dotfiles/bin/transcribe-audio

#!/usr/bin/env bash

if which tput >/dev/null 2>&1; then
    ncolors=$(tput colors)
fi
if [ -t 1 ] && [ -n "$ncolors" ] && [ "$ncolors" -ge 8 ]; then
    RED="$(tput setaf 1)"
    GREEN="$(tput setaf 2)"
    YELLOW="$(tput setaf 3)"
    BLUE="$(tput setaf 4)"
    MAGENTA="$(tput setaf 5)"
    CYAN="$(tput setaf 6)"
    BOLD="$(tput bold)"
    NORMAL="$(tput sgr0)"
else
    RED=""
    GREEN=""
    YELLOW=""
    BLUE=""
    MAGENTA=""
    CYAN=""
    BOLD=""
    NORMAL=""
fi

input_wav="$1"
output_name_without_ext="$2"
model="$3"
threads=$4

# 4 seems to be the sweet spot.
default_thread_count=4

if [[ $input_wav == "" || $output_name_without_ext == "" || $model == "" ]]; then
    printf "${BOLD}${RED}Usage: $0 <input.wav> <output name without extension> <model name> <optional: thread count>${NORMAL}\n"
    exit 1
fi

if [[ ! -f "$input_wav" ]]; then
    printf "${RED}${BOLD}Input file \"$input_wav\" doesn't exist!\n${NORMAL}"
    exit 1
fi

if [[ $threads == "" ]]; then
    threads=$default_thread_count
fi

output_name="$output_name_without_ext.${model}"

printf "\n${YELLOW}${BOLD}Transcribing $input_wav | model: $model | threads: $threads | output: $output_name ${NORMAL}\n"

whisper.exe --threads ${threads} -m $JELLYPIXEL_OPENSOURCE_DEV/whisper.cpp/models/ggml-${model}.en.bin -otxt -osrt -f "$input_wav" -of "$output_name" --print-colors

printf "${GREEN}${BOLD}Done transcribing $input_wav | model: $model | threads: $threads | output: $output_name${NORMAL}\n"
Add scripts for audio transcription using whisper.cpp 2023-06-03 21:21:16 +00:00			`#!/usr/bin/env bash`

			`if which tput >/dev/null 2>&1; then`
			`ncolors=$(tput colors)`
			`fi`
			`if [ -t 1 ] && [ -n "$ncolors" ] && [ "$ncolors" -ge 8 ]; then`
			`RED="$(tput setaf 1)"`
			`GREEN="$(tput setaf 2)"`
			`YELLOW="$(tput setaf 3)"`
			`BLUE="$(tput setaf 4)"`
			`MAGENTA="$(tput setaf 5)"`
			`CYAN="$(tput setaf 6)"`
			`BOLD="$(tput bold)"`
			`NORMAL="$(tput sgr0)"`
			`else`
			`RED=""`
			`GREEN=""`
			`YELLOW=""`
			`BLUE=""`
			`MAGENTA=""`
			`CYAN=""`
			`BOLD=""`
			`NORMAL=""`
			`fi`

			`input_wav="$1"`
			`output_name_without_ext="$2"`
			`model="$3"`
			`threads=$4`

			`# 4 seems to be the sweet spot.`
			`default_thread_count=4`

			`if [[ $input_wav == "" \|\| $output_name_without_ext == "" \|\| $model == "" ]]; then`
			`printf "${BOLD}${RED}Usage: $0 <input.wav> <output name without extension> <model name> <optional: thread count>${NORMAL}\n"`
			`exit 1`
			`fi`

			`if [[ ! -f "$input_wav" ]]; then`
			`printf "${RED}${BOLD}Input file \"$input_wav\" doesn't exist!\n${NORMAL}"`
			`exit 1`
			`fi`

			`if [[ $threads == "" ]]; then`
			`threads=$default_thread_count`
			`fi`

			`output_name="$output_name_without_ext.${model}"`

			`printf "\n${YELLOW}${BOLD}Transcribing $input_wav \| model: $model \| threads: $threads \| output: $output_name ${NORMAL}\n"`

			`whisper.exe --threads ${threads} -m $JELLYPIXEL_OPENSOURCE_DEV/whisper.cpp/models/ggml-${model}.en.bin -otxt -osrt -f "$input_wav" -of "$output_name" --print-colors`

			`printf "${GREEN}${BOLD}Done transcribing $input_wav \| model: $model \| threads: $threads \| output: $output_name${NORMAL}\n"`