Add scripts for audio transcription using whisper.cpp

2023-06-03 17:21:16 -04:00
parent 06bbc0c995
commit 173bda9eb0
9 changed files with 242 additions and 2 deletions
--- a/bin/transcribe-audio
+++ b/bin/transcribe-audio
@@ -0,0 +1,54 @@
+#!/usr/bin/env bash
+
+if which tput >/dev/null 2>&1; then
+    ncolors=$(tput colors)
+fi
+if [ -t 1 ] && [ -n "$ncolors" ] && [ "$ncolors" -ge 8 ]; then
+    RED="$(tput setaf 1)"
+    GREEN="$(tput setaf 2)"
+    YELLOW="$(tput setaf 3)"
+    BLUE="$(tput setaf 4)"
+    MAGENTA="$(tput setaf 5)"
+    CYAN="$(tput setaf 6)"
+    BOLD="$(tput bold)"
+    NORMAL="$(tput sgr0)"
+else
+    RED=""
+    GREEN=""
+    YELLOW=""
+    BLUE=""
+    MAGENTA=""
+    CYAN=""
+    BOLD=""
+    NORMAL=""
+fi
+
+input_wav="$1"
+output_name_without_ext="$2"
+model="$3"
+threads=$4
+
+# 4 seems to be the sweet spot.
+default_thread_count=4
+
+if [[ $input_wav == "" || $output_name_without_ext == "" || $model == "" ]]; then
+    printf "${BOLD}${RED}Usage: $0 <input.wav> <output name without extension> <model name> <optional: thread count>${NORMAL}\n"
+    exit 1
+fi
+
+if [[ ! -f "$input_wav" ]]; then
+    printf "${RED}${BOLD}Input file \"$input_wav\" doesn't exist!\n${NORMAL}"
+    exit 1
+fi
+
+if [[ $threads == "" ]]; then
+    threads=$default_thread_count
+fi
+
+output_name="$output_name_without_ext.${model}"
+
+printf "\n${YELLOW}${BOLD}Transcribing $input_wav | model: $model | threads: $threads | output: $output_name ${NORMAL}\n"
+
+whisper.exe --threads ${threads} -m $JELLYPIXEL_OPENSOURCE_DEV/whisper.cpp/models/ggml-${model}.en.bin -otxt -osrt -f "$input_wav" -of "$output_name" --print-colors
+
+printf "${GREEN}${BOLD}Done transcribing $input_wav | model: $model | threads: $threads | output: $output_name${NORMAL}\n"