Speech to Text

OpenAI Whisper
https://github.com/openai/whisper

https://hub.docker.com/r/fedirz/faster-whisper-server

https://github.com/speaches-ai/speaches

OpenAI/Whisper example python script with changed base url

mkdir transcribe
cd transcribe
python -m venv venv
source venv/bin/activate
pip install openai
 
cat >> trans.py << EOD
#!/home/user/transcribe/venv/bin/python3
from openai import OpenAI
import sys,os
 
def usage():
    print("Usage: "+os.path.basename(__file__)+" inputfile [outputfile]")
    print(" inputfile \t\tInput file to transcribe")
    print(" outputfile\tOptional: Filename to store transcription to")
    exit(1)
 
try:
    inputfile = sys.argv[1]
except Exception as e:
    usage()
 
client = OpenAI(base_url="http://192.168.xx.xx:8010/v1", api_key="not needed")
audio_file= open(inputfile, "rb")
 
transcription = client.audio.transcriptions.create(
    model="Systran/faster-whisper-large-v3", 
    file=audio_file
)
 
try:
    outputfile = sys.argv[2]
    with open(sys.argv[2], "w") as text_file:
        text_file.write(transcription.text)
except:
    print(transcription.text)
EOD