transcription/conversion_simple_en.py

31 lines
733 B
Python
Raw Permalink Normal View History

2021-03-23 12:54:17 +01:00
#!/usr/bin/env python3
from vosk import Model, KaldiRecognizer, SetLogLevel
import sys
import os
import wave
SetLogLevel(0)
2021-03-23 12:54:53 +01:00
if not os.path.exists("models/en"):
2021-03-23 12:54:17 +01:00
print ("Please download the model from https://alphacephei.com/vosk/models and unpack as 'models' in the current folder.")
exit (1)
wf = wave.open(sys.argv[1], "rb")
if wf.getnchannels() != 1 or wf.getsampwidth() != 2 or wf.getcomptype() != "NONE":
print ("Audio file must be WAV format mono PCM.")
exit (1)
2021-03-23 12:54:53 +01:00
model = Model("models/en")
2021-03-23 12:54:17 +01:00
rec = KaldiRecognizer(model, wf.getframerate())
while True:
data = wf.readframes(4000)
if len(data) == 0:
break
if rec.AcceptWaveform(data):
print(rec.Result())
print(rec.FinalResult())