python语音识别whisper
程序猿和攻城狮:
import whisper
import stable_whisper as whisper
class WhisperTranscriber(object):
def __init__(self, model_name):
self.model = whisper.load_model(model_name)
def whisper_transcribe(self, audio_path):
audio = self.model.transcribe(audio_path, fp16=False, language='Chinese')
# 连接所有片段的文本,加上逗号
transcribed_text = ""
for segment in audio:
for word_timing in segment.words:
transcribed_text += word_timing.word + " "
# 在每一段文本后加上逗号
transcribed_text += ","
return transcribed_text.strip(",")
if __name__ == '__main__':
transcriber = WhisperTranscriber("tiny")
text = transcriber.whisper_transcribe("test.mp3")
print(text)
这时最新的代码,运行后不会出错的。
|