import whisper
model = whisper.load_model("large-v3-turbo")
result = model.transcribe("./driven_audio/chinese_poem1.wav",fp16="False")
print(result["text"])