import whisper model = whisper.load_model("large-v3-turbo") result = model.transcribe("./driven_audio/chinese_poem1.wav",fp16="False") print(result["text"])