whisper_asr.py 430 B

123456789101112131415
  1. import whisper
  2. from zhconv import convert
  3. def get_whisper_asr(audio, model='medium'):
  4. try:
  5. model = whisper.load_model(model, device='cuda')
  6. result = model.transcribe(audio, language='Chinese')
  7. # 简繁转换
  8. # zh-cn 大陆简体
  9. # zh-hant 繁体
  10. return convert(result['text'], 'zh-cn')
  11. except Exception as e:
  12. print(f'asr error: {audio}. e: {e}')
  13. return ''