funasr/utils/asr_utils.py
@@ -5,6 +5,7 @@ from typing import Any, Dict, List, Union import torchaudio import soundfile import numpy as np import pkg_resources from modelscope.utils.logger import get_logger @@ -135,7 +136,10 @@ if support_audio_type == "pcm": fs = None else: audio, fs = torchaudio.load(fname) try: audio, fs = torchaudio.load(fname) except: audio, fs = soundfile.read(fname) break if audio_type.rfind(".scp") >= 0: with open(fname, encoding="utf-8") as f: