python/FunASR-XL.git

			@@ -9,6 +9,7 @@
			from torch import nn

			import whisper

			# import whisper_timestamped as whisper

			from funasr.utils.load_utils import load_audio_text_image_video, extract_fbank
			@@ -112,7 +113,7 @@
			# decode the audio
			options = whisper.DecodingOptions(**kwargs.get("DecodingOptions", {}))

			result = whisper.decode(self.model, speech, language='english')
			result = whisper.decode(self.model, speech, options=options)
			# result = whisper.transcribe(self.model, speech)

			results = []