funasr/models/sense_voice/model.py
@@ -91,7 +91,11 @@ # decode the audio # initial_prompt = kwargs.get("initial_prompt", "<|startoftranscript|><|ASR|>") options = whisper.DecodingOptions(language=language, fp16=False, without_timestamps=True, initial_prompt=initial_prompt) vocab_path = kwargs.get("vocab_path", None) options = whisper.DecodingOptions(language=language, fp16=False, without_timestamps=True, initial_prompt=initial_prompt, vocab_path=vocab_path) result = whisper.decode(self.model, speech, options) results = []