zhifu gao
2024-04-08 d19f48e17478be273584853568ac101c994c37e5
funasr/models/sense_voice/model.py
@@ -91,7 +91,11 @@
        # decode the audio
        
        # initial_prompt = kwargs.get("initial_prompt", "<|startoftranscript|><|ASR|>")
        options = whisper.DecodingOptions(language=language, fp16=False, without_timestamps=True, initial_prompt=initial_prompt)
        vocab_path = kwargs.get("vocab_path", None)
        options = whisper.DecodingOptions(language=language, fp16=False, without_timestamps=True, initial_prompt=initial_prompt, vocab_path=vocab_path)
        result = whisper.decode(self.model, speech, options)
        results = []