zhifu gao
2024-04-08 6ddd383370c3b264c5c56a8fafb33e5cde20cfc5
funasr/models/sense_voice/model.py
@@ -91,7 +91,11 @@
        # decode the audio
        
        # initial_prompt = kwargs.get("initial_prompt", "<|startoftranscript|><|ASR|>")
        options = whisper.DecodingOptions(language=language, fp16=False, without_timestamps=True, initial_prompt=initial_prompt)
        vocab_path = kwargs.get("vocab_path", None)
        options = whisper.DecodingOptions(language=language, fp16=False, without_timestamps=True, initial_prompt=initial_prompt, vocab_path=vocab_path)
        result = whisper.decode(self.model, speech, options)
        results = []