funasr/models/paraformer_streaming/model.py
@@ -428,7 +428,8 @@ **kwargs, ): cache = kwargs.get("cache", {}) speech.to(device=kwargs["device"]), speech_lengths.to(device=kwargs["device"]) speech = speech.to(device=kwargs["device"]) speech_lengths = speech_lengths.to(device=kwargs["device"]) # Encoder encoder_out, encoder_out_lens = self.encode_chunk(speech, speech_lengths, cache=cache, is_final=kwargs.get("is_final", False))