Yuekai Zhang
2023-03-06 80e6c258cf89b5f11f4e52a4cc5a9cf2e95aa7be
funasr/models/e2e_uni_asr.py
@@ -206,7 +206,7 @@
            with torch.no_grad():
                speech_raw, encoder_out, encoder_out_lens = self.encode(speech, speech_lengths, ind=ind)
        else:
            speech_raw, encoder_out_lens = self.encode(speech, speech_lengths, ind=ind)
            speech_raw, encoder_out, encoder_out_lens = self.encode(speech, speech_lengths, ind=ind)
        intermediate_outs = None
        if isinstance(encoder_out, tuple):