zhifu gao
2024-03-29 320c7ff2c2dfbce13ee01589a64b515bf2d7857b
funasr/models/fsmn_vad_streaming/model.py
@@ -543,6 +543,11 @@
      cache["frontend"] = {}
      cache["prev_samples"] = torch.empty(0)
      cache["encoder"] = {}
      if kwargs.get("max_end_silence_time") is not None:
         # update the max_end_silence_time
         self.vad_opts.max_end_silence_time = kwargs.get("max_end_silence_time")
      windows_detector = WindowDetector(self.vad_opts.window_size_ms,
                                        self.vad_opts.sil_to_speech_time_thres,
                                        self.vad_opts.speech_to_sil_time_thres,