yhliang
2023-04-27 32d2b3ec153e53176da710ebcc0aba5669effd8a
funasr/runtime/python/onnxruntime/funasr_onnx/utils/e2e_vad.py
@@ -1,3 +1,7 @@
# -*- encoding: utf-8 -*-
# Copyright FunASR (https://github.com/alibaba-damo-academy/FunASR). All Rights Reserved.
#  MIT License  (https://opensource.org/licenses/MIT)
from enum import Enum
from typing import List, Tuple, Dict, Any
@@ -189,6 +193,11 @@
class E2EVadModel():
    """
    Author: Speech Lab of DAMO Academy, Alibaba Group
    Deep-FSMN for Large Vocabulary Continuous Speech Recognition
    https://arxiv.org/abs/1803.05030
    """
    def __init__(self, vad_post_args: Dict[str, Any]):
        super(E2EVadModel, self).__init__()
        self.vad_opts = VADXOptions(**vad_post_args)
@@ -470,8 +479,8 @@
                            end_ms = -1
                            self.next_seg = False
                    else:
                        if not self.output_data_buf[i].contain_seg_start_point or not self.output_data_buf[
                            i].contain_seg_end_point:
                        if not is_final and (not self.output_data_buf[i].contain_seg_start_point or not self.output_data_buf[
                            i].contain_seg_end_point):
                            continue
                        start_ms = self.output_data_buf[i].start_ms
                        end_ms = self.output_data_buf[i].end_ms