From 273d0d6015a4655cb34cc77cee2c3267a23d7d03 Mon Sep 17 00:00:00 2001
From: 九耳 <mengzhe.cmz@alibaba-inc.com>
Date: 星期五, 03 二月 2023 13:09:05 +0800
Subject: [PATCH] update punc and asr_inference_paraformer_vad_punc

---
 funasr/punctuation/text_preprocessor.py |   21 ---------------------
 1 files changed, 0 insertions(+), 21 deletions(-)

diff --git a/funasr/punctuation/text_preprocessor.py b/funasr/punctuation/text_preprocessor.py
index 3d2c19e..c9c4bac 100644
--- a/funasr/punctuation/text_preprocessor.py
+++ b/funasr/punctuation/text_preprocessor.py
@@ -1,24 +1,3 @@
-def split_words(text: str):
-    words = []
-    segs = text.split()
-    for seg in segs:
-        # There is no space in seg.
-        current_word = ""
-        for c in seg:
-            if len(c.encode()) == 1:
-                # This is an ASCII char.
-                current_word += c
-            else:
-                # This is a Chinese char.
-                if len(current_word) > 0:
-                    words.append(current_word)
-                    current_word = ""
-                words.append(c)
-        if len(current_word) > 0:
-            words.append(current_word)
-    return words
-
-
 def split_to_mini_sentence(words: list, word_limit: int = 20):
     assert word_limit > 1
     if len(words) <= word_limit:

--
Gitblit v1.9.1