From 810046e3df4910c8f5c1a90e4b53aca45b3397e8 Mon Sep 17 00:00:00 2001
From: wuhongsheng <664116298@qq.com>
Date: 星期一, 01 七月 2024 10:42:58 +0800
Subject: [PATCH] 优化merge segments 参数,解决新闻联播男女主持人“晚上好”合并一个speakid问题 (#1861)

---
 fun_text_processing/inverse_text_normalization/vi/verbalizers/whitelist.py |    4 +---
 1 files changed, 1 insertions(+), 3 deletions(-)

diff --git a/fun_text_processing/inverse_text_normalization/vi/verbalizers/whitelist.py b/fun_text_processing/inverse_text_normalization/vi/verbalizers/whitelist.py
index 0a08a7b..4574121 100644
--- a/fun_text_processing/inverse_text_normalization/vi/verbalizers/whitelist.py
+++ b/fun_text_processing/inverse_text_normalization/vi/verbalizers/whitelist.py
@@ -1,5 +1,3 @@
-
-
 import pynini
 from fun_text_processing.inverse_text_normalization.vi.graph_utils import (
     DAMO_CHAR,
@@ -25,5 +23,5 @@
             + pynini.closure(DAMO_CHAR - " ", 1)
             + pynutil.delete('"')
         )
-        graph = graph @ pynini.cdrewrite(pynini.cross(u"\u00A0", " "), "", "", DAMO_SIGMA)
+        graph = graph @ pynini.cdrewrite(pynini.cross("\u00A0", " "), "", "", DAMO_SIGMA)
         self.fst = graph.optimize()

--
Gitblit v1.9.1