From 810046e3df4910c8f5c1a90e4b53aca45b3397e8 Mon Sep 17 00:00:00 2001
From: wuhongsheng <664116298@qq.com>
Date: 星期一, 01 七月 2024 10:42:58 +0800
Subject: [PATCH] 优化merge segments 参数,解决新闻联播男女主持人“晚上好”合并一个speakid问题 (#1861)
---
fun_text_processing/inverse_text_normalization/vi/verbalizers/whitelist.py | 4 +---
1 files changed, 1 insertions(+), 3 deletions(-)
diff --git a/fun_text_processing/inverse_text_normalization/vi/verbalizers/whitelist.py b/fun_text_processing/inverse_text_normalization/vi/verbalizers/whitelist.py
index 0a08a7b..4574121 100644
--- a/fun_text_processing/inverse_text_normalization/vi/verbalizers/whitelist.py
+++ b/fun_text_processing/inverse_text_normalization/vi/verbalizers/whitelist.py
@@ -1,5 +1,3 @@
-
-
import pynini
from fun_text_processing.inverse_text_normalization.vi.graph_utils import (
DAMO_CHAR,
@@ -25,5 +23,5 @@
+ pynini.closure(DAMO_CHAR - " ", 1)
+ pynutil.delete('"')
)
- graph = graph @ pynini.cdrewrite(pynini.cross(u"\u00A0", " "), "", "", DAMO_SIGMA)
+ graph = graph @ pynini.cdrewrite(pynini.cross("\u00A0", " "), "", "", DAMO_SIGMA)
self.fst = graph.optimize()
--
Gitblit v1.9.1