From 1cdb3cc28d4d89a576cc06e5cd8eb80da1f3a3aa Mon Sep 17 00:00:00 2001
From: zhifu gao <zhifu.gzf@alibaba-inc.com>
Date: 星期五, 26 四月 2024 11:27:39 +0800
Subject: [PATCH] Dev gzf exp (#1665)
---
fun_text_processing/inverse_text_normalization/id/verbalizers/whitelist.py | 13 +++++++++----
1 files changed, 9 insertions(+), 4 deletions(-)
diff --git a/fun_text_processing/inverse_text_normalization/id/verbalizers/whitelist.py b/fun_text_processing/inverse_text_normalization/id/verbalizers/whitelist.py
index f1ced47..4450202 100644
--- a/fun_text_processing/inverse_text_normalization/id/verbalizers/whitelist.py
+++ b/fun_text_processing/inverse_text_normalization/id/verbalizers/whitelist.py
@@ -1,5 +1,10 @@
import pynini
-from fun_text_processing.inverse_text_normalization.id.graph_utils import DAMO_CHAR, DAMO_SIGMA, GraphFst, delete_space
+from fun_text_processing.inverse_text_normalization.id.graph_utils import (
+ DAMO_CHAR,
+ DAMO_SIGMA,
+ GraphFst,
+ delete_space,
+)
from pynini.lib import pynutil
@@ -14,9 +19,9 @@
graph = (
pynutil.delete("name:")
+ delete_space
- + pynutil.delete("\"")
+ + pynutil.delete('"')
+ pynini.closure(DAMO_CHAR - " ", 1)
- + pynutil.delete("\"")
+ + pynutil.delete('"')
)
- graph = graph @ pynini.cdrewrite(pynini.cross(u"\u00A0", " "), "", "", DAMO_SIGMA)
+ graph = graph @ pynini.cdrewrite(pynini.cross("\u00A0", " "), "", "", DAMO_SIGMA)
self.fst = graph.optimize()
--
Gitblit v1.9.1