From 3a4281f4959534b1bf5d01acf0085f4f8e6f2ec8 Mon Sep 17 00:00:00 2001
From: wuhongsheng <664116298@qq.com>
Date: 星期五, 05 七月 2024 00:55:32 +0800
Subject: [PATCH] 优化speakid和语句匹配逻辑,部分解决speakid不从0递增问题 (#1870)
---
fun_text_processing/text_normalization/ru/verbalizers/time.py | 24 ++++++++++++++++--------
1 files changed, 16 insertions(+), 8 deletions(-)
diff --git a/fun_text_processing/text_normalization/ru/verbalizers/time.py b/fun_text_processing/text_normalization/ru/verbalizers/time.py
index 55289cc..cdabfac 100644
--- a/fun_text_processing/text_normalization/ru/verbalizers/time.py
+++ b/fun_text_processing/text_normalization/ru/verbalizers/time.py
@@ -1,7 +1,10 @@
-
-
import pynini
-from fun_text_processing.text_normalization.en.graph_utils import DAMO_NOT_QUOTE, GraphFst, delete_space, insert_space
+from fun_text_processing.text_normalization.en.graph_utils import (
+ DAMO_NOT_QUOTE,
+ GraphFst,
+ delete_space,
+ insert_space,
+)
from pynini.lib import pynutil
@@ -21,20 +24,25 @@
hour = (
pynutil.delete("hours:")
+ delete_space
- + pynutil.delete("\"")
+ + pynutil.delete('"')
+ pynini.closure(DAMO_NOT_QUOTE, 1)
- + pynutil.delete("\"")
+ + pynutil.delete('"')
)
minutes = (
pynutil.delete("minutes:")
+ delete_space
- + pynutil.delete("\"")
+ + pynutil.delete('"')
+ pynini.closure(DAMO_NOT_QUOTE, 1)
- + pynutil.delete("\"")
+ + pynutil.delete('"')
)
self.graph = (
- hour + delete_space + insert_space + minutes + delete_space + pynutil.delete("preserve_order: true")
+ hour
+ + delete_space
+ + insert_space
+ + minutes
+ + delete_space
+ + pynutil.delete("preserve_order: true")
)
self.graph |= hour + delete_space
self.graph |= minutes + delete_space + insert_space + hour + delete_space
--
Gitblit v1.9.1