wuhongsheng
2024-07-05 3a4281f4959534b1bf5d01acf0085f4f8e6f2ec8
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
from fun_text_processing.text_normalization.zh.graph_utils import GraphFst
from fun_text_processing.text_normalization.zh.taggers.cardinal import Cardinal
from pynini.lib import pynutil
 
 
class Fraction(GraphFst):
    """
    tokens { fraction { denominator: "5" numerator: "1" } } -> 五分之一
    """
 
    def __init__(self, deterministic: bool = True, lm: bool = False):
        super().__init__(name="fraction", kind="verbalize", deterministic=deterministic)
 
        denominator = (
            pynutil.delete('denominator: "') + Cardinal().graph_cardinal + pynutil.delete('"')
        )
        numerator = pynutil.delete('numerator: "') + Cardinal().graph_cardinal + pynutil.delete('"')
        graph = denominator + pynutil.delete(" ") + pynutil.insert("分之") + numerator
 
        self.fst = self.delete_tokens(graph).optimize()