Djraemon
2024-10-21 a76f15c78527edf47a68dd67e2c4d894bc252398
1
2
3
4
5
6
7
8
9
10
11
12
13
14
from fun_text_processing.text_normalization.zh.graph_utils import FUN_NOT_QUOTE, GraphFst
from pynini.lib import pynutil
 
 
class Char(GraphFst):
    """
    tokens { char: "你" } -> 你
    """
 
    def __init__(self, deterministic: bool = True, lm: bool = False):
        super().__init__(name="char", kind="verbalize", deterministic=deterministic)
 
        graph = pynutil.delete('name: "') + FUN_NOT_QUOTE + pynutil.delete('"')
        self.fst = graph.optimize()