|
|
import pynini
|
from fun_text_processing.text_normalization.zh.graph_utils import FUN_NOT_QUOTE, GraphFst
|
from pynini.lib import pynutil
|
|
|
class Whitelist(GraphFst):
|
'''
|
tokens { whitelist: "ATM" } -> A T M
|
'''
|
|
def __init__(self, deterministic: bool = True, lm: bool = False):
|
super().__init__(name="whitelist", kind="verbalize", deterministic=deterministic)
|
remove_erhua = pynutil.delete("erhua: \"") + pynutil.delete("儿") + pynutil.delete("\"")
|
whitelist = pynutil.delete("name: \"") + pynini.closure(FUN_NOT_QUOTE) + pynutil.delete("\"")
|
graph = remove_erhua | whitelist
|
self.fst = graph.optimize()
|