kongdeqiang
10 天以前 28ccfbfc51068a663a80764e14074df5edf2b5ba
fun_text_processing/inverse_text_normalization/ko/verbalizers/time.py
@@ -1,4 +1,3 @@
import pynini
from fun_text_processing.inverse_text_normalization.ko.graph_utils import (
    DAMO_CHAR,
@@ -20,40 +19,42 @@
    def __init__(self):
        super().__init__(name="time", kind="verbalize")
        add_leading_zero_to_double_digit = (DAMO_DIGIT + DAMO_DIGIT) | (pynutil.insert("0") + DAMO_DIGIT)
        #hour
        add_leading_zero_to_double_digit = (DAMO_DIGIT + DAMO_DIGIT) | (
            pynutil.insert("0") + DAMO_DIGIT
        )
        # hour
        hour = (
            pynutil.delete("hours:")
            + delete_space
            + pynutil.delete("\"")
            + pynutil.delete('"')
            + pynini.closure(DAMO_DIGIT, 1)
            + pynutil.delete("\"")
            + pynutil.delete('"')
        )
        #minute
        # minute
        minute = (
            pynutil.delete("minutes:")
            + delete_space
            + pynutil.delete("\"")
            + pynutil.delete('"')
            + pynini.closure(DAMO_DIGIT, 1)
            + pynutil.delete("\"")
            + pynutil.delete('"')
        )
        #seconds
        # seconds
        second = (
            pynutil.delete("seconds:")
            + delete_space
            + pynutil.delete("\"")
            + pynutil.delete('"')
            + pynini.closure(DAMO_DIGIT, 1)
            + pynutil.delete("\"")
            + pynutil.delete('"')
        )
        suffix = (
            delete_space
            + insert_space
            + pynutil.delete("suffix:")
            + delete_space
            + pynutil.delete("\"")
            + pynutil.delete('"')
            + pynini.closure(DAMO_CHAR - " ", 1)
            + pynutil.delete("\"")
            + pynutil.delete('"')
        )
        optional_suffix = pynini.closure(suffix, 0, 1)
        zone = (
@@ -61,18 +62,31 @@
            + insert_space
            + pynutil.delete("zone:")
            + delete_space
            + pynutil.delete("\"")
            + pynutil.delete('"')
            + pynini.closure(DAMO_CHAR - " ", 1)
            + pynutil.delete("\"")
            + pynutil.delete('"')
        )
        optional_zone = pynini.closure(zone, 0, 1)
        #hms
        graph_hms = (hour @ add_leading_zero_to_double_digit) + delete_space + pynutil.insert(":") + (minute @ add_leading_zero_to_double_digit) + delete_space + pynutil.insert(":") + second
        #hm
        graph_hm = (hour @ add_leading_zero_to_double_digit) + delete_space + pynutil.insert(":") + (minute @ add_leading_zero_to_double_digit)
        graph = ( (graph_hms | graph_hm) + optional_suffix + optional_zone )
        # hms
        graph_hms = (
            (hour @ add_leading_zero_to_double_digit)
            + delete_space
            + pynutil.insert(":")
            + (minute @ add_leading_zero_to_double_digit)
            + delete_space
            + pynutil.insert(":")
            + second
        )
        # hm
        graph_hm = (
            (hour @ add_leading_zero_to_double_digit)
            + delete_space
            + pynutil.insert(":")
            + (minute @ add_leading_zero_to_double_digit)
        )
        graph = (graph_hms | graph_hm) + optional_suffix + optional_zone
        delete_tokens = self.delete_tokens(graph)
        self.fst = delete_tokens.optimize()