| | |
| | | # Copyright NeMo (https://github.com/NVIDIA/NeMo). All Rights Reserved. |
| | | # |
| | | # Licensed under the Apache License, Version 2.0 (the "License"); |
| | | # you may not use this file except in compliance with the License. |
| | | # You may obtain a copy of the License at |
| | | # |
| | | # http://www.apache.org/licenses/LICENSE-2.0 |
| | | # |
| | | # Unless required by applicable law or agreed to in writing, software |
| | | # distributed under the License is distributed on an "AS IS" BASIS, |
| | | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| | | # See the License for the specific language governing permissions and |
| | | # limitations under the License. |
| | | |
| | | import pynini |
| | | from fun_text_processing.text_normalization.en.graph_utils import DAMO_NOT_QUOTE, GraphFst, delete_preserve_order |
| | | from fun_text_processing.text_normalization.en.graph_utils import ( |
| | | DAMO_NOT_QUOTE, |
| | | GraphFst, |
| | | delete_preserve_order, |
| | | ) |
| | | from pynini.lib import pynutil |
| | | |
| | | |
| | | class TelephoneFst(GraphFst): |
| | | """ |
| | | Finite state transducer for verbalizing telephone, e.g. |
| | | telephone { country_code: "plus neun und vierzig" number_part: "null eins eins eins null null null" } |
| | | telephone { country_code: "plus neun und vierzig" number_part: "null eins eins eins null null null" } |
| | | -> "plus neun und vierzig null eins eins eins null null null" |
| | | |
| | | Args: |
| | |
| | | def __init__(self, deterministic: bool = True): |
| | | super().__init__(name="telephone", kind="verbalize", deterministic=deterministic) |
| | | |
| | | country_code = pynutil.delete("country_code: \"") + pynini.closure(DAMO_NOT_QUOTE, 1) + pynutil.delete("\"") |
| | | country_code = ( |
| | | pynutil.delete('country_code: "') |
| | | + pynini.closure(DAMO_NOT_QUOTE, 1) |
| | | + pynutil.delete('"') |
| | | ) |
| | | |
| | | number_part = pynutil.delete("number_part: \"") + pynini.closure(DAMO_NOT_QUOTE, 1) + pynutil.delete("\"") |
| | | number_part = ( |
| | | pynutil.delete('number_part: "') |
| | | + pynini.closure(DAMO_NOT_QUOTE, 1) |
| | | + pynutil.delete('"') |
| | | ) |
| | | |
| | | self.graph = country_code + pynini.accep(" ") + number_part |
| | | |