游雁
2023-12-06 e98e10639d90c55a4b7e498d0d87837ad9c4173d
funasr/tokenizer/phoneme_tokenizer.py
@@ -363,6 +363,7 @@
        non_linguistic_symbols: Union[Path, str, Iterable[str]] = None,
        space_symbol: str = "<space>",
        remove_non_linguistic_symbols: bool = False,
        **kwargs,
    ):
        if g2p_type is None:
            self.g2p = split_by_space