From 65676c0aaefacff0dfbfb7e1785dda516460d9eb Mon Sep 17 00:00:00 2001
From: Yabin Li <wucong.lyb@alibaba-inc.com>
Date: 星期一, 18 十二月 2023 09:39:47 +0800
Subject: [PATCH] Update readme.md
---
funasr/tokenizer/char_tokenizer.py | 6 ++----
1 files changed, 2 insertions(+), 4 deletions(-)
diff --git a/funasr/tokenizer/char_tokenizer.py b/funasr/tokenizer/char_tokenizer.py
index 80528a2..6c9a5a5 100644
--- a/funasr/tokenizer/char_tokenizer.py
+++ b/funasr/tokenizer/char_tokenizer.py
@@ -6,17 +6,15 @@
from funasr.tokenizer.abs_tokenizer import AbsTokenizer
-from funasr.tokenizer.abs_tokenizer import BaseTokenizer
-class CharTokenizer(BaseTokenizer):
+
+class CharTokenizer(AbsTokenizer):
def __init__(
self,
non_linguistic_symbols: Union[Path, str, Iterable[str]] = None,
space_symbol: str = "<space>",
remove_non_linguistic_symbols: bool = False,
- **kwargs,
):
- super().__init__(**kwargs)
self.space_symbol = space_symbol
if non_linguistic_symbols is None:
self.non_linguistic_symbols = set()
--
Gitblit v1.9.1