游雁
2024-10-31 e6f58e7bc74a2dc4b371a4045b1a8d86e39333bb
funasr/tokenizer/sentencepiece_tokenizer.py
@@ -49,3 +49,9 @@
    def get_vocab_size(self):
        return self.sp.GetPieceSize()
    def ids2tokens(self, *args, **kwargs):
        return self.decode(*args, **kwargs)
    def tokens2ids(self, *args, **kwargs):
        return self.encode(*args, **kwargs)