jaluik
2024-01-09 27e8ba254adbe9f0df50b4969c5d2e66e0c7c0de
funasr/datasets/small_datasets/preprocessor.py
@@ -361,7 +361,6 @@
                    tokens = seg_tokenize(tokens, self.seg_dict)
            else:
                tokens = self.tokenizer.text2tokens(text)
            text_ints = self.token_id_converter.tokens2ids(tokens)
            data[self.text_name] = np.array(text_ints, dtype=np.int64)
        return data