yhliang
2023-05-11 d788b6d5a61df918b65b6914f87a7482778df5f5
funasr/datasets/large_datasets/utils/tokenize.py
@@ -57,7 +57,7 @@
    length = len(text)
    if 'hw_tag' in data:
        hotword_indxs = sample_hotword(length, **hw_config)
        data[hotword_indxs] = hotword_indxs
        data['hotword_indxs'] = hotword_indxs
        del data['hw_tag']
    for i in range(length):
        x = text[i]