| | |
| | | format="%(asctime)s (%(module)s:%(lineno)d) %(levelname)s: %(message)s", |
| | | ) |
| | | |
| | | if sv_model_file is None: |
| | | sv_model_file = "{}/damo/speech_paraformer-large-vad-punc-spk_asr_nat-zh-cn/campplus_cn_common.bin".format(get_cache_dir(None)) |
| | | sv_model_file = asr_model_file.replace("model.pb", "campplus_cn_common.bin") |
| | | |
| | | if param_dict is not None: |
| | | hotword_list_or_file = param_dict.get('hotword') |
| | |
| | | |
| | | ncpu = kwargs.get("ncpu", 1) |
| | | torch.set_num_threads(ncpu) |
| | | if param_dict: |
| | | language = param_dict.get("language", None) |
| | | task = param_dict.get("task", "transcribe") |
| | | else: |
| | | language = None |
| | | task = "transcribe" |
| | | if batch_size > 1: |
| | | raise NotImplementedError("batch decoding is not implemented") |
| | | if word_lm_train_config is not None: |
| | |
| | | penalty=penalty, |
| | | nbest=nbest, |
| | | streaming=streaming, |
| | | language=language, |
| | | task=task, |
| | | ) |
| | | logging.info("speech2text_kwargs: {}".format(speech2text_kwargs)) |
| | | speech2text = Speech2TextWhisper(**speech2text_kwargs) |