speech_asr
2023-04-20 c452b2a3c77059b7bc6cfbc8d480eac15cf38095
update
1个文件已修改
35 ■■■■ 已修改文件
funasr/utils/build_asr_model.py 35 ●●●● 补丁 | 查看 | 原始文档 | blame | 历史
funasr/utils/build_asr_model.py
@@ -253,7 +253,34 @@
        odim=vocab_size, encoder_output_size=encoder.output_size(), **args.ctc_conf
    )
    if args.model == "asr":
        model
    if args.model in ["asr", "mfcca"]:
        model_class = model_choices.get_class(args.model)
        model = model_class(
            vocab_size=vocab_size,
            frontend=frontend,
            specaug=specaug,
            normalize=normalize,
            encoder=encoder,
            decoder=decoder,
            ctc=ctc,
            token_list=token_list,
            **args.model_conf,
        )
    elif args.model == "paraformer":
        # predictor
        predictor_class = predictor_choices.get_class(args.predictor)
        predictor = predictor_class(**args.predictor_conf)
        model_class = model_choices.get_class(args.model)
        model = model_class(
            vocab_size=vocab_size,
            frontend=frontend,
            specaug=specaug,
            normalize=normalize,
            encoder=encoder,
            decoder=decoder,
            ctc=ctc,
            token_list=token_list,
            predictor=predictor,
            **args.model_conf,
        )
    elif