游雁
2023-12-27 fddb28f026f7eddd1a23341253256e96cfa0328c
Merge branch 'dev_gzf_funasr2' of github.com:alibaba-damo-academy/FunASR into dev_gzf_funasr2
add
2个文件已添加
5 文件已重命名
1个文件已删除
1 文件已复制
52 ■■■■■ 已修改文件
examples/industrial_data_pretraining/contextual_paraformer/demo.py 12 ●●●●● 补丁 | 查看 | 原始文档 | blame | 历史
examples/industrial_data_pretraining/contextual_paraformer/infer.sh 2 ●●● 补丁 | 查看 | 原始文档 | blame | 历史
examples/industrial_data_pretraining/neat_contextual_paraformer/demo.py 12 ●●●●● 补丁 | 查看 | 原始文档 | blame | 历史
examples/industrial_data_pretraining/seaco_paraformer/demo.py 12 ●●●●● 补丁 | 查看 | 原始文档 | blame | 历史
examples/industrial_data_pretraining/seaco_paraformer/infer.sh 4 ●●●● 补丁 | 查看 | 原始文档 | blame | 历史
funasr/models/contextual_paraformer/__init__.py 补丁 | 查看 | 原始文档 | blame | 历史
funasr/models/contextual_paraformer/decoder.py 补丁 | 查看 | 原始文档 | blame | 历史
funasr/models/contextual_paraformer/model.py 8 ●●●● 补丁 | 查看 | 原始文档 | blame | 历史
funasr/models/contextual_paraformer/template.yaml 2 ●●● 补丁 | 查看 | 原始文档 | blame | 历史
examples/industrial_data_pretraining/contextual_paraformer/demo.py
New file
@@ -0,0 +1,12 @@
#!/usr/bin/env python3
# -*- encoding: utf-8 -*-
# Copyright FunASR (https://github.com/alibaba-damo-academy/FunASR). All Rights Reserved.
#  MIT License  (https://opensource.org/licenses/MIT)
from funasr import AutoModel
model = AutoModel(model="../modelscope_models/speech_paraformer-large-contextual_asr_nat-zh-cn-16k-common-vocab8404")
res = model(input="../modelscope_models/speech_paraformer-large-contextual_asr_nat-zh-cn-16k-common-vocab8404/example/asr_example.wav",
            hotword='达魔院 魔搭')
print(res)
examples/industrial_data_pretraining/contextual_paraformer/infer.sh
File was renamed from examples/industrial_data_pretraining/neat_contextual_paraformer/infer.sh
@@ -1,6 +1,6 @@
# download model
local_path_root=./modelscope_models
local_path_root=../modelscope_models
mkdir -p ${local_path_root}
local_path=${local_path_root}/speech_paraformer-large-contextual_asr_nat-zh-cn-16k-common-vocab8404
git clone https://www.modelscope.cn/damo/speech_paraformer-large-contextual_asr_nat-zh-cn-16k-common-vocab8404.git ${local_path}
examples/industrial_data_pretraining/neat_contextual_paraformer/demo.py
File was deleted
examples/industrial_data_pretraining/seaco_paraformer/demo.py
New file
@@ -0,0 +1,12 @@
#!/usr/bin/env python3
# -*- encoding: utf-8 -*-
# Copyright FunASR (https://github.com/alibaba-damo-academy/FunASR). All Rights Reserved.
#  MIT License  (https://opensource.org/licenses/MIT)
from funasr import AutoModel
model = AutoModel(model="../modelscope_models/speech_paraformer-large-contextual_asr_nat-zh-cn-16k-common-vocab8404")
res = model(input="../modelscope_models/speech_paraformer-large-contextual_asr_nat-zh-cn-16k-common-vocab8404/example/asr_example.wav",
            hotword='达魔院 魔搭')
print(res)
examples/industrial_data_pretraining/seaco_paraformer/infer.sh
copy from examples/industrial_data_pretraining/neat_contextual_paraformer/infer.sh copy to examples/industrial_data_pretraining/seaco_paraformer/infer.sh
File was copied from examples/industrial_data_pretraining/neat_contextual_paraformer/infer.sh
@@ -1,9 +1,9 @@
# download model
local_path_root=./modelscope_models
local_path_root=../modelscope_models
mkdir -p ${local_path_root}
local_path=${local_path_root}/speech_paraformer-large-contextual_asr_nat-zh-cn-16k-common-vocab8404
git clone https://www.modelscope.cn/damo/speech_paraformer-large-contextual_asr_nat-zh-cn-16k-common-vocab8404.git ${local_path}
git clone https://www.modelscope.cn/damo/speech_seaco_paraformer_large_asr_nat-zh-cn-16k-common-vocab8404-pytorch.git ${local_path}
python funasr/bin/inference.py \
funasr/models/contextual_paraformer/__init__.py
funasr/models/contextual_paraformer/decoder.py
funasr/models/contextual_paraformer/model.py
File was renamed from funasr/models/neat_contextual_paraformer/model.py
@@ -55,12 +55,12 @@
from funasr.register import tables
@tables.register("model_classes", "NeatContextualParaformer")
class NeatContextualParaformer(Paraformer):
@tables.register("model_classes", "ContextualParaformer")
class ContextualParaformer(Paraformer):
    """
    Author: Speech Lab of DAMO Academy, Alibaba Group
    Paraformer: Fast and Accurate Parallel Transformer for Non-autoregressive End-to-End Speech Recognition
    https://arxiv.org/abs/2206.08317
    FunASR: A Fundamental End-to-End Speech Recognition Toolkit
    https://arxiv.org/abs/2305.11013
    """
    
    def __init__(
funasr/models/contextual_paraformer/template.yaml
File was renamed from funasr/models/neat_contextual_paraformer/template.yaml
@@ -6,7 +6,7 @@
# tables.print()
# network architecture
model: NeatContextualParaformer
model: ContextualParaformer
model_conf:
    ctc_weight: 0.0
    lsm_weight: 0.1