From 3c349ac0531b07239f37b81254f8568ab80e3f6a Mon Sep 17 00:00:00 2001
From: Han Zhang <45134013+holazzer@users.noreply.github.com>
Date: 星期二, 18 三月 2025 11:45:37 +0800
Subject: [PATCH] fix: use converted token_ids for alignment for sensevoice model with timestamp output (#2429)
---
examples/industrial_data_pretraining/fsmn_kws_mt/convert.py | 4 ----
1 files changed, 0 insertions(+), 4 deletions(-)
diff --git a/examples/industrial_data_pretraining/fsmn_kws_mt/convert.py b/examples/industrial_data_pretraining/fsmn_kws_mt/convert.py
index e63e689..a6ef0f8 100644
--- a/examples/industrial_data_pretraining/fsmn_kws_mt/convert.py
+++ b/examples/industrial_data_pretraining/fsmn_kws_mt/convert.py
@@ -49,8 +49,6 @@
copyfile(network_file, os.path.join(model_dir, 'origin.torch.pt'))
model = FsmnKWSMTConvert(
- vocab_size=configs['encoder_conf']['output_dim'],
- vocab_size2=configs['encoder_conf']['output_dim2'],
encoder='FSMNMTConvert',
encoder_conf=configs['encoder_conf'],
ctc_conf=configs['ctc_conf'],
@@ -82,8 +80,6 @@
model_name="convert.torch.pt"
):
model = FsmnKWSMTConvert(
- vocab_size=configs['encoder_conf']['output_dim'],
- vocab_size2=configs['encoder_conf']['output_dim2'],
encoder='FSMNMTConvert',
encoder_conf=configs['encoder_conf'],
ctc_conf=configs['ctc_conf'],
--
Gitblit v1.9.1