From 7a7ead00bccc3de7b542332f7dcdf84086ab74a9 Mon Sep 17 00:00:00 2001
From: 凌匀 <ailsa.zly@alibaba-inc.com>
Date: 星期五, 21 四月 2023 21:40:11 +0800
Subject: [PATCH] vad bug fix
---
funasr/bin/vad_inference.py | 4 ++--
funasr/models/frontend/wav_frontend.py | 2 +-
2 files changed, 3 insertions(+), 3 deletions(-)
diff --git a/funasr/bin/vad_inference.py b/funasr/bin/vad_inference.py
index 1e19f5f..387b622 100644
--- a/funasr/bin/vad_inference.py
+++ b/funasr/bin/vad_inference.py
@@ -109,7 +109,7 @@
fbanks, fbanks_len = self.frontend.forward_fbank(speech, speech_lengths)
feats, feats_len = self.frontend.forward_lfr_cmvn(fbanks, fbanks_len)
fbanks = to_device(fbanks, device=self.device)
- # feats = to_device(feats, device=self.device)
+ feats = to_device(feats, device=self.device)
feats_len = feats_len.int()
else:
raise Exception("Need to extract feats first, please configure frontend configuration")
@@ -131,7 +131,7 @@
"in_cache": in_cache
}
# a. To device
- batch = to_device(batch, device=self.device)
+ #batch = to_device(batch, device=self.device)
segments_part, in_cache = self.vad_model(**batch)
if segments_part:
for batch_num in range(0, self.batch_size):
diff --git a/funasr/models/frontend/wav_frontend.py b/funasr/models/frontend/wav_frontend.py
index 3661f6b..1dbf490 100644
--- a/funasr/models/frontend/wav_frontend.py
+++ b/funasr/models/frontend/wav_frontend.py
@@ -34,7 +34,7 @@
means = np.array(means_list).astype(np.float)
vars = np.array(vars_list).astype(np.float)
cmvn = np.array([means, vars])
- cmvn = torch.as_tensor(cmvn, dype=torch.float32)
+ cmvn = torch.as_tensor(cmvn, dtype=torch.float32)
return cmvn
--
Gitblit v1.9.1