From 10e37a721fdd2ecfd8e17f7213688927c29343a1 Mon Sep 17 00:00:00 2001
From: 嘉渊 <wangjiaming.wjm@alibaba-inc.com>
Date: 星期四, 27 四月 2023 17:24:47 +0800
Subject: [PATCH] update
---
funasr/models/frontend/wav_frontend_kaldifeat.py | 12 +++++++-----
1 files changed, 7 insertions(+), 5 deletions(-)
diff --git a/funasr/models/frontend/wav_frontend_kaldifeat.py b/funasr/models/frontend/wav_frontend_kaldifeat.py
index d4e775e..85adbb7 100644
--- a/funasr/models/frontend/wav_frontend_kaldifeat.py
+++ b/funasr/models/frontend/wav_frontend_kaldifeat.py
@@ -6,8 +6,11 @@
import numpy as np
import torch
import torchaudio.compliance.kaldi as kaldi
+from funasr.models.frontend.abs_frontend import AbsFrontend
from typeguard import check_argument_types
from torch.nn.utils.rnn import pad_sequence
+
+
# import kaldifeat
def load_cmvn(cmvn_file):
@@ -32,9 +35,9 @@
means = np.array(means_list).astype(np.float)
vars = np.array(vars_list).astype(np.float)
cmvn = np.array([means, vars])
- cmvn = torch.as_tensor(cmvn)
- return cmvn
-
+ cmvn = torch.as_tensor(cmvn)
+ return cmvn
+
def apply_cmvn(inputs, cmvn_file): # noqa
"""
@@ -72,7 +75,6 @@
LFR_inputs.append(frame)
LFR_outputs = torch.vstack(LFR_inputs)
return LFR_outputs.type(torch.float32)
-
# class WavFrontend_kaldifeat(AbsFrontend):
# """Conventional frontend structure for ASR.
@@ -176,4 +178,4 @@
# feats_pad = pad_sequence(feats,
# batch_first=True,
# padding_value=0.0)
-# return feats_pad, feats_lens
+# return feats_pad, feats_lens
\ No newline at end of file
--
Gitblit v1.9.1