speech_asr
2023-03-15 f691014c8a97f2ea27dc72c9d3b374bdd05aa6c9
update
1个文件已修改
4 ■■■■ 已修改文件
funasr/models/frontend/wav_frontend.py 4 ●●●● 补丁 | 查看 | 原始文档 | blame | 历史
funasr/models/frontend/wav_frontend.py
@@ -493,10 +493,10 @@
        for i in range(batch_size):
            waveform_length = input_lengths[i]
            waveform = input[i][:waveform_length]
            waveform = waveform.unsqueeze(0).numpy()
            waveform = waveform.numpy()
            mat = eend_ola_feature.stft(waveform, self.frame_length, self.frame_shift)
            mat = eend_ola_feature.transform(mat)
            mat = mat.splice(mat, context_size=self.lfr_m)
            mat = eend_ola_feature.splice(mat, context_size=self.lfr_m)
            mat = mat[::self.lfr_n]
            mat = torch.from_numpy(mat)
            feat_length = mat.size(0)