zhifu gao
2022-12-12 22f0bd826565dcdeba78771deb32d1e92d500e44
Merge pull request #14 from alibaba-damo-academy/dev

wav
1个文件已修改
6 ■■■■ 已修改文件
funasr/bin/asr_inference_paraformer.py 6 ●●●● 补丁 | 查看 | 原始文档 | blame | 历史
funasr/bin/asr_inference_paraformer.py
@@ -197,9 +197,9 @@
        # data: (Nsamples,) -> (1, Nsamples)
        # lengths: (1,)
        if len(speech.size()) < 3:
            speech = speech.unsqueeze(0).to(getattr(torch, self.dtype))
            speech_lengths = speech.new_full([1], dtype=torch.long, fill_value=speech.size(1))
        # if len(speech.size()) < 3:
        #     speech = speech.unsqueeze(0).to(getattr(torch, self.dtype))
        #     speech_lengths = speech.new_full([1], dtype=torch.long, fill_value=speech.size(1))
        lfr_factor = max(1, (speech.size()[-1]//80)-1)
        
        batch = {"speech": speech, "speech_lengths": speech_lengths}