mengzhe.cmz
2023-07-18 b6b63936c7f4320b30b5f907514f6e8d39ed7239
egs/wenetspeech/conformer/local/process_opus.py
@@ -65,8 +65,8 @@
            start = int(start_time_list[i] * sample_rate)
            end = int(end_time_list[i] * sample_rate)
            target_audio = waveform[:, start:end].transpose(0, 1).contiguous()
            target_audio.export(seg_wav_path, format="wav")
            target_audio = waveform[:, start:end]
            torchaudio.save(seg_wav_path, target_audio, sample_rate)
            fout.write("{} {}\n".format(utt_id, seg_wav_path))
            if i % step == 0: