funasr/datasets/llm_datasets_qwenaudio/datasets.py
@@ -66,8 +66,6 @@ def __getitem__(self, index): item = self.index_ds[index] # import pdb; # pdb.set_trace() source = item["source"] data_src = load_audio_text_image_video(source, fs=self.fs) if self.preprocessor_speech: