游雁
2023-03-13 fc08b62d05723cdc1ce021bb8ba044ca014fb1f7
funasr/datasets/iterable_dataset.py
@@ -244,10 +244,14 @@
                        array = torchaudio.transforms.Resample(orig_freq=audio_fs,
                                                               new_freq=model_fs)(array)
                        array = array.numpy()
                if self.mc:
                    data[name] = array.transpose(0, 1)
                if _type == "sound":
                    if self.mc:
                        data[name] = array.transpose((1, 0))
                    else:
                        data[name] = array[0]
                else:
                    data[name] = array[0]
                    data[name] = array
                if self.preprocess is not None:
                    data = self.preprocess(uid, data)
@@ -350,7 +354,7 @@
                            array = array.numpy()
                    if _type == "sound":
                        if self.mc:
                            data[name] = array.transpose(0, 1)
                            data[name] = array.transpose((1, 0))
                        else:
                            data[name] = array[0]
                    else: