From c6574bf4f4390a9c0dfdd5aa2c4f39eb85e1557e Mon Sep 17 00:00:00 2001
From: Shi Xian <40013335+R1ckShi@users.noreply.github.com>
Date: 星期二, 09 四月 2024 10:41:11 +0800
Subject: [PATCH] Merge pull request #1596 from wanghuii1/main

---
 funasr/datasets/audio_datasets/preprocessor.py |    9 +++++----
 1 files changed, 5 insertions(+), 4 deletions(-)

diff --git a/funasr/datasets/audio_datasets/preprocessor.py b/funasr/datasets/audio_datasets/preprocessor.py
index a3ba3a5..ab75140 100644
--- a/funasr/datasets/audio_datasets/preprocessor.py
+++ b/funasr/datasets/audio_datasets/preprocessor.py
@@ -26,10 +26,11 @@
 			return waveform
 		speed = random.choice(self.speed_perturb)
 		if speed != 1.0:
-			with torch.no_grad():
-				waveform, _ = torchaudio.sox_effects.apply_effects_tensor(
-					torch.tensor(waveform).view(1, -1), fs, [['speed', str(speed)], ['rate', str(fs)]])
-				waveform = waveform.view(-1)
+			if not isinstance(waveform, torch.Tensor):
+				waveform = torch.tensor(waveform)
+			waveform, _ = torchaudio.sox_effects.apply_effects_tensor(
+				waveform.view(1, -1), fs, [['speed', str(speed)], ['rate', str(fs)]])
+			waveform = waveform.view(-1)
 			
 		return waveform
 

--
Gitblit v1.9.1