funasr/frontends/wav_frontend.py
@@ -32,7 +32,6 @@ rescale_line = line_item[3:(len(line_item) - 1)] vars_list = list(rescale_line) continue import pdb;pdb.set_trace() means = np.array(means_list).astype(np.float32) vars = np.array(vars_list).astype(np.float32) cmvn = np.array([means, vars]) @@ -76,6 +75,7 @@ LFR_outputs = torch.vstack(LFR_inputs) return LFR_outputs.type(torch.float32) @tables.register("frontend_classes", "wav_frontend") @tables.register("frontend_classes", "WavFrontend") class WavFrontend(nn.Module): """Conventional frontend structure for ASR.