From eba1fccfa07665ed9cada19cfab6cd342e03112e Mon Sep 17 00:00:00 2001
From: Shi Xian <40013335+R1ckShi@users.noreply.github.com>
Date: 星期二, 16 一月 2024 11:34:04 +0800
Subject: [PATCH] Merge pull request #1250 from alibaba-damo-academy/funasr1.0
---
funasr/models/uniasr/e2e_uni_asr.py | 24 ++++++++++++------------
1 files changed, 12 insertions(+), 12 deletions(-)
diff --git a/funasr/models/uniasr/e2e_uni_asr.py b/funasr/models/uniasr/e2e_uni_asr.py
index de7ed29..390d274 100644
--- a/funasr/models/uniasr/e2e_uni_asr.py
+++ b/funasr/models/uniasr/e2e_uni_asr.py
@@ -541,20 +541,20 @@
speech_lengths: (Batch, )
"""
# with autocast(False):
- # # 1. Extract feats
- # feats, feats_lengths = self._extract_feats(speech, speech_lengths)
+ # # 1. Extract feats
+ # feats, feats_lengths = self._extract_feats(speech, speech_lengths)
#
- # # 2. Data augmentation
- # if self.specaug is not None and self.training:
- # feats, feats_lengths = self.specaug(feats, feats_lengths)
+ # # 2. Data augmentation
+ # if self.specaug is not None and self.training:
+ # feats, feats_lengths = self.specaug(feats, feats_lengths)
#
- # # 3. Normalization for feature: e.g. Global-CMVN, Utterance-CMVN
- # if self.normalize is not None:
- # feats, feats_lengths = self.normalize(feats, feats_lengths)
+ # # 3. Normalization for feature: e.g. Global-CMVN, Utterance-CMVN
+ # if self.normalize is not None:
+ # feats, feats_lengths = self.normalize(feats, feats_lengths)
# Pre-encoder, e.g. used for raw input data
# if self.preencoder is not None:
- # feats, feats_lengths = self.preencoder(feats, feats_lengths)
+ # feats, feats_lengths = self.preencoder(feats, feats_lengths)
encoder_out_rm, encoder_out_lens_rm = self.encoder.overlap_chunk_cls.remove_chunk(
encoder_out,
encoder_out_lens,
@@ -584,9 +584,9 @@
# # Post-encoder, e.g. NLU
# if self.postencoder is not None:
- # encoder_out, encoder_out_lens = self.postencoder(
- # encoder_out, encoder_out_lens
- # )
+ # encoder_out, encoder_out_lens = self.postencoder(
+ # encoder_out, encoder_out_lens
+ # )
assert encoder_out.size(0) == speech.size(0), (
encoder_out.size(),
--
Gitblit v1.9.1