speech_asr
2023-03-10 b3af8b7a1a2a9769e3250554d00feddf9ff16154
funasr/models/encoder/sanm_encoder.py
@@ -293,7 +293,7 @@
            position embedded tensor and mask
        """
        masks = (~make_pad_mask(ilens)[:, None, :]).to(xs_pad.device)
        xs_pad *= self.output_size()**0.5
        xs_pad = xs_pad * self.output_size()**0.5
        if self.embed is None:
            xs_pad = xs_pad
        elif (