游雁
2024-01-13 bdfd27b9e96bd55c449953bb577e1d4deeaf11c9
funasr/models/scama/sanm_encoder.py
@@ -30,7 +30,7 @@
from funasr.models.ctc.ctc import CTC
from funasr.utils.register import register_class, registry_tables
from funasr.register import tables
class EncoderLayerSANM(nn.Module):
    def __init__(
@@ -154,7 +154,7 @@
        return x, cache
@register_class("encoder_classes", "SANMEncoderChunkOpt")
@tables.register("encoder_classes", "SANMEncoderChunkOpt")
class SANMEncoderChunkOpt(nn.Module):
    """
    Author: Speech Lab of DAMO Academy, Alibaba Group
@@ -423,7 +423,9 @@
                      xs_pad: torch.Tensor,
                      ilens: torch.Tensor,
                      cache: dict = None,
                      **kwargs,
                      ):
        is_final = kwargs.get("is_final", False)
        xs_pad *= self.output_size() ** 0.5
        if self.embed is None:
            xs_pad = xs_pad