python/FunASR-XL.git

File was renamed from funasr/punctuation/espnet_model.py
			@@ -1,3 +1,9 @@
			from abc import ABC
			from abc import abstractmethod
			from typing import Tuple

			import torch

			from typing import Dict
			from typing import Optional
			from typing import Tuple
			@@ -7,12 +13,33 @@
			from typeguard import check_argument_types

			from funasr.modules.nets_utils import make_pad_mask
			from funasr.punctuation.abs_model import AbsPunctuation
			from funasr.torch_utils.device_funcs import force_gatherable
			from funasr.train.abs_espnet_model import AbsESPnetModel

			from funasr.modules.scorers.scorer_interface import BatchScorerInterface

			class ESPnetPunctuationModel(AbsESPnetModel):

			class AbsPunctuation(torch.nn.Module, BatchScorerInterface, ABC):
			"""The abstract class

			To share the loss calculation way among different models,
			We uses delegate pattern here:
			The instance of this class should be passed to "LanguageModel"

			This "model" is one of mediator objects for "Task" class.

			"""

			@abstractmethod
			def forward(self, input: torch.Tensor, hidden: torch.Tensor) -> Tuple[torch.Tensor, torch.Tensor]:
			raise NotImplementedError

			@abstractmethod
			def with_vad(self) -> bool:
			raise NotImplementedError


			class PunctuationModel(AbsESPnetModel):

			def __init__(self, punc_model: AbsPunctuation, vocab_size: int, ignore_id: int = 0, punc_weight: list = None):
			assert check_argument_types()
			@@ -75,7 +102,8 @@
			return nll, text_lengths
			else:
			self.punc_weight = self.punc_weight.to(punc.device)
			nll = F.cross_entropy(y.view(-1, y.shape[-1]), punc.view(-1), self.punc_weight, reduction="none", ignore_index=self.ignore_id)
			nll = F.cross_entropy(y.view(-1, y.shape[-1]), punc.view(-1), self.punc_weight, reduction="none",
			ignore_index=self.ignore_id)
			# nll: (BxL,) -> (BxL,)
			if max_length is None:
			nll.masked_fill_(make_pad_mask(text_lengths).to(nll.device).view(-1), 0.0)