| | |
| | | self.dropout = torch.nn.Dropout(dropout_rate) |
| | | |
| | | assert whisper_model in whisper.available_models() |
| | | _model = whisper.load_model( |
| | | whisper_model, download_root=download_dir, device="cpu" |
| | | ) |
| | | _model = whisper.load_model(whisper_model, download_root=download_dir, device="cpu") |
| | | self.encoders = copy.deepcopy(_model.encoder) |
| | | self.encoders.train() |
| | | |
| | |
| | | if ilens is not None: |
| | | olens = ( |
| | | 1 |
| | | + ( |
| | | ilens |
| | | - self.encoders.conv2.kernel_size[0] |
| | | + 2 * self.encoders.conv2.padding[0] |
| | | ) |
| | | + (ilens - self.encoders.conv2.kernel_size[0] + 2 * self.encoders.conv2.padding[0]) |
| | | // self.encoders.conv2.stride[0] |
| | | ) |
| | | olens = torch.clamp(olens, max=max_pos) |