runtime/python/onnxruntime/funasr_onnx/sensevoice_bin.py
@@ -183,8 +183,10 @@ # ctc_logits = torch.from_numpy(ctc_logits).float() # support batch_size=1 only currently x = ctc_logits[b, : encoder_out_lens[b].item(), :] yseq = x.argmax(dim=-1) yseq = np.unique(yseq) yseq = np.argmax(x, axis=-1) # Use np.diff and np.where instead of torch.unique_consecutive. mask = np.concatenate(([True], np.diff(yseq) != 0)) yseq = yseq[mask] mask = yseq != self.blank_id token_int = yseq[mask].tolist()