From fce4e1d1b48f23cd8332e60afce3df8d6209a6a7 Mon Sep 17 00:00:00 2001
From: gaochangfeng <54253717+gaochangfeng@users.noreply.github.com>
Date: 星期四, 11 四月 2024 14:59:22 +0800
Subject: [PATCH] SenseVoice对富文本解码的参数 (#1608)
---
funasr/models/campplus/cluster_backend.py | 5 ++---
1 files changed, 2 insertions(+), 3 deletions(-)
diff --git a/funasr/models/campplus/cluster_backend.py b/funasr/models/campplus/cluster_backend.py
index 93d3bce..14fbbe1 100644
--- a/funasr/models/campplus/cluster_backend.py
+++ b/funasr/models/campplus/cluster_backend.py
@@ -10,6 +10,7 @@
import numpy as np
from sklearn.cluster._kmeans import k_means
+from sklearn.cluster import HDBSCAN
class SpectralCluster:
@@ -115,8 +116,6 @@
self.min_samples = min_samples
self.min_cluster_size = min_cluster_size
self.metric = metric
- import hdbscan
- self.hdbscan = hdbscan
def __call__(self, X):
import umap.umap_ as umap
@@ -126,7 +125,7 @@
n_components=min(self.n_components, X.shape[0] - 2),
metric=self.metric,
).fit_transform(X)
- labels = self.hdbscan.HDBSCAN(
+ labels = HDBSCAN(
min_samples=self.min_samples,
min_cluster_size=self.min_cluster_size,
allow_single_cluster=True).fit_predict(umap_X)
--
Gitblit v1.9.1