From ef1d7b3f12535d73bf9046085d14d192c54cf7da Mon Sep 17 00:00:00 2001
From: Yuekai Zhang <zhangyuekai@foxmail.com>
Date: 星期二, 12 十一月 2024 17:23:51 +0800
Subject: [PATCH] Merge pull request #2206 from yijinsheng/triton_gpu

---
 runtime/triton_gpu/model_repo_paraformer_large_offline/scoring/1/model.py |    6 +++---
 1 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/runtime/triton_gpu/model_repo_paraformer_large_offline/scoring/1/model.py b/runtime/triton_gpu/model_repo_paraformer_large_offline/scoring/1/model.py
index d582e50..6f7e720 100644
--- a/runtime/triton_gpu/model_repo_paraformer_large_offline/scoring/1/model.py
+++ b/runtime/triton_gpu/model_repo_paraformer_large_offline/scoring/1/model.py
@@ -74,8 +74,8 @@
         load lang_char.txt
         """
         with open(str(vocab_file), "rb") as f:
-            config = yaml.load(f, Loader=yaml.Loader)
-        return config["token_list"]
+            vocab_list = json.load(f, encoding='utf-8')
+        return vocab_list
 
     def execute(self, requests):
         """`execute` must be implemented in every Python model. `execute`
@@ -142,7 +142,7 @@
         ]
         responses = []
         for i in range(total_seq):
-            sents = np.array(hyps[i : i + 1])
+            sents = np.array(hyps[i: i + 1])
             out0 = pb_utils.Tensor("OUTPUT0", sents.astype(self.out0_dtype))
             inference_response = pb_utils.InferenceResponse(output_tensors=[out0])
             responses.append(inference_response)

--
Gitblit v1.9.1