From c1e365fea09aafda387cac12fdff43d28c598979 Mon Sep 17 00:00:00 2001
From: BienBoy <92378515+BienBoy@users.noreply.github.com>
Date: 星期六, 01 二月 2025 23:29:34 +0800
Subject: [PATCH] fix: resolve unexpected 'out of memory' issue in multi-GPU setup (#2373)
---
runtime/onnxruntime/src/punc-model.cpp | 4 +++-
1 files changed, 3 insertions(+), 1 deletions(-)
diff --git a/runtime/onnxruntime/src/punc-model.cpp b/runtime/onnxruntime/src/punc-model.cpp
index 54b8d6a..9af03db 100644
--- a/runtime/onnxruntime/src/punc-model.cpp
+++ b/runtime/onnxruntime/src/punc-model.cpp
@@ -14,14 +14,16 @@
}
string punc_model_path;
string punc_config_path;
+ string token_file;
punc_model_path = PathAppend(model_path.at(MODEL_DIR), MODEL_NAME);
if(model_path.find(QUANTIZE) != model_path.end() && model_path.at(QUANTIZE) == "true"){
punc_model_path = PathAppend(model_path.at(MODEL_DIR), QUANT_MODEL_NAME);
}
punc_config_path = PathAppend(model_path.at(MODEL_DIR), PUNC_CONFIG_NAME);
+ token_file = PathAppend(model_path.at(MODEL_DIR), TOKEN_PATH);
- mm->InitPunc(punc_model_path, punc_config_path, thread_num);
+ mm->InitPunc(punc_model_path, punc_config_path, token_file, thread_num);
return mm;
}
--
Gitblit v1.9.1