🐛[bugfix] Model : Added the ability to automatically select calculation types from GPU devices

2025-01-02 08:32:35 +09:00
parent 7616a11a46
commit 567907fc4d
3 changed files with 12 additions and 60 deletions
--- a/src-python/models/translation/translation_translator.py
+++ b/src-python/models/translation/translation_translator.py
@@ -6,7 +6,7 @@ from .translation_utils import ctranslate2_weights

 import ctranslate2
 import transformers
-from utils import errorLogging
+from utils import errorLogging, getBestComputeType

 import warnings
 warnings.filterwarnings("ignore")
@@ -37,7 +37,7 @@ class Translator():
        weight_path = os_path.join(path, "weights", "ctranslate2", directory_name)
        tokenizer_path = os_path.join(path, "weights", "ctranslate2", directory_name, "tokenizer")

-        compute_type = "int8" if device == "cpu" else "float16"
+        compute_type = getBestComputeType(device, device_index)
        self.ctranslate2_translator = ctranslate2.Translator(
            weight_path,
            device=device,