From 4085b2cfe8abadc73eb26e3640f28bd23174c451 Mon Sep 17 00:00:00 2001 From: ZX-ModelCloud Date: Fri, 7 Nov 2025 07:53:48 +0000 Subject: [PATCH 1/2] Fixed version("triton") crash on torch+xpu Signed-off-by: ZX-ModelCloud --- gptqmodel/utils/nogil_patcher.py | 9 ++++++++- 1 file changed, 8 insertions(+), 1 deletion(-) diff --git a/gptqmodel/utils/nogil_patcher.py b/gptqmodel/utils/nogil_patcher.py index e2779f603..4e14b7888 100644 --- a/gptqmodel/utils/nogil_patcher.py +++ b/gptqmodel/utils/nogil_patcher.py @@ -7,6 +7,7 @@ import threading import time +import importlib from .safe import ThreadSafe from importlib.metadata import version @@ -42,7 +43,13 @@ def patch_triton_autotuner() -> None: except ImportError: return - triton_version_str = version("triton") + try: + triton_version_str = version("triton") + except importlib.metadata.PackageNotFoundError: + try: + triton_version_str = version("pytorch_triton_xpu") + except Exception: + raise ValueError("Can't get triton version") try: triton_ver = Version(triton_version_str) From 61a1159d2044a6341ee719466358ff21ca004813 Mon Sep 17 00:00:00 2001 From: ZX-ModelCloud Date: Fri, 7 Nov 2025 08:11:18 +0000 Subject: [PATCH 2/2] format Signed-off-by: ZX-ModelCloud --- gptqmodel/utils/nogil_patcher.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/gptqmodel/utils/nogil_patcher.py b/gptqmodel/utils/nogil_patcher.py index b4585053c..fb313e49e 100644 --- a/gptqmodel/utils/nogil_patcher.py +++ b/gptqmodel/utils/nogil_patcher.py @@ -5,9 +5,9 @@ """Straightforward monkey patch helpers for nogil runtimes.""" +import importlib import threading import time -import importlib from importlib.metadata import version from packaging.version import InvalidVersion, Version @@ -250,4 +250,4 @@ def patched_run(self, *args, **kwargs): autotuner_cls.check_disk_cache = patched_check_disk_cache autotuner_cls._get_config_for_key = _get_config_for_key autotuner_cls.run = patched_run - autotuner_cls._gptqmodel_threadsafe = True \ No newline at end of file + autotuner_cls._gptqmodel_threadsafe = True