Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 2 additions & 2 deletions gptqmodel/utils/nogil_patcher.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,8 +5,8 @@

"""Straightforward monkey patch helpers for nogil runtimes."""

import time
import threading
import time

from .safe import ThreadSafe

Expand All @@ -33,8 +33,8 @@ def patch_safetensors_save_file() -> None:

def patch_triton_autotuner() -> None:
try:
from triton.runtime import autotuner as module
import triton
from triton.runtime import autotuner as module
except ImportError:
return

Expand Down
3 changes: 2 additions & 1 deletion gptqmodel/utils/stream.py
Original file line number Diff line number Diff line change
Expand Up @@ -6,15 +6,16 @@
from __future__ import annotations

import threading
from concurrent.futures import Future
from dataclasses import dataclass
from typing import Any, Callable, Dict, Iterable, List, Optional, Tuple

import torch
from concurrent.futures import Future

from .logger import setup_logger
from .threadx import DeviceThreadPool


log = setup_logger()


Expand Down
3 changes: 2 additions & 1 deletion gptqmodel/utils/threadx.py
Original file line number Diff line number Diff line change
Expand Up @@ -13,12 +13,13 @@
import threading
import time
import traceback
from datetime import datetime, timezone
from concurrent.futures import Future
from datetime import datetime, timezone
from typing import Any, Callable, Dict, Iterable, List, Optional, Set, Tuple, Union

import torch


try:
from device_smi import Device # type: ignore
except Exception: # pragma: no cover - defensive: optional dependency may be unavailable
Expand Down
2 changes: 1 addition & 1 deletion setup.py
Original file line number Diff line number Diff line change
Expand Up @@ -3,11 +3,11 @@
# SPDX-License-Identifier: Apache-2.0
# Contact: qubitium@modelcloud.ai, x.com/qubitium
import os
import re
import subprocess
import sys
from pathlib import Path

import pcre as re
from setuptools import find_packages, setup
from setuptools.command.bdist_wheel import bdist_wheel as _bdist_wheel

Expand Down
2 changes: 1 addition & 1 deletion tests/models/model_test.py
Original file line number Diff line number Diff line change
Expand Up @@ -22,8 +22,8 @@

# -- end do not touch

from pathlib import Path # noqa: E402
from enum import Enum # noqa: E402
from pathlib import Path # noqa: E402
from typing import Dict, List # noqa: E402

from logbar import LogBar # noqa: E402
Expand Down
1 change: 1 addition & 0 deletions tests/models/test_act_group_aware.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


Expand Down
2 changes: 1 addition & 1 deletion tests/models/test_apertus.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,9 +4,9 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest
from gptqmodel.utils.eval import EVAL

from gptqmodel import BACKEND
from gptqmodel.utils.eval import EVAL


class TestApertus(ModelTest):
Expand Down
1 change: 1 addition & 0 deletions tests/models/test_cohere.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


Expand Down
1 change: 1 addition & 0 deletions tests/models/test_cohere2.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


Expand Down
1 change: 1 addition & 0 deletions tests/models/test_deci.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


Expand Down
1 change: 1 addition & 0 deletions tests/models/test_dream.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


Expand Down
1 change: 1 addition & 0 deletions tests/models/test_falcon.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,6 +5,7 @@

import torch # noqa: E402from tests.model_test import ModelTest
from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


Expand Down
2 changes: 2 additions & 0 deletions tests/models/test_glm.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,8 +4,10 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


# | Metric | MARLIN |
# |--------------------------------|----------|
# | arc_challenge :: acc,none | 0.5154 |
Expand Down
2 changes: 2 additions & 0 deletions tests/models/test_glm4_moe.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,8 +4,10 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


class TestGlm4Moe(ModelTest):
NATIVE_MODEL_ID = "/monster/data/model/GLM-4.6/"
DELETE_QUANTIZED_MODEL = False
Expand Down
1 change: 1 addition & 0 deletions tests/models/test_gpt_oss.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


Expand Down
1 change: 1 addition & 0 deletions tests/models/test_granite.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


Expand Down
1 change: 1 addition & 0 deletions tests/models/test_hymba.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


Expand Down
1 change: 1 addition & 0 deletions tests/models/test_ling.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


Expand Down
1 change: 1 addition & 0 deletions tests/models/test_llama3_2.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


Expand Down
2 changes: 1 addition & 1 deletion tests/models/test_llama3_2_awq.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,9 +4,9 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest
from gptqmodel.utils.eval import EVAL

from gptqmodel.quantization import FORMAT, METHOD
from gptqmodel.utils.eval import EVAL


# a100:0
Expand Down
1 change: 1 addition & 0 deletions tests/models/test_llama4.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


Expand Down
1 change: 1 addition & 0 deletions tests/models/test_longllama.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


Expand Down
1 change: 1 addition & 0 deletions tests/models/test_mimo.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


Expand Down
1 change: 1 addition & 0 deletions tests/models/test_nemotron_ultra.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


Expand Down
2 changes: 2 additions & 0 deletions tests/models/test_qwen2_5.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,8 +4,10 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


# | Metric | MARLIN |
# |--------------------------------|----------|
# | arc_challenge :: acc,none | 0.2884 |
Expand Down
2 changes: 1 addition & 1 deletion tests/models/test_qwen2_5_omni.py
Original file line number Diff line number Diff line change
Expand Up @@ -6,9 +6,9 @@

import soundfile as sf
from model_test import ModelTest
from gptqmodel.utils.eval import EVAL

from gptqmodel.models.definitions.qwen2_5_omni import Qwen2_5_OmniGPTQ
from gptqmodel.utils.eval import EVAL


class TestQwen2_5_Omni(ModelTest):
Expand Down
2 changes: 1 addition & 1 deletion tests/models/test_qwen2_5_vl.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,9 +4,9 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest
from gptqmodel.utils.eval import EVAL

from gptqmodel.models.definitions.qwen2_vl import Qwen2VLQModel
from gptqmodel.utils.eval import EVAL


class TestQwen2_VL(ModelTest):
Expand Down
1 change: 1 addition & 0 deletions tests/models/test_qwen2_moe_quant.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


Expand Down
2 changes: 1 addition & 1 deletion tests/models/test_qwen2_vl.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,9 +4,9 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest
from gptqmodel.utils.eval import EVAL

from gptqmodel.models.definitions.qwen2_vl import Qwen2VLQModel
from gptqmodel.utils.eval import EVAL


class TestQwen2_VL(ModelTest):
Expand Down
2 changes: 2 additions & 0 deletions tests/models/test_qwen3_moe.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,8 +4,10 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


# | Metric | MARLIN |
# |--------------------------------|----------|
# | arc_challenge :: acc,none | 0.5094 |
Expand Down
2 changes: 2 additions & 0 deletions tests/models/test_qwen3_next.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,8 +4,10 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


# | Metric | MARLIN |
# |--------------------------------|----------|
# | arc_challenge :: acc,none | 0.6271 |
Expand Down
1 change: 1 addition & 0 deletions tests/models/test_qwen3_omni.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


Expand Down
1 change: 1 addition & 0 deletions tests/models/test_seed_oss.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


Expand Down
1 change: 1 addition & 0 deletions tests/models/test_stablelm.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


Expand Down
1 change: 1 addition & 0 deletions tests/models/test_xverse.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from model_test import ModelTest

from gptqmodel.utils.eval import EVAL


Expand Down
1 change: 1 addition & 0 deletions tests/test_gptqv2.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
# Contact: qubitium@modelcloud.ai, x.com/qubitium

from models.model_test import ModelTest

from gptqmodel.utils.eval import EVAL


Expand Down
2 changes: 1 addition & 1 deletion tests/test_lm_head.py
Original file line number Diff line number Diff line change
Expand Up @@ -13,10 +13,10 @@
os.environ["CUDA_DEVICE_ORDER"] = "PCI_BUS_ID"
# -- end do not touch
from models.model_test import ModelTest # noqa: E402
from gptqmodel.utils.eval import EVAL # noqa: E402

from gptqmodel import GPTQModel, QuantizeConfig # noqa: E402
from gptqmodel.nn_modules.qlinear import BaseQuantLinear # noqa: E402
from gptqmodel.utils.eval import EVAL # noqa: E402


class TestLmHeadLoad(ModelTest):
Expand Down