Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 2 additions & 2 deletions .github/workflows/unit_tests.yml
Original file line number Diff line number Diff line change
Expand Up @@ -205,7 +205,7 @@ jobs:
- list-test-files
if: needs.list-test-files.outputs.torch-files != '[]' || needs.list-test-files.outputs.transformers-files != '[]'
container:
image: ${{ needs.check-vm.outputs.ip }}:5000/nvidia/cuda:${{ needs.check-vm.outputs.cuda_version }}-ubuntu22.04
image: ${{ needs.check-vm.outputs.ip }}:5000/nvidia/cuda:${{ needs.check-vm.outputs.cuda_version }}-ubuntu22.04_0822
options: --device /dev/dri --ipc=host --runtime=nvidia --gpus all
volumes:
- /dev/dri/by-path:/dev/dri/by-path
Expand Down Expand Up @@ -327,7 +327,7 @@ jobs:
- check-vm
runs-on: [ self-hosted, xeon5 ]
container:
image: ${{ needs.check-vm.outputs.ip }}:5000/nvidia/cuda:${{ needs.check-vm.outputs.cuda_version }}-ubuntu22.04
image: ${{ needs.check-vm.outputs.ip }}:5000/nvidia/cuda:${{ needs.check-vm.outputs.cuda_version }}-ubuntu22.04_0822
options: --device /dev/dri --ipc=host --runtime=nvidia --gpus all
volumes:
- /dev/dri/by-path:/dev/dri/by-path
Expand Down
4 changes: 3 additions & 1 deletion tests/test_packable.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,7 +8,7 @@
from gptqmodel.nn_modules.qlinear.exllama import ExllamaQuantLinear # noqa: E402
from gptqmodel.nn_modules.qlinear.exllama_eora import ExllamaEoraQuantLinear
from gptqmodel.nn_modules.qlinear.exllamav2 import ExllamaV2QuantLinear # noqa: E402
from gptqmodel.nn_modules.qlinear.ipex import IPEXQuantLinear # noqa: E402
from gptqmodel.nn_modules.qlinear.ipex import IPEXQuantLinear, HAS_IPEX # noqa: E402
from gptqmodel.nn_modules.qlinear.marlin import MarlinQuantLinear # noqa: E402
from gptqmodel.nn_modules.qlinear.torch import TorchQuantLinear # noqa: E402
from gptqmodel.nn_modules.qlinear.tritonv2 import TritonV2QuantLinear # noqa: E402
Expand Down Expand Up @@ -59,6 +59,8 @@ def setUpClass(cls):
]
)
def test_post_init(self, backend: BACKEND, equal: Dict[str, bool]):
if backend == BACKEND.IPEX and not HAS_IPEX:
self.skipTest("IPEX is not available")
model = GPTQModel.load(self.model_id, backend=backend, device_map="auto")
model = convert_gptq_v2_to_v1_format(model, model.quantize_config, self.QLINEAR_DICT[backend])

Expand Down