From c0aac0aa330a82cf491d9bb462b281343ee5c129 Mon Sep 17 00:00:00 2001 From: Qubitium Date: Wed, 15 Oct 2025 17:35:37 +0000 Subject: [PATCH] safety check before cpp call --- gptqmodel/nn_modules/qlinear/__init__.py | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/gptqmodel/nn_modules/qlinear/__init__.py b/gptqmodel/nn_modules/qlinear/__init__.py index efe667a4d..20b2d6892 100644 --- a/gptqmodel/nn_modules/qlinear/__init__.py +++ b/gptqmodel/nn_modules/qlinear/__init__.py @@ -554,6 +554,10 @@ def pack_block( assert word_bits == 32, "Only 32-bit packing words supported." if (in_features % word_bits) != 0: raise ValueError("in_features must be divisible by 32") + if (out_features % word_bits) != 0: + raise ValueError( + "pack_block extension requires out_features to be divisible by 32" + ) disable_ext = env_flag("GPTQMODEL_DISABLE_PACK_EXT") force_ext = env_flag("GPTQMODEL_FORCE_PACK_EXT")