diff --git a/gptqmodel/nn_modules/qlinear/__init__.py b/gptqmodel/nn_modules/qlinear/__init__.py index efe667a4d..20b2d6892 100644 --- a/gptqmodel/nn_modules/qlinear/__init__.py +++ b/gptqmodel/nn_modules/qlinear/__init__.py @@ -554,6 +554,10 @@ def pack_block( assert word_bits == 32, "Only 32-bit packing words supported." if (in_features % word_bits) != 0: raise ValueError("in_features must be divisible by 32") + if (out_features % word_bits) != 0: + raise ValueError( + "pack_block extension requires out_features to be divisible by 32" + ) disable_ext = env_flag("GPTQMODEL_DISABLE_PACK_EXT") force_ext = env_flag("GPTQMODEL_FORCE_PACK_EXT")