huggingface · younesbelkada · Apr 23, 2024 · Apr 9, 2024 · Apr 9, 2024 · Apr 22, 2024
diff --git a/src/transformers/modeling_utils.py b/src/transformers/modeling_utils.py
@@ -1160,12 +1160,15 @@ def num_parameters(self, only_trainable: bool = False, exclude_embeddings: bool
                 # For 4bit models, we need to multiply the number of parameters by 2 as half of the parameters are
                 # used for the 4bit quantization (uint8 tensors are stored)
                 if is_loaded_in_4bit and isinstance(param, bnb.nn.Params4bit):
-                    quant_storage = self.hf_quantizer.quantization_config.bnb_4bit_quant_storage
-                    # For compatibility with older PT version - see: https://github.com/huggingface/peft/pull/1635
-                    nb_params = (
-                        quant_storage.itemsize if hasattr(quant_storage, "itemsize") else quant_storage.element_size()
+                    if hasattr(param, "element_size"):
+                        num_bytes = param.element_size()
+                    elif not hasattr(param, "quant_storage"):
+                        num_bytes = 1
+                    else:
+                        num_bytes = param.quant_storage.itemsize
+                    total_numel.append(
+                        param.numel() * 2 * num_bytes
                     )
-                    total_numel.append(param.numel() * 2 * nb_params)
                 else:
                     total_numel.append(param.numel())