diff --git a/intel_extension_for_transformers/transformers/modeling/modeling_auto.py b/intel_extension_for_transformers/transformers/modeling/modeling_auto.py index e52154e6b0a..a56f0645376 100644 --- a/intel_extension_for_transformers/transformers/modeling/modeling_auto.py +++ b/intel_extension_for_transformers/transformers/modeling/modeling_auto.py @@ -322,6 +322,7 @@ class _BaseQBitsAutoModelClass: "whisper", "qwen2", "gemma", + "tinyllama", ] model_type_list_for_gptq = [