diff --git a/examples/qualcomm/oss_scripts/llama/llama.py b/examples/qualcomm/oss_scripts/llama/llama.py index 33482090b28..99f346eccbc 100755 --- a/examples/qualcomm/oss_scripts/llama/llama.py +++ b/examples/qualcomm/oss_scripts/llama/llama.py @@ -398,7 +398,7 @@ def quantize(self, quant_dtype, args, tokenizer, custom_annotations=()): self.llama_graph_module, self.inputs, strict=True ).module() - if QuantDtype == QuantDtype.use_16a4w_block: + if quant_dtype == QuantDtype.use_16a4w_block: conv_nodes = [ n for n in fx_graph_module.graph.nodes if "conv" in n.name ]