intel · chensuyue · May 21, 2024 · May 20, 2024 · May 20, 2024 · May 20, 2024
diff --git a/test/3x/torch/quantization/weight_only/test_gptq.py b/test/3x/torch/quantization/weight_only/test_gptq.py
@@ -142,6 +142,30 @@ def test_mse_search(self):
             atol_false > atol_true
         ), "use_mse_search=True doesn't help accuracy, maybe is reasonable, please double check."
 
+    def test_act_order(self):
+        # act_order=False
+        model = copy.deepcopy(self.tiny_gptj)
+        quant_config = GPTQConfig(
+            act_order=False,
+        )
+        model = prepare(model, quant_config)
+        run_fn(model)
+        model = convert(model)
+        out = model(self.example_inputs)[0]
+        atol_false = (out - self.label).amax()
+        # act_order=True
+        model = copy.deepcopy(self.tiny_gptj)
+        quant_config = GPTQConfig(
+            act_order=True,
+        )
+        model = prepare(model, quant_config)
+        run_fn(model)
+        model = convert(model)
+        out = model(self.example_inputs)[0]
+        atol_true = (out - self.label).amax()
+        # compare atol, this case is an ideal case.
+        assert atol_false > atol_true, "act_order=True doesn't help accuracy, maybe is reasonable, please double check."
+
     # def test_layer_wise(self):
     #     model = copy.deepcopy(self.tiny_gptj)
     #     quant_config = GPTQConfig(