diff --git a/neural_compressor/adaptor/pytorch.py b/neural_compressor/adaptor/pytorch.py index 833d011f858..5984e8150ea 100644 --- a/neural_compressor/adaptor/pytorch.py +++ b/neural_compressor/adaptor/pytorch.py @@ -2231,6 +2231,7 @@ def quantize(self, tune_cfg, model, dataloader, q_func=None): q_model = torch.jit.trace(q_model, example_inputs, strict=False) q_model = torch.jit.freeze(q_model.eval()) else: + q_model = ipex.quantization.convert(q_model) with torch.no_grad(): try: q_model = torch.jit.trace(q_model, example_inputs)