pytorch · z-a-f · Oct 13, 2020 · Oct 13, 2020 · Oct 13, 2020 · Oct 13, 2020
diff --git a/test/quantization/test_quantized_op.py b/test/quantization/test_quantized_op.py
@@ -80,7 +80,9 @@ def qlinear_ref(X_q, X_scale, X_zp, W_q, W_scale, W_zp, b_q, Y_scale, Y_zp):
     )
     if b_q is not None:
         Prod_XqWq_ref += b_q
-    Y_q_ref = _quantize(Prod_XqWq_ref, Y_scale / (X_scale * W_scale), Y_zp)
+    Y_q_ref, _, _ = _quantize(Prod_XqWq_ref,
+                              Y_scale / (X_scale * W_scale),
+                              Y_zp)
     return Y_q_ref
 
 """Computes the output shape given pooling parameters."""
@@ -752,7 +754,7 @@ def test_qadd_relu_same_qparams(self):
 
             # Add ReLU ground truth
             C = (qA.dequantize() + qB.dequantize()).numpy()
-            qC = _quantize(C, scale, zero_point, dtype=np_dtype[dtype])
+            qC, _, _ = _quantize(C, scale, zero_point, dtype=np_dtype[dtype])
             qC_hat = add(qA, qB, scale=scale, zero_point=zero_point)
             np.testing.assert_equal(qC, qC_hat.int_repr(),
                                     "Quantized addition failed.")
@@ -766,7 +768,8 @@ def test_qadd_relu_same_qparams(self):
             # Add + ReLU ground truth
             Crelu = C.copy()
             Crelu[C < 0] = 0
-            qCrelu = _quantize(Crelu, scale, zero_point, dtype=np_dtype[dtype])
+            qCrelu, _, _ = _quantize(Crelu, scale, zero_point,
+                                     dtype=np_dtype[dtype])
             qCrelu_hat = add_relu(qA, qB, scale=scale, zero_point=zero_point)
             np.testing.assert_equal(qCrelu, qCrelu_hat.int_repr(),
                                     "Quantized addition with ReLU failed.")
@@ -807,7 +810,8 @@ def test_qadd_relu_different_qparams(self):
 
             # Add ground truth
             C = (qA.dequantize() + qB.dequantize()).numpy()
-            qC = _quantize(C, scale_C, zero_point_C, dtype=np_dtype[dtype])
+            qC, _, _ = _quantize(C, scale_C, zero_point_C,
+                                 dtype=np_dtype[dtype])
             qC_hat = add(qA, qB, scale=scale_C, zero_point=zero_point_C)
             np.testing.assert_equal(qC, qC_hat.int_repr(),
                                     "Quantized addition failed.")
@@ -821,7 +825,8 @@ def test_qadd_relu_different_qparams(self):
             # Add + ReLU ground truth
             Crelu = C.copy()
             Crelu[C < 0] = 0
-            qCrelu = _quantize(Crelu, scale_C, zero_point_C, dtype=np_dtype[dtype])
+            qCrelu, _, _ = _quantize(Crelu, scale_C, zero_point_C,
+                                     dtype=np_dtype[dtype])
             qCrelu_hat = add_relu(qA, qB, scale=scale_C, zero_point=zero_point_C)
             np.testing.assert_equal(qCrelu, qCrelu_hat.int_repr(),
                                     "Quantized addition with ReLU failed.")
@@ -852,7 +857,7 @@ def test_qmul_relu_same_qparams(self):
 
             # mul ReLU ground truth
             C = (qA.dequantize() * qB.dequantize()).numpy()
-            qC = _quantize(C, scale, zero_point, dtype=np_dtype[dtype])
+            qC, _, _ = _quantize(C, scale, zero_point, dtype=np_dtype[dtype])
             qC_hat = mul(qA, qB, scale=scale, zero_point=zero_point)
             np.testing.assert_equal(qC, qC_hat.int_repr(),
                                     "Quantized mulition failed.")
@@ -866,7 +871,8 @@ def test_qmul_relu_same_qparams(self):
             # mul + ReLU ground truth
             Crelu = C.copy()
             Crelu[C < 0] = 0
-            qCrelu = _quantize(Crelu, scale, zero_point, dtype=np_dtype[dtype])
+            qCrelu, _, _ = _quantize(Crelu, scale, zero_point,
+                                     dtype=np_dtype[dtype])
             qCrelu_hat = mul_relu(qA, qB, scale=scale, zero_point=zero_point)
             np.testing.assert_equal(qCrelu, qCrelu_hat.int_repr(),
                                     "Quantized mulition with ReLU failed.")
@@ -918,7 +924,7 @@ def test_qmul_relu_different_qparams(self):
 
             # mul ground truth
             C = (qA.dequantize() * qB.dequantize()).numpy()
-            qC = _quantize(C, scale_C, zero_point_C, dtype=np_dtype[dtype])
+            qC, _, _ = _quantize(C, scale_C, zero_point_C, dtype=np_dtype[dtype])
             qC_hat = mul(qA, qB, scale=scale_C, zero_point=zero_point_C)
             np.testing.assert_equal(qC, qC_hat.int_repr(),
                                     "Quantized multiplication failed.")
@@ -932,7 +938,8 @@ def test_qmul_relu_different_qparams(self):
             # mul + ReLU ground truth
             Crelu = C.copy()
             Crelu[C < 0] = 0
-            qCrelu = _quantize(Crelu, scale_C, zero_point_C, dtype=np_dtype[dtype])
+            qCrelu, _, _ = _quantize(Crelu, scale_C, zero_point_C,
+                                     dtype=np_dtype[dtype])
             qCrelu_hat = mul_relu(qA, qB, scale=scale_C, zero_point=zero_point_C)
             np.testing.assert_equal(qCrelu, qCrelu_hat.int_repr(),
                                     "Quantized multiplication with ReLU failed.")
@@ -970,7 +977,7 @@ def test_qmul_broadcast(self):
 
         # mul ground truth
         C = (qA.dequantize() * qB.dequantize()).numpy()
-        qC = _quantize(C, scale_C, zero_point_C)
+        qC, _, _ = _quantize(C, scale_C, zero_point_C)
         qC_hat = mul(qA, qB, scale=scale_C, zero_point=zero_point_C)
         np.testing.assert_equal(qC, qC_hat.int_repr(),
                                 "Quantized multiplication failed.")
@@ -4073,7 +4080,7 @@ def test_qnnpack_add(self, A, zero_point, scale_A, scale_B, scale_C):
             # Add ground truth
             C = (qA.dequantize() + qB.dequantize()).numpy()
 
-            qC = _quantize(C, scale_C, zero_point_C)
+            qC, _, _ = _quantize(C, scale_C, zero_point_C)
 
             qC_qnnp = torch.ops.quantized.add(qA, qB, scale_C, zero_point_C)
 

diff --git a/torch/testing/_internal/common_quantized.py b/torch/testing/_internal/common_quantized.py
@@ -21,16 +21,27 @@ def _conv_output_shape(input_size, kernel_size, padding, stride, dilation,
                      * (dilation - 1)) / stride) + 2 * output_padding + 1
 
 # Quantization references
-def _quantize(x, scale, zero_point, qmin=None, qmax=None, dtype=np.uint8):
+def _quantize(x, scale=None, zero_point=None, qmin=None, qmax=None,
+              dtype=np.uint8):
     """Quantizes a numpy array."""
     if qmin is None:
         qmin = np.iinfo(dtype).min
     if qmax is None:
         qmax = np.iinfo(dtype).max
+    if scale is None:
+        fmin = min(x.min().item(), 0)
+        fmax = max(x.max().item(), 0)
+        if fmin == fmax:
+            scale = 1.0
+        else:
+            scale = (fmax - fmin) / (qmax - qmin)
+    if zero_point is None:
+        zero_point = int(round(qmin - fmin / scale))
+        zero_point = np.clip(zero_point, qmin, qmax)
     qx = np.round(x / scale + zero_point).astype(np.int64)
     qx = np.clip(qx, qmin, qmax)
     qx = qx.astype(dtype)
-    return qx
+    return qx, scale, zero_point
 
 
 def _dequantize(qx, scale, zero_point):