Add compression_lr_multiplier for tf part

openvinotoolkit · Jul 22, 2021 · e2a39be · e2a39be
1 parent e4fbd2d
commit e2a39be
Show file tree

Hide file tree

Showing 20 changed files with 817 additions and 511 deletions.
diff --git a/nncf/common/quantization/structs.py b/nncf/common/quantization/structs.py
@@ -136,7 +136,8 @@ def __init__(self, num_bits: int,
                  mode: QuantizationMode,
                  signedness_to_force: bool,
                  narrow_range: bool,
-                 half_range: bool):
+                 half_range: bool,
+                 compression_lr_multiplier: Optional[float] = None):
         """
         :param num_bits: Bitwidth of the quantization.
         :param mode: The mode of quantization (symmetric or asymmetric).
@@ -147,23 +148,28 @@ def __init__(self, num_bits: int,
             naive case, False if all 2^`num_bits` quantizations should be used.
         :param half_range: If ``True`` effectively only a half of an quantizer range are used.
             False - the full range are used.
+        :compression_lr_multiplier: Multiplier for gradient values
         """
         self.num_bits = num_bits
         self.mode = mode
         self.signedness_to_force = signedness_to_force
         self.narrow_range = narrow_range
         self.half_range = half_range
+        self.compression_lr_multiplier = compression_lr_multiplier
 
     def __eq__(self, other: 'QuantizerSpec'):
         return self.__dict__ == other.__dict__
 
     @classmethod
-    def from_config(cls, qconfig: QuantizerConfig, narrow_range: bool, half_range: bool) -> 'QuantizerSpec':
+    def from_config(cls, qconfig: QuantizerConfig,
+                    narrow_range: bool, half_range: bool,
+                    compression_lr_multiplier: Optional[float]) -> 'QuantizerSpec':
         return cls(qconfig.num_bits,
                    qconfig.mode,
                    qconfig.signedness_to_force,
                    narrow_range,
-                   half_range)
+                   half_range,
+                   compression_lr_multiplier)
 
 
 class QuantizationConstraints:

diff --git a/nncf/tensorflow/functions.py b/nncf/tensorflow/functions.py
@@ -12,6 +12,7 @@
 """
 
 import tensorflow as tf
+from typing import Callable, Optional
 
 
 @tf.function
@@ -24,3 +25,13 @@ def st_threshold(input_):
     def grad(upstream):
         return upstream
     return tf.round(input_), grad
+
+
+def get_id_with_multiplied_grad() -> Callable[[tf.Tensor, tf.Tensor], tf.Tensor]:
+    @tf.custom_gradient
+    def id_with_multiplied_grad(x, grad_multiplier):
+        def grad(upstream):
+            return grad_multiplier, 0
+        return x, grad
+
+    return id_with_multiplied_grad
diff --git a/nncf/tensorflow/quantization/algorithm.py b/nncf/tensorflow/quantization/algorithm.py
@@ -11,10 +11,7 @@
  limitations under the License.
 """
 from copy import deepcopy
-from typing import Any
-from typing import Dict
-from typing import List
-from typing import Tuple
+from typing import Any, Dict, List, Optional, Tuple
 
 import tensorflow as tf
 
@@ -394,9 +391,11 @@ def _get_quantizer_setup(self, model: tf.keras.Model) -> TFQuantizationSetup:
 
                     half_range = self._get_half_range(qconfig)
                     applied_saturation_fix = applied_saturation_fix or half_range
+                    compression_lr_multiplier = self._get_compression_lr_multiplier()
                     quantizer_spec = TFQuantizerSpec.from_config(qconfig,
                                                                  narrow_range=not half_range,
-                                                                 half_range=half_range)
+                                                                 half_range=half_range,
+                                                                 compression_lr_multiplier=compression_lr_multiplier)
                     target_point = TFLayerWeight(layer_info.layer_name, weight_def.weight_attr_name)
                     qpoint = TFQuantizationPoint(op_name, quantizer_spec, target_point)
                     setup.add_quantization_point(qpoint)
@@ -407,7 +406,9 @@ def _get_quantizer_setup(self, model: tf.keras.Model) -> TFQuantizationSetup:
                 target_node_name = ip.target_node_name
                 input_port_id = ip.input_port_id
                 fake_quantize_name = self._get_fake_quantize_name(target_node_name, input_port_id)
-                quantizer_spec = TFQuantizerSpec.from_config(qp.qconfig, narrow_range=False, half_range=False)
+                compression_lr_multiplier = self._get_compression_lr_multiplier()
+                quantizer_spec = TFQuantizerSpec.from_config(qp.qconfig, narrow_range=False, half_range=False,
+                                                             compression_lr_multiplier=compression_lr_multiplier)
                 fake_quantize_layer = FakeQuantize(
                     quantizer_spec,
                     name=fake_quantize_name)
@@ -565,6 +566,10 @@ def _get_fake_quantize_name(self, node_name: NNCFNodeName, input_port_id: int =
     def _get_quantizer_operation_name(self, layer_name, weight_attr_name):
         return f'{layer_name}_{weight_attr_name}_quantizer'
 
+    def _get_compression_lr_multiplier(self) -> Optional[float]:
+        return self.config.get_redefinable_global_param_value_for_algo('compression_lr_multiplier',
+                                                                       self.name)
+
 
 class QuantizationController(BaseCompressionAlgorithmController):
     def __init__(self, target_model, config, op_names: List[str]):

diff --git a/nncf/tensorflow/quantization/layers.py b/nncf/tensorflow/quantization/layers.py
@@ -14,6 +14,7 @@
 import tensorflow as tf
 
 from nncf.common.quantization.structs import QuantizationMode
+from nncf.tensorflow.functions import get_id_with_multiplied_grad
 from nncf.tensorflow.layers.custom_objects import NNCF_CUSTOM_OBJECTS
 from nncf.tensorflow.layers.custom_objects import NNCF_QUANTIZATION_OPERATONS
 from nncf.tensorflow.layers.operation import InputType
@@ -33,7 +34,12 @@ def __init__(self, config: TFQuantizerSpec, data_format: str ='channels_last', *
 
         self._op_name = f'{self.name}_quantizer'
         self._quantizer = self._create_quantizer(config, self._op_name)
-        self._quantizer_weights = {}
+        self._quantizer_weights_dict = {}
+        self.id_with_multiplied_grad = get_id_with_multiplied_grad()
+        if config.compression_lr_multiplier is None:
+            self.compression_lr_multiplier = 1.
+        else:
+            self.compression_lr_multiplier = float(config.compression_lr_multiplier)
 
     @property
     def num_bits(self):
@@ -79,6 +85,24 @@ def enabled(self):
     def enabled(self, v):
         self._quantizer.enabled = v
 
+    @property
+    def _quantizer_weights(self):
+        res = {}
+        for k in self._quantizer_weights_dict:
+            res[k] = self.id_with_multiplied_grad(self._quantizer_weights_dict[k], self.compression_lr_multiplier)
+        return res
+
+    @property
+    def _real_quantizer_weights(self):
+        res = {}
+        for k in self._quantizer_weights_dict:
+            res[k] = self._quantizer_weights_dict[k]
+        return res
+
+    @_quantizer_weights.setter
+    def _quantizer_weights(self, value):
+        self._quantizer_weights_dict = value
+
     def build(self, input_shape):
         self._quantizer_weights = self._quantizer.build(
             input_shape, InputType.INPUTS, self.name, self)
@@ -91,7 +115,7 @@ def register_hook_pre_quantizer(self, hook):
         return self._quantizer.register_hook_pre_call(hook)
 
     def apply_range_initialization(self, min_values, max_values, min_range=0.1, eps=0.01):
-        self._quantizer.apply_range_initialization(self._quantizer_weights, min_values, max_values, min_range, eps)
+        self._quantizer.apply_range_initialization(self._real_quantizer_weights, min_values, max_values, min_range, eps)
 
     def _create_quantizer(self, qspec: TFQuantizerSpec, op_name: str) -> Quantizer:
         quantizer_cls = NNCF_QUANTIZATION_OPERATONS.get(qspec.mode)

diff --git a/nncf/tensorflow/quantization/quantizers.py b/nncf/tensorflow/quantization/quantizers.py
@@ -36,18 +36,21 @@ def __init__(self, num_bits: int,
                  signedness_to_force: Optional[bool],
                  narrow_range: bool,
                  half_range: bool,
-                 per_channel: bool):
-        super().__init__(num_bits, mode, signedness_to_force, narrow_range, half_range)
+                 per_channel: bool,
+                 compression_lr_multiplier: Optional[float] = None):
+        super().__init__(num_bits, mode, signedness_to_force, narrow_range, half_range, compression_lr_multiplier)
         self.per_channel = per_channel
 
     @classmethod
-    def from_config(cls, qconfig: QuantizerConfig, narrow_range: bool, half_range: bool) -> 'TFQuantizerSpec':
+    def from_config(cls, qconfig: QuantizerConfig, narrow_range: bool, half_range: bool,
+                    compression_lr_multiplier: Optional[float] = None) -> 'TFQuantizerSpec':
         return cls(qconfig.num_bits,
                    qconfig.mode,
                    qconfig.signedness_to_force,
                    narrow_range,
                    half_range,
-                   qconfig.per_channel)
+                   qconfig.per_channel,
+                   compression_lr_multiplier)
 
     def get_state(self) -> Dict[str, Any]:
         """
@@ -62,7 +65,8 @@ def get_state(self) -> Dict[str, Any]:
             'signedness_to_force': self.signedness_to_force,
             'narrow_range': self.narrow_range,
             'half_range': self.half_range,
-            'per_channel': self.per_channel
+            'per_channel': self.per_channel,
+            'compression_lr_multiplier': self.compression_lr_multiplier
         }
 
     @classmethod
@@ -285,6 +289,7 @@ def __init__(self, name: str, qspec: TFQuantizerSpec):
         self.narrow_range = qspec.narrow_range
         self.signedness_to_force = qspec.signedness_to_force
         self._half_range = qspec.half_range
+        self.compression_lr_multiplier = qspec.compression_lr_multiplier
 
     @property
     def half_range(self):
@@ -389,6 +394,7 @@ def get_config(self):
             'narrow_range': self.narrow_range,
             'half_range': self._half_range,
             'per_channel': self.per_channel,
+            'compression_lr_multiplier': self.compression_lr_multiplier,
         }
         config = {
             'quantizer_spec': qspec_dict,
@@ -404,7 +410,8 @@ def from_config(cls, config):
                                 signedness_to_force=qspec_dict['signedness_to_force'],
                                 narrow_range=qspec_dict['narrow_range'],
                                 half_range=qspec_dict['half_range'],
-                                per_channel=qspec_dict['per_channel'])
+                                per_channel=qspec_dict['per_channel'],
+                                compression_lr_multiplier=qspec_dict['compression_lr_multiplier'])
         name = config['name']
         return cls(name, qspec)
 
@@ -419,6 +426,7 @@ def __init__(self, name: str, qspec: TFQuantizerSpec):
         self.narrow_range = qspec.narrow_range
         self.per_channel = qspec.per_channel
         self._half_range = qspec.half_range
+        self.compression_lr_multiplier = compression_lr_multiplier
 
     @property
     def half_range(self):
@@ -519,6 +527,7 @@ def get_config(self):
             'narrow_range': self.narrow_range,
             'half_range': self._half_range,
             'per_channel': self.per_channel,
+            'compression_lr_multiplier': self.compression_lr_multiplier,
         }
         config = {
             'quantizer_spec': qspec_dict,
@@ -534,6 +543,7 @@ def from_config(cls, config):
                                 signedness_to_force=None,
                                 narrow_range=qspec_dict['narrow_range'],
                                 half_range=qspec_dict['half_range'],
-                                per_channel=qspec_dict['per_channel'])
+                                per_channel=qspec_dict['per_channel'],
+                                compression_lr_multiplier=qspec_dict['compression_lr_multiplier'])
         name = config['name']
         return cls(name, qspec)
diff --git a/nncf/torch/quantization/layers.py b/nncf/torch/quantization/layers.py
@@ -59,17 +59,15 @@ def __init__(self, num_bits: int,
                  half_range: bool,
                  scale_shape: Tuple[int, ...],
                  logarithm_scale: bool,
-                 compression_lr_multiplier: float = None):
-        super().__init__(num_bits, mode, signedness_to_force, narrow_range, half_range)
+                 compression_lr_multiplier: Optional[float] = None):
+        super().__init__(num_bits, mode, signedness_to_force, narrow_range, half_range, compression_lr_multiplier)
         self.scale_shape = scale_shape
         self.logarithm_scale = logarithm_scale
-        self.compression_lr_multiplier = compression_lr_multiplier
-
 
     @classmethod
     def from_config(cls, qconfig: QuantizerConfig, narrow_range: bool,
                     half_range: bool, scale_shape: Tuple[int],
-                    logarithm_scale: bool, compression_lr_multiplier: float) -> 'PTQuantizerSpec':
+                    logarithm_scale: bool, compression_lr_multiplier: Optional[float] = None) -> 'PTQuantizerSpec':
         return cls(qconfig.num_bits,
                    qconfig.mode,
                    qconfig.signedness_to_force,

diff --git a/tests/common/helpers.py b/tests/common/helpers.py
@@ -10,13 +10,19 @@
  See the License for the specific language governing permissions and
  limitations under the License.
 """
-
-from pathlib import Path
+import numpy as np
 import os
 import shutil
 import subprocess
 import sys
 
+from abc import ABC
+from abc import abstractmethod
+from pathlib import Path
+from typing import Callable, List, TypeVar
+
+TensorType = TypeVar('TensorType')
+
 TEST_ROOT = Path(__file__).absolute().parents[1]
 PROJECT_ROOT = TEST_ROOT.parent.absolute()
 EXAMPLES_DIR = PROJECT_ROOT / 'examples'
@@ -113,3 +119,43 @@ def run_install_checks(venv_path, tmp_path, package_type, test_dir, install_type
                                                install_mode,
                                                package_type),
         check=True, shell=True, cwd=run_path)
+
+
+class BaseTensorListComparator(ABC):
+    @classmethod
+    @abstractmethod
+    def _to_numpy(cls, tensor: TensorType) -> np.ndarray:
+        pass
+
+    @classmethod
+    def _compare_tensor_lists(cls, test: List[TensorType], reference: List[TensorType],
+                              assert_fn: Callable[[np.ndarray, np.ndarray], bool]):
+        assert len(test) == len(reference)
+
+        for x, y in zip(test, reference):
+            x = cls._to_numpy(x)
+            y = cls._to_numpy(y)
+            assert_fn(x, y)
+
+    @classmethod
+    def check_equal(cls, test: List[TensorType], reference: List[TensorType], rtol: float = 1e-1):
+        cls._compare_tensor_lists(test, reference,
+                                  lambda x, y: np.testing.assert_allclose(x, y, rtol=rtol))
+
+    @classmethod
+    def check_not_equal(cls, test: List[TensorType], reference: List[TensorType], rtol: float = 1e-4):
+        cls._compare_tensor_lists(test, reference,
+                                  lambda x, y: np.testing.assert_raises(AssertionError,
+                                                                        np.testing.assert_allclose, x, y, rtol=rtol))
+
+    @classmethod
+    def check_less(cls, test: List[TensorType], reference: List[TensorType], rtol=1e-4):
+        cls.check_not_equal(test, reference, rtol=rtol)
+        cls._compare_tensor_lists(test, reference, np.testing.assert_array_less)
+
+    @classmethod
+    def check_greater(cls, test: List[TensorType], reference: List[TensorType], rtol=1e-4):
+        cls.check_not_equal(test, reference, rtol=rtol)
+        cls._compare_tensor_lists(test, reference,
+                                  lambda x, y: np.testing.assert_raises(AssertionError,
+                                                                        np.testing.assert_array_less, x, y))