intel · chensuyue · Jul 25, 2024 · Jul 23, 2024 · Jul 23, 2024 · Jul 23, 2024
diff --git a/.azure-pipelines/scripts/codeScan/pydocstyle/scan_path.txt b/.azure-pipelines/scripts/codeScan/pydocstyle/scan_path.txt
@@ -22,4 +22,6 @@
 /neural_compressor/torch/export
 /neural_compressor/common
 /neural_compressor/torch/algorithms/weight_only
-/neural_compressor/torch/algorithms/layer_wise
+/neural_compressor/torch/algorithms/layer_wise
+/neural_compressor/torch/algorithms/mixed_precision
+/neural_compressor/tensorflow
diff --git a/docs/source/3x/TensorFlow.md b/docs/source/3x/TensorFlow.md
@@ -2,12 +2,16 @@ TensorFlow
 ===============
 
 
-1. [Introduction](#introduction)
-2. [API for TensorFlow](#api-for-tensorflow)
-3. [Support Matrix](#support-matrix)  
-   3.1 [Quantization Scheme](#quantization-scheme)   
-   3.2 [Quantization Approaches](#quantization-approaches)   
-   3.3 [Backend and Device](#backend-and-device)   
+- [TensorFlow](#tensorflow)
+  - [Introduction](#introduction)
+  - [API for TensorFlow](#api-for-tensorflow)
+    - [Support Matrix](#support-matrix)
+      - [Quantization Scheme](#quantization-scheme)
+      - [Quantization Approaches](#quantization-approaches)
+        - [Post Training Static Quantization](#post-training-static-quantization)
+        - [Smooth Quantization](#smooth-quantization)
+        - [Mixed Precision](#mixed-precison)
+      - [Backend and Device](#backend-and-device)
 
 ## Introduction
 
@@ -152,9 +156,16 @@ The supported Quantization methods for TensorFlow and Keras are listed below:
             <td align="center"><a href="https://github.com/tensorflow/tensorflow">TensorFlow</a>/<a href="https://github.com/Intel-tensorflow/tensorflow">Intel TensorFlow</a></td>
         </tr>
         <tr>
-            <td rowspan="2" align="center">Smooth Quantization(SQ)</td>
-            <td rowspan="2" align="center">weights</td>
-            <td rowspan="2" align="center">calibration</td>
+            <td rowspan="1" align="center">Smooth Quantization(SQ)</td>
+            <td rowspan="1" align="center">weights</td>
+            <td rowspan="1" align="center">calibration</td>
+            <td align="center">Tensorflow</td>
+            <td align="center"><a href="https://github.com/tensorflow/tensorflow">TensorFlow</a>/<a href="https://github.com/Intel-tensorflow/tensorflow">Intel TensorFlow</a></td>
+        </tr>
+        <tr>
+            <td rowspan="1" align="center">Mixed Precision(MP)</td>
+            <td rowspan="1" align="center">weights and activations</td>
+            <td rowspan="1" align="center">NA</td>
             <td align="center">Tensorflow</td>
             <td align="center"><a href="https://github.com/tensorflow/tensorflow">TensorFlow</a>/<a href="https://github.com/Intel-tensorflow/tensorflow">Intel TensorFlow</a></td>
         </tr>
@@ -175,6 +186,10 @@ Smooth Quantization (SQ) is an advanced quantization technique designed to optim
 
 Refer to the [SQ Guide](./TF_SQ.md) for detailed information.
 
+##### Mixed Precision
+The Mixed Precision (MP) is enabled with Post Training Static Quantization. Once `BF16` is supported on machine, the matched operators will be automatically converted.
+
+
 #### Backend and Device
 Intel(R) Neural Compressor supports TF GPU with [ITEX-XPU](https://github.com/intel/intel-extension-for-tensorflow). We will automatically run model on GPU by checking if it has been installed.
 

diff --git a/neural_compressor/tensorflow/algorithms/__init__.py b/neural_compressor/tensorflow/algorithms/__init__.py
@@ -11,7 +11,7 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-
+"""Initialize all algorithms."""
 
 from neural_compressor.tensorflow.algorithms.smoother import SmoothQuant
 from neural_compressor.tensorflow.algorithms.static_quant import KerasAdaptor, TensorFlowAdaptor, Tensorflow_ITEXAdaptor
diff --git a/neural_compressor/tensorflow/algorithms/smoother/__init__.py b/neural_compressor/tensorflow/algorithms/smoother/__init__.py
@@ -14,6 +14,7 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+"""Initialize classes of smooth quant algorithm."""
 
 from neural_compressor.tensorflow.algorithms.smoother.core import SmoothQuant
 from neural_compressor.tensorflow.algorithms.smoother.scaler import (

diff --git a/neural_compressor/tensorflow/algorithms/smoother/core.py b/neural_compressor/tensorflow/algorithms/smoother/core.py
@@ -14,6 +14,7 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+"""The core components of sq."""
 
 from typing import Callable, Dict
 

diff --git a/neural_compressor/tensorflow/algorithms/static_quant/__init__.py b/neural_compressor/tensorflow/algorithms/static_quant/__init__.py
@@ -11,6 +11,7 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+"""Initialize classes of static quant algorithm."""
 
 from neural_compressor.tensorflow.algorithms.static_quant.keras import KerasAdaptor
 from neural_compressor.tensorflow.algorithms.static_quant.tensorflow import TensorFlowAdaptor, Tensorflow_ITEXAdaptor
diff --git a/neural_compressor/tensorflow/algorithms/static_quant/keras.py b/neural_compressor/tensorflow/algorithms/static_quant/keras.py
@@ -14,6 +14,7 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+"""The quantization classes for Keras."""
 
 import copy
 import json
@@ -373,9 +374,9 @@ def _calibrate(self, model, dataloader=None, calib_interation=None):
         """Apply calibration.
 
         Args:
-            model (tf.keras.Model): The model inserted with FakeQuant layers for calibration.
+            model(tf.keras.Model): The model inserted with FakeQuant layers for calibration.
             dataloader(object): The calibration dataloader used to load quantization dataset.
-            iteration(int): The iteration of calibration.
+            calib_interation(int): The iteration of calibration.
         """
         # run eagerly to fetch the numpy min/max
         results = {}
@@ -580,9 +581,9 @@ def _one_shot_query(self):
 
     def _get_specified_version_cfg(self, data):
         """Get the configuration for the current runtime.
+
         If there's no matched configuration in the input yaml, we'll
         use the `default` field of yaml.
-
         Args:
             data (Yaml content): input yaml file.
 

diff --git a/neural_compressor/tensorflow/keras/__init__.py b/neural_compressor/tensorflow/keras/__init__.py
@@ -11,6 +11,7 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+"""Initialize classes for Keras quantization."""
 
 from neural_compressor.tensorflow.keras.quantization import (
     StaticQuantConfig,

diff --git a/neural_compressor/tensorflow/keras/layers/__init__.py b/neural_compressor/tensorflow/keras/layers/__init__.py
@@ -14,6 +14,7 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+"""Initialize custom layers for Keras quantization."""
 
 from neural_compressor.tensorflow.keras.layers.conv2d import QConv2D
 from neural_compressor.tensorflow.keras.layers.dense import QDense

diff --git a/neural_compressor/tensorflow/keras/layers/conv2d.py b/neural_compressor/tensorflow/keras/layers/conv2d.py
@@ -14,6 +14,7 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+"""Initialize custom conv2d layers for Keras quantization."""
 
 import json
 
@@ -33,6 +34,8 @@
 if version1_gte_version2(tf.__version__, "2.16.1"):  # pragma: no cover
 
     class QConv2D(BaseConv):
+        """The custom quantized Conv2D layer."""
+
         def __init__(
             self,
             name,
@@ -65,6 +68,7 @@ def __init__(
             quant_axis=None,
             **kwargs
         ):
+            """Initialize custom quantized Conv2D layer."""
             super(QConv2D, self).__init__(
                 name=name,
                 rank=2,
@@ -100,6 +104,7 @@ def __init__(
             self.quant_axis = quant_axis
 
         def call(self, inputs):
+            """The __call__ function of custom quantized Conv2D layer."""
             if self.quant_status == "calib" and not isinstance(inputs, tf.keras.KerasTensor):
                 if self.granularity == "per_tensor":
                     self.act_min_value = tf.math.reduce_min(inputs)
@@ -168,9 +173,11 @@ def call(self, inputs):
 
         @classmethod
         def from_config(cls, config):
+            """Deserialize this class from a config dict."""
             return cls(**config)
 
         def get_config(self):
+            """Serialize this class to a config dict."""
             config = super(QConv2D, self).get_config()
             config.update(
                 {
@@ -193,6 +200,8 @@ def get_config(self):
 else:
 
     class QConv2D(Conv):
+        """The custom quantized Conv2D layer."""
+
         def __init__(
             self,
             name,
@@ -225,6 +234,7 @@ def __init__(
             quant_axis=None,
             **kwargs
         ):
+            """Initialize custom quantized Conv2D layer."""
             super(QConv2D, self).__init__(
                 name=name,
                 rank=2,
@@ -260,6 +270,7 @@ def __init__(
             self.quant_axis = quant_axis
 
         def call(self, inputs):
+            """The __call__ function of custom quantized Conv2D layer."""
             if self.quant_status == "calib":
                 if self.granularity == "per_tensor":
                     self.act_min_value = tf.math.reduce_min(inputs)
@@ -328,9 +339,11 @@ def call(self, inputs):
 
         @classmethod
         def from_config(cls, config):
+            """Deserialize this class from a config dict."""
             return cls(**config)
 
         def get_config(self):
+            """Serialize this class to a config dict."""
             config = super(QConv2D, self).get_config()
             config.update(
                 {
@@ -352,6 +365,7 @@ def get_config(self):
 
 
 def initialize_int8_conv2d(fp32_layer, q_config):
+    """Initialize int8 conv2d."""
     kwargs = fp32_layer.get_config()
 
     param_list = [

diff --git a/neural_compressor/tensorflow/keras/layers/dense.py b/neural_compressor/tensorflow/keras/layers/dense.py
@@ -14,6 +14,7 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+"""Initialize custom dense layers for Keras quantization."""
 
 import json
 
@@ -25,6 +26,8 @@
 
 
 class QDense(Dense):
+    """The custom quantized Dense layer."""
+
     def __init__(
         self,
         name,
@@ -51,6 +54,7 @@ def __init__(
         quant_axis=None,
         **kwargs
     ):
+        """Initialize custom quantized Dense layer."""
         super(QDense, self).__init__(
             name=name,
             units=units,
@@ -79,6 +83,7 @@ def __init__(
         self.quant_axis = quant_axis
 
     def call(self, inputs):
+        """The __call__ function of custom quantized Dense layer."""
         if self.quant_status == "calib" and not (
             version1_gte_version2(tf.__version__, "2.16.1") and isinstance(inputs, tf.keras.KerasTensor)
         ):
@@ -144,9 +149,11 @@ def call(self, inputs):
 
     @classmethod
     def from_config(cls, config):
+        """Deserialize this class from a config dict."""
         return cls(**config)
 
     def get_config(self):
+        """Serialize this class to a config dict."""
         config = super(QDense, self).get_config()
         config.update(
             {
@@ -168,6 +175,7 @@ def get_config(self):
 
 
 def initialize_int8_dense(fp32_layer, q_config):
+    """Initialize int8 dense."""
     kwargs = fp32_layer.get_config()
 
     param_list = [

diff --git a/neural_compressor/tensorflow/keras/layers/depthwise_conv2d.py b/neural_compressor/tensorflow/keras/layers/depthwise_conv2d.py
@@ -14,6 +14,7 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+"""Initialize custom depthwise conv2d layers for Keras quantization."""
 
 import json
 
@@ -35,6 +36,8 @@
 if version1_gte_version2(tf.__version__, "2.16.1"):
 
     class QDepthwiseConv2D(BaseDepthwiseConv):  # pragma: no cover
+        """The custom quantized DepthwiseConv2D layer."""
+
         def __init__(
             self,
             kernel_size,
@@ -65,6 +68,7 @@ def __init__(
             quant_axis=None,
             **kwargs
         ):
+            """Initialize custom quantized DepthwiseConv2D layer."""
             super().__init__(
                 2,
                 kernel_size=kernel_size,
@@ -98,6 +102,7 @@ def __init__(
             self.quant_axis = quant_axis
 
         def call(self, inputs):
+            """The __call__ function of custom quantized DepthwiseConv2D layer."""
             if self.quant_status == "calib" and not isinstance(inputs, tf.keras.KerasTensor):
                 if self.granularity == "per_tensor":
                     self.act_min_value = tf.math.reduce_min(inputs)
@@ -165,9 +170,11 @@ def call(self, inputs):
 
         @classmethod
         def from_config(cls, config):
+            """Deserialize this class from a config dict."""
             return cls(**config)
 
         def get_config(self):
+            """Serialize this class to a config dict."""
             config = super(QDepthwiseConv2D, self).get_config()
             config.update(
                 {
@@ -190,6 +197,8 @@ def get_config(self):
 else:
 
     class QDepthwiseConv2D(DepthwiseConv):
+        """The custom quantized DepthwiseConv2D layer."""
+
         def __init__(
             self,
             kernel_size,
@@ -220,6 +229,7 @@ def __init__(
             quant_axis=None,
             **kwargs
         ):
+            """Initialize custom quantized DepthwiseConv2D layer."""
             super().__init__(
                 2,
                 kernel_size=kernel_size,
@@ -253,6 +263,7 @@ def __init__(
             self.quant_axis = quant_axis
 
         def call(self, inputs):
+            """The __call__ function of custom quantized DepthwiseConv2D layer."""
             if self.quant_status == "calib":
                 if self.granularity == "per_tensor":
                     self.act_min_value = tf.math.reduce_min(inputs)
@@ -315,9 +326,11 @@ def call(self, inputs):
 
         @classmethod
         def from_config(cls, config):
+            """Deserialize this class from a config dict."""
             return cls(**config)
 
         def get_config(self):
+            """Serialize this class to a config dict."""
             config = super(QDepthwiseConv2D, self).get_config()
             config.update(
                 {
@@ -339,6 +352,7 @@ def get_config(self):
 
         @tf_utils.shape_type_conversion
         def compute_output_shape(self, input_shape):
+            """Compute_output_shape."""
             if self.data_format == "channels_first":
                 rows = input_shape[2]
                 cols = input_shape[3]
@@ -369,6 +383,7 @@ def compute_output_shape(self, input_shape):
 
 
 def initialize_int8_depthwise_conv2d(fp32_layer, q_config):
+    """Initialize int8 depthwise conv2d."""
     kwargs = fp32_layer.get_config()
     q_name = fp32_layer.name
 

diff --git a/neural_compressor/tensorflow/keras/layers/layer_initializer.py b/neural_compressor/tensorflow/keras/layers/layer_initializer.py
@@ -14,6 +14,7 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+"""Initialize layer initializer functions."""
 
 from neural_compressor.tensorflow.keras.layers.conv2d import initialize_int8_conv2d
 from neural_compressor.tensorflow.keras.layers.dense import initialize_int8_dense