openvinotoolkit · alexsu52 · Mar 22, 2024 · Oct 13, 2023 · Oct 13, 2023 · Oct 18, 2023
@@ -45,28 +45,36 @@ def collect_statistics(self, model: TModel, graph: NNCFGraph) -> None:
         """
         if not self.statistic_points:
             return
-
+        collected_statistics_num = 0
         model_transformer = factory.ModelTransformerFactory.create(model)
 
         merged_statistics = self._get_merged_statistic_points(self.statistic_points, model, graph)
         transformation_layout = self._get_transformation_layout_extra_outputs(merged_statistics)
         model_with_outputs = model_transformer.transform(transformation_layout)
         engine = factory.EngineFactory.create(model_with_outputs)
 
+        batch_size = self.dataset.get_batch_size()
+        batch_size = 1 if batch_size is None else batch_size
         dataset_length = self.dataset.get_length()
+        dataset_length = dataset_length * batch_size if dataset_length is not None else dataset_length
         total = (
             min(dataset_length or self.stat_subset_size, self.stat_subset_size)
             if self.stat_subset_size is not None
             else None
         )
-        for input_data in track(
-            islice(self.dataset.get_inference_data(), self.stat_subset_size),
-            total=total,
-            description="Statistics collection",
-        ):
-            outputs = engine.infer(input_data)
-            processed_outputs = self._process_outputs(outputs)
-            self._register_statistics(processed_outputs, merged_statistics)
+        with track(total=total, description="Statistics collection") as pbar:
+            for input_data in islice(self.dataset.get_inference_data(), self.stat_subset_size):
+                batch_size_to_collect = (
+                    min(total - collected_statistics_num, batch_size) if total is not None else batch_size
+                )
+                sliced_iput = self._get_sliced_data(input_data, batch_size_to_collect)
+                outputs = engine.infer(sliced_iput)
+                processed_outputs = self._process_outputs(outputs)
+                self._register_statistics(processed_outputs, merged_statistics)
+                collected_statistics_num += batch_size_to_collect
+                pbar.progress.update(pbar.task, advance=batch_size_to_collect)
+                if total and collected_statistics_num == total:
+                    break
 
     def register_statistic_points(self, statistic_points: StatisticPointsContainer) -> None:
         """
@@ -134,3 +142,8 @@ def _process_outputs(outputs: Any) -> Dict[str, NNCFTensor]:
         :param outputs: raw model outputs
         :return: processed model outputs in Dict[str, NNCFTensor] format
         """
+
+    @staticmethod
+    @abstractmethod
+    def _get_sliced_data(inputs: Any, end: int) -> Any:
+        """ """
@@ -81,6 +81,12 @@ def get_length(self) -> Optional[int]:
             return self._data_source.__len__()
         return None
 
+    def get_batch_size(self) -> Optional[int]:
+        """ """
+        if hasattr(self._data_source, "batch_size"):
+            return self._data_source.batch_size
+        return None
+
 
 class DataProvider(Generic[DataItem, ModelInput]):
     def __init__(

diff --git a/nncf/experimental/common/tensor_statistics/collectors.py b/nncf/experimental/common/tensor_statistics/collectors.py
@@ -12,7 +12,6 @@
 from abc import ABC
 from abc import abstractmethod
 from collections import defaultdict
-from collections import deque
 from typing import Any, Dict, List, Optional, Set, Tuple, Type, TypeVar, Union
 
 from nncf.common.tensor import TensorType
@@ -129,16 +128,14 @@ def __init__(
         """
         :param tensor_processor: Backend-specific tensor processor.
         :param aggregation_axes: Axes along which to operate.
-            Registered statistics are stacked along zero axis,
-            axes >=1 correspond to recieved statistic axes shifted left by 1.
         :param num_samples: Maximum number of samples to collect. Aggregator
             skips tensor registration if tensor registration was called num_samples times before.
             Aggregator never skips registration if num_samples is None.
         """
 
         self._tensor_processor = tensor_processor
-        self._aggregation_axes = (0,) if aggregation_axes is None else aggregation_axes
-        self._keepdims = False
+        self._aggregation_axes = (0,) if aggregation_axes is None else (0, *map(lambda x: x + 1, aggregation_axes))
+        self._keepdims = True
         self._num_samples = num_samples
         self._collected_samples = 0
         self._container = []
@@ -594,20 +591,7 @@ def _aggregate_impl(self):
         return self._container.shape
 
 
-class TensorAggregatorBase(AggregatorBase, ABC):
-    def __init__(
-        self,
-        tensor_processor: NNCFCollectorTensorProcessor,
-        aggregation_axes: Optional[AggregationAxes] = None,
-        num_samples: Optional[int] = None,
-        window_size=None,
-    ):
-        super().__init__(tensor_processor, aggregation_axes=aggregation_axes, num_samples=num_samples)
-        self._window_size = window_size
-        self._container = deque(maxlen=window_size)
-
-
-class OnlineAggregatorBase(TensorAggregatorBase, ABC):
+class OnlineAggregatorBase(AggregatorBase, ABC):
     """
     Base class for aggregators which are using aggregation function fn with following property:
     fn([x1, x2, x3]) == fn([fn([x1, x2]), x3]) where x1, x2, x3 are samples to aggregate.
@@ -616,26 +600,14 @@ class OnlineAggregatorBase(TensorAggregatorBase, ABC):
     """
 
     def _register_reduced_input_impl(self, x: NNCFTensor) -> None:
-        online_aggregation_axes = tuple(dim - 1 for dim in self._aggregation_axes if dim != 0)
-        if online_aggregation_axes:
-            reduced = self._aggregation_fn(x, axis=online_aggregation_axes, keepdims=self._keepdims)
-        else:
-            reduced = x
-        if 0 in self._aggregation_axes:
-            if self._container:
-                reduced = self._aggregation_fn(
-                    self._tensor_processor.stack([reduced, self._container]), axis=0, keepdims=False
-                )
-            self._container = reduced
-        else:
-            self._container.append(reduced)
+        stacked_tensors = self._tensor_processor.stack([x, *self._container])
+        aggregated = self._aggregation_fn(stacked_tensors, axis=self._aggregation_axes, keepdims=self._keepdims)
+        squeezed = self._tensor_processor.squeeze(aggregated, 0)
+        self._container = [squeezed]
 
     def _aggregate_impl(self) -> NNCFTensor:
-        if 0 in self._aggregation_axes:
-            if self._keepdims:
-                return self._tensor_processor.stack([self._container]).tensor
-            return self._container.tensor
-        return self._tensor_processor.stack(self._container).tensor
+        assert len(self._container) == 1
+        return self._container[0].tensor
 
     @abstractmethod
     def _aggregation_fn(self, stacked_value: NNCFTensor, axis: AggregationAxes, keepdims: bool) -> NNCFTensor:
@@ -652,7 +624,7 @@ def _aggregation_fn(self, stacked_value: NNCFTensor, axis: AggregationAxes, keep
         return self._tensor_processor.reduce_max(stacked_value, axis=axis, keepdims=keepdims)
 
 
-class OfflineAggregatorBase(TensorAggregatorBase, ABC):
+class OfflineAggregatorBase(AggregatorBase, ABC):
     """
     Base class for aggregators which are using aggregation function fn which
     does not fulfill property fn([x1, x2, x3]) == fn([fn([x1, x2]), x3])
@@ -665,7 +637,8 @@ def _register_reduced_input_impl(self, x: TensorType) -> None:
 
     def _aggregate_impl(self) -> NNCFTensor:
         stacked_val = self._tensor_processor.stack(self._container)
-        return self._aggregation_fn(stacked_val, axis=self._aggregation_axes, keepdims=self._keepdims).tensor
+        aggregated = self._aggregation_fn(stacked_val, axis=self._aggregation_axes, keepdims=self._keepdims)
+        return self._tensor_processor.squeeze(aggregated, 0).tensor
 
     @abstractmethod
     def _aggregation_fn(self, stacked_value: NNCFTensor, axis: AggregationAxes, keepdims: bool) -> NNCFTensor:
@@ -688,12 +661,9 @@ def __init__(
         tensor_processor: NNCFCollectorTensorProcessor,
         aggregation_axes: Optional[AggregationAxes] = None,
         num_samples: Optional[int] = None,
-        window_size=None,
         quantile: float = 0.01,
     ):
         super().__init__(tensor_processor, aggregation_axes=aggregation_axes, num_samples=num_samples)
-        self._window_size = window_size
-        self._container = deque(maxlen=window_size)
         self._quantile = quantile
 
     def _aggregate_impl(self) -> NNCFTensor:
@@ -734,7 +704,7 @@ def _aggregation_fn(
         return self._tensor_processor.masked_median(stacked_samples, axis=axis, mask=mask, keepdims=keepdims)
 
 
-class MedianAbsoluteDeviationAggregator(TensorAggregatorBase):
+class MedianAbsoluteDeviationAggregator(AggregatorBase):
     def _register_reduced_input_impl(self, x: TensorType) -> None:
         return self._container.append(x)
 
@@ -759,19 +729,16 @@ def _aggregate_impl(self) -> Dict[str, NNCFTensor]:
         }
 
 
-class PercentileAggregator(TensorAggregatorBase):
+class PercentileAggregator(AggregatorBase):
     def __init__(
         self,
         tensor_processor: NNCFCollectorTensorProcessor,
         percentiles_to_collect: List[float],
         aggregation_axes: Optional[AggregationAxes] = None,
         num_samples: Optional[int] = None,
-        window_size=None,
     ):
         super().__init__(tensor_processor, aggregation_axes=aggregation_axes, num_samples=num_samples)
         self._percentiles_to_collect = percentiles_to_collect
-        self._window_size = window_size
-        self._container = deque(maxlen=window_size)
 
     def _register_reduced_input_impl(self, x: TensorType) -> None:
         return self._container.append(x)

diff --git a/nncf/onnx/statistics/aggregator.py b/nncf/onnx/statistics/aggregator.py
@@ -80,3 +80,7 @@ def _get_merged_statistic_points(
     @staticmethod
     def _process_outputs(outputs: Dict[str, np.ndarray]) -> Dict[str, ONNXNNCFTensor]:
         return {n: ONNXNNCFTensor(v) for n, v in outputs.items()}
+
+    @staticmethod
+    def _get_sliced_data(inputs: Dict[str, np.ndarray], end: int) -> Dict[str, ONNXNNCFTensor]:
+        return inputs
diff --git a/nncf/openvino/statistics/aggregator.py b/nncf/openvino/statistics/aggregator.py
@@ -111,3 +111,7 @@ def _get_merged_statistic_points(
     @staticmethod
     def _process_outputs(outputs: Dict[str, np.ndarray]) -> Dict[str, OVNNCFTensor]:
         return {n: OVNNCFTensor(v) for n, v in outputs.items()}
+
+    @staticmethod
+    def _get_sliced_data(inputs: Dict[str, np.ndarray], end: int) -> Dict[str, OVNNCFTensor]:
+        return inputs
diff --git a/nncf/openvino/statistics/collectors.py b/nncf/openvino/statistics/collectors.py
@@ -271,16 +271,12 @@ def get_output_names(self, target_node_name: str, port_id: int) -> List[str]:
         return get_reducer_output_node_names(self.name, target_node_name, port_id, self.output_port_id, self.inplace)
 
 
-def get_mean_statistic_collector(
-    num_samples: int, channel_axis: int, window_size: Optional[int] = None, inplace: bool = True
-) -> TensorCollector:
+def get_mean_statistic_collector(num_samples: int, channel_axis: int, inplace: bool = True) -> TensorCollector:
     """
     Mean statistic collector builder.
 
     :param num_samples: Maximum number of samples to collect.
     :param channel_axis: Channel axis to use during reduction phase.
-    :param window_size: Number of samples from the end of the list of collected samples to aggregate.
-        Aggregates all available collected statistics in case parameter is None.
     :param inplace: Whether the mean reducer should be calculated inplace or out of place.
     :return: Mean statistic collector.
     """
@@ -296,7 +292,6 @@ def get_mean_statistic_collector(
     kwargs = {
         "tensor_processor": OVNNCFCollectorTensorProcessor,
         "num_samples": num_samples,
-        "window_size": window_size,
     }
     aggregate_mean = MeanAggregator(**kwargs)
     aggregate_shape = ShapeAggregator()

diff --git a/nncf/quantization/algorithms/bias_correction/openvino_backend.py b/nncf/quantization/algorithms/bias_correction/openvino_backend.py
@@ -67,9 +67,8 @@ def mean_statistic_collector(
         channel_axis: int,
         inplace: bool,
         num_samples: Optional[int] = None,
-        window_size: Optional[int] = None,
     ) -> TensorCollector:
-        return get_mean_statistic_collector(num_samples, channel_axis, window_size, inplace)
+        return get_mean_statistic_collector(num_samples, channel_axis, inplace)
 
     @staticmethod
     def raw_statistic_collector(inplace: bool, num_samples: int = None) -> TensorCollector:

diff --git a/nncf/quantization/algorithms/fast_bias_correction/openvino_backend.py b/nncf/quantization/algorithms/fast_bias_correction/openvino_backend.py
@@ -53,9 +53,8 @@ def mean_statistic_collector(
         channel_axis: int,
         inplace: bool,
         num_samples: Optional[int] = None,
-        window_size: Optional[int] = None,
     ) -> TensorCollector:
-        return get_mean_statistic_collector(num_samples, channel_axis, window_size, inplace)
+        return get_mean_statistic_collector(num_samples, channel_axis, inplace)
 
     @staticmethod
     def get_sub_input_output_names(subgraph: ov.Model) -> Tuple[str, str]:

diff --git a/nncf/quantization/algorithms/fast_bias_correction/torch_backend.py b/nncf/quantization/algorithms/fast_bias_correction/torch_backend.py
@@ -65,9 +65,8 @@ def mean_statistic_collector(
         channel_axis: int,
         inplace: bool,
         num_samples: Optional[int] = None,
-        window_size: Optional[int] = None,
     ) -> TensorCollector:
-        return get_mean_statistic_collector(num_samples, channel_axis, window_size)
+        return get_mean_statistic_collector(num_samples, channel_axis)
 
     @staticmethod
     def get_sub_input_output_names(subgraph: NNCFNetwork) -> Tuple[str, str]: