Source code for aimet_onnx.cross_layer_equalization

# /usr/bin/env python3.5
# -*- mode: python -*-
# =============================================================================
#  @@-COPYRIGHT-START-@@
#
#  Copyright (c) 2022-2023, Qualcomm Innovation Center, Inc. All rights reserved.
#
#  Redistribution and use in source and binary forms, with or without
#  modification, are permitted provided that the following conditions are met:
#
#  1. Redistributions of source code must retain the above copyright notice,
#     this list of conditions and the following disclaimer.
#
#  2. Redistributions in binary form must reproduce the above copyright notice,
#     this list of conditions and the following disclaimer in the documentation
#     and/or other materials provided with the distribution.
#
#  3. Neither the name of the copyright holder nor the names of its contributors
#     may be used to endorse or promote products derived from this software
#     without specific prior written permission.
#
#  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
#  AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
#  IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
#  ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
#  LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
#  CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
#  SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
#  INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
#  CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
#  ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
#  POSSIBILITY OF SUCH DAMAGE.
#
#  SPDX-License-Identifier: BSD-3-Clause
#
#  @@-COPYRIGHT-END-@@
# =============================================================================

""" Cross Layer Equalization

Some terminology for this code.
CLS set: Set of layers (2 or 3) that can be used for cross-layer scaling
Layer groups: Groups of layers that are immediately connected and can be decomposed further into CLS sets
"""

from typing import Tuple, List, Union
import numpy as np
from onnx import onnx_pb, numpy_helper
from onnxruntime.quantization.onnx_quantizer import ONNXModel

from aimet_common.utils import AimetLogger
from aimet_common.connected_graph.connectedgraph import get_ordered_ops
from aimet_common.cross_layer_equalization import GraphSearchUtils, CrossLayerScaling as CLS, ClsSetInfo, \
    HighBiasFold as HBF
import aimet_common.libpymo as libpymo      # pylint: disable=import-error

from aimet_onnx.meta.connectedgraph import ConnectedGraph, WEIGHT_INDEX, BIAS_INDEX
from aimet_onnx.meta.operations import Op
from aimet_onnx.utils import transpose_tensor, ParamUtils, get_node_attribute, replace_relu6_with_relu
from aimet_onnx.batch_norm_fold import BNLayer, fold_all_batch_norms_to_weight

logger = AimetLogger.get_area_logger(AimetLogger.LogAreas.Quant)

ClsSet = Union[Tuple['Conv', 'Conv'],
               Tuple['Conv', 'Conv', 'Conv']]
ScaleFactor = Union[np.ndarray, Tuple[np.ndarray]]
cls_supported_layer_types = ['Conv', 'ConvTranspose']
cls_supported_activation_types = ['Relu', 'PRelu']


def get_ordered_list_of_conv_modules(list_of_starting_ops: List) -> List:
    """
    Finds order of nodes in graph
    :param list_of_starting_ops: list of starting ops for the model
    :return: List of names in graph in order
    """
    module_list = get_ordered_ops(list_of_starting_ops)
    module_list = [[module.dotted_name, module] for module in module_list if module.type in cls_supported_layer_types]
    return module_list


class CrossLayerScaling(CLS):
    """
    Scales a model's layers to equalize the weights between consecutive layers
    """
    def __init__(self, model: onnx_pb.ModelProto):
        """
        :param model: ONNX model
        """
        super().__init__()
        self._model = model

    def scale_model(self) -> List[ClsSetInfo]:
        """
        Uses cross-layer scaling to scale all applicable layers in the given model

        :param model: Model to scale
        :return: CLS information for each CLS set
        """
        # Find layer groups
        connected_graph = ConnectedGraph(self._model)
        ordered_module_list = get_ordered_list_of_conv_modules(connected_graph.starting_ops)
        graph_search = GraphSearchUtils(connected_graph, ordered_module_list, cls_supported_layer_types,
                                        cls_supported_activation_types)
        layer_groups = graph_search.find_layer_groups_to_scale()

        # Find cls sets from the layer groups
        cls_sets = []
        for layer_group in layer_groups:
            cls_set = GraphSearchUtils.convert_layer_group_to_cls_sets(layer_group)
            cls_sets += cls_set

        # Scale the CLS sets
        scale_factors = self.scale_cls_sets(cls_sets)

        # Find if there were relu activations between layers of each cls set
        is_relu_activation_in_cls_sets = graph_search.is_relu_activation_present_in_cls_sets(cls_sets)

        # Convert to a list of cls-set-info elements
        cls_set_info_list = CrossLayerScaling.create_cls_set_info_list(cls_sets, scale_factors,
                                                                       is_relu_activation_in_cls_sets)

        return cls_set_info_list

    def _populate_libpymo_params(self, module: onnx_pb.NodeProto,
                                 layer_param: libpymo.EqualizationParams):
        """
        Populates libpymo weight parameter
        """
        weight = ParamUtils.get_param(self._model.model, module, WEIGHT_INDEX)
        groups = get_node_attribute(module, "group")

        # Transpose weights to C, N, H, W from N, C, H, W since axis are flipped for transposed conv
        if module.op_type == "ConvTranspose" and groups == 1:
            weight = transpose_tensor(weight, (1, 0, 2, 3))

        layer_param.weight = numpy_helper.to_array(weight).reshape(-1)
        weight_shape = get_weight_dimensions(np.array(weight.dims))
        layer_param.weightShape = weight_shape

    def _pack_params_for_conv(self,
                              cls_set,
                              prev_layer_params: libpymo.EqualizationParams,
                              curr_layer_params: libpymo.EqualizationParams):
        """
        Prepare and pack data structure for previous and current layer in given cls set.

        :param cls_set: Consecutive Conv layers Tuple whose weights and biases need to be equalized.
        :param prev_layer_params: Data structure holding weight and bias for previous layer in cls set.
        :param curr_layer_params: Data structure holding weight and bias for current layer in cls set.
        """
        self._populate_libpymo_params(cls_set[0].get_module(), prev_layer_params)
        self._populate_libpymo_params(cls_set[1].get_module(), curr_layer_params)

        cls_set_0_bias = ParamUtils.get_param(self._model.model, cls_set[0].get_module(), BIAS_INDEX)
        if cls_set_0_bias is not None:
            prev_layer_params.bias = numpy_helper.to_array(cls_set_0_bias).reshape(-1)
        else:
            prev_layer_params.isBiasNone = True

    def _update_weight_for_layer_from_libpymo_obj(self, layer_param: libpymo.EqualizationParams,
                                                  module: onnx_pb.NodeProto):
        """
        Update weight parameter from libpymo object
        """
        weight = ParamUtils.get_param(self._model.model, module, WEIGHT_INDEX)
        weight.raw_data = np.asarray(layer_param.weight, dtype=np.float32).tobytes()
        groups = get_node_attribute(module, "group")
        # Transpose weight back to original configuration
        if module.op_type == "ConvTranspose" and groups == 1:
            weight = transpose_tensor(weight, (1, 0, 2, 3))

        weight_param = ParamUtils.get_param(self._model.model, module, WEIGHT_INDEX)
        weight_param.raw_data = weight.raw_data

    def _update_params_for_conv(self,
                                cls_set,
                                prev_layer_params: libpymo.EqualizationParams,
                                curr_layer_params: libpymo.EqualizationParams):
        """
        Update weight and biases for cls set using updated data structures.

        :param cls_set: Consecutive Conv layers Tuple whose weights and biases need to be equalized.
        :param prev_layer_params: Data structure holding weight and bias for previous layer in cls set.
        :param curr_layer_params: Data structure holding weight and bias for current layer in cls set.
        """
        self._update_weight_for_layer_from_libpymo_obj(prev_layer_params, cls_set[0].get_module())
        self._update_weight_for_layer_from_libpymo_obj(curr_layer_params, cls_set[1].get_module())

        if not prev_layer_params.isBiasNone:
            bias_param = ParamUtils.get_param(self._model.model, cls_set[0].get_module(),
                                              BIAS_INDEX)
            bias_param.raw_data = np.asarray(prev_layer_params.bias, dtype=np.float32).tobytes()

    def _pack_params_for_depthwise_conv(self, cls_set,
                                        prev_layer_params: libpymo.EqualizationParams,
                                        curr_layer_params: libpymo.EqualizationParams,
                                        next_layer_params: libpymo.EqualizationParams):
        """
        Prepare and pack data structure for previous, current and next layer in given cls set.

        :param cls_set: Consecutive Conv layers Tuple whose weights and biases need to be equalized.
        :param prev_layer_params: Data structure holding weight and bias for previous layer in cls set.
        :param curr_layer_params: Data structure holding weight and bias for current layer in cls set.
        :param next_layer_params: Data structure holding weight and bias for next layer in cls set.
        """

        self._populate_libpymo_params(cls_set[0].get_module(), prev_layer_params)

        assert cls_set[1].groups > 1

        weight = ParamUtils.get_param(self._model.model, cls_set[1].get_module(), WEIGHT_INDEX)
        curr_layer_params.weight = numpy_helper.to_array(weight).reshape(-1)
        curr_layer_params.weightShape = np.array(weight.dims)

        self._populate_libpymo_params(cls_set[2].get_module(), next_layer_params)

        cls_set_0_bias = ParamUtils.get_param(self._model.model, cls_set[0].get_module(), BIAS_INDEX)
        if cls_set_0_bias is not None:
            prev_layer_params.bias = numpy_helper.to_array(cls_set_0_bias).reshape(-1)
        else:
            prev_layer_params.isBiasNone = True

        cls_set_1_bias = ParamUtils.get_param(self._model.model, cls_set[1].get_module(), BIAS_INDEX)
        if cls_set_1_bias is not None:
            curr_layer_params.bias = numpy_helper.to_array(cls_set_1_bias).reshape(-1)
        else:
            curr_layer_params.isBiasNone = True

    def _update_params_for_depthwise_conv(self, cls_set,
                                          prev_layer_params: libpymo.EqualizationParams,
                                          curr_layer_params: libpymo.EqualizationParams,
                                          next_layer_params: libpymo.EqualizationParams):
        """
        Update weight and biases for cls set using updated data structures.

        :param cls_set: Consecutive Conv layers Tuple whose weights and biases need to be equalized.
        :param prev_layer_params: Data structure holding weight and bias for previous layer in cls set.
        :param curr_layer_params: Data structure holding weight and bias for current layer in cls set.
        :param next_layer_params: Data structure holding weight and bias for next layer in cls set.
        """
        self._update_weight_for_layer_from_libpymo_obj(prev_layer_params, cls_set[0].get_module())
        self._update_weight_for_layer_from_libpymo_obj(curr_layer_params, cls_set[1].get_module())
        self._update_weight_for_layer_from_libpymo_obj(next_layer_params, cls_set[2].get_module())

        if not prev_layer_params.isBiasNone:
            bias_param = ParamUtils.get_param(self._model.model, cls_set[0].get_module(),
                                              BIAS_INDEX)
            bias_param.raw_data = np.asarray(prev_layer_params.bias, dtype=np.float32).tobytes()

        if not curr_layer_params.isBiasNone:
            bias_param = ParamUtils.get_param(self._model.model, cls_set[1].get_module(),
                                              BIAS_INDEX)
            bias_param.raw_data = np.asarray(curr_layer_params.bias, dtype=np.float32).tobytes()


class HighBiasFold(HBF):
    """
    Code to apply the high-bias-fold technique to a model
    """
    def __init__(self, model: onnx_pb.ModelProto):
        self._model = model

    def _check_if_bias_is_none(self, layer: Op) -> bool:
        """ Returns if bias is a None for a layer. True if bias is None"""
        bias = ParamUtils.get_param(self._model.model, layer.get_module(), BIAS_INDEX)
        return not bias

    def _populate_bn_params_in_libpymo_obj(self, prev_layer_bn_params: libpymo.BNParamsHighBiasFold,
                                           bn_layer: BNLayer):
        """
        Populates BatchNorm params in the libpymo object
        :param prev_layer_bn_params: Data structure to pack batch norm parameter
        :param bn_layer: BatchNorm layer
        """
        prev_layer_bn_params.gamma = bn_layer.gamma
        prev_layer_bn_params.beta = bn_layer.beta

    def _pack_previous_and_current_layer_params(self, cls_pair_info: ClsSetInfo.ClsSetLayerPairInfo,
                                                prev_layer_params: libpymo.LayerParams,
                                                curr_layer_params: libpymo.LayerParams):
        """
        Helper method to pack information of previous and current layer.

        :param cls_pair_info: Layer pairs that were scaled using CLS and related information.
        :param prev_layer_params: Data structure to pack previous layer parameters.
        :param curr_layer_params: Data structure to pack current layer parameters.
        """
        prev_layer_params.activationIsRelu = cls_pair_info.relu_activation_between_layers

        bias = ParamUtils.get_param(self._model.model, cls_pair_info.layer1.get_module(),
                                    BIAS_INDEX)

        prev_layer_params.bias = numpy_helper.to_array(bias).reshape(-1)

        module = cls_pair_info.layer2.get_module()
        weight = ParamUtils.get_param(self._model.model, module, WEIGHT_INDEX)
        bias = ParamUtils.get_param(self._model.model, module, BIAS_INDEX)

        groups = get_node_attribute(module, "group")

        # Transpose weights to C, N, H, W from N, C, H, W since axis are flipped for transposed conv
        if module.op_type == "ConvTranspose" and groups == 1:
            weight = transpose_tensor(weight, (1, 0, 2, 3))

        curr_layer_params.bias = numpy_helper.to_array(bias).reshape(-1)
        curr_layer_params.weight = numpy_helper.to_array(weight).reshape(-1)
        curr_layer_params.weightShape = get_weight_dimensions(np.array(weight.dims))

    def _update_bias_for_layer_from_libpymo_obj(self, layer_param: libpymo.LayerParams,
                                                module: onnx_pb.NodeProto):
        """
        Update bias parameter from libpymo object
        """
        bias = ParamUtils.get_param(self._model.model, module, BIAS_INDEX)

        bias.raw_data = np.asarray(layer_param.bias, dtype=np.float32).tobytes()

    def _update_previous_and_current_layer_bias(self, cls_pair_info: ClsSetInfo.ClsSetLayerPairInfo,
                                                prev_layer_params: libpymo.LayerParams,
                                                curr_layer_params: libpymo.LayerParams):
        """
        Update biases for previous and current layer.

        :param cls_pair_info: Layer pairs that were scaled using CLS and related information.
        :param prev_layer_params: Data structure holding weight and bias for previous layer in cls set.
        :param curr_layer_params: Data structure holding weight and bias for current layer in cls set.
        """
        self._update_bias_for_layer_from_libpymo_obj(prev_layer_params, cls_pair_info.layer1.get_module())
        self._update_bias_for_layer_from_libpymo_obj(curr_layer_params, cls_pair_info.layer2.get_module())


def get_weight_dimensions(weight_shape: np.array) -> np.array:
    """
    Returns a length 4 weight shape
    :param weight_shape: shape of the weight tensor
    """
    dims = len(weight_shape)
    if dims == 4:
        return weight_shape
    return np.append(weight_shape, [1 for _ in range(4 - dims)]).astype(int)


[docs]def equalize_model(model: onnx_pb.ModelProto): """ High-level API to perform Cross-Layer Equalization (CLE) on the given model. The model is equalized in place. :param model: Model to equalize """ if not isinstance(model, ONNXModel): model = ONNXModel(model) conv_bn_pairs, bn_conv_pairs = fold_all_batch_norms_to_weight(model) replace_relu6_with_relu(model) bn_dict = {} for conv_bn in conv_bn_pairs: bn_dict[conv_bn[0].name] = conv_bn[1] for bn_conv in bn_conv_pairs: bn_dict[bn_conv[1].name] = bn_conv[0] # perform cross-layer scaling on applicable layer sets cls = CrossLayerScaling(model) cls_set_info = cls.scale_model() # high-bias fold hbf = HighBiasFold(model) hbf.bias_fold(cls_set_info, bn_dict)