master

分支 (22)

标签 (16)

管理

管理

master

r1.4.0

r1.3.1

feature-mindone

r1.2.0

r1.3.0

develop-2025Q3

feature-boom

feature-duo

develop-2025Q2IT3

r1.1.0

r1.0.0

r0.6.0

r0.6.1

telecomm

r0.5.0

r0.4.1

r0.4

r0.3

r0.3.0-alpha

v1.3.0

v1.2.0

1.2.0.rc1

v1.1.0

deepseek-week4

deepseek-week1

deepseek-week3

v1.0.0

v0.6.0

v0.5.0

v0.4.1

v0.4.0

v0.3.0

v0.3.0-alpha

v0.2.0

v0.1.0

golden-stick
/
mindspore_gs
/
quantization
/
slb
/
slb_quant_aware_training.py

# Copyright 2022 Huawei Technologies Co., Ltd
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ============================================================================
"""SlbQuantAwareTraining."""

import os
from mindspore.dataset import Dataset
from mindspore import Model
from mindspore.nn import Cell
from mindspore.train.callback import Callback
from mindspore.train.serialization import load_checkpoint, load_param_into_net
from mindspore.common.dtype import QuantDtype
from mindspore_gs.quantization.quant_utils import get_quant_dtype_num_bits
from mindspore_gs.common.validator import Validator, Rel
from mindspore_gs.quantization.quantization_aware_training import QuantizationAwareTraining
from .slb_net_policy import SlbNetPolicy
from .slb_quant_config import SlbQuantConfig
from .slb_quant_convert import ConvertToQuantInferNetwork


class SlbQuantAwareTraining(QuantizationAwareTraining):
    """
    Implementation of slb quantization algorithm, this algorithm regards the discrete weights
    in an arbitrary quantized neural network as searchable variables, and utilize a differential method
    to search them accurately. In particular, each weight is represented as a probability distribution
    over the discrete value set. The probabilities are optimized during training and the values
    with the highest probability are selected to establish the desired quantized network.
    See more details in `Searching for Low-Bit Weights in Quantized Neural
    Networks <https://arxiv.org/pdf/2009.08695.pdf>`_.

    Note:
        This method will call other set functions to set special values,
        please refer to the set function about the error.
        This method will call other set functions to set special values,
        please refer to the set function about the error.
        For example, `quant_dtype` need refer to `set_weight_quant_dtype` and `set_act_quant_dtype`.

    Args:
        config (dict): store attributes for quantization aware training, keys are attribute names,
            values are attribute values. Default: ``None``. Supported attribute are listed below:

            - quant_dtype (Union[QuantDtype, list(QuantDtype), tuple(QuantDtype)]): Datatype used to
              quantize weights and activations. The type is a QuantDtype, a list of two QuantDtype or
              a tuple of two QuantDtype. If quant_dtype is a QuantDtype, it will be duplicated to a list
              of two QuantDtype. The first element represents the type of activations and the second
              element represents the type of weights. It is necessary to consider the precision support of
              hardware devices in the practical quantization infer scenaries. Weights quantization support
              int4|int2|int1, and activations quantization support int8 now.
            - quant_dtype (Union[QuantDtype, list(QuantDtype), tuple(QuantDtype)]): Datatype used to
              quantize weights and activations. The type is a QuantDtype, a list of two QuantDtype or
              a tuple of two QuantDtype. If quant_dtype is a QuantDtype, it will be duplicated to a list
              of two QuantDtype. The first element represents the type of activations and the second
              element represents the type of weights. It is necessary to consider the precision support of
              hardware devices in the practical quantization infer scenaries. Weights quantization support
              int4|int2|int1, and activations quantization support int8 now.
              Default: ``(QuantDtype.INT8, QuantDtype.INT1)``.
            - enable_act_quant (bool): Whether apply activation quantization while training.
              Default: ``False``.
            - enable_bn_calibration (bool): Whether apply batchnorm calibration while training.
              Default: ``False``.
            - epoch_size (int): Total training epochs.
            - has_trained_epoch (int): The trained epochs.
            - t_start_val (float): Initial value of temperature hyperparameters. Default: ``1``.
            - t_start_time (float): Fraction of epochs after which temperature hyperparameters starting changing.
              Default: ``0.2``.
            - t_end_time (float): Fraction of epochs after which temperature hyperparameters stopping changing.
              Default: ``0.6``.
            - t_factor (float): Multiplicative factor of temperature hyperparameters changing.
              Default: ``1.2``.

    Raises:
        TypeError: If `quant_dtype` is not `QuantDtype`, or every element of `quant_dtype` is not `QuantDtype`.
        TypeError: If `enable_act_quant` or `enable_bn_calibration` is not bool.
        ValueError: If the length of `quant_dtype` is greater than 2.
        TypeError: If `epoch_size` or `has_trained_epoch` is not an int.
        TypeError: If `t_start_val`, `t_start_time`, `t_end_time` or `t_factor` is not float.
        ValueError: If `epoch_size` is not greater than 0.
        ValueError: If `has_trained_epoch` is less than 0.
        ValueError: If `t_start_val` or `t_factor` is not greater than 0.
        ValueError: If `t_start_time` or `t_end_time` is less than 0.
        ValueError: If `t_start_time` or `t_end_time` is greater than 1.

    Supported Platforms:
        ``GPU``

    Examples:
        >>> import mindspore
        >>> import numpy as np
        >>> from mindspore import nn
        >>> from mindspore_gs.quantization import SlbQuantAwareTraining
        >>> from mindspore.common.dtype import QuantDtype
        >>> class NetToQuant(nn.Cell):
        ...     def __init__(self, num_channel=1):
        ...         super(NetToQuant, self).__init__()
        ...         self.conv = nn.Conv2d(num_channel, 6, 5, pad_mode='valid')
        ...         self.bn = nn.BatchNorm2d(6)
        ...
        ...     def construct(self, x):
        ...         x = self.conv(x)
        ...         x = self.bn(x)
        ...         return x
        ...
        >>> ## 1) Define network to be quantized
        >>> net = NetToQuant()
        >>> ## 2) Define SLB QAT-Algorithm
        >>> slb_quantization = SlbQuantAwareTraining()
        >>> ## 3) Use set functions to change config
        >>> ## 3.1) set_weight_quant_dtype is used to set the weight quantization bit,
        >>> and support QuantDtype.INT4, QuantDtype.INT2, QuantDtype.INT1 now.
        >>> ## 3.1) set_weight_quant_dtype is used to set the weight quantization bit,
        >>> ## and support QuantDtype.INT4, QuantDtype.INT2, QuantDtype.INT1 now.
        >>> slb_quantization.set_weight_quant_dtype(QuantDtype.INT1)
        >>> ## 3.2) set_act_quant_dtype is used to set the activation quantization bit,
        >>> ## and support QuantDtype.INT8 now.
        >>> slb_quantization.set_act_quant_dtype(QuantDtype.INT8)
        >>> ## 3.3) set_enable_act_quant is used to set whether apply activation quantization.
        >>> slb_quantization.set_enable_act_quant(True)
        >>> ## 3.4) set_enable_bn_calibration is used to set whether apply batchnorm calibration.
        >>> slb_quantization.set_enable_bn_calibration(True)
        >>> ## 3.5) set_epoch_size is used to set the epoch size of training.
        >>> slb_quantization.set_epoch_size(100)
        >>> ## 3.6) set_has_trained_epoch is used to set the trained epoch size of training.
        >>> slb_quantization.set_has_trained_epoch(0)
        >>> ## 3.7) set_t_start_val is used to set the initial value of temperature hyperparameters.
        >>> slb_quantization.set_t_start_val(1.0)
        >>> ## 3.8) set_t_start_time is used to set the fraction of epochs after which temperature
        >>> hyperparameters starting changing.
        >>> ## 3.8) set_t_start_time is used to set the fraction of epochs after which temperature
        >>> ## hyperparameters starting changing.
        >>> slb_quantization.set_t_start_time(0.2)
        >>> ## 3.9) set_t_end_time is used to set the fraction of epochs after which temperature
        >>> hyperparameters stopping changing.
        >>> ## 3.9) set_t_end_time is used to set the fraction of epochs after which temperature
        >>> ## hyperparameters stopping changing.
        >>> slb_quantization.set_t_end_time(0.6)
        >>> ## 3.10) set_t_factor is used to set the multiplicative factor of temperature hyperparameters changing.
        >>> slb_quantization.set_t_factor(1.2)
        >>> ## 4) Print SLB QAT-Algorithm object and check the config setting result
        >>> ## Since we set weight_quant_dtype to be QuantDtype.INT1, the value of the attribute
        >>> weight_quant_dtype is INT1
        >>> ## Since we set act_quant_dtype to be QuantDtype.INT8, the value of the attribute weight_quant_dtype is INT8
        >>> ## Since we set weight_quant_dtype to be QuantDtype.INT1, the value of the attribute
        >>> weight_quant_dtype is INT1
        >>> ## Since we set act_quant_dtype to be QuantDtype.INT8,
        >>> ## the value of the attribute weight_quant_dtype is INT8
        >>> ## Since we set enable_act_quant to be True, the value of the attribute enable_act_quant is True
        >>> ## Since we set enable_bn_calibration to be True, the value of the attribute enable_bn_calibration is True
        >>> ## Since we set epoch_size to be 100, the value of the attribute epoch_size is 100
        >>> ## Since we set has_trained_epoch to be 0, the value of the attribute has_trained_epoch is 0
        >>> ## Since we set t_start_val to be 1.0, the value of the attribute t_start_val is 1.0
        >>> ## Since we set t_start_time to be 0.2, the value of the attribute t_start_time is 0.2
        >>> ## Since we set t_end_time to be 0.6, the value of the attribute t_end_time is 0.6
        >>> ## Since we set t_factor to be 1.2, the value of the attribute t_factor is 1.2
        >>> print(slb_quantization)
        SlbQuantAwareTraining<weight_quant_dtype=INT1, act_quant_dtype=INT8, enable_act_quant=True,
            enable_bn_calibration=True, epoch_size=100, has_trained_epoch=0, t_start_val=1.0,
            t_start_time=0.2, t_end_time=0.6, t_factor=1.2>
        SlbQuantAwareTraining<weight_quant_dtype=INT1, act_quant_dtype=INT8, enable_act_quant=True,
            enable_bn_calibration=True, epoch_size=100, has_trained_epoch=0, t_start_val=1.0,
            t_start_time=0.2, t_end_time=0.6, t_factor=1.2>
        >>> ## 5) Apply SLB QAT-algorithm to origin network
        >>> net_qat = slb_quantization.apply(net)
        >>> ## 6) Print network and check the result. Conv2d should be transformed to QuantizeWrapperCells.
        >>> ## Since we set weight_quant_dtype to be QuantDtype.INT1, the bit_num value of fake_quant_weight
        >>> ## should be 1, and the weight_bit_num value of Conv2dSlbQuant should be 1.
        >>> print(net_qat)
        NetToQuantOpt<
          (_handler): NetToQuant<
            (conv): Conv2d<input_channels=1, output_channels=6, kernel_size=(5, 5), stride=(1, 1), pad_mode=valid,
                padding=0, dilation=(1, 1), group=1, has_bias=False, weight_init=normal, bias_init=zeros, format=NCHW>
            (bn): BatchNorm2d<num_features=6, eps=1e-05, momentum=0.9,
                gamma=Parameter(name=bn.gamma, requires_grad=True, shape=[6], dtype=Float32,
                    value= [1., 1., 1., 1., 1., 1.]),
                beta=Parameter(name=bn.beta, requires_grad=True, shape=[6], dtype=Float32,
                    value= [0., 0., 0., 0., 0., 0.]),
                moving_mean=Parameter(name=bn.moving_mean, requires_grad=False, shape=[6], dtype=Float32,
                    value= [0., 0., 0., 0., 0., 0.]),
                moving_variance=Parameter(name=bn.moving_variance, requires_grad=False, shape=[6], dtype=Float32,
                    value= [1., 1., 1., 1., 1., 1.])>
            (conv): Conv2d<input_channels=1, output_channels=6, kernel_size=(5, 5), stride=(1, 1), pad_mode=valid,
                padding=0, dilation=(1, 1), group=1, has_bias=False, weight_init=normal, bias_init=zeros, format=NCHW>
            (bn): BatchNorm2d<num_features=6, eps=1e-05, momentum=0.9,
                gamma=Parameter(name=bn.gamma, requires_grad=True, shape=[6], dtype=Float32,
                    value= [1., 1., 1., 1., 1., 1.]),
                beta=Parameter(name=bn.beta, requires_grad=True, shape=[6], dtype=Float32,
                    value= [0., 0., 0., 0., 0., 0.]),
                moving_mean=Parameter(name=bn.moving_mean, requires_grad=False, shape=[6], dtype=Float32,
                    value= [0., 0., 0., 0., 0., 0.]),
                moving_variance=Parameter(name=bn.moving_variance, requires_grad=False, shape=[6], dtype=Float32,
                    value= [1., 1., 1., 1., 1., 1.])>
            >
          (bn): BatchNorm2d<num_features=6, eps=1e-05, momentum=0.9,
            gamma=Parameter(name=bn.gamma, requires_grad=True, shape=[6], dtype=Float32,
                value= [1., 1., 1., 1., 1., 1.]),
            beta=Parameter(name=bn.beta, requires_grad=True, shape=[6], dtype=Float32, value= [0., 0., 0., 0., 0., 0.]),
            moving_mean=Parameter(name=bn.moving_mean, requires_grad=False, shape=[6], dtype=Float32,
                value= [0., 0., 0., 0., 0., 0.]),
            moving_variance=Parameter(name=bn.moving_variance, requires_grad=False, shape=[6], dtype=Float32,
                value= [1., 1., 1., 1., 1., 1.])>
          (bn): BatchNorm2d<num_features=6, eps=1e-05, momentum=0.9,
            gamma=Parameter(name=bn.gamma, requires_grad=True, shape=[6], dtype=Float32,
                value= [1., 1., 1., 1., 1., 1.]),
            beta=Parameter(name=bn.beta, requires_grad=True, shape=[6], dtype=Float32, value= [0., 0., 0., 0., 0., 0.]),
            moving_mean=Parameter(name=bn.moving_mean, requires_grad=False, shape=[6], dtype=Float32,
                value= [0., 0., 0., 0., 0., 0.]),
            moving_variance=Parameter(name=bn.moving_variance, requires_grad=False, shape=[6], dtype=Float32,
                value= [1., 1., 1., 1., 1., 1.])>
          (Conv2dSlbQuant): QuantCell<
            (_handler): Conv2dSlbQuant<
              in_channels=1, out_channels=6, kernel_size=(5, 5), weight_bit_num=1, stride=(1, 1), pad_mode=valid,
                padding=0, dilation=(1, 1), group=1, has_bias=False
              in_channels=1, out_channels=6, kernel_size=(5, 5), weight_bit_num=1, stride=(1, 1), pad_mode=valid,
                padding=0, dilation=(1, 1), group=1, has_bias=False
              (fake_quant_weight): SlbFakeQuantizerPerLayer<bit_num=1>
              >
            (_input_quantizer): SlbActQuantizer<bit_num=8, symmetric=False, narrow_range=False,
                ema=False(0.999), per_channel=False, quant_delay=900>
            (_output_quantizer): SlbActQuantizer<bit_num=8, symmetric=False, narrow_range=False,
                ema=False(0.999), per_channel=False, quant_delay=900>
            (_input_quantizer): SlbActQuantizer<bit_num=8, symmetric=False, narrow_range=False,
                ema=False(0.999), per_channel=False, quant_delay=900>
            (_output_quantizer): SlbActQuantizer<bit_num=8, symmetric=False, narrow_range=False,
                ema=False(0.999), per_channel=False, quant_delay=900>
            >
          >
        >>> ## 7) convert a compressed network to a standard network before exporting to MindIR.
        >>> net_qat = slb_quantization.convert(net_qat)
        >>> data_in = mindspore.Tensor(np.ones([1, 1, 32, 32]), mindspore.float32)
        >>> file_name = "./conv.mindir"
        >>> mindspore.export(net_qat, data_in, file_name=file_name, file_format="MINDIR")
        >>> graph = mindspore.load(file_name)
        >>> mindspore.nn.GraphCell(graph)
    """

    def __init__(self, config=None):
        super(SlbQuantAwareTraining, self).__init__(config)
        if config is None:
            config = {}
        self._qat_policy = self._init_net_policy(self._config)
        self._custom_transforms = {}
        self._custom_layer_policy_map = {}
        if "custom_transforms" in config.keys():
            self._custom_transforms = config["custom_transforms"]
        if "custom_policies" in config.keys():
            self._custom_layer_policy_map = config["custom_policies"]

    def set_weight_quant_dtype(self, weight_quant_dtype=QuantDtype.INT1):
        """
        Set value of weight_quant_dtype of quantization aware training `config`

        Args:
            weight_quant_dtype (QuantDtype): Datatype used to quantize weights. Default: ``QuantDtype.INT1``.

        Raises:
            TypeError: If `weight_quant_dtype` is not QuantDtype.
            ValueError: Only supported if `weight_quant_dtype` is ``QuantDtype.INT1``, ``QuantDtype.INT2``
                or ``QuantDtype.INT4`` yet.
        """
        if not isinstance(weight_quant_dtype, QuantDtype):
            raise TypeError("The parameter `weight quant dtype` must be isinstance of QuantDtype, "
                            "but got {}.".format(weight_quant_dtype))
        if weight_quant_dtype not in [QuantDtype.INT1, QuantDtype.INT2, QuantDtype.INT4]:
            raise ValueError("Only supported if `weight_quant_dtype` is `QuantDtype.INT1`, " \
                             "`QuantDtype.INT2` or `QuantDtype.INT4` yet.")
        self._config.weight_quant_dtype = weight_quant_dtype

    def set_act_quant_dtype(self, act_quant_dtype=QuantDtype.INT8):
        """
        Set value of act_quant_dtype of quantization aware training `config`

        Args:
            act_quant_dtype (QuantDtype): Datatype used to quantize activations. Default: ``QuantDtype.INT8``.

        Raises:
            TypeError: If `act_quant_dtype` is not QuantDtype.
            ValueError: Only supported if `act_quant_dtype` is ``QuantDtype.INT8`` yet.
        """
        if not isinstance(act_quant_dtype, QuantDtype):
            raise TypeError("The parameter `act quant dtype` must be isinstance of QuantDtype, "
                            "but got {}.".format(act_quant_dtype))
        if act_quant_dtype not in [QuantDtype.INT8]:
            raise ValueError("Only supported if `act_quant_dtype` is `QuantDtype.INT8` yet.")
        self._config.act_quant_dtype = act_quant_dtype

    def set_enable_act_quant(self, enable_act_quant=False):
        """
        Set value of enable_act_quant of quantization aware training `config`

        Args:
            enable_act_quant (bool): Whether apply activation quantization while training, default is ``False``.

        Raises:
            TypeError: If `enable_act_quant` is not bool.
        """
        enable_act_quant = Validator.check_bool(enable_act_quant, "enable_act_quant", self.__class__.__name__)
        self._config.enable_act_quant = enable_act_quant

    def set_enable_bn_calibration(self, enable_bn_calibration=False):
        """
        Set value of enable_bn_calibration of quantization aware training `config`

        Args:
            enable_bn_calibration (bool): Whether apply batchnorm calibration while training, default is ``False``.

        Raises:
            TypeError: If `enable_bn_calibration` is not bool.
        """
        enable_bn_calibration = Validator.check_bool(enable_bn_calibration, "enable_bn_calibration",
                                                     self.__class__.__name__)
        self._config.enable_bn_calibration = enable_bn_calibration

    def set_epoch_size(self, epoch_size):
        """
        Set value of epoch_size of quantization aware training `config`

        Args:
            epoch_size (int): the epoch size of training.

        Raises:
            TypeError: If `epoch_size` is not int.
            ValueError: If `epoch_size` is not greater than 0.
        """
        epoch_size = Validator.check_int(epoch_size, 0, Rel.GT, "epoch_size", self.__class__.__name__)
        self._config.epoch_size = epoch_size

    def set_has_trained_epoch(self, has_trained_epoch):
        """
        Set value of has_trained_epoch of quantization aware training `config`

        Args:
            has_trained_epoch (int): the trained epochs of training.

        Raises:
            TypeError: If `has_trained_epoch` is not int.
            ValueError: If `has_trained_epoch` is less than 0.
        """
        has_trained_epoch = Validator.check_int(has_trained_epoch, 0, Rel.GE, "has_trained_epoch",
                                                self.__class__.__name__)
        self._config.has_trained_epoch = has_trained_epoch

    def set_t_start_val(self, t_start_val=1.0):
        """
        Set value of t_start_val of quantization aware training `config`.

        Args:
            t_start_val (float): Initial value of temperature hyperparameters, default: ``1.0``.

        Raises:
            TypeError: If `t_start_val` is not float.
            ValueError: If `t_start_val` is not greater than 0.
        """
        t_start_val = Validator.check_positive_float(t_start_val, "t_start_val", self.__class__.__name__)
        self._config.t_start_val = t_start_val

    def set_t_start_time(self, t_start_time=0.2):
        """
        Set value of t_start_time of quantization aware training `config`.

        Args:
            t_start_time (float): Fraction of epochs after which temperature hyperparameters starting changing,
                default: ``0.2``.

        Raises:
            TypeError: If `t_start_time` is not float.
            ValueError: If `t_start_time` is less than 0. or greater than 1.
        """
        t_start_time = Validator.check_float_range(t_start_time, 0.0, 1.0, Rel.INC_BOTH, \
                                                   "t_start_time", self.__class__.__name__)
        self._config.t_start_time = t_start_time

    def set_t_end_time(self, t_end_time=0.6):
        """
        Set value of t_end_time of quantization aware training `config`

        Args:
            t_end_time (float): Fraction of epochs after which temperature hyperparameters stopping changing,
                default: ``0.6``.

        Raises:
            TypeError: If `t_end_time` is not float.
            ValueError: If `t_end_time` is less than 0. or greater than 1.
        """
        t_end_time = Validator.check_float_range(t_end_time, 0.0, 1.0, Rel.INC_BOTH,
                                                 "t_end_time", self.__class__.__name__)
        self._config.t_end_time = t_end_time

    def set_t_factor(self, t_factor=1.2):
        """
        Set value of t_factor of quantization aware training `config`

        Args:
            t_factor (float): Multiplicative factor of temperature hyperparameters changing, default: ``1.2``.

        Raises:
            TypeError: If `t_factor` is not float.
            ValueError: If `t_factor` is not greater than 0.
        """
        t_factor = Validator.check_positive_float(t_factor, "t_factor", self.__class__.__name__)
        self._config.t_factor = t_factor

    @staticmethod
    def _convert2list(name, value):
        if not isinstance(value, list) and not isinstance(value, tuple):
            value = [value, value]
        elif len(value) == 1:
            value = value + value
        elif len(value) > 2:
            raise ValueError("The length of input `{}` should not be greater than 2.".format(name))
        return value

    def _init_net_policy(self, config):
        return SlbNetPolicy(config)

    def _create_config(self):
        """Create SlbQuantConfig."""
        self._config = SlbQuantConfig()

    def _update_config_from_dict(self, config: dict):
        """Update `_config` from a dict"""
        quant_dtype_list = SlbQuantAwareTraining. \
            _convert2list("quant dtype", config.get("quant_dtype", [QuantDtype.INT8, QuantDtype.INT1]))

        self.set_act_quant_dtype(quant_dtype_list[0])
        self.set_weight_quant_dtype(quant_dtype_list[-1])

        self.set_enable_act_quant(config.get("enable_act_quant", False))
        self.set_enable_bn_calibration(config.get("enable_bn_calibration", False))
        if "epoch_size" in config:
            self.set_epoch_size(config["epoch_size"])
        if "has_trained_epoch" in config:
            self.set_has_trained_epoch(config["has_trained_epoch"])
        self.set_t_start_val(config.get("t_start_val", 1.0))
        self.set_t_start_time(config.get("t_start_time", 0.2))
        self.set_t_end_time(config.get("t_end_time", 0.6))
        self.set_t_factor(config.get("t_factor", 1.2))

    # pylint: disable=arguments-differ
    # pylint: disable=arguments-differ
    def callbacks(self, model: Model, dataset: Dataset) -> [Callback]:
        """
        Define TemperatureScheduler callback for SLB QAT-algorithm.

        Args:
            model (Model): Model to be used.
            dataset (Dataset): Dataset to be used.

        Returns:
            List of instance of Callbacks.

        Raises:
            RuntimeError: If `epoch_size` is not initialized.
            RuntimeError: If `has_trained_epoch` is not initialized.
            ValueError: If `epoch_size` is not greater than `has_trained_epoch`.
            ValueError: If `t_end_time` is less than `t_start_time`.
            TypeError: If `model` is not `mindspore.train.Model`.
            TypeError: If `dataset` is not mindspore.dataset.Dataset.
        """

        if self._config.epoch_size == -1:
            raise RuntimeError("The `epoch_size` need to be initialized!")
        if self._config.has_trained_epoch == -1:
            raise RuntimeError("The `has_trained_epoch` need to be initialized!")

        if self._config.epoch_size <= self._config.has_trained_epoch:
            raise ValueError("The `epoch_size` should be greater than `has_trained_epoch`.")
        if self._config.t_end_time < self._config.t_start_time:
            raise ValueError("The `t_end_time` should not be less than `t_start_time`.")

        if not isinstance(model, Model):
            raise TypeError(f'The parameter `model` must be isinstance of mindspore.Model, '
                            f'but got {model}.')

        if not isinstance(dataset, Dataset):
            raise TypeError(f'The parameter `dataset` must be isinstance of mindspore.dataset.Dataset, '
                            f'but got {dataset}.')

        cb = []
        cb.append(TemperatureScheduler(model, self._config.epoch_size, self._config.has_trained_epoch,
                                       self._config.t_start_val, self._config.t_start_time,
                                       self._config.t_end_time, self._config.t_factor))

        if self._config.enable_bn_calibration:
            cb.append(BNCalibrationCallback(model, dataset, self._config.epoch_size,
                                            self._config.has_trained_epoch, self._config.t_start_time, False))
        cb.extend(super(SlbQuantAwareTraining, self).callbacks())
        return cb

    def apply(self, network: Cell, **kwargs) -> Cell:
        """
        Apply SLB quantization Algorithm on `network`, use the following steps to make `network` available for
        quantization aware training:

        1. Fuse certain cells in `network` using pattern engine which is defined by net policy.
        2. Propagate layer policies defined through cells.
        3. Reduce redundant fake quantizers when they are redundant.
        4. Apply layer policies to convert normal cell to `QuantCell`.

        Args:
            network (Cell): Network to be quantized.
            kwargs (Dict): Extensible parameter for subclasses.

        Returns:
            Quantized network.
        """

        self._qat_policy.build()
        return super(SlbQuantAwareTraining, self).apply(network)

    def convert(self, net_opt: Cell, ckpt_path="") -> Cell:
        """
        Define how to convert a compressed network to a standard network before exporting to MindIR.

        Args:
            net_opt (Cell): Network to be converted which is transformed by `SlbQuantAwareTraining.apply`.
            ckpt_path (str): Path to checkpoint file for `net_opt`. Default is ``""``, which means not loading
                checkpoint file to `net_opt`.

        Returns:
            An instance of Cell represents converted network.

        Raises:
            TypeError: If `net_opt` is not Cell.
            TypeError: If `ckpt_path` is not string.
            ValueError: If `ckpt_path` is not empty and invalid.
            RuntimeError: If loading `ckpt_path` fails.
        """
        if not isinstance(net_opt, Cell):
            raise TypeError(f'The parameter `net_opt` must be isinstance of Cell, but got {type(net_opt)}.')
        if not isinstance(ckpt_path, str):
            raise TypeError(f'The parameter `ckpt_path` must be isinstance of str, but got {type(ckpt_path)}.')
        if ckpt_path != "" and not os.path.isfile(ckpt_path):
            raise ValueError(
                f'The parameter `ckpt_path` can only be empty or a valid file, '
                f'but got {os.path.realpath(ckpt_path)}.'
            )
        ckpt_path = os.path.realpath(ckpt_path)
        if os.path.isfile(ckpt_path):
            param_dict = load_checkpoint(ckpt_path)
            not_load_param = load_param_into_net(net_opt, param_dict)
            if not_load_param[0]:
                raise RuntimeError("Load param into net fail.")
        exporter = ConvertToQuantInferNetwork(net_opt, get_quant_dtype_num_bits(self._config.weight_quant_dtype))
        return exporter.run()


    def __repr__(self):
        """Display instance object as string."""
        s = 'SlbQuantAwareTraining<weight_quant_dtype={}, act_quant_dtype={}, enable_act_quant={}, ' \
            'enable_bn_calibration={}, epoch_size={}, has_trained_epoch={}, t_start_val={}, t_start_time={}, ' \
            't_end_time={}, t_factor={}>'.format(self._config.weight_quant_dtype, self._config.act_quant_dtype,
                                                 self._config.enable_act_quant, self._config.enable_bn_calibration,
                                                 self._config.epoch_size, self._config.has_trained_epoch,
                                                 self._config.t_start_val, self._config.t_start_time,
                                                 self._config.t_end_time, self._config.t_factor)
        return s


class TemperatureScheduler(Callback):
    """
    Define TemperatureScheduler callback for SLB QAT-algorithm.
    """

    def __init__(self, model, epoch_size=100, has_trained_epoch=0,
                 t_start_val=1.0, t_start_time=0.2, t_end_time=0.6, t_factor=1.2):
        super().__init__()
        self.epochs = epoch_size
        self.has_trained_epoch = has_trained_epoch
        self.t_start_val = t_start_val
        self.t_start_time = t_start_time
        self.t_end_time = t_end_time
        self.t_factor = t_factor
        self.model = model

    def epoch_begin(self, run_context):
        """
        Epoch_begin.
        """
        cb_params = run_context.original_args()
        epoch = cb_params.cur_epoch_num + self.has_trained_epoch
        # Compute temperature value
        t = self.t_start_val
        t_start_epoch = int(self.epochs * self.t_start_time)
        t_end_epoch = int(self.epochs * self.t_end_time)
        if epoch > t_start_epoch:
            t *= self.t_factor ** (min(epoch, t_end_epoch) - t_start_epoch)
        # Assign new value to temperature parameter
        for _, cell in self.model.train_network.cells_and_names():
            if cell.cls_name == 'SlbFakeQuantizerPerLayer':  # for SLB
                cell.set_temperature(t)
                if epoch >= t_end_epoch:
                    cell.set_temperature_end_flag()


class BNCalibrationCallback(Callback):
    '''Update discrete state statistics in BN layers.'''

    def __init__(self, model, train_set, epoch_size=100, has_trained_epoch=0,
                 t_start_time=0.2, dataset_sink_mode=False):
        self.dataset_sink_mode = dataset_sink_mode
        self.model = model
        self.train_set = train_set
        self.epochs = epoch_size
        self.has_trained_epoch = has_trained_epoch
        self.t_start_time = t_start_time

    def epoch_end(self, run_context):
        """
        Epoch_end.
        """
        cb_params = run_context.original_args()
        epoch = cb_params.cur_epoch_num + self.has_trained_epoch
        t_start_epoch = int(self.epochs * self.t_start_time)
        if epoch > t_start_epoch:
            # make BN update for train and BNCalibration
            for _, cell in self.model.train_network.cells_and_names():
                if cell.cls_name == 'BatchNorm2d':
                    cell.use_batch_statistics = True
            self.model.eval(self.train_set, dataset_sink_mode=self.dataset_sink_mode)