Source code for aihwkit.simulator.digital_low_precision.quantization_manager

# -*- coding: utf-8 -*-

# # Copyright (c) 2021 Qualcomm Technologies, Inc.
# All Rights Reserved.

# (C) Copyright 2020, 2021, 2022, 2023, 2024 IBM. All Rights Reserved.
#
# Licensed under the MIT license. See LICENSE file in the project root for details.

# pylint: skip-file
# type: ignore


from enum import Enum

from torch import nn

from aihwkit.simulator.digital_low_precision.quantizers import (
    QMethods,
    QuantizerBase,
    QuantizerNotInitializedError,
)
from aihwkit.simulator.digital_low_precision.range_estimators import RangeEstimators



[docs]
class Qstates(Enum):
    estimate_ranges = 0  # ranges are updated in eval and train mode
    fix_ranges = 1  # quantization ranges are fixed for train and eval
    learn_ranges = 2  # quantization params are nn.Parameters
    estimate_ranges_train = 3  # quantization ranges are updated during train and fixed for eval




[docs]
class QuantizationManager(nn.Module):
    """Implementation of Quantization and Quantization Range Estimation

    Parameters
    ----------
    n_bits: int
        Number of bits for the quantization.
    qmethod: QMethods member (Enum)
        The quantization scheme to use, e.g. symmetric_uniform, asymmetric_uniform,
        qmn_uniform etc.
    init: RangeEstimators member (Enum)
        Initialization method for the grid from
    per_channel: bool
        If true, will use a separate quantization grid for each kernel/channle.
    x_min: float or PyTorch Tensor
        The minimum value which needs to be represented.
    x_max: float or PyTorch Tensor
        The maximum value which needs to be represented.
    """

    def __init__(
        self,
        qmethod=QMethods.symmetric_uniform,
        init=RangeEstimators.current_minmax,
        per_channel=False,
        axis=None,
        n_groups=None,
        x_min=None,
        x_max=None,
        qparams=None,
        init_params=None,
    ):
        super().__init__()
        self.state = Qstates.estimate_ranges_train
        self.qmethod = qmethod
        self.init = init
        self.per_channel = per_channel
        self.axis = axis
        self.n_groups = n_groups
        self.qparams = qparams if qparams else {}
        self.init_params = init_params if init_params else {}
        self.range_estimator = None

        # define quantizer
        self.quantizer: QuantizerBase = self.qmethod.cls(
            per_channel=per_channel, axis=axis, **qparams
        )

        # define range estimation method for quantizer initialisation
        if x_min is not None and x_max is not None:
            self.set_quant_range(x_min, x_max)
            self.state = Qstates.fix_ranges
        else:
            # set up the collector function to set the ranges
            self.range_estimator = self.init.cls(
                per_channel=self.per_channel,
                quantizer=(
                    self.quantizer if self.init.value.value > 2 else None
                ),  # For MSE and the crossentropy range estimators
                axis=self.axis,
                n_groups=self.n_groups,
                **self.init_params,
            )

    @property
    def n_bits(self):
        return self.quantizer.n_bits


[docs]
    def estimate_ranges(self):
        self.state = Qstates.estimate_ranges



[docs]
    def fix_ranges(self):
        if self.quantizer.is_initialized:
            self.state = Qstates.fix_ranges
        else:
            raise QuantizerNotInitializedError()



[docs]
    def learn_ranges(self):
        self.quantizer.make_range_trainable()
        self.state = Qstates.learn_ranges



[docs]
    def estimate_ranges_train(self):
        self.state = Qstates.estimate_ranges_train



[docs]
    def is_learning(self) -> bool:
        return self.state == Qstates.learn_ranges



[docs]
    def reset_ranges(self):
        self.range_estimator.reset()
        self.quantizer.reset()
        self.estimate_ranges_train()



[docs]
    def forward(self, x):
        if self.range_estimator.per_group_range_estimation:
            self.range_estimator(x)
            return x

        if self.state == Qstates.estimate_ranges or (
            self.state == Qstates.estimate_ranges_train and self.training
        ):
            # Note this can be per tensor or per channel
            cur_xmin, cur_xmax = self.range_estimator(x)
            self.set_quant_range(cur_xmin, cur_xmax)

        return self.quantizer(x)



[docs]
    def set_quant_range(self, x_min, x_max):
        self.quantizer.set_quant_range(x_min, x_max)



[docs]
    def extra_repr(self):
        return "state={}".format(self.state.name)