Source code for qkeras.qpooling

# Copyright 2019 Google LLC
#
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================

import keras
import keras.ops.numpy as knp
from keras import constraints, layers
from keras import ops as Kops
from keras.saving import register_keras_serializable

from .quantizers import get_quantizer



[docs]
@register_keras_serializable(package="qkeras")
class QAveragePooling2D(layers.AveragePooling2D):
    """Computes the quantized version of AveragePooling2D."""

    def __init__(
        self,
        pool_size=(2, 2),
        strides=None,
        padding="valid",
        data_format=None,
        average_quantizer=None,
        activation=None,
        **kwargs,
    ):
        self.average_quantizer = average_quantizer
        self.average_quantizer_internal = get_quantizer(self.average_quantizer)
        self.quantizers = [self.average_quantizer_internal]

        if activation is not None:
            self.activation = get_quantizer(activation)
        else:
            self.activation = activation

        super().__init__(
            pool_size=pool_size,
            strides=strides,
            padding=padding,
            data_format=data_format,
            **kwargs,
        )


[docs]
    def call(self, inputs):
        """Performs quantized AveragePooling followed by QActivation.

        Since there is no specific parameter for averaging op, we couldn't apply
        averaging quantizer to the averaging op. We have two options:
        1. we perform our own average as sum first then multiply with the
           inversion
           of the division factor: sum(x) * quantize(1/pool_area)
        2. first, we call keras version of averaging first: y1 = keras_average(x)
           then multiply it with pool_size^2: y2 = y1 * pool_area
           Last, y3 = y2 * quantize(1/ pool_area)
        3. Improved based on #2, but multiply x with pool_area before averaging
           so that we don't lose precision during averaging. The order now becomes:
           first, multiply x with pool_area: y1 = x * pool_area
           then we call keras version of averaging: y2 = keras_average(y1)
           Last, y3 = y2 * quantize(1/ pool_area)
        4. Since there is sum_pooling operation, another solution is to use
           depthwise_conv2d with kernel weights = 1 to get the pooling sum. In this
           case we don't lose precision due to averaging. However, this solution
           will introduce extra weights to the layer, which might break our code
           elsewhere.

        Since we need to match software and hardware inference numerics, we are now
        using #3 in the implementation.
        """

        if self.average_quantizer:
            # Calculates the pool area
            if isinstance(self.pool_size, int):
                pool_area = self.pool_size * self.pool_size
            else:
                pool_area = knp.prod(self.pool_size)

            inputs = keras.ops.cast(inputs, dtype=float)
            pool_area = keras.ops.cast(pool_area, dtype=float)

            # Calculates the pooling average of x*pool_area
            x = super(QAveragePooling2D, self).call(inputs * pool_area)

            # Quantizes the multiplication factor.
            mult_factor = 1.0 / pool_area
            q_mult_factor = self.average_quantizer_internal(mult_factor)
            q_mult_factor = Kops.cast(q_mult_factor, dtype=float)

            # Computes pooling average.
            x = x * q_mult_factor

        else:
            # Since no quantizer is available, we directly call the keras layer
            x = super(QAveragePooling2D, self).call(inputs)

        if self.activation is not None:
            return self.activation(x)
        return x



[docs]
    def get_config(self):
        config = {
            "average_quantizer": constraints.serialize(
                self.average_quantizer_internal  # Google internal code, commented out by copybara
            ),
            "activation": constraints.serialize(
                self.activation  # Google internal code, commented out by copybara
            ),
        }
        base_config = super(QAveragePooling2D, self).get_config()
        return dict(list(base_config.items()) + list(config.items()))



[docs]
    def get_quantization_config(self):
        return {
            "average_quantizer": str(self.average_quantizer_internal),
            "activation": str(self.activation),
        }



[docs]
    def get_quantizers(self):
        return self.quantizers





[docs]
@register_keras_serializable(package="qkeras")
class QGlobalAveragePooling2D(layers.GlobalAveragePooling2D):
    """Computes the quantized version of GlobalAveragePooling2D."""

    def __init__(
        self, data_format=None, average_quantizer=None, activation=None, **kwargs
    ):
        self.average_quantizer = average_quantizer
        self.average_quantizer_internal = get_quantizer(self.average_quantizer)
        self.quantizers = [self.average_quantizer_internal]

        if activation is not None:
            self.activation = get_quantizer(activation)
        else:
            self.activation = activation

        super().__init__(data_format=data_format, **kwargs)


[docs]
    def compute_pooling_area(self, input_shape):
        if not isinstance(input_shape, tuple):
            input_shape = input_shape
        if self.data_format == "channels_last":
            return input_shape[1] * input_shape[2]
        else:
            return input_shape[2] * input_shape[3]



[docs]
    def call(self, inputs):
        """Performs quantized GlobalAveragePooling followed by QActivation.

        Since there is no specific parameter for averaging op, we couldn't apply
        averaging quantizer to the averaging op. We have two options:
        1. we perform our own average as sum first then multiply with the
           inversion
           of the division factor: sum(x) * quantize(1/pool_area)
        2. first, we call keras version of averaging first:
           y1 = keras_global_average(x)
           then multiply it with the denominator(pool_area) used by averaging:
           y2 = y1 * pool_area
           Last, y3 = y2 * quantize(1/ pool_area)
        3. we perform pooling sum, and then multiply the sum with the quantized
           inverse multiplication factor to get the average value.

        Our previous implementation uses option #2. Yet we observed minor numerical
        mismatch between software and hardware inference. Therefore we use #3 as
        the current implementation.
        """

        if self.average_quantizer:
            # Calculates pooling sum.
            if self.data_format == "channels_last":
                x = Kops.sum(inputs, axis=[1, 2], keepdims=self.keepdims)
            else:
                x = Kops.sum(inputs, axis=[2, 3], keepdims=self.keepdims)

            # Calculates the pooling area
            pool_area = self.compute_pooling_area(input_shape=inputs.shape)

            # Quantizes the inverse multiplication factor
            mult_factor = 1.0 / pool_area
            q_mult_factor = self.average_quantizer_internal(mult_factor)

            # Derives average pooling value from pooling sum.
            x = x * q_mult_factor

        else:
            # If quantizer is not available, calls the keras layer.
            x = super(QGlobalAveragePooling2D, self).call(inputs)

        if self.activation is not None:
            return self.activation(x)
        return x



[docs]
    def get_config(self):
        config = {
            "average_quantizer": constraints.serialize(
                self.average_quantizer_internal  # Google internal code, commented out by copybara
            ),
            "activation": constraints.serialize(
                self.activation  # Google internal code, commented out by copybara
            ),
        }
        base_config = super(QGlobalAveragePooling2D, self).get_config()
        return dict(list(base_config.items()) + list(config.items()))



[docs]
    def get_quantization_config(self):
        return {
            "average_quantizer": str(self.average_quantizer_internal),
            "activation": str(self.activation),
        }



[docs]
    def get_quantizers(self):
        return self.quantizers