Source code for cnn2snn.quantization_layers

#!/usr/bin/env python
# ******************************************************************************
# Copyright 2020 Brainchip Holdings Ltd.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#    http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ******************************************************************************
"""Quantized layers API: neural quantized layers and quantized activations"""

# Tensorflow imports
import tensorflow as tf
from keras import backend as K
from keras import layers
from keras.utils.generic_utils import serialize_keras_object
from keras.utils import conv_utils
from tensorflow.python.ops import nn
from .quantization_ops import get as get_quantizer
from .quantization_ops import ceil_through


def _check_unsupported_args(kwargs, unsupported_args):
    """Raises error if unsupported argument are present in kwargs.

    For now, 4 arguments are unsupported: 'data_format', 'activation',
        'dilation_rate', 'depth_mutiplier'.

    Args:
        kwargs (dictionary): keyword arguments to check.
        unsupported_args: list of unsupported arguments.

    """
    for kwarg in kwargs:
        if kwarg in unsupported_args:
            raise TypeError("Unsupported argument in quantized layers:", kwarg)


[docs]class QuantizedConv2D(layers.Conv2D): """A quantization-aware Keras convolutional layer. Inherits from Keras Conv2D layer, applying a quantization on weights during the forward pass. Args: filters (int): the number of filters. kernel_size (tuple of integer): the kernel spatial dimensions. quantizer (:obj:`cnn2snn.WeightQuantizer`): the quantizer to apply during the forward pass. strides (integer, or tuple of integers, optional): strides of the convolution along spatial dimensions. padding (str, optional): one of 'valid' or 'same'. use_bias (boolean, optional): whether the layer uses a bias vector. kernel_initializer (str, or a :obj:`tf.keras.initializer`, optional): initializer for the weights matrix. bias_initializer (str, or a :obj:`tf.keras.initializer`, optional): initializer for the bias vector. kernel_regularizer (str, or a :obj:`tf.keras.regularizer`, optional): regularization applied to the weights. bias_regularizer (str, or a :obj:`tf.keras.regularizer`, optional): regularization applied to the bias. activity_regularizer (str, or a :obj:`tf.keras.regularizer`, optional): regularization applied to the output of the layer. kernel_constraint (str, or a :obj:`tf.keras.constraint`, optional): constraint applied to the weights. bias_constraint (str, or a :obj:`tf.keras.constraint`, optional): constraint applied to the bias. """ unsupported_args = { 'data_format': 'channels_last', 'activation': 'linear', 'dilation_rate': (1, 1), 'groups': 1 } def __init__(self, filters, kernel_size, quantizer, strides=(1, 1), padding='valid', use_bias=True, kernel_initializer='glorot_uniform', bias_initializer='zeros', kernel_regularizer=None, bias_regularizer=None, activity_regularizer=None, kernel_constraint=None, bias_constraint=None, **kwargs): _check_unsupported_args(kwargs, self.unsupported_args) self.quantizer = get_quantizer(quantizer) super().__init__(filters=filters, kernel_size=kernel_size, strides=strides, padding=padding, use_bias=use_bias, kernel_initializer=kernel_initializer, bias_initializer=bias_initializer, kernel_regularizer=kernel_regularizer, bias_regularizer=bias_regularizer, activity_regularizer=activity_regularizer, kernel_constraint=kernel_constraint, bias_constraint=bias_constraint, **kwargs)
[docs] def call(self, inputs): """Evaluates input Tensor. This applies the quantization on weights, then evaluates the input Tensor and produces the output Tensor. Args: inputs(:obj:`tensorflow.Tensor`): input Tensor. Returns: :obj:`tensorflow.Tensor`: output Tensor. """ input_shape = inputs.shape outputs = self.convolution_op(inputs, self.quantizer.quantize(self.kernel)) if self.use_bias: output_rank = outputs.shape.rank # Handle multiple batch dimensions. if output_rank is not None and output_rank > 2 + self.rank: def _apply_fn(o): return tf.nn.bias_add(o, self.bias, data_format=self._tf_data_format) outputs = conv_utils.squeeze_batch_dims( outputs, _apply_fn, inner_rank=self.rank + 1) else: outputs = tf.nn.bias_add(outputs, self.bias, data_format=self._tf_data_format) if not tf.executing_eagerly(): # Infer the static output shape: out_shape = self.compute_output_shape(input_shape) outputs.set_shape(out_shape) return outputs
[docs] def get_config(self): config = super().get_config() config['quantizer'] = serialize_keras_object(self.quantizer) for kwarg in self.unsupported_args: config.pop(kwarg, None) return config
class QuantizedDepthwiseConv2D(layers.DepthwiseConv2D): """A quantization-aware Keras depthwise convolutional layer. Inherits from Keras DepthwiseConv2D layer, applying a quantization on weights during the forward pass. Args: kernel_size (a tuple of integer): the kernel spatial dimensions. strides (integer, or tuple of integers, optional): strides of the convolution along spatial dimensions. quantizer (:obj:`cnn2snn.WeightQuantizer`): the quantizer to apply during the forward pass. padding (str, optional): One of 'valid' or 'same'. use_bias (boolean, optional): whether the layer uses a bias vector. depthwise_initializer (str, or a :obj:`tf.keras.initializer`, optional): initializer for the weights matrix. bias_initializer (str, or a :obj:`tf.keras.initializer`, optional): initializer for the bias vector. depthwise_regularizer (str, or a :obj:`tf.keras.initializer`, optional): regularization applied to the weights. bias_regularizer (str, or a :obj:`tf.keras.initializer`, optional): regularization applied to the bias. activity_regularizer (str, or a :obj:`tf.keras.regularizer`, optional): regularization applied to the output of the layer. depthwise_constraint (str, or a :obj:`tf.keras.initializer`, optional): constraint applied to the weights. bias_constraint (str, or a :obj:`tf.keras.initializer`, optional): constraint applied to the bias. """ unsupported_args = { 'data_format': 'channels_last', 'activation': 'linear', 'depth_multiplier': 1 } def __init__(self, kernel_size, quantizer, strides=(1, 1), padding='valid', use_bias=True, depthwise_initializer='glorot_uniform', bias_initializer='zeros', depthwise_regularizer=None, bias_regularizer=None, activity_regularizer=None, depthwise_constraint=None, bias_constraint=None, **kwargs): _check_unsupported_args(kwargs, self.unsupported_args) self.quantizer = get_quantizer(quantizer) super().__init__(kernel_size=kernel_size, strides=strides, padding=padding, use_bias=use_bias, depthwise_initializer=depthwise_initializer, bias_initializer=bias_initializer, depthwise_regularizer=depthwise_regularizer, bias_regularizer=bias_regularizer, activity_regularizer=activity_regularizer, depthwise_constraint=depthwise_constraint, bias_constraint=bias_constraint, **kwargs) def call(self, inputs): """Evaluates input Tensor. This applies the quantization on weights, then evaluates the input Tensor and produces the output Tensor. Args: inputs (:obj:`tensorflow.Tensor`): input Tensor. Returns: :obj:`tensorflow.Tensor`: output Tensor. """ # We don't support biases return K.depthwise_conv2d(inputs, self.quantizer.quantize( self.depthwise_kernel), strides=self.strides, padding=self.padding, dilation_rate=self.dilation_rate, data_format=self.data_format) def get_config(self): config = super().get_config() config['quantizer'] = serialize_keras_object(self.quantizer) for kwarg in self.unsupported_args: config.pop(kwarg, None) return config
[docs]class QuantizedDense(layers.Dense): """A quantization-aware Keras dense layer. Inherits from Keras Dense layer, applying a quantization on weights during the forward pass. Args: units (int): the number of neurons. use_bias (boolean, optional): whether the layer uses a bias vector. quantizer (:obj:`cnn2snn.WeightQuantizer`): the quantizer to apply during the forward pass. kernel_initializer (str, or a :obj:`tf.keras.initializer`, optional): initializer for the weights matrix. bias_initializer (str, or a :obj:`tf.keras.initializer`, optional): initializer for the bias vector. kernel_regularizer (str, or a :obj:`tf.keras.regularizer`, optional): regularization applied to the weights. bias_regularizer (str, or a :obj:`tf.keras.regularizer`, optional): regularization applied to the bias. activity_regularizer (str, or a :obj:`tf.keras.regularizer`, optional): regularization applied to the output of the layer. kernel_constraint (str, or a :obj:`tf.keras.constraint`, optional): constraint applied to the weights. bias_constraint (str, or a :obj:`tf.keras.constraint`, optional): constraint applied to the bias. """ unsupported_args = {'activation': 'linear'} def __init__(self, units, quantizer, use_bias=True, kernel_initializer='glorot_uniform', bias_initializer='zeros', kernel_regularizer=None, bias_regularizer=None, activity_regularizer=None, kernel_constraint=None, bias_constraint=None, **kwargs): _check_unsupported_args(kwargs, self.unsupported_args) self.quantizer = get_quantizer(quantizer) super().__init__(units=units, use_bias=use_bias, kernel_initializer=kernel_initializer, bias_initializer=bias_initializer, kernel_regularizer=kernel_regularizer, bias_regularizer=bias_regularizer, activity_regularizer=activity_regularizer, kernel_constraint=kernel_constraint, bias_constraint=bias_constraint, **kwargs)
[docs] def call(self, inputs): """Evaluates input Tensor. This applies the quantization on weights, then evaluates the input Tensor and produces the output Tensor. Args: inputs (:obj:`tensorflow.Tensor`): input Tensor. Returns: :obj:`tensorflow.Tensor`: output Tensor. """ if inputs.dtype.base_dtype != self._compute_dtype_object.base_dtype: inputs = tf.cast(inputs, dtype=self._compute_dtype_object) if isinstance(inputs, tf.RaggedTensor): raise TypeError(f"The inputs of a Dense Layer must be a uniform \ Tensor. Received {type(inputs)}") kernel = self.quantizer.quantize(self.kernel) rank = inputs.shape.rank if rank == 2 or rank is None: # We use embedding_lookup_sparse as a more efficient matmul # operation for large sparse input tensors. The op will result in a # sparse gradient, as opposed to # sparse_ops.sparse_tensor_dense_matmul which results in dense # gradients. This can lead to sigfinicant speedups, see b/171762937. if isinstance(inputs, tf.SparseTensor): raise TypeError( f"The inputs of a Dense Layer must be a uniform \ Tensor. Received {type(inputs)}") outputs = tf.raw_ops.MatMul(a=inputs, b=kernel) # Broadcast kernel to inputs. else: outputs = tf.tensordot(inputs, kernel, [[rank - 1], [0]]) # Reshape the output back to the original ndim of the input. if not tf.executing_eagerly(): shape = inputs.shape.as_list() output_shape = shape[:-1] + [kernel.shape[-1]] outputs.set_shape(output_shape) if self.use_bias: outputs = tf.nn.bias_add(outputs, self.bias) return outputs
[docs] def get_config(self): config = super().get_config() config['quantizer'] = serialize_keras_object(self.quantizer) for kwarg in self.unsupported_args: config.pop(kwarg, None) return config
[docs]class QuantizedSeparableConv2D(layers.SeparableConv2D): """A quantization-aware Keras separable convolutional layer. Inherits from Keras SeparableConv2D layer, applying a quantization on weights during the forward pass. Creates a quantization-aware separable convolutional layer. Args: filters (int): the number of filters. kernel_size (tuple of integer): the kernel spatial dimensions. quantizer (:obj:`cnn2snn.WeightQuantizer`): the quantizer to apply during the forward pass. quantizer_dw (:obj:`cnn2snn.WeightQuantizer`, optional): the depthwise quantizer to apply during the forward pass. strides (integer, or tuple of integers, optional): strides of the convolution along spatial dimensions. padding (str, optional): One of 'valid' or 'same'. use_bias (boolean, optional): Whether the layer uses a bias vector. depthwise_initializer (str, or a :obj:`tf.keras.initializer`, optional): initializer for the depthwise kernel. pointwise_initializer (str, or a :obj:`tf.keras.initializer`, optional): initializer for the pointwise kernel. bias_initializer (str, or a :obj:`tf.keras.initializer`, optional): initializer for the bias vector. depthwise_regularizer (str, or a :obj:`tf.keras.regularizer`, optional): regularization applied to the depthwise kernel. pointwise_regularizer (str, or a :obj:`tf.keras.regularizer`, optional): regularization applied to the pointwise kernel. bias_regularizer (str, or a :obj:`tf.keras.regularizer`, optional): regularization applied to the bias. activity_regularizer (str, or a :obj:`tf.keras.regularizer`, optional): regularization applied to the output of the layer. depthwise_constraint (str, or a :obj:`tf.keras.constraint`, optional): constraint applied to the depthwise kernel. pointwise_constraint (str, or a :obj:`tf.keras.constraint`, optional): constraint applied to the pointwise kernel. bias_constraint (str, or a :obj:`tf.keras.constraint`, optional): constraint applied to the bias. """ unsupported_args = { 'data_format': 'channels_last', 'activation': 'linear', 'dilation_rate': (1, 1), 'depth_multiplier': 1 } def __init__(self, filters, kernel_size, quantizer, quantizer_dw=None, strides=(1, 1), padding='valid', use_bias=True, depthwise_initializer='glorot_uniform', pointwise_initializer='glorot_uniform', bias_initializer='zeros', depthwise_regularizer=None, pointwise_regularizer=None, bias_regularizer=None, activity_regularizer=None, depthwise_constraint=None, pointwise_constraint=None, bias_constraint=None, **kwargs): _check_unsupported_args(kwargs, self.unsupported_args) self.quantizer = get_quantizer(quantizer) if quantizer_dw is None: # If no depthwise quantizer provided, use the pointwise quantizer # Note: this is compatible with legacy models self.quantizer_dw = self.quantizer.__class__.from_config( self.quantizer.get_config()) else: self.quantizer_dw = get_quantizer(quantizer_dw) super().__init__(filters=filters, kernel_size=kernel_size, strides=strides, padding=padding, use_bias=use_bias, depthwise_initializer=depthwise_initializer, pointwise_initializer=pointwise_initializer, bias_initializer=bias_initializer, depthwise_regularizer=depthwise_regularizer, pointwise_regularizer=pointwise_regularizer, bias_regularizer=bias_regularizer, activity_regularizer=activity_regularizer, depthwise_constraint=depthwise_constraint, pointwise_constraint=pointwise_constraint, bias_constraint=bias_constraint, **kwargs)
[docs] def call(self, inputs): """Evaluates input Tensor. This applies the quantization on weights, then evaluates the input Tensor and produces the output Tensor. Args: inputs (:obj:`tensorflow.Tensor`): input Tensor. Returns: :obj:`tensorflow.Tensor`: a Tensor. """ strides = (1,) + self.strides + (1,) outputs = nn.separable_conv2d( inputs, self.quantizer_dw.quantize(self.depthwise_kernel), self.quantizer.quantize(self.pointwise_kernel), strides=strides, padding=self.padding.upper(), rate=self.dilation_rate, data_format=conv_utils.convert_data_format(self.data_format, ndim=4)) if self.use_bias: outputs = nn.bias_add(outputs, self.bias, data_format=conv_utils.convert_data_format( self.data_format, ndim=4)) return outputs
[docs] def get_config(self): config = super().get_config() config['quantizer_dw'] = serialize_keras_object(self.quantizer_dw) config['quantizer'] = serialize_keras_object(self.quantizer) for kwarg in self.unsupported_args: config.pop(kwarg, None) return config
[docs]class QuantizedActivation(layers.Layer): """Base class for quantized activation layers. This base class must be overloaded as well as the `step` @property function. This @property function must return a TensorFlow object (e.g. tf.Tensor or tf.Variable) of scalar values. The `.numpy()` method must be callable on them. They can be fixed at initialization or can be trainable variables. The CNN2SNN toolkit only support linear quantized activation as defined in the `quantized_activation` function. The bitwidth defines the number of quantization levels on which the activation will be quantized. For instance, a 4-bit quantization gives 15 activation levels. More generally, a n-bit quantization gives 2^n-1 levels. Args: bitwidth (int): the quantization bitwidth """ def __init__(self, bitwidth, **kwargs): if bitwidth <= 0: raise ValueError("Activation 'bitwidth' must be greater than zero." f" Receives 'bitwidth' {bitwidth}.") self.bitwidth_ = bitwidth self.levels = 2.**bitwidth - 1 super().__init__(**kwargs)
[docs] def quantized_activation(self, x): """Evaluates the quantized activations for the specified input Tensor. Activations will be clipped to a quantization range, and quantized to a number of values defined by the bitwidth: N = (2^bitwidth - 1) values plus zero. The quantization is defined by a single step parameter, that defines the interval between two quantized values. A quantization threshold set to half the quantization step is used to evaluate the quantization intervals, to make sure that each quantized value is exactly in the middle of its quantization interval, thus minimizing the quantization error. For any potential x, the activation output is as follows: - if x <= threshold, activation is zero - if threshold + (n - 1) * step < x <= threshold + n * step, activation is n * step - if x > threshold + levels * step, activation is levels * step Args: x (:obj:`tensorflow.Tensor`): the input values. """ act = ceil_through((x - self.threshold) / self.step) clip_act = tf.clip_by_value(act, 0, self.levels) return self.step * clip_act
[docs] def call(self, inputs, *args, **kwargs): """Evaluates the quantized activations for the specified input Tensor. """ return self.quantized_activation(inputs)
@property def bitwidth(self): """Returns the bitwidth of the quantized activation""" return self.bitwidth_ @property def threshold(self): """The quantization threshold is equal to half the quantization step to better approximate the ReLU. """ return self.step * 0.5 @property def step(self): """Returns the interval between two quantized activation values""" raise NotImplementedError()
[docs] def get_config(self): config = super().get_config() config.update({'bitwidth': self.bitwidth_}) return config
[docs]class ActivationDiscreteRelu(QuantizedActivation): """A discrete ReLU Keras Activation. For bitwidth 1 or 2: - threshold is 0.5 and step is 1 For bithwidth > 2, with N = 2^bitwidth - 1: - threshold is 3 / N and step is 6 / N Args: bitwidth (int): the activation bitwidth. """ def __init__(self, bitwidth=1, **kwargs): super().__init__(bitwidth, **kwargs) relumax = min(self.levels, 6) self.step_ = tf.constant(relumax / self.levels) @property def step(self): return self.step_
[docs]class QuantizedReLU(QuantizedActivation): """A configurable Quantized ReLU Keras Activation. In addition to the quantization bitwidth, this class can be initialized with a max_value parameter corresponding to the ReLU maximum value. Args: bitwidth (int): the activation bitwidth. max_value (float): the initial max_value """ def __init__(self, bitwidth=1, max_value=None, **kwargs): super().__init__(bitwidth, **kwargs) # The max_value defaults to None for ReLU, which means unclipped. # For QuantizedReLU we need to set a value, by default we align # on the bitwidth. if max_value is None: max_value = 2.**bitwidth - 1 self.max_value_ = tf.constant(max_value, dtype=tf.float32) # Evaluate the quantization step self.step_ = tf.constant(self.max_value_ / self.levels, dtype=tf.float32) @property def step(self): return self.step_
[docs] def get_config(self): config = super().get_config() config.update({'max_value': self.max_value_.numpy()}) return config