Source code for rational.keras.rationals

"""
Rational Activation Functions for tensorflow/keras
==================================================

This module allows you to create Rational Neural Networks using Learnable
Rational activation functions.
"""
from tensorflow.keras.layers import Layer
import tensorflow as tf

from rational.keras.versions import _version_a, _version_b, _version_c, \
    _version_d
from rational.utils.get_weights import get_parameters
from rational._base.rational_base import Rational_base


[docs]class Rational(Rational_base, Layer):
    """
    Rational Activation Functions, inheriting from \
    ``tensorflow.keras.layers.Layer``.

    Arguments:
            approx_func (str):
                The name of the approximated function for initialisation.
                The different functions are available in `rational.rationals_config.json`. \n
                Default: ``leaky_relu``

            degrees (tuple of int):
                The degrees of the numerator (P) and denominator (Q). \n
                Default: ``(5, 4)``

            cuda (bool):
                whether to execute on cuda device.
                NOTE: THIS PARAMETER IS CURRENTLY NOT CONSIDERED.
                CUDA GPUS ARE USED WHEN IT IS POSSIBLE

            version (str):
                Version of Rational to use. Rational(x) = P(x)/Q(x),
                where
                P(x) = (a_0 + a_1 * x + a_2 * x^2 + ... + a_n * x^n) and \n

                `A`: Q(x) = (1 + \|b_0 * x\| + \| b_1 * x^2\| + ... +  \| b_m * x^{m+1}\|) \n
                `B`: Q(x) = (1 + \|b_0 * x + b_1 * x^2 + ... + b_m * x^{m + 1}\|) \n
                `C`: Q(x) = (0.1 + \|b_0 + b_1 * x + b_2 * x^2 + ... + b_m * x^m\|) \n
                `D`: like `B` with noised coefficients b_i \n

                Default: ``A``

            trainable (bool):
                Whether the weights are trainable, i.e, if they are updated during
                backward pass. \n
                Default: ``True``

    Returns:
        Layer:
            Rational layer
    """
    def __init__(self, approx_func="leaky_relu", degrees=(5, 4), cuda=False, version="A",
                 trainable=True, name=None):
        if name is None:
            name = approx_func
        super().__init__(name)

        w_numerator, w_denominator = get_parameters(version, degrees, approx_func)

        # add trainable weight vectors for numerator (a_0, ... a_n) and denominator (b_0, ... b_m)
        self.numerator = self.add_weight(shape=(len(w_numerator),), name='w_numerator',
                                         trainable=trainable,
                                         initializer=tf.keras.initializers.Constant(w_numerator))

        self.denominator = self.add_weight(shape=(len(w_denominator),), name='w_denominator',
                                           trainable=trainable,
                                           initializer=tf.keras.initializers
                                           .Constant(w_denominator))

        # record whether weights are trainable. Used later by call() method
        self.training = trainable
        self.degrees = degrees
        self.version = version
        self.init_approximation = approx_func

        # set rational activation function version
        self.rational_func = {'A': _version_a, 'B': _version_b, 'C': _version_c, 'D': _version_d}\
            .get(version)
        if self.rational_func is None:
            raise ValueError("rational activation function version %s not implemented" % version)


[docs]    def build(self, input_shape):
        """
        Inherited from ``tensorflow.keras.layers.Layer``

        This method can be used to create weights that depend on the shape(s) of the input(s),
        using ``add_weight()``. ``__call__()`` will automatically build the layer (if it has not
        been built yet) by calling ``build()``.

        Arguments:
            input_shape (TensorShape):
                one or a list of instances of `TensorShape` if
                the layer expects a list of inputs (one instance per input).
        """
        super(Rational, self).build(input_shape)

[docs]    def call(self, inputs, **kwargs):
        """
        Inherited from ``tensorflow.keras.layers.Layer``

        Called in ``__call__`` after making sure ``build()`` has been called. ``call()`` performs
        the logic of applying the layer to the input tensors (which should be passed in as
        argument). Two reserved keyword arguments you can optionally use in ``call()`` are:

        - training (boolean, whether the call is in inference mode or training mode)
        - mask (boolean tensor encoding masked timesteps in the input, used in RNN layers)

        Arguments:
                inputs:
                    Input tensorflow tensor
        Returns:
                output tensor, with the Rational Activation Function applied to it
        """
        return self.rational_func(inputs, self.numerator, self.denominator, self.training)

[docs]    def numpy(self):
        """
        Returns a numpy version of this activation function.
        """
        from rational.numpy import Rational as Rational_numpy
        rational_n = Rational_numpy(self.init_approximation, self.degrees,
                                    self.version)
        rational_n.numerator = self.numerator.numpy().tolist()
        rational_n.denominator = self.denominator.numpy().tolist()
        return rational_n

    @property
    def device(self):
        return self.numerator.device.split("device:")[-1]