Source code for hosa.models.cnn.cnn_models

"""
Utilities for Convolutional Neural Network (CNN) models.
"""
import abc

import numpy as np
import tensorflow as tf
from sklearn.metrics import r2_score, mean_squared_error
from sklearn.model_selection import train_test_split

from hosa.callbacks import EarlyStoppingAtMinLoss
from hosa.helpers.functions import metrics_multiclass


[docs]class BaseCNN:
    """Base class for Convolutional Neural Network (CNN) models for classification and
    regression.

    Each CNN model comprises an input layer, a set of groups of layers (GofLayers [Men20]_)—where
    each group is composed of one convolution layer, followed by one pooling
    layer and a dropout layer—, a dense layer, and an output layer. The output layer is a
    dense layer with ``n_outputs`` units, and with the softmax activation function (for
    classification) or the linear activation function (for regression).

    .. warning::
        This class should not be used directly. Use derived classes instead, i.e.,
        :class:`.CNNClassification` or :class:`.CNNRegression`.

    .. note::
        The parameters used in this library were adapted from the exact parameters of the
        TensorFlow library. Descriptions were thus modified accordingly to our approach.
        However, refer to the TensorFlow documentation for more details about each of those
        parameters.

    Args:
        n_outputs (int): Number of class labels in classification, or the number of numerical
            values to predict in regression.
        n_kernels (list): *i*-th element represents the number of output filters of the
            convolution layer in the *i*-th GofLayer.
        n_neurons_dense_layer (int): Number of neuron units in the dense layer (i.e.,
            the dense layer after the set of groups of layers).
        optimizer (str): Name of the optimizer. See `tensorflow.keras.optimizers
            <https://www.tensorflow.org/api_docs/python/tf/keras/optimizers>`_.
        cnn_dim (int): Number of dimensions applicable to *all* the convolution layers of the
            GofLayers.
        kernel_size (int or tuple): Integer or tuple/list of integers, specifying the length
            (for ``cnn_dim`` = 1), the height and width (for ``cnn_dim`` = 2), or  the depth,
            height and width (for ``cnn_dim`` = 3) of the convolution window. It can also be a
            single integer to specify the same value for all spatial dimensions. This applies to
            *all* the convolution layers of the GofLayers.
        pool_size (int or tuple): Size of the max-pooling window applicable to *all* the
            max-pooling layers of the GofLayers. For ``cnn_dim`` = 1, use a tuple with 1 integer;
            For ``cnn_dim`` = 2, a tuple with 2 integers and for ``cnn_dim`` = 3, a tuple with 3
            integers. It can also be a single integer to specify the same value for all spatial
            dimensions.
        strides_convolution (int or tuple): Integer or tuple/list of integers, specifying the
            strides of the convolution. For ``cnn_dim`` = 1, use a tuple with 1 integer; For
            ``cnn_dim`` = 2, a tuple with 2 integers and for ``cnn_dim`` = 3, a tuple with 3
            integers. It can also be a single integer to specify the same value for all spatial
            dimensions. This applies to *all* the convolution layers of the GofLayers.
        strides_pooling (int or tuple): Integer or tuple/list of integers, specifying the
            strides of the pooling. For ``cnn_dim`` = 1, use a tuple with 1 integer; For
            ``cnn_dim`` = 2, a tuple with 2 integers and for ``cnn_dim`` = 3, a tuple with 3
            integers. It can also be a single integer to specify the same value for all spatial
            dimensions. This applies to *all* the pooling layers of the GofLayers.
        padding (str): Available options are ``valid`` or ``same``. ``valid`` means no
            padding. ``same`` results in padding evenly to the left/right or up/down of the input
            such that output has the same height/width dimension as the input. This applies to
            *all* the pooling layers of the GofLayers.
        dropout_percentage (float): Fraction of the input units to drop. This applies to
            *all* the dropout layers of the GofLayers.
        activation_function_gol (str or None): Activation function to use in the convolution
            layers of the GofLayers. If not specified, no activation is applied (i.e., uses the
            linear activation function). See `tensorflow.keras.activations
            <https://www.tensorflow.org/api_docs/python/tf/keras/activations>`_. This applies to
            *all* the convolution layers of the GofLayers.
        activation_function_dense (str or None): Activation function to use on the dense
            layer (i.e., the dense layer after the set of groups of layers). If not specified,
            no activation is applied (i.e., uses the linear activation function). See
            `tensorflow.keras.activations
            <https://www.tensorflow.org/api_docs/python/tf/keras/activations>`_.
        batch_size (int or None): Number of samples per batch of computation. If ``None``,
            ``batch_size`` will default to 32.
        epochs (int): Maximum number of epochs to train the model.
        patience (int): Number of epochs with no improvement after which training will be
            stopped.
        **kwargs: *Ignored*. Extra arguments that are used for compatibility’s sake.

   """

    def __init__(self, n_outputs, n_kernels, n_neurons_dense_layer=50,
                 optimizer='adam', cnn_dim=1, kernel_size=2, pool_size=2, strides_convolution=1,
                 strides_pooling=2, padding='valid', dropout_percentage=0.1,
                 activation_function_gol='relu', activation_function_dense='relu', batch_size=1000,
                 epochs=50, patience=5,
                 **kwargs):
        self.n_outputs = n_outputs
        self.n_kernels = n_kernels
        self.n_neurons_dense_layer = n_neurons_dense_layer
        self.optimizer = optimizer
        self.cnn_dim = cnn_dim
        self.kernel_size = kernel_size
        self.pool_size = pool_size
        self.strides_convolution = strides_convolution
        self.strides_pooling = strides_pooling
        self.padding = padding
        self.dropout_percentage = dropout_percentage
        self.activation_function_gol = activation_function_gol
        self.activation_function_dense = activation_function_dense
        self.batch_size = batch_size
        self.epochs = epochs
        self.patience = patience

        self.model = tf.keras.models.Sequential()

[docs]    def prepare(self, x, y):
        """

        Prepares the model by adding the layers to the estimator: input layer, GofLayers,
        flatten and dense layers.

        Args:
            x (numpy.ndarray): Input data.
            y (numpy.ndarray): Target values (class labels in classification, real numbers in
            regression).
        """
        if self.cnn_dim == 1:
            input_shape = (x.shape[-1], 1)
        elif self.cnn_dim == 2:
            input_shape = (x.shape[-2], x.shape[-1], 1)
        elif self.cnn_dim == 3:
            input_shape = (x.shape[-3], x.shape[-2], x.shape[-1], 1)
        else:
            raise ValueError('`cnn_dim` parameter must be 1, 2 or 3.')
        self.model.add(tf.keras.layers.InputLayer(input_shape=input_shape))
        for n_kernel in self.n_kernels:
            self.add_gol(n_kernel, self.cnn_dim)
        self.model.add(tf.keras.layers.Flatten())
        self.model.add(tf.keras.layers.Dense(self.n_neurons_dense_layer,
                                             activation=self.activation_function_dense))

[docs]    def add_gol(self, n_kernel, cnn_dim):
        """

        Adds a GofLayer to the estimator.

        Args:
            n_kernel (int): Number of output filters.
            cnn_dim (int): Number of dimensions.

        Raises:
            ValueError: If ``cnn_dim`` is not valid.
        """
        if cnn_dim == 1:
            self.model.add(tf.keras.layers.Conv1D(n_kernel, kernel_size=self.kernel_size,
                                                  activation=self.activation_function_gol,
                                                  strides=self.strides_convolution))
            self.model.add(
                    tf.keras.layers.MaxPooling1D(pool_size=self.pool_size,
                                                 strides=self.strides_pooling,
                                                 padding=self.padding))
        elif cnn_dim == 2:
            self.model.add(tf.keras.layers.Conv2D(n_kernel, kernel_size=self.kernel_size,
                                                  activation=self.activation_function_gol,
                                                  strides=self.strides_convolution))
            self.model.add(
                    tf.keras.layers.MaxPooling2D(pool_size=self.pool_size,
                                                 strides=self.strides_pooling,
                                                 padding=self.padding))
        elif cnn_dim == 3:
            self.model.add(tf.keras.layers.Conv3D(n_kernel, kernel_size=self.kernel_size,
                                                  activation=self.activation_function_gol,
                                                  strides=self.strides_convolution))
            self.model.add(
                    tf.keras.layers.MaxPooling3D(pool_size=self.pool_size,
                                                 strides=self.strides_pooling,
                                                 padding=self.padding))
        else:
            raise ValueError('`cnn_dim` parameter must be 1, 2 or 3.')
        self.model.add(tf.keras.layers.Dropout(self.dropout_percentage))

[docs]    def aux_fit(self, x, y, callback, validation_size, atol=1e-04, rtol=1e-03, class_weights=None,
                imbalance_correction=None, shuffle=True, **kwargs):
        """
        Auxiliar function for classification and regression models compatibility.

        .. warning::
            This function is not meant to be called by itself. It is just an auxiliary function
            called by the child classes' ``fit`` function.

        Args:
            x (numpy.ndarray): Input data.
            y (numpy.ndarray): Target values (class labels in classification, real numbers in
                regression).
            callback (object): Early stopping callback for halting the model's training.
            validation_size (float or int): Proportion of the training dataset that will be used
                the validation split.
            atol (float): Absolute tolerance used for early stopping based on the performance
                metric.
            rtol (float): Relative tolerance used for early stopping based on the performance
                metric.
            class_weights (None or dict): Dictionary mapping class indices (integers) to a weight
                (float) value, used for weighting the loss function (during training only). **Only
                used for classification problems. Ignored for regression.**
            imbalance_correction (None or bool): Whether to apply correction to class
                imbalances. **Only used for classification problems. Ignored for regression.**
            shuffle (bool): Whether to shuffle the data before splitting.
            **kwargs: Extra arguments used in the TensorFlow's model ``fit`` function. See `here
                <https://www.tensorflow.org/api_docs/python/tf/keras/Model#fit>`_.
        """

        x_train, x_validation, y_train, y_validation = train_test_split(x, y,
                                                                        test_size=validation_size,
                                                                        shuffle=shuffle)
        x_train = np.expand_dims(x_train, axis=-1)
        x_validation = np.expand_dims(x_validation, axis=-1)
        callbacks = [
                callback(self, self.patience, (x_validation, y_validation), imbalance_correction,
                         rtol, atol)]
        self.model.fit(x_train, y_train, batch_size=self.batch_size, epochs=self.epochs,
                       validation_data=(x_validation, y_validation), callbacks=callbacks,
                       class_weight=class_weights, **kwargs)

[docs]    @abc.abstractmethod
    def fit(self, x, y, **kwargs):
        """

        Fits the model to data matrix x and target(s) y.

        Args:
            x (numpy.ndarray): Input data.
            y (numpy.ndarray): Target values (class labels in classification, real numbers in
                regression).
            **kwargs: Extra arguments explicitly used for regression or classification models.
        """
        raise NotImplementedError

[docs]    @abc.abstractmethod
    def compile(self):
        """

        Compiles the model for training.
        """
        raise NotImplementedError

[docs]    @abc.abstractmethod
    def score(self, x, y, **kwargs):
        """

        Computes the performance metric(s) (e.g., accuracy for classification) on the given input
        data and target values.

        Args:
            x (numpy.ndarray): Input data.
            y (numpy.ndarray): Target values (class labels in classification, real numbers in
                regression).
            **kwargs: Extra arguments that are explicitly used for regression or classification
            models.
        """
        raise NotImplementedError

[docs]    @abc.abstractmethod
    def predict(self, x, **kwargs):
        """

        Predicts the target values using the input data in the trained model.

        Args:
            x (numpy.ndarray): Input data.
            **kwargs: Extra arguments that are used in the TensorFlow's model ``predict``
                function. See `here <https://www.tensorflow.org/api_docs/python/tf/keras/Model
                #predict>`_.
        """
        raise NotImplementedError

    @abc.abstractmethod
    def __dict__(self):
        """
        Prepares a dictonary with the parameters of the model.
        """
        raise NotImplementedError


[docs]class CNNClassification(BaseCNN):
    """Convolutional Neural Network (CNN) classifier.

    The model comprises an input layer, a set of groups of layers (GofLayers [Men20]_)—where
    each group is composed of one convolution layer, followed by one pooling layer and a
    dropout layer—, a dense layer, and an output layer. The output layer is a dense layer
    with ``n_outputs`` units, with the softmax activation function.

    .. note::
        The parameters used in this library were adapted from the exact parameters of the
        TensorFlow library. Descriptions were thus modified accordingly to our approach.
        However, refer to the TensorFlow documentation for more details about each of those
        parameters.

    Args:
        n_outputs (int): Number of class labels to predict.
        n_kernels (list): *i*-th element represents the number of output filters of the
            convolution layer in the *i*-th GofLayer.
        n_neurons_dense_layer (int): Number of neuron units in the dense layer (i.e.,
            the dense layer after the set of groups of layers).
        optimizer (str): Name of the optimizer. See `tensorflow.keras.optimizers
            <https://www.tensorflow.org/api_docs/python/tf/keras/optimizers>`_.
        metrics (list): List of metrics to be evaluated by the model during training and
            testing. Each item of the list can be a string (name of a TensorFlow's built-in
            function), function, or a `tf.keras.metrics.Metric
            <https://www.tensorflow.org/api_docs/python/tf/keras/metrics/Metric>`_ instance. If
            ``None``, ``metrics`` will default to ``['accuracy']``.
        cnn_dim (int): Number of dimensions applicable to *all* the convolution layers of the
            GofLayers.
        kernel_size (int or tuple): Integer or tuple/list of integers, specifying the length
            (for ``cnn_dim`` = 1), the height and width (for ``cnn_dim`` = 2), or  the depth,
            height and width (for ``cnn_dim`` = 3) of the convolution window. It can also be a
            single integer to specify the same value for all spatial dimensions. This applies to
            *all* the convolution layers of the GofLayers.
        pool_size (int or tuple): Size of the max-pooling window applicable to *all* the
            max-pooling layers of the GofLayers. For ``cnn_dim`` = 1, use a tuple with 1 integer;
            For ``cnn_dim`` = 2, a tuple with 2 integers and for ``cnn_dim`` = 3, a tuple with 3
            integers. It can also be a single integer to specify the same value for all spatial
            dimensions.
        strides_convolution (int or tuple): Integer or tuple/list of integers, specifying the
            strides of the convolution. For ``cnn_dim`` = 1, use a tuple with 1 integer; For
            ``cnn_dim`` = 2, a tuple with 2 integers and for ``cnn_dim`` = 3, a tuple with 3
            integers. It can also be a single integer to specify the same value for all spatial
            dimensions. This applies to *all* the convolution layers of the GofLayers.
        strides_pooling (int or tuple): Integer or tuple/list of integers, specifying the
            strides of the pooling. For ``cnn_dim`` = 1, use a tuple with 1 integer; For
            ``cnn_dim`` = 2, a tuple with 2 integers and for ``cnn_dim`` = 3, a tuple with 3
            integers. It can also be a single integer to specify the same value for all spatial
            dimensions. This applies to *all* the pooling layers of the GofLayers.
        padding (str): Available options are ``valid`` or ``same``. ``valid`` means no
            padding. ``same`` results in padding evenly to the left/right or up/down of the input
            such that output has the same height/width dimension as the input. This applies to
            *all* the pooling layers of the GofLayers.
        dropout_percentage (float): Fraction of the input units to drop. This applies to
            *all* the dropout layers of the GofLayers.
        activation_function_gol (str or None): Activation function to use in the convolution
            layers of the GofLayers. If not specified, no activation is applied (i.e., uses the
            linear activation function). See `tensorflow.keras.activations
            <https://www.tensorflow.org/api_docs/python/tf/keras/activations>`_. This applies to
            *all* the convolution layers of the GofLayers.
        activation_function_dense (str or None): Activation function to use on the dense
            layer (i.e., the dense layer after the set of groups of layers). If not specified,
            no activation is applied (i.e., uses the linear activation function). See
            `tensorflow.keras.activations
            <https://www.tensorflow.org/api_docs/python/tf/keras/activations>`_.
        batch_size (int or None): Number of samples per batch of computation. If ``None``,
            ``batch_size`` will default to 32.
        epochs (int): Maximum number of epochs to train the model.
        patience (int): Number of epochs with no improvement after which training will be
            stopped.
        **kwargs: *Ignored*. Extra arguments that are used for compatibility’s sake.

    Examples:
        .. code-block:: python
            :linenos:

            from tensorflow import keras

            from hosa.models.cnn import CNNClassification

            # 1 - Load and split the data
            fashion_mnist = keras.datasets.fashion_mnist
            (x_train, y_train), (X_test, y_test) = fashion_mnist.load_data()
            # 2 - Normalize the images, and reshape the images for cnn input
            x_train = x_train / 255.0
            X_test = X_test / 255.0
            x_train = x_train.reshape((-1, 28 * 28))
            X_test = X_test.reshape((-1, 28 * 28))
            # 3 - Create and fit the model
            clf = CNNClassification(10, 10, [4, 3])
            clf.prepare(x_train, y_train)
            clf.compile()
            clf.fit(x_train, y_train)
            # 4 - Calculate predictions
            clf.predict(X_test)
            # 5 - Compute the score
            score = clf.score(X_test, y_test)

    """

    def __init__(self, n_outputs, n_kernels, n_neurons_dense_layer=50,
                 optimizer='adam', metrics=None, cnn_dim=1, kernel_size=2, pool_size=2,
                 strides_convolution=1, strides_pooling=2, padding='valid', dropout_percentage=0.1,
                 activation_function_gol='relu', activation_function_dense='relu', batch_size=1000,
                 epochs=50, patience=5,
                 **kwargs):
        if metrics is None:
            metrics = ['accuracy']
        self.metrics, self.n_outputs, self.is_binary = metrics, n_outputs, None
        super().__init__(n_outputs, n_kernels, n_neurons_dense_layer, optimizer, cnn_dim,
                         kernel_size, pool_size, strides_convolution, strides_pooling, padding,
                         dropout_percentage, activation_function_gol, activation_function_dense,
                         batch_size, epochs, patience, **kwargs)

[docs]    def prepare(self, x, y):
        """

        Prepares the model by adding the layers to the estimator: input layer, GofLayers,
        flatten and dense layers.

        Args:
            x (numpy.ndarray): Input data.
            y (numpy.ndarray): Target values (i.e., class labels).
        """
        super().prepare(x, y)
        self.model.add(tf.keras.layers.Dense(self.n_outputs, activation='softmax'))

[docs]    def fit(self, x, y, validation_size=0.33, shuffle=True, atol=1e-04, rtol=1e-03,
            class_weights=None, imbalance_correction=False, **kwargs):
        """

        Fits the model to data matrix x and target(s) y.

        Args:
            x (numpy.ndarray): Input data.
            y (numpy.ndarray): Target values (i.e., class labels).
            validation_size (float or int): Proportion of the train dataset to include in the
                validation split.
            shuffle (bool): Whether to shuffle the data before splitting.
            atol (float): Absolute tolerance used for early stopping based on the performance
                metric.
            rtol (float): Relative tolerance used for early stopping based on the performance
                metric.
            class_weights (None or dict): Dictionary mapping class indices (integers) to a weight
                (float) value, used for weighting the loss function (during training only).
            imbalance_correction (bool): `True` if correction for imbalance should be applied to
                the metrics; `False` otherwise.
            **kwargs: Extra arguments that are used in the TensorFlow's model ``fit`` function.
                See `here <https://www.tensorflow.org/api_docs/python/tf/keras/Model#fit>`_.

        Returns:
            tensorflow.keras.Sequential: Returns a trained TensorFlow model.
        """
        callback = EarlyStoppingAtMinLoss
        super().aux_fit(x, y, callback, validation_size, atol=atol, rtol=rtol,
                        class_weights=class_weights, imbalance_correction=imbalance_correction,
                        shuffle=shuffle, **kwargs)
        return self.model

[docs]    def score(self, x, y, imbalance_correction=False, **kwargs):
        """

        Computes the performance metrics on the given input data and target values.

        Args:
            x (numpy.ndarray): Input data.
            y (numpy.ndarray): Target values (i.e., class labels).
            imbalance_correction (bool): `True` if correction for imbalance should be applied to
                the metrics; `False` otherwise.
            **kwargs: *Ignored*. Only included here for compatibility’s sake.

        Returns:
            tuple: Returns a tuple containing the area under the ROC curve (AUC), accuracy,
                sensitivity, and sensitivity.

        .. note::
            This function can be used for both binary and multiclass classification.
        """
        y_probs, _ = self.predict(x)
        auc_value, accuracy, sensitivity, specificity = metrics_multiclass(y, y_probs,
                                                                           self.n_outputs,
                                                                           imbalance_correction=imbalance_correction)
        return auc_value, accuracy, sensitivity, specificity

[docs]    def predict(self, x, **kwargs):
        """

        Predicts the target values using the input data in the trained model.

        Args:
            x (numpy.ndarray): Input data.
            **kwargs: Extra arguments that are used in the TensorFlow's model ``predict``
                function. See `here <https://www.tensorflow.org/api_docs/python/tf/keras/Model
                #predict>`_.

        Returns:
            tuple: Returns a tuple containing the probability estimates and predicted classes.
        """

        x = np.expand_dims(x, axis=-1)
        y_probs = self.model.predict(x, **kwargs)
        y_pred_labels = np.argmax(y_probs, axis=1)
        return y_probs, y_pred_labels

[docs]    def compile(self):
        """

        Compiles the model for training.

        Returns:
            tensorflow.keras.Sequential: Returns an untrained but compiled TensorFlow model.
        """
        self.model.compile(loss='sparse_categorical_crossentropy', optimizer=self.optimizer,
                           metrics=self.metrics)
        return self.model

    def __dict__(self):
        """
        Prepares a dictonary with the parameters of the model.

        Returns:
            dict: Dictonary with the parameter names mapped to their values.
        """
        parameters = {'n_outputs':                 self.n_outputs,
                      'n_kernels':                 self.n_kernels,
                      'n_neurons_dense_layer':     self.n_neurons_dense_layer,
                      'optimizer':                 self.optimizer,
                      'metrics':                   self.metrics,
                      'cnn_dim':                   self.cnn_dim,
                      'kernel_size':               self.kernel_size,
                      'pool_size':                 self.pool_size,
                      'strides_convolution':       self.strides_convolution,
                      'strides_pooling':           self.strides_pooling,
                      'padding':                   self.padding,
                      'dropout_percentage':        self.dropout_percentage,
                      'activation_function_gol':   self.activation_function_gol,
                      'activation_function_dense': self.activation_function_dense,
                      'batch_size':                self.batch_size,
                      'epochs':                    self.epochs,
                      'patience':                  self.patience}
        return parameters


[docs]class CNNRegression(BaseCNN):
    """Convolutional Neural Network (CNN) regressor.

    The model comprises an input layer, a set of groups of layers (GofLayers [Men20]_)—where
    each group is composed of one convolution layer, followed by one pooling layer and a
    dropout layer—, a dense layer, and an output layer. The output layer is a dense layer
    with ``n_outputs`` units, with the linear activation function.

    .. note::
        The parameters used in this library were adapted from the exact parameters of the
        TensorFlow library. Descriptions were thus modified accordingly to our approach.
        However, refer to the TensorFlow documentation for more details about each of those
        parameters.

    Args:
        n_outputs (int): Number of numerical values to predict in regression.
        n_kernels (list): *i*-th element represents the number of output filters of the
            convolution layer in the *i*-th GofLayer.
        n_neurons_dense_layer (int): Number of neuron units in the dense layer (i.e.,
            the dense layer after the set of groups of layers).
        optimizer (str): Name of the optimizer. See `tensorflow.keras.optimizers
            <https://www.tensorflow.org/api_docs/python/tf/keras/optimizers>`_.
        metrics (list): List of metrics to be evaluated by the model during training and
            testing. Each item of the list can be a string (name of a TensorFlow's built-in
            function), function, or a `tf.keras.metrics.Metric
            <https://www.tensorflow.org/api_docs/python/tf/keras/metrics/Metric>`_ instance. If
            ``None``, ``metrics`` will default to ``['mean_squared_error']``.
        cnn_dim (int): Number of dimensions applicable to *all* the convolution layers of the
            GofLayers.
        kernel_size (int or tuple): Integer or tuple/list of integers, specifying the length
            (for ``cnn_dim`` = 1), the height and width (for ``cnn_dim`` = 2), or  the depth,
            height and width (for ``cnn_dim`` = 3) of the convolution window. It can also be a
            single integer to specify the same value for all spatial dimensions. This applies to
            *all* the convolution layers of the GofLayers.
        pool_size (int or tuple): Size of the max-pooling window applicable to *all* the
            max-pooling layers of the GofLayers. For ``cnn_dim`` = 1, use a tuple with 1 integer;
            For ``cnn_dim`` = 2, a tuple with 2 integers and for ``cnn_dim`` = 3, a tuple with 3
            integers. It can also be a single integer to specify the same value for all spatial
            dimensions.
        strides_convolution (int or tuple): Integer or tuple/list of integers, specifying the
            strides of the convolution. For ``cnn_dim`` = 1, use a tuple with 1 integer; For
            ``cnn_dim`` = 2, a tuple with 2 integers and for ``cnn_dim`` = 3, a tuple with 3
            integers. It can also be a single integer to specify the same value for all spatial
            dimensions. This applies to *all* the convolution layers of the GofLayers.
        strides_pooling (int or tuple): Integer or tuple/list of integers, specifying the
            strides of the pooling. For ``cnn_dim`` = 1, use a tuple with 1 integer; For
            ``cnn_dim`` = 2, a tuple with 2 integers and for ``cnn_dim`` = 3, a tuple with 3
            integers. It can also be a single integer to specify the same value for all spatial
            dimensions. This applies to *all* the pooling layers of the GofLayers.
        padding (str): Available options are ``valid`` or ``same``. ``valid`` means no
            padding. ``same`` results in padding evenly to the left/right or up/down of the input
            such that output has the same height/width dimension as the input. This applies to
            *all* the pooling layers of the GofLayers.
        dropout_percentage (float): Fraction of the input units to drop. This applies to
            *all* the dropout layers of the GofLayers.
        activation_function_gol (str or None): Activation function to use in the convolution
            layers of the GofLayers. If not specified, no activation is applied (i.e., uses the
            linear activation function). See `tensorflow.keras.activations
            <https://www.tensorflow.org/api_docs/python/tf/keras/activations>`_. This applies to
            *all* the convolution layers of the GofLayers.
        activation_function_dense (str or None): Activation function to use on the dense
            layer (i.e., the dense layer after the set of groups of layers). If not specified,
            no activation is applied (i.e., uses the linear activation function). See
            `tensorflow.keras.activations
            <https://www.tensorflow.org/api_docs/python/tf/keras/activations>`_.
        batch_size (int or None): Number of samples per batch of computation. If ``None``,
            ``batch_size`` will default to 32.
        epochs (int): Maximum number of epochs to train the model.
        patience (int): Number of epochs with no improvement after which training will be
            stopped.
        **kwargs: *Ignored*. Extra arguments that are used for compatibility’s sake.

    Examples:
        .. code-block:: python
            :linenos:

            import pandas as pd

            from hosa.models.cnn import CNNRegression
            from hosa.aux import create_overlapping

            # 1 - Download, load, and split the data
            dataset = pd.read_csv(
            'https://raw.githubusercontent.com/jbrownlee/Datasets/master/airline-passengers
            .csv', header=0, index_col=0)
            x = dataset.Passengers.to_numpy().reshape((len(dataset), 1))
            y = dataset.Passengers.to_numpy()
            x_train, y_train = x[:100], y[:100]
            X_test, y_test = x[100:], y[100:]
            # 2 - Prepare the data for cnn input
            x_train, y_train = create_overlapping(x_train, y_train, CNNRegression, 'central', 4)
            X_test, y_test = create_overlapping(X_test, y_test, CNNRegression, 'central', 4)
            # 3 - Create and fit the model
            clf = CNNRegression(1, 50, [5], epochs=500, patience=500)
            clf.prepare(x_train, y_train)
            clf.compile()
            clf.fit(x_train, y_train)
            # 4 - Calculate predictions
            clf.predict(X_test)
            # 5 - Compute the score
            score = clf.score(X_test, y_test)

    """

    def __init__(self, n_outputs, n_kernels, n_neurons_dense_layer=50,
                 optimizer='adam', metrics=None, cnn_dim=1, kernel_size=2, pool_size=2,
                 strides_convolution=1, strides_pooling=2, padding='valid', dropout_percentage=0.1,
                 activation_function_gol='relu', activation_function_dense='relu', batch_size=1000,
                 epochs=50, patience=5,
                 **kwargs):
        if metrics is None:
            metrics = ['mean_squared_error']
        self.metrics, self.n_outputs = metrics, n_outputs
        super().__init__(n_outputs, n_kernels, n_neurons_dense_layer, optimizer, cnn_dim,
                         kernel_size, pool_size, strides_convolution, strides_pooling, padding,
                         dropout_percentage, activation_function_gol, activation_function_dense,
                         batch_size, epochs, patience, **kwargs)

[docs]    def prepare(self, x, y):
        """

        Prepares the model by adding the layers to the estimator: input layer, GofLayers,
        flatten and dense layers.

        Args:
            x (numpy.ndarray): Input data.
            y (numpy.ndarray): Target values (i.e., real numbers).
        """
        super().prepare(x, y)
        self.model.add(tf.keras.layers.Dense(self.n_outputs, activation='linear'))

[docs]    def fit(self, x, y, validation_size=0.33, shuffle=True, atol=1e-04, rtol=1e-03, **kwargs):
        """

        Fits the model to data matrix x and target(s) y.

        Args:
            x (numpy.ndarray): Input data.
            y (numpy.ndarray): Target values (i.e., real numbers).
            validation_size (float or int): Proportion of the train dataset to include in the
                validation split.
            shuffle (bool): Whether to shuffle the data before splitting.
            atol (float): Absolute tolerance used for early stopping based on the performance
                metric.
            rtol (float): Relative tolerance used for early stopping based on the performance
                metric.
            **kwargs: Extra arguments that are used in the TensorFlow's model ``fit`` function.
                See `here <https://www.tensorflow.org/api_docs/python/tf/keras/Model#fit>`_.

        Returns:
            tensorflow.keras.Sequential: Returns a trained TensorFlow model.
        """
        callback = EarlyStoppingAtMinLoss
        super().aux_fit(x, y, callback, validation_size, atol=atol, rtol=rtol, class_weights=None,
                        imbalance_correction=None, shuffle=shuffle, **kwargs)

[docs]    def score(self, x, y, **kwargs):
        """

        Computes the performance metrics on the given input data and target values.

        Args:
            x (numpy.ndarray): Input data.
            y (numpy.ndarray): Target values (i.e., real numbers).
            **kwargs: *Ignored*. Only included here for compatibility’s sake.

        Returns:
            tuple: Returns a tuple containing the mean squared error (MSE) and coefficient of
                determination (:math:`R^2`).

        """
        y_pred = self.predict(x)
        r2 = r2_score(y, y_pred)
        mse = mean_squared_error(y, y_pred)
        return mse, r2

[docs]    def predict(self, x, **kwargs):
        """

        Predicts the target values using the input data in the trained model.

        Args:
            x (numpy.ndarray): Input data.
            **kwargs: Extra arguments that are used in the TensorFlow's model ``predict``
                function. See `here <https://www.tensorflow.org/api_docs/python/tf/keras/Model
                #predict>`_.

        Returns:
            numpy.ndarray: Returns an array containing the estimates.
        """
        x = np.expand_dims(x, axis=-1)
        y_pred = self.model.predict(x, **kwargs)
        return y_pred

[docs]    def compile(self):
        """

        Compiles the model for training.

        Returns:
            tensorflow.keras.Sequential: Returns an untrained but compiled TensorFlow model.
        """
        self.model.compile(loss='mean_squared_error', optimizer=self.optimizer,
                           metrics=self.metrics)

    def __dict__(self):
        """
        Prepares a dictonary with the parameters of the model.

        Returns:
            dict: Dictonary with the parameter names mapped to their values.
        """
        parameters = {'n_outputs':                 self.n_outputs,
                      'n_kernels':                 self.n_kernels,
                      'n_neurons_dense_layer':     self.n_neurons_dense_layer,
                      'optimizer':                 self.optimizer,
                      'metrics':                   self.metrics,
                      'cnn_dim':                   self.cnn_dim,
                      'kernel_size':               self.kernel_size,
                      'pool_size':                 self.pool_size,
                      'strides_convolution':       self.strides_convolution,
                      'strides_pooling':           self.strides_pooling,
                      'padding':                   self.padding,
                      'dropout_percentage':        self.dropout_percentage,
                      'activation_function_gol':   self.activation_function_gol,
                      'activation_function_dense': self.activation_function_dense,
                      'batch_size':                self.batch_size,
                      'epochs':                    self.epochs,
                      'patience':                  self.patience}
        return parameters