Source code for model.scffnn

# -*- coding: utf-8 -*-
"""**RosenPy: An Open Source Python Framework for Complex-Valued Neural Networks**.
*Copyright © A. A. Cruz, K. S. Mayer, D. S. Arantes*.

*License*

This file is part of RosenPy.
RosenPy is an open source framework distributed under the terms of the GNU General 
Public License, as published by the Free Software Foundation, either version 3 of 
the License, or (at your option) any later version. For additional information on 
license terms, please open the Readme.md file.

RosenPy is distributed in the hope that it will be useful to every user, but
WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. 
See the GNU General Public License for more details. 

You should have received a copy of the GNU General Public License
along with RosenPy. If not, see <http://www.gnu.org/licenses/>.
"""
from rosenpy.utils import reg_func, init_func, act_func, decay_func
from .rp_layer import Layer
from .rp_nn import NeuralNetwork

[docs]class SCFFNN(NeuralNetwork):
    """
    The Split Complex FeedForward Neural Network (SCFFNN) class.
    
    This class provides the specifications and methods to construct, train, and 
    utilize a split-complex feedforward neural network, including feedforward, 
    backpropagation, and layer addition functionality.
    
    This class inherits from the base `NeuralNetwork` class.
    """
    
[docs]    def feedforward(self, input_data):
        """
        Executes the feedforward operation on the neural network.
        
        Parameters:
        -----------
        input_data : array-like
            Input data to be processed by the neural network.
        
        Returns:
        --------
        array-like
            The output of the neural network after performing feedforward.
        """
        if self.gpu_enable:
            return self._feedforward_gpu(input_data)
        return self._feedforward_cpu(input_data)
    
    def _feedforward_gpu(self, x):
        """
        Executes the feedforward operation using GPU acceleration.
        
        Parameters:
        -----------
        x : array-like
            Training input data as real numbers.
        
        Returns:
        --------
        array-like
            The output of the final layer after feedforward on the GPU.
        """
        layers = self.layers
        layers[0].input = x

        for i, layer in enumerate(layers):
            layer.activ_in = self.xp.dot(layer.input, layer.weights) + layer.biases
            layer.activ_out = (layer.activation(self.xp, self.xp.real(layer.activ_in), 0) +
                               1.0j * layer.activation(self.xp.imag(layer.activ_in), 0))

            if i < len(layers) - 1:
                layers[i + 1].input = layer.activ_out
        
        return layers[-1].activ_out
    
    def _feedforward_cpu(self, x):
        """
        Executes the feedforward operation using the CPU.
        
        Parameters:
        -----------
        x : array-like
            Training input data as real numbers.
        
        Returns:
        --------
        array-like
            The output of the final layer after feedforward on the CPU.
        """
        self.layers[0].input = x
        self.layers[0].activ_in = self.xp.dot(self.layers[0].input, self.layers[0].weights) + self.layers[0].biases
        self.layers[0].activ_out = act_func.split_complex(self.xp, self.layers[0].activ_in, self.layers[0].activation, derivative=False)
        
        for i in range(1, len(self.layers)):
            self.layers[i].input = self.layers[i - 1].activ_out
            self.layers[i].activ_in = self.xp.dot(self.layers[i].input, self.layers[i].weights) + self.layers[i].biases
            self.layers[i].activ_out = act_func.split_complex(self.xp, self.layers[i].activ_in, self.layers[i].activation, derivative=False)
        
        return self.layers[-1].activ_out
    
[docs]    def backprop(self, y, y_pred, epoch):
        """
        Executes the backpropagation operation on the neural network.
        
        Parameters:
        -----------
        y : array-like
            True labels or target values.
        y_pred : array-like
            Predicted values from the neural network.
        epoch : int
            The current epoch number during training.
        """
        if self.gpu_enable:
            return self._backprop_gpu(y, y_pred, epoch)
        return self._backprop_cpu(y, y_pred, epoch)
        
    def _backprop_gpu(self, y, y_pred, epoch):
        """
        Executes the backpropagation operation using GPU acceleration.
        
        Parameters:
        -----------
        y : array-like
            True labels or target values.
        y_pred : array-like
            Predicted values from the neural network.
        epoch : int
            The current epoch number during training.
        """
        e = y - y_pred
        delta_dir, aux_w = None, 0
        
        for layer in reversed(self.layers):
            deriv = (layer.activation(self.xp, self.xp.real(layer.activ_in), 1) +
                     1.0j * layer.activation(self.xp.imag(layer.activ_in), 1))

            if delta_dir is not None:
                delta_dir = self.xp.multiply(self.xp.dot(delta_dir, self.xp.conj(aux_w.T)), self.xp.conj(deriv))
            else:
                delta_dir = self.xp.multiply(self.xp.conj(deriv), e)

            aux_w = layer.weights
            reg_l2 = reg_func.l2_regularization(self.xp, layer.lambda_init, layer.reg_strength, epoch)
            grad_w = (self.xp.dot(self.xp.conj(layer.input.T), delta_dir) -
                      (reg_l2 if layer.reg_strength else 0) * layer.weights)
            grad_b = (self.xp.mean(delta_dir, axis=0) -
                      (reg_l2 if layer.reg_strength else 0) * layer.biases)

            layer.weights, layer.biases, layer.mt, layer.vt, layer.ut = self.optimizer.update_parameters(
                [layer.weights, layer.biases],
                [grad_w, grad_b],
                layer.learning_rates,
                epoch, layer.mt, layer.vt, layer.ut
            )
            
    def _backprop_cpu(self, y, y_pred, epoch):
        """
        Executes the backpropagation operation using the CPU.
        
        Parameters:
        -----------
        y : array-like
            True labels or target values.
        y_pred : array-like
            Predicted values from the neural network.
        epoch : int
            The current epoch number during training.
        """
        e = y - y_pred
        delta_dir, aux_w = None, 0
        
        for layer in reversed(self.layers):
            deriv = act_func.split_complex(self.xp, layer.activ_in, layer.activation, derivative=True)

            if delta_dir is not None:
                delta_dir = self.xp.multiply(self.xp.conjugate(deriv), self.xp.dot(delta_dir, self.xp.conjugate(aux_w.T)))
            else:
                delta_dir = self.xp.multiply(self.xp.conj(deriv), e)

            aux_w = layer.weights
            reg_l2 = reg_func.l2_regularization(self.xp, layer.lambda_init, layer.reg_strength, epoch)
            grad_w = (self.xp.dot(self.xp.conj(layer.input.T), delta_dir) -
                      (reg_l2 if layer.reg_strength else 0) * layer.weights)
            grad_b = (self.xp.divide(sum(delta_dir), delta_dir.shape[0]) -
                      (reg_l2 if layer.reg_strength else 0) * layer.biases)

            layer.weights, layer.biases, layer.mt, layer.vt, layer.ut = self.optimizer.update_parameters(
                [layer.weights, layer.biases],
                [grad_w, grad_b],
                layer.learning_rates,
                epoch, layer.mt, layer.vt, layer.ut
            )
    
[docs]    def add_layer(self, neurons, ishape=0, weights_initializer=init_func.random_normal, bias_initializer=init_func.random_normal,
                  activation=act_func.tanh, weights_rate=0.001, biases_rate=0.001, 
                  reg_strength=0.0, lambda_init=0.1, lr_decay_method=decay_func.none_decay,
                  lr_decay_rate=0.0, lr_decay_steps=1, module=None):
        """
        Adds a new layer to the split-complex neural network.

        Parameters:
        -----------
        neurons : int
            The number of neurons in the new layer.
        ishape : int, optional
            The input shape for the layer. Defaults to 0.
        weights_initializer : function, optional
            Function used to initialize the weights. Defaults to `random_normal`.
        bias_initializer : function, optional
            Function used to initialize the biases. Defaults to `random_normal`.
        activation : function, optional
            Activation function for the layer. Defaults to `tanh`.
        weights_rate : float, optional
            Learning rate for the weights. Defaults to 0.001.
        biases_rate : float, optional
            Learning rate for the biases. Defaults to 0.001.
        reg_strength : float, optional
            Strength of L2 regularization. Defaults to 0.0.
        lambda_init : float, optional
            Initial lambda value for regularization. Defaults to 0.1.
        lr_decay_method : function, optional
            Method for decaying the learning rate. Defaults to `none_decay`.
        lr_decay_rate : float, optional
            Rate at which learning rate decays. Defaults to 0.0.
        lr_decay_steps : int, optional
            Number of steps after which the learning rate decays. Defaults to 1.
        module : object, optional
            Computational module used for the layer (e.g., NumPy or CuPy). Defaults to None.
        """
        
        self.layers.append(Layer(
            ishape if not self.layers else self.layers[-1].neurons,
            neurons,
            weights_initializer=weights_initializer,
            bias_initializer=bias_initializer,
            weights_rate=weights_rate, 
            biases_rate=biases_rate, 
            activation=activation,
            reg_strength=reg_strength,
            lambda_init=lambda_init,
            cvnn=1,
            lr_decay_method=lr_decay_method,
            lr_decay_rate=lr_decay_rate,
            lr_decay_steps=lr_decay_steps,
            module=self.xp
        ))