Source code for model.rp_nn

# -*- coding: utf-8 -*-
"""
RosenPy: An Open Source Python Framework for Complex-Valued Neural Networks.
Copyright © A. A. Cruz, K. S. Mayer, D. S. Arantes.

License:
This file is part of RosenPy.
RosenPy is an open source framework distributed under the terms of the GNU 
General Public License, as published by the Free Software Foundation, either 
version 3 of the License, or (at your option) any later version. For additional 
information on license terms, please open the Readme.md file.

RosenPy is distributed in the hope that it will be useful to every user, but
WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 
FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more 
details.

You should have received a copy of the GNU General Public License along with 
RosenPy. If not, see <http://www.gnu.org/licenses/>.
"""

from rosenpy.utils import cost_func, decay_func, batch_gen_func, select_module
from .rp_layer import Layer
from . import rp_optimizer as opt

[docs]class NeuralNetwork: """ Abstract base class for wrapping all neural network functionality from RosenPy. This is a superclass. """ def __init__(self, cost_func=cost_func.mse, patience=float('inf'), gpu_enable=False): """ Initializes the neural network with default parameters. Parameters: ----------- cost_func : function, optional The cost function to be used for training the neural network. Default is mean squared error (MSE). patience : int, optional The patience parameter for early stopping during training. Default is a large value to avoid early stopping. gpu_enable : bool, optional Flag indicating whether GPU acceleration is enabled. Default is False. """ self.xp = select_module(gpu_enable) self.gpu_enable = gpu_enable self.layers = [] self.cost_func = cost_func self.optimizer = None self.patience, self.waiting = patience, 0 self._best_model, self._best_loss = self.layers, self.xp.inf self._history = {'epochs': [], 'loss': [], 'loss_val': []}
[docs] def fit(self, x_train, y_train, x_val=None, y_val=None, epochs=100, verbose=10, batch_gen=batch_gen_func.batch_sequential, batch_size=1, optimizer=opt.GradientDescent(beta=100, beta1=0.9, beta2=0.999)): """ Trains the neural network on the provided training data. Parameters: ----------- x_train : array-like The input training data. y_train : array-like The target training data. x_val : array-like, optional The input validation data. Default is None. y_val : array-like, optional The target validation data. Default is None. epochs : int, optional The number of training epochs. Default is 100. verbose : int, optional Controls the verbosity of the training process. Default is 10. batch_gen : function, optional The batch generation function to use during training. Default is batch_gen_func.batch_sequential. batch_size : int, optional The batch size to use during training. Default is 1. optimizer : Optimizer, optional The optimizer to use during training. Default is GradientDescent with specified parameters. """ self.verify_input(x_train) self.optimizer = optimizer self.optimizer.set_module(self.xp) x_train, y_train = self.convert_data(x_train), self.convert_data(y_train) self.mean_in = self.xp.mean(x_train) self.mean_out = self.xp.mean(y_train) self.std_in = self.xp.std(x_train) self.std_out = self.xp.std(y_train) x_val, y_val = (x_train, y_train) if (x_val is None or y_val is None) else ( self.convert_data(x_val), self.convert_data(y_val)) x_train = self.normalize_data(x_train, self.mean_in, self.std_in) y_train = self.normalize_data(y_train, self.mean_out, self.std_out) x_val = self.normalize_data(x_val, self.mean_in, self.std_in) y_val = self.normalize_data(y_val, self.mean_out, self.std_out) for epoch in range(1, epochs + 1): x_batch, y_batch = batch_gen(self.xp, x_train, y_train, batch_size) self.update_learning_rate(epoch) for x_batch1, y_batch1 in zip(x_batch, y_batch): y_pred = self.feedforward(x_batch1) self.backprop(y_batch1, y_pred, epoch) loss_val = self.cost_func(self.xp, y_val, self.predict(x_val, status=0)) if self.patience != float('inf'): if loss_val < self._best_loss: self._best_model, self._best_loss = self.layers, loss_val self.waiting = 0 else: self.waiting += 1 print(f"Not improving: [{self.waiting}] current loss val: " f"{loss_val} best: {self._best_loss}") if self.waiting >= self.patience: self.layers = self._best_model print(f"Early stopping at epoch {epoch}") return if epoch % verbose == 0: loss_train = self.cost_func(self.xp, y_train, self.predict(x_train, status=0)) self._history['epochs'].append(epoch) self._history['loss'].append(loss_train) self._history['loss_val'].append(loss_val) print(f"Epoch: {epoch:4}/{epochs} loss_train: {loss_train:.8f} " f"loss_val: {loss_val:.8f}") return self._history
[docs] def predict(self, x, status=1): """ Predicts the output for the given input data. Parameters: ----------- x : array-like The input data for prediction. Returns: -------- array-like The predicted output for the input data. """ if status: input_data = self.normalize_data(self.convert_data(x), self.mean_in, self.std_in) output = self.feedforward(input_data) return self.denormalize_outputs(output, self.mean_out, self.std_out) else: return self.feedforward(self.convert_data(x))
[docs] def accuracy(self, y, y_pred): """ Computes the accuracy of the predictions. Parameters: ----------- y : array-like The true labels or target values. y_pred : array-like The predicted values. Returns: -------- float The accuracy of the predictions as a percentage. """ if isinstance(y, type(y_pred)) and isinstance(y_pred, type(y)): return 100 * (1 - self.xp.mean(self.xp.abs(y - y_pred))) else: print("Datas have different types.") return 0
[docs] def add_layer(self): pass
[docs] def update_learning_rate(self, epoch): """ Updates the learning rates of all layers based on the current epoch. Parameters: ----------- epoch : int The current epoch number. """ for layer in self.layers: for i in range(len(layer.learning_rates)): layer.learning_rates[i] = layer.lr_decay_method( layer.learning_rates[i], epoch, layer.lr_decay_rate, layer.lr_decay_steps)
def _get_optimizer(self, optimizer_class): """ Creates an instance of the specified optimizer class. Parameters: ----------- optimizer_class : class The class of the optimizer to be instantiated. Returns: -------- instance An instance of the specified optimizer class. """ return optimizer_class()
[docs] def verify_input(self, data): """ Verifies the input data type for optimal performance of the RosenPY framework. Parameters: ----------- data : array-like The input data. """ if not isinstance(data, self.xp.ndarray): print("For optimal performance of the RosenPY framework, when not " "using GPU, input the data in NUMPY format, and when utilizing " "GPU, input the data in CUPY format.\n\n")
[docs] def convert_data(self, data): """ Converts the input data to the appropriate format for the current backend (NUMPY or CUPY). Parameters: ----------- data : array-like The input data. Returns: -------- array-like The converted input data. """ if isinstance(data, self.xp.ndarray): return data if self.xp.__name__ == "cupy": return self.xp.asarray(data) if self.xp.__name__ == "numpy": return data.get() raise ValueError("Unsupported data type")
[docs] def get_history(self): """ Returns the training history of the neural network. Returns: -------- dict A dictionary containing the training history. """ return self._history
[docs] def normalize_data(self, input_data, mean=0, std_dev=0): """ Normalizes the input data based on the provided mean and standard deviation. Parameters: ----------- input_data : array-like The data to be normalized. mean : float, optional The mean for normalization. Default is 0. std_dev : float, optional The standard deviation for normalization. Default is 0. Returns: -------- array-like The normalized data. """ return input_data
[docs] def denormalize_outputs(self, normalized_output_data, mean=0, std_dev=0): """ Denormalizes the output data based on the provided mean and standard deviation. Parameters: ----------- normalized_output_data : array-like The data to be denormalized. mean : float, optional The mean used for normalization. Default is 0. std_dev : float, optional The standard deviation used for normalization. Default is 0. Returns: -------- array-like The denormalized data. """ return normalized_output_data