projecto-final-turinmachin/html/neural__network_8h_source.html

#ifndef PROG3_NN_FINAL_PROJECT_V2025_01_NEURAL_NETWORK_H

#define PROG3_NN_FINAL_PROJECT_V2025_01_NEURAL_NETWORK_H


#include <iostream>

#include <memory>

#include <numeric>

#include <random>

#include "interfaces.h"

#include "optimizer.h"

#include "utec/nn/layer_registry.h"

#include "utec/utils/serialization.h"


namespace utec::neural_network {

    constexpr std::uint8_t FORMAT_CURRENT_VERSION = 1;


    template <typename T>


    class NeuralNetwork {

        std::vector<std::unique_ptr<ILayer<T>>> layers;


    public:


        NeuralNetwork() {

            register_all_layers<T>();

        }


        template <typename L, typename... Args>


        void add_layer(Args&&... args) {

            layers.emplace_back(std::make_unique<L>(std::forward<Args>(args)...));

        }


        template <template <typename...> class LossType,

                  template <typename...> class OptimizerType = SGD>


        void train(const algebra::Tensor<T, 2>& x,

                   const algebra::Tensor<T, 2>& y,

                   const size_t epochs,

                   const size_t batch_size,

                   T learning_rate,

                   std::mt19937& rng) {

            OptimizerType<T> optimizer(learning_rate);

            const size_t num_samples = x.shape()[0];


            std::vector<size_t> indices(num_samples);

            std::ranges::iota(indices, 0);


            for (size_t epoch = 0; epoch < epochs; ++epoch) {

                if (epoch % 100 == 0) {

                    std::cout << "Epoch " << epoch << '\n';

                }


                std::ranges::shuffle(indices, rng);


                for (size_t batch_start = 0; batch_start < num_samples; batch_start += batch_size) {

                    size_t current_batch_size = std::min(batch_size, num_samples - batch_start);


                    algebra::Tensor<T, 2> batch_x(current_batch_size, x.shape()[1]);

                    algebra::Tensor<T, 2> batch_y(current_batch_size, y.shape()[1]);


                    for (size_t i = 0; i < current_batch_size; ++i) {

                        batch_x.set_row(i, x.row(indices[batch_start + i]));

                        batch_y.set_row(i, y.row(indices[batch_start + i]));

                    }


                    algebra::Tensor<T, 2> output = batch_x;

                    for (auto& layer : layers) {

                        output = layer->forward(output);

                    }


                    LossType<T> loss_function(output, batch_y);

                    algebra::Tensor<T, 2> grad = loss_function.loss_gradient();


                    for (auto layer = layers.rbegin(); layer != layers.rend(); ++layer) {

                        grad = (*layer)->backward(grad);

                        (*layer)->update_params(optimizer);

                    }

                }

            }

        }


        auto predict(const algebra::Tensor<T, 2>& X) -> algebra::Tensor<T, 2> {

            algebra::Tensor<T, 2> output = X;

            for (auto& layer : layers) {

                output = layer->forward(output);

            }

            return output;

        }


        void save(std::ostream& out) const {

            out.put(FORMAT_CURRENT_VERSION);

            out.put(static_cast<std::uint8_t>(sizeof(T)));


            serialization::write_numeric(out, static_cast<std::uint64_t>(layers.size()));


            for (const auto& layer : layers) {

                out.put(static_cast<std::uint8_t>(layer->id()));

                layer->save(out);

            }

        }


        static auto load(std::istream& in) -> NeuralNetwork<T> {

            const int version = in.get();

            if (version != FORMAT_CURRENT_VERSION) {

                throw std::runtime_error("Invalid file format version: " + std::to_string(version));

            }


            const std::size_t t_size = in.get();

            if (t_size != sizeof(T)) {

                throw std::runtime_error(

                    "Stored data size does not match this platform's data size.");

            }


            const auto layers_size = serialization::read_numeric<std::uint64_t>(in);


            NeuralNetwork<T> net;

            net.layers.reserve(layers_size);


            for (std::size_t i = 0; i < layers_size; ++i) {

                const int id_raw = in.get();

                const auto id = static_cast<LayerId>(id_raw);


                net.layers.push_back(LayerRegistry<T>::create(id, in));

            }


            return net;

        }


    };


}  // namespace utec::neural_network


#endif

x
return p * x
Definition catch_amalgamated.cpp:321

NeuralNetwork::NeuralNetwork
NeuralNetwork()
Constructor por defecto.
Definition neural_network.h:28

utec::algebra::Tensor
Representa un tensor de tipo T y rango Rank.
Definition tensor.h:63

utec::algebra::Tensor::shape
auto shape() const noexcept -> const std::array< size_t, Rank > &
Definition tensor.h:179

utec::algebra::Tensor::row
auto row(const size_t index) const -> Tensor< T, 2 > requires(Rank==2)
Genera tensor con fila particular.
Definition tensor.h:223

utec::algebra::Tensor::set_row
void set_row(const size_t index, const Tensor< T, 2 > &row_tensor)
Cambia fila especifica de un tensor.
Definition tensor.h:243

utec::neural_network::LayerRegistry::create
static auto create(LayerId id, std::istream &in) -> std::unique_ptr< ILayer< T > >
Crea una instancia de una capa registrada a partir de su ID. Busca la función asociada al ID proporci...
Definition layer_registry.h:46

utec::neural_network::NeuralNetwork::save
void save(std::ostream &out) const
Guarda el modelo en un flujo de salida binario.
Definition neural_network.h:131

utec::neural_network::NeuralNetwork::NeuralNetwork
NeuralNetwork()
Constructor por defecto.
Definition neural_network.h:28

utec::neural_network::NeuralNetwork::load
static auto load(std::istream &in) -> NeuralNetwork< T >
Carga una red neuronal desde un flujo de entrada binario.
Definition neural_network.h:150

utec::neural_network::NeuralNetwork::add_layer
void add_layer(Args &&... args)
Agrega una nueva capa a la red.
Definition neural_network.h:40

utec::neural_network::NeuralNetwork::predict
auto predict(const algebra::Tensor< T, 2 > &X) -> algebra::Tensor< T, 2 >
Realiza una predicción sobre un conjunto de datos.
Definition neural_network.h:118

utec::neural_network::NeuralNetwork::train
void train(const algebra::Tensor< T, 2 > &x, const algebra::Tensor< T, 2 > &y, const size_t epochs, const size_t batch_size, T learning_rate, std::mt19937 &rng)
Entrena la red neuronal usando descenso por lotes.
Definition neural_network.h:66

utec::neural_network::SGD
Optimizador Stochastic Gradient Descent (SGD). Actualiza los parámetros en dirección opuesta al gradi...
Definition optimizer.h:14

layer_registry.h

serialization::read_numeric
auto read_numeric(std::istream &in) -> T
Definition serialization.h:17

serialization::write_numeric
void write_numeric(std::ostream &out, const T n)
Definition serialization.h:9

utec::neural_network
Capa de activación de Rectified Linear Unit (ReLU). Los valores negativos del input se convierten en ...
Definition activation.h:14

utec::neural_network::LayerId
LayerId
Identificador para los diferentes tipos de capas en la red neuronal. Se emplea uint8_t (unsigned 8-bi...
Definition interfaces.h:11

utec::neural_network::FORMAT_CURRENT_VERSION
constexpr std::uint8_t FORMAT_CURRENT_VERSION
Versión actual del formato .pp20 (Profe Pónganos 20).
Definition neural_network.h:15

utec::neural_network::register_all_layers
void register_all_layers()
Registra todas las capas disponibles en el sistema. Llamado al inicio del programa para asegurar que ...
Definition layer_registry.h:75

optimizer.h

serialization.h

interfaces.h