cuda-networks-docs/neural__network_8h_source.html

 /**

  * @file neural_network.h

  * @brief Defines the NeuralNetwork class for a simple feedforward neural network.

  */


 #ifndef NEURAL_NETWORK_H

 #define NEURAL_NETWORK_H


 #include "../linear_algebra/matrix.h"

 #include "../linear_algebra/vector.h"


 /**

  * @class NeuralNetwork

  * @brief Represents a simple feedforward neural network with one hidden layer.

  */

 class NeuralNetwork {

 public:

     /**

      * @brief Construct a new NeuralNetwork object

      * @param input_size Number of input features

      * @param hidden_size Number of neurons in the hidden layer

      * @param output_size Number of output classes

      */

     NeuralNetwork(int input_size, int hidden_size, int output_size);


     /**

      * @brief Destroy the NeuralNetwork object

      */

     ~NeuralNetwork();


     /**

      * @brief Initialize the neural network parameters

      */

     void initialize();


     /**

      * @brief Perform forward propagation through the network

      * @param X Input data matrix

      */

     void forward(const Matrix& X);


     /**

      * @brief Perform backward propagation through the network

      * @param X Input data matrix

      * @param Y True labels matrix

      */

     void backward(const Matrix& X, const Matrix& Y);


     /**

      * @brief Updates the network parameters based on computed gradients.

      * @param learning_rate The learning rate for the parameter update.

      */

     void update_params(double learning_rate);


     /**

      * @brief Get predictions from the output layer (A2)

      * @return Vector containing the predicted class indices

      */

     Vector get_predictions() const;


     /**

      * @brief Calculate the accuracy of predictions compared to true labels

      * @param Y True labels matrix

      * @return Accuracy as a fraction of correct predictions

      */

     double get_accuracy(const Matrix& Y) const;


     /**

      * @brief Perform gradient descent to train the neural network

      * @param X Input data matrix

      * @param Y True labels matrix

      * @param learning_rate Learning rate for parameter updates

      * @param epochs Number of training epochs

      */

     void gradient_descent(const Matrix& X, const Matrix& Y, double learning_rate, int epochs);


     /**

      * @brief Get the pointer to the W1 matrix data

      * @return Pointer to the W1 matrix data on the device

      */

     double* get_W1_data() const { return W1.get_data(); }


     /**

      * @brief Get the pointer to the W2 matrix data

      * @return Pointer to the W2 matrix data on the device

      */

     double* get_W2_data() const { return W2.get_data(); }


     /**

      * @brief Get the pointer to the b1 vector data

      * @return Pointer to the b1 vector data on the device

      */

     double* get_b1_data() const { return b1.get_data(); }


     /**

      * @brief Get the pointer to the b2 vector data

      * @return Pointer to the b2 vector data on the device

      */

     double* get_b2_data() const { return b2.get_data(); }


     /**

      * @brief Get the dimensions of the W1 matrix

      * @return std::pair<int, int> containing rows and columns of W1

      */

     std::pair<int, int> get_W1_dimensions() const { return {W1.get_rows(), W1.get_cols()}; }


     /**

      * @brief Get the dimensions of the W2 matrix

      * @return std::pair<int, int> containing rows and columns of W2

      */

     std::pair<int, int> get_W2_dimensions() const { return {W2.get_rows(), W2.get_cols()}; }


     /**

      * @brief Get the size of the b1 vector

      * @return Size of the b1 vector

      */

     int get_b1_size() const { return b1.get_rows(); }


     /**

      * @brief Get the size of the b2 vector

      * @return Size of the b2 vector

      */

     int get_b2_size() const { return b2.get_rows(); }


     /**

      * @brief Get the DW1 matrix

      * @return The DW1 matrix

      */

     Matrix get_DW1() const { return DW1; }


     /**

      * @brief Get the db1 scalar

      * @return The db1 scalar

      */

     double get_db1() const { return db1; }


     /**

      * @brief Get the DW2 matrix

      * @return The DW2 matrix

      */

     Matrix get_DW2() const { return DW2; }


     /**

      * @brief Get the db2 scalar

      * @return The db2 scalar

      */

     double get_db2() const { return db2; }


     /**

      * @brief Get the pointer to the A matrix data (input matrix)

      * @return Pointer to the A matrix data on the device

      */

     double* get_A_data() const { return A.get_data(); }


     /**

      * @brief Get the dimensions of the A matrix

      * @return std::pair<int, int> containing rows and columns of A

      */

     std::pair<int, int> get_A_dimensions() const { return {A.get_rows(), A.get_cols()}; }


     /**

      * @brief Get the pointer to the Z1 matrix data (pre-activation of hidden layer)

      * @return Pointer to the Z1 matrix data on the device

      */

     double* get_Z1_data() const { return Z1.get_data(); }


     /**

      * @brief Get the dimensions of the Z1 matrix

      * @return std::pair<int, int> containing rows and columns of Z1

      */

     std::pair<int, int> get_Z1_dimensions() const { return {Z1.get_rows(), Z1.get_cols()}; }


     /**

      * @brief Get the pointer to the A1 matrix data (activation of hidden layer)

      * @return Pointer to the A1 matrix data on the device

      */

     double* get_A1_data() const { return A1.get_data(); }


     /**

      * @brief Get the dimensions of the A1 matrix

      * @return std::pair<int, int> containing rows and columns of A1

      */

     std::pair<int, int> get_A1_dimensions() const { return {A1.get_rows(), A1.get_cols()}; }


     /**

      * @brief Get the pointer to the Z2 matrix data (pre-activation of output layer)

      * @return Pointer to the Z2 matrix data on the device

      */

     double* get_Z2_data() const { return Z2.get_data(); }


     /**

      * @brief Get the dimensions of the Z2 matrix

      * @return std::pair<int, int> containing rows and columns of Z2

      */

     std::pair<int, int> get_Z2_dimensions() const { return {Z2.get_rows(), Z2.get_cols()}; }


     /**

      * @brief Get the pointer to the A2 matrix data (activation of output layer)

      * @return Pointer to the A2 matrix data on the device

      */

     double* get_A2_data() const { return A2.get_data(); }


     /**

      * @brief Get the dimensions of the A2 matrix

      * @return std::pair<int, int> containing rows and columns of A2

      */

     std::pair<int, int> get_A2_dimensions() const { return {A2.get_rows(), A2.get_cols()}; }


 private:

     int input_size;    ///< Number of input features

     int hidden_size;   ///< Number of neurons in the hidden layer

     int output_size;   ///< Number of output classes


     Matrix W1;         ///< Weights for the hidden layer

     Vector b1;         ///< Biases for the hidden layer

     Matrix W2;         ///< Weights for the output layer

     Vector b2;         ///< Biases for the output layer


     Matrix A;          ///< Input matrix

     Matrix Z1;         ///< Pre-activation of hidden layer

     Matrix A1;         ///< Activation of hidden layer

     Matrix Z2;         ///< Pre-activation of output layer

     Matrix A2;         ///< Activation of output layer (final output)


     Matrix DZ2;        ///< Gradient of Z2

     Matrix DW2;        ///< Gradient of W2

     double db2;        ///< Gradient of b2 (scalar)

     Matrix DZ1;        ///< Gradient of Z1

     Matrix DW1;        ///< Gradient of W1

     double db1;        ///< Gradient of b1 (scalar)

 };


 #endif // NEURAL_NETWORK_H

Matrix
Represents a matrix with GPU-accelerated operations.
Definition: matrix.h:18

Matrix::get_rows
int get_rows() const
Get the number of rows in the matrix.
Definition: matrix_get_rows.cu:7

Matrix::get_data
double * get_data() const
Get the raw data pointer of the matrix.
Definition: matrix_get_data.cu:7

Matrix::get_cols
int get_cols() const
Get the number of columns in the matrix.
Definition: matrix_get_cols.cu:7

NeuralNetwork
Represents a simple feedforward neural network with one hidden layer.
Definition: neural_network.h:16

NeuralNetwork::get_b1_data
double * get_b1_data() const
Get the pointer to the b1 vector data.
Definition: neural_network.h:93

NeuralNetwork::backward
void backward(const Matrix &X, const Matrix &Y)
Perform backward propagation through the network.
Definition: neural_network_backward.cu:8

NeuralNetwork::get_DW1
Matrix get_DW1() const
Get the DW1 matrix.
Definition: neural_network.h:129

NeuralNetwork::update_params
void update_params(double learning_rate)
Updates the network parameters based on computed gradients.
Definition: neural_network_update_params.cu:8

NeuralNetwork::get_accuracy
double get_accuracy(const Matrix &Y) const
Calculate the accuracy of predictions compared to true labels.
Definition: neural_network_get_accuracy.cu:22

NeuralNetwork::forward
void forward(const Matrix &X)
Perform forward propagation through the network.
Definition: neural_network_forward.cu:8

NeuralNetwork::get_db2
double get_db2() const
Get the db2 scalar.
Definition: neural_network.h:147

NeuralNetwork::get_b1_size
int get_b1_size() const
Get the size of the b1 vector.
Definition: neural_network.h:117

NeuralNetwork::get_W2_data
double * get_W2_data() const
Get the pointer to the W2 matrix data.
Definition: neural_network.h:87

NeuralNetwork::get_Z1_dimensions
std::pair< int, int > get_Z1_dimensions() const
Get the dimensions of the Z1 matrix.
Definition: neural_network.h:171

NeuralNetwork::get_b2_size
int get_b2_size() const
Get the size of the b2 vector.
Definition: neural_network.h:123

NeuralNetwork::get_b2_data
double * get_b2_data() const
Get the pointer to the b2 vector data.
Definition: neural_network.h:99

NeuralNetwork::get_W1_data
double * get_W1_data() const
Get the pointer to the W1 matrix data.
Definition: neural_network.h:81

NeuralNetwork::initialize
void initialize()
Initialize the neural network parameters.
Definition: neural_network_initialize.cu:9

NeuralNetwork::get_A1_data
double * get_A1_data() const
Get the pointer to the A1 matrix data (activation of hidden layer)
Definition: neural_network.h:177

NeuralNetwork::~NeuralNetwork
~NeuralNetwork()
Destroy the NeuralNetwork object.
Definition: neural_network_destructor.cu:8

NeuralNetwork::get_db1
double get_db1() const
Get the db1 scalar.
Definition: neural_network.h:135

NeuralNetwork::get_W2_dimensions
std::pair< int, int > get_W2_dimensions() const
Get the dimensions of the W2 matrix.
Definition: neural_network.h:111

NeuralNetwork::get_A_data
double * get_A_data() const
Get the pointer to the A matrix data (input matrix)
Definition: neural_network.h:153

NeuralNetwork::get_A1_dimensions
std::pair< int, int > get_A1_dimensions() const
Get the dimensions of the A1 matrix.
Definition: neural_network.h:183

NeuralNetwork::get_Z2_data
double * get_Z2_data() const
Get the pointer to the Z2 matrix data (pre-activation of output layer)
Definition: neural_network.h:189

NeuralNetwork::get_predictions
Vector get_predictions() const
Get predictions from the output layer (A2)
Definition: neural_network_get_predictions.cu:7

NeuralNetwork::get_W1_dimensions
std::pair< int, int > get_W1_dimensions() const
Get the dimensions of the W1 matrix.
Definition: neural_network.h:105

NeuralNetwork::get_Z2_dimensions
std::pair< int, int > get_Z2_dimensions() const
Get the dimensions of the Z2 matrix.
Definition: neural_network.h:195

NeuralNetwork::get_DW2
Matrix get_DW2() const
Get the DW2 matrix.
Definition: neural_network.h:141

NeuralNetwork::get_A2_dimensions
std::pair< int, int > get_A2_dimensions() const
Get the dimensions of the A2 matrix.
Definition: neural_network.h:207

NeuralNetwork::get_A2_data
double * get_A2_data() const
Get the pointer to the A2 matrix data (activation of output layer)
Definition: neural_network.h:201

NeuralNetwork::get_Z1_data
double * get_Z1_data() const
Get the pointer to the Z1 matrix data (pre-activation of hidden layer)
Definition: neural_network.h:165

NeuralNetwork::gradient_descent
void gradient_descent(const Matrix &X, const Matrix &Y, double learning_rate, int epochs)
Perform gradient descent to train the neural network.
Definition: neural_network_gradient_descent.cu:10

NeuralNetwork::get_A_dimensions
std::pair< int, int > get_A_dimensions() const
Get the dimensions of the A matrix.
Definition: neural_network.h:159

NeuralNetwork::NeuralNetwork
NeuralNetwork(int input_size, int hidden_size, int output_size)
Construct a new NeuralNetwork object.
Definition: neural_network_constructor.cu:8

Vector
Represents a vector with GPU-accelerated operations.
Definition: vector.h:13

Vector::get_rows
int get_rows() const
Get the number of elements in the vector.
Definition: vector_get_rows.cu:7

Vector::get_data
double * get_data() const
Get the raw data pointer of the vector.
Definition: vector_get_data.cu:7