Represents a vector with GPU-accelerated operations. More...

#include <vector.h>

Public Member Functions
	Vector (int rows)
	Construct a new Vector object. More...

	~Vector ()
	Destroy the Vector object. More...

void	initialize ()
	Initialize the vector (typically sets all elements to zero) More...

void	randomize ()
	Randomize the vector elements with values between -0.5 and 0.5. More...

void	print (int decimals)
	Print the vector contents. More...

int	get_rows () const
	Get the number of elements in the vector. More...

double *	get_data () const
	Get the raw data pointer of the vector. More...

Vector	copy () const
	Creates a deep copy of the vector. More...

void	multiply_scalar (double scalar)
	Multiplies all elements in the vector by a scalar. More...

void	divide_scalar (double scalar)
	Divides all elements in the vector by a scalar. More...

void	subtract_scalar (double scalar)
	Subtracts a scalar value from all elements in the vector. More...

Detailed Description

Represents a vector with GPU-accelerated operations.

Definition at line 13 of file vector.h.

Constructor & Destructor Documentation

◆ Vector()

Vector::Vector ( int rows )

Construct a new Vector object.

Parameters

rows	Number of elements in the vector

Definition at line 8 of file vector_constructor.cu.

                        : rows(rows) {
     // Allocate memory on the GPU for the vector data
     cudaMalloc(&d_data, rows * sizeof(double));
 }

◆ ~Vector()

Vector::~Vector ( )

Destroy the Vector object.

Definition at line 8 of file vector_destructor.cu.

                 {
     // Free the GPU memory allocated for this vector
     cudaFree(d_data);
 }

Member Function Documentation

◆ copy()

Vector Vector::copy ( ) const

Creates a deep copy of the vector.

Returns: A new Vector object with the same content as the original.

Definition at line 13 of file vector_copy.cu.

                           {
     // Create a new vector with the same number of rows
     Vector result(rows);
     
     // Copy the data from the current vector to the new vector
     cudaMemcpy(result.d_data, d_data, rows * sizeof(double), cudaMemcpyDeviceToDevice);
     
     // Return the new vector
     return result;
 }

◆ divide_scalar()

void Vector::divide_scalar ( double scalar )

Divides all elements in the vector by a scalar.

Parameters

scalar The scalar to divide by.

Exceptions

std::invalid_argument if scalar is exactly zero.

Definition at line 47 of file vector_divide_scalar.cu.

                                         {
     // Check for division by exactly zero
     if (scalar == 0.0) {
         throw std::invalid_argument("Cannot divide by exactly zero");
     }
  
     // Calculate total number of elements
     int size = rows;
  
     // Define block and grid dimensions
     int threadsPerBlock = 256;
     int blocksPerGrid = (size + threadsPerBlock - 1) / threadsPerBlock;
  
     // Launch CUDA kernel
     vectorDivideScalarKernel<<<blocksPerGrid, threadsPerBlock>>>(d_data, scalar, size);
  
     // Check for kernel launch errors
     cudaError_t cudaStatus = cudaGetLastError();
     if (cudaStatus != cudaSuccess) {
         throw std::runtime_error("Kernel launch failed: " + std::string(cudaGetErrorString(cudaStatus)));
     }
  
     // Synchronize device
     cudaDeviceSynchronize();
 }

◆ get_data()

double * Vector::get_data ( ) const

Get the raw data pointer of the vector.

Returns: double* Pointer to the vector data on the device

Definition at line 7 of file vector_get_data.cu.

                                {
     // Return the pointer to the GPU memory
     return d_data;
 }

◆ get_rows()

int Vector::get_rows ( ) const

Get the number of elements in the vector.

Returns: int Number of elements

Definition at line 7 of file vector_get_rows.cu.

                            {
     // Return the number of elements in the vector
     return rows;
 }

◆ initialize()

void Vector::initialize ( )

Initialize the vector (typically sets all elements to zero)

Definition at line 8 of file vector_initialize.cu.

                         {
     // Use cudaMemset to set all elements of d_data to 0
     cudaMemset(d_data, 0, rows * sizeof(double));
 }

◆ multiply_scalar()

void Vector::multiply_scalar ( double scalar )

Multiplies all elements in the vector by a scalar.

Parameters

scalar The scalar to multiply by.

Definition at line 41 of file vector_multiply_scalar.cu.

                                           {
     // Calculate total number of elements
     int size = rows;
  
     // Define block and grid dimensions
     int threadsPerBlock = 256;
     int blocksPerGrid = (size + threadsPerBlock - 1) / threadsPerBlock;
  
     // Launch CUDA kernel
     vectorMultiplyScalarKernel<<<blocksPerGrid, threadsPerBlock>>>(d_data, scalar, size);
  
     // Check for kernel launch errors
     cudaError_t cudaStatus = cudaGetLastError();
     if (cudaStatus != cudaSuccess) {
         throw std::runtime_error("Kernel launch failed: " + std::string(cudaGetErrorString(cudaStatus)));
     }
  
     // Synchronize device
     cudaDeviceSynchronize();
 }

◆ print()

void Vector::print ( int decimals )

Print the vector contents.

Parameters

decimals Number of decimal places to display

Definition at line 11 of file vector_print.cu.

                                {
     // Create format string for desired number of decimals
     char format[20];
     sprintf(format, "%%d:\t%%.%df\n", decimals);
  
     // Allocate host memory to copy the data from GPU
     double* h_data = new double[rows];
     cudaMemcpy(h_data, d_data, rows * sizeof(double), cudaMemcpyDeviceToHost);
  
     // Print vector dimensions
     std::cout << "Vector with " << rows << " rows:\n";
  
     // Print column header (since vector is treated as a single column)
     std::cout << "\t0:\t\n";
  
     // Iterate over rows
     for (int i = 0; i < rows; ++i) {
         // If more than 10 rows, only print first and last 5
         if (i == 5 && rows > 10) {
             std::cout << "...\t...\n";
             i = rows - 5;  // Skip to the last 5 rows
         }
         // Print row index and value
         printf(format, i, h_data[i]);
     }
  
     // Free the allocated host memory
     delete[] h_data;
     std::cout << std::endl;
 }

◆ randomize()

void Vector::randomize ( )

Randomize the vector elements with values between -0.5 and 0.5.

Fills the vector with random values between -0.5 and 0.5.

Definition at line 37 of file vector_randomize.cu.

                        {
     // Define the number of threads per block (a common choice for good occupancy)
     int threadsPerBlock = 256;
  
     // Calculate the number of blocks needed to cover all elements
     // We use ceiling division to ensure we have enough blocks
     int blocksPerGrid = (rows + threadsPerBlock - 1) / threadsPerBlock;
  
     // Generate a seed for the random number generator
     // We use the current time to ensure different seeds across runs
     unsigned long seed = time(NULL);
  
     // Launch the CUDA kernel
     randomizeKernel<<<blocksPerGrid, threadsPerBlock>>>(d_data, rows, seed);
  
     // Wait for the kernel to complete before returning
     // This ensures all random values are generated before any subsequent operations
     cudaDeviceSynchronize();
 }

◆ subtract_scalar()

void Vector::subtract_scalar ( double scalar )

Subtracts a scalar value from all elements in the vector.

Parameters

scalar The scalar value to subtract.

Definition at line 41 of file vector_subtract_scalar.cu.

                                           {
     // Calculate total number of elements
     int size = rows;
  
     // Define block and grid dimensions
     int threadsPerBlock = 256;
     int blocksPerGrid = (size + threadsPerBlock - 1) / threadsPerBlock;
  
     // Launch CUDA kernel
     vectorSubtractScalarKernel<<<blocksPerGrid, threadsPerBlock>>>(d_data, scalar, size);
  
     // Check for kernel launch errors
     cudaError_t cudaStatus = cudaGetLastError();
     if (cudaStatus != cudaSuccess) {
         throw std::runtime_error("Kernel launch failed: " + std::string(cudaGetErrorString(cudaStatus)));
     }
  
     // Synchronize device
     cudaDeviceSynchronize();
 }

The documentation for this class was generated from the following files:

src/linear_algebra/vector.h
src/linear_algebra/vector_constructor.cu
src/linear_algebra/vector_copy.cu
src/linear_algebra/vector_destructor.cu
src/linear_algebra/vector_divide_scalar.cu
src/linear_algebra/vector_get_data.cu
src/linear_algebra/vector_get_rows.cu
src/linear_algebra/vector_initialize.cu
src/linear_algebra/vector_multiply_scalar.cu
src/linear_algebra/vector_print.cu
src/linear_algebra/vector_randomize.cu
src/linear_algebra/vector_subtract_scalar.cu

Public Member Functions

Detailed Description

Constructor & Destructor Documentation

◆ Vector()

◆ ~Vector()

Member Function Documentation

◆ copy()

◆ divide_scalar()

◆ get_data()

◆ get_rows()

◆ initialize()

◆ multiply_scalar()

◆ print()

◆ randomize()

◆ subtract_scalar()