#include #include #include #include "activation_functions.cuh" #include "matmul.cuh" #include "cuda_helper.cuh" TEST(ActivationFunctionsTest, SigmoidSanityCheck) { cudaError_t cudaStatus; float input[3] = {-100.0f, 0.0f, 100.0f}; std::vector expected_output = {0.0f, 0.5f, 1.0f}; float* d_input; float* d_output; cudaStatus = cudaMalloc((void**)&d_input, sizeof(float) * 3); EXPECT_EQ(cudaStatus, cudaSuccess); cudaStatus = cudaMalloc((void**)&d_output, sizeof(float) * 3); EXPECT_EQ(cudaStatus, cudaSuccess); cudaStatus = cudaMemcpy(d_input, input, sizeof(float) * 3, cudaMemcpyHostToDevice); EXPECT_EQ(cudaStatus, cudaSuccess); CUDANet::Kernels::sigmoid<<<1, 3>>>(d_input, d_output, 3); cudaStatus = cudaDeviceSynchronize(); EXPECT_EQ(cudaStatus, cudaSuccess); std::vector output(3); cudaStatus = cudaMemcpy( output.data(), d_output, sizeof(float) * 3, cudaMemcpyDeviceToHost ); EXPECT_EQ(cudaStatus, cudaSuccess); for (int i = 0; i < 3; i++) { EXPECT_NEAR(expected_output[i], output[i], 1e-5); } cudaFree(d_input); cudaFree(d_output); cudaDeviceReset(); } // void print_vec(float* d_vec, int length) { // std::vector h_vec(length); // CUDA_CHECK(cudaMemcpy( // h_vec.data(), d_vec, sizeof(float) * length, cudaMemcpyDeviceToHost // )); // float sum = 0.0f; // for (int i = 0; i < length; ++i) { // std::cout << h_vec[i] << ", "; // sum += h_vec[i]; // } // std::cout << std::endl; // }