Change vector scalar math kernels

This commit is contained in:
2024-04-28 19:02:57 +02:00
parent 69111f6cb1
commit 1f708f3ea3
2 changed files with 4 additions and 4 deletions

View File

@@ -46,7 +46,7 @@ __global__ void Kernels::vec_scalar_sub(
if (tid >= len) { if (tid >= len) {
return; return;
} }
d_out[tid] = d_src[tid] - d_scalar[0]; d_out[tid] = d_src[tid] - *d_scalar;
} }
__global__ void Kernels::vec_scalar_div( __global__ void Kernels::vec_scalar_div(
@@ -59,7 +59,7 @@ __global__ void Kernels::vec_scalar_div(
if (tid >= len) { if (tid >= len) {
return; return;
} }
d_out[tid] = d_src[tid] / d_scalar[0]; d_out[tid] = d_src[tid] / *d_scalar;
} }
__global__ void Kernels::vec_exp( __global__ void Kernels::vec_exp(

View File

@@ -52,7 +52,7 @@ void Activation::activate(float* d_input) {
// Subtract max value to improve numerical stability // Subtract max value to improve numerical stability
Kernels::vec_scalar_sub<<<gridSize, BLOCK_SIZE>>>( Kernels::vec_scalar_sub<<<gridSize, BLOCK_SIZE>>>(
d_input, d_input, d_max, length d_input, d_input, &d_max[0], length
); );
CUDA_CHECK(cudaGetLastError()); CUDA_CHECK(cudaGetLastError());
@@ -66,7 +66,7 @@ void Activation::activate(float* d_input) {
Utils::sum(d_input, d_softmax_sum, length); Utils::sum(d_input, d_softmax_sum, length);
Kernels::vec_scalar_div<<<gridSize, BLOCK_SIZE>>>( Kernels::vec_scalar_div<<<gridSize, BLOCK_SIZE>>>(
d_input, d_input, d_softmax_sum, length d_input, d_input, &d_softmax_sum[0], length
); );
CUDA_CHECK(cudaGetLastError()); CUDA_CHECK(cudaGetLastError());
break; break;