mirror of
https://github.com/lordmathis/CUDANet.git
synced 2025-11-06 01:34:22 +00:00
Change vector scalar math kernels
This commit is contained in:
@@ -46,7 +46,7 @@ __global__ void Kernels::vec_scalar_sub(
|
|||||||
if (tid >= len) {
|
if (tid >= len) {
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
d_out[tid] = d_src[tid] - d_scalar[0];
|
d_out[tid] = d_src[tid] - *d_scalar;
|
||||||
}
|
}
|
||||||
|
|
||||||
__global__ void Kernels::vec_scalar_div(
|
__global__ void Kernels::vec_scalar_div(
|
||||||
@@ -59,7 +59,7 @@ __global__ void Kernels::vec_scalar_div(
|
|||||||
if (tid >= len) {
|
if (tid >= len) {
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
d_out[tid] = d_src[tid] / d_scalar[0];
|
d_out[tid] = d_src[tid] / *d_scalar;
|
||||||
}
|
}
|
||||||
|
|
||||||
__global__ void Kernels::vec_exp(
|
__global__ void Kernels::vec_exp(
|
||||||
|
|||||||
@@ -52,7 +52,7 @@ void Activation::activate(float* d_input) {
|
|||||||
|
|
||||||
// Subtract max value to improve numerical stability
|
// Subtract max value to improve numerical stability
|
||||||
Kernels::vec_scalar_sub<<<gridSize, BLOCK_SIZE>>>(
|
Kernels::vec_scalar_sub<<<gridSize, BLOCK_SIZE>>>(
|
||||||
d_input, d_input, d_max, length
|
d_input, d_input, &d_max[0], length
|
||||||
);
|
);
|
||||||
CUDA_CHECK(cudaGetLastError());
|
CUDA_CHECK(cudaGetLastError());
|
||||||
|
|
||||||
@@ -66,7 +66,7 @@ void Activation::activate(float* d_input) {
|
|||||||
Utils::sum(d_input, d_softmax_sum, length);
|
Utils::sum(d_input, d_softmax_sum, length);
|
||||||
|
|
||||||
Kernels::vec_scalar_div<<<gridSize, BLOCK_SIZE>>>(
|
Kernels::vec_scalar_div<<<gridSize, BLOCK_SIZE>>>(
|
||||||
d_input, d_input, d_softmax_sum, length
|
d_input, d_input, &d_softmax_sum[0], length
|
||||||
);
|
);
|
||||||
CUDA_CHECK(cudaGetLastError());
|
CUDA_CHECK(cudaGetLastError());
|
||||||
break;
|
break;
|
||||||
|
|||||||
Reference in New Issue
Block a user