cuda.reduction.SumReduction.cuh Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of komputation Show documentation
Show all versions of komputation Show documentation
Komputation is a neural network framework for the JVM written in the Kotlin programming language.
__inline__ __device__ float warpReduceToSum(float thisValue) {
for (int offset = warpSize / 2; offset > 0; offset /= 2) {
float otherValue = __shfl_down(thisValue, offset, warpSize);
thisValue += otherValue;
}
return thisValue;
}
__device__ void reduceToSum(float thisValue, int warpId, int laneId, float* shared) {
float warpSum = warpReduceToSum(thisValue);
if(laneId == 0) {
shared[warpId] = warpSum;
}
__syncthreads();
thisValue = (threadIdx.x < blockDim.x / warpSize) ? shared[laneId] : 0.0;
if (warpId == 0) {
warpReduceToSum(thisValue);
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy