Loading src/TNL/Algorithms/detail/CudaReductionKernel.h +211 −72 File changed.Preview size limit exceeded, changes collapsed. Show changes src/TNL/Algorithms/detail/CudaScanKernel.h +1 −1 Original line number Diff line number Diff line Loading @@ -312,7 +312,7 @@ CudaScanKernelUpsweep( const InputView input, __syncthreads(); // Perform the parallel reduction. value = BlockReduce::reduce( reduction, value, threadIdx.x, storage.blockReduceStorage ); value = BlockReduce::reduce( reduction, identity, value, threadIdx.x, storage.blockReduceStorage ); // Store the block result in the global memory. if( threadIdx.x == 0 ) Loading Loading
src/TNL/Algorithms/detail/CudaReductionKernel.h +211 −72 File changed.Preview size limit exceeded, changes collapsed. Show changes
src/TNL/Algorithms/detail/CudaScanKernel.h +1 −1 Original line number Diff line number Diff line Loading @@ -312,7 +312,7 @@ CudaScanKernelUpsweep( const InputView input, __syncthreads(); // Perform the parallel reduction. value = BlockReduce::reduce( reduction, value, threadIdx.x, storage.blockReduceStorage ); value = BlockReduce::reduce( reduction, identity, value, threadIdx.x, storage.blockReduceStorage ); // Store the block result in the global memory. if( threadIdx.x == 0 ) Loading