Loading src/TNL/Containers/Algorithms/CudaReductionKernel.h +3 −1 Original line number Diff line number Diff line Loading @@ -132,6 +132,8 @@ CudaReductionKernel( Operation operation, operation.commonReductionOnDevice( vsdata[ tid ], vsdata[ tid + 32 ] ); //printf( "4: tid %d data %f \n", tid, sdata[ tid ] ); } // TODO: If blocksize == 32, the following does not work // We do not check if tid < 16. Fix it!!! if( blockSize >= 32 ) { operation.commonReductionOnDevice( vsdata[ tid ], vsdata[ tid + 16 ] ); Loading Loading
src/TNL/Containers/Algorithms/CudaReductionKernel.h +3 −1 Original line number Diff line number Diff line Loading @@ -132,6 +132,8 @@ CudaReductionKernel( Operation operation, operation.commonReductionOnDevice( vsdata[ tid ], vsdata[ tid + 32 ] ); //printf( "4: tid %d data %f \n", tid, sdata[ tid ] ); } // TODO: If blocksize == 32, the following does not work // We do not check if tid < 16. Fix it!!! if( blockSize >= 32 ) { operation.commonReductionOnDevice( vsdata[ tid ], vsdata[ tid + 16 ] ); Loading