Loading src/TNL/Containers/Algorithms/CudaMultireductionKernel.h +9 −0 Original line number Diff line number Diff line #pragma once #ifdef HAVE_CUDA #include <cuda.h> #endif #include <TNL/Assert.h> #include <TNL/Math.h> #include <TNL/Devices/CudaDeviceInfo.h> #include <TNL/Containers/Algorithms/CudaReductionBuffer.h> namespace TNL { namespace Containers { namespace Algorithms { Loading src/TNL/Containers/Algorithms/Multireduction_impl.h +0 −6 Original line number Diff line number Diff line Loading @@ -2,16 +2,10 @@ //#define CUDA_REDUCTION_PROFILING #ifdef HAVE_CUDA #include <cuda.h> #endif #include <TNL/Assert.h> #include <TNL/Containers/Algorithms/reduction-operations.h> #include <TNL/Containers/ArrayOperations.h> #include <TNL/Math.h> #include <TNL/Containers/Algorithms/CudaReductionBuffer.h> #include <TNL/Containers/Algorithms/CudaMultireductionKernel.h> #include <TNL/Devices/CudaDeviceInfo.h> #ifdef CUDA_REDUCTION_PROFILING #include <TNL/Timer.h> Loading Loading
src/TNL/Containers/Algorithms/CudaMultireductionKernel.h +9 −0 Original line number Diff line number Diff line #pragma once #ifdef HAVE_CUDA #include <cuda.h> #endif #include <TNL/Assert.h> #include <TNL/Math.h> #include <TNL/Devices/CudaDeviceInfo.h> #include <TNL/Containers/Algorithms/CudaReductionBuffer.h> namespace TNL { namespace Containers { namespace Algorithms { Loading
src/TNL/Containers/Algorithms/Multireduction_impl.h +0 −6 Original line number Diff line number Diff line Loading @@ -2,16 +2,10 @@ //#define CUDA_REDUCTION_PROFILING #ifdef HAVE_CUDA #include <cuda.h> #endif #include <TNL/Assert.h> #include <TNL/Containers/Algorithms/reduction-operations.h> #include <TNL/Containers/ArrayOperations.h> #include <TNL/Math.h> #include <TNL/Containers/Algorithms/CudaReductionBuffer.h> #include <TNL/Containers/Algorithms/CudaMultireductionKernel.h> #include <TNL/Devices/CudaDeviceInfo.h> #ifdef CUDA_REDUCTION_PROFILING #include <TNL/Timer.h> Loading