Commit 7110b53a authored by Jakub Klinkovský's avatar Jakub Klinkovský
Browse files

Fixed includes in CudaMultireductionKernel.h

parent 89bf3543
Loading
Loading
Loading
Loading
+9 −0
Original line number Diff line number Diff line
#pragma once

#ifdef HAVE_CUDA
#include <cuda.h>
#endif

#include <TNL/Assert.h>
#include <TNL/Math.h>
#include <TNL/Devices/CudaDeviceInfo.h>
#include <TNL/Containers/Algorithms/CudaReductionBuffer.h>

namespace TNL {
namespace Containers {
namespace Algorithms {
+0 −6
Original line number Diff line number Diff line
@@ -2,16 +2,10 @@

//#define CUDA_REDUCTION_PROFILING

#ifdef HAVE_CUDA
#include <cuda.h>
#endif
#include <TNL/Assert.h>
#include <TNL/Containers/Algorithms/reduction-operations.h>
#include <TNL/Containers/ArrayOperations.h>
#include <TNL/Math.h>
#include <TNL/Containers/Algorithms/CudaReductionBuffer.h>
#include <TNL/Containers/Algorithms/CudaMultireductionKernel.h>
#include <TNL/Devices/CudaDeviceInfo.h>

#ifdef CUDA_REDUCTION_PROFILING
#include <TNL/Timer.h>