Loading src/Benchmarks/Convolution/kernels/sharedDataAndKernel.h +6 −0 Original line number Diff line number Diff line Loading @@ -431,6 +431,8 @@ public: constexpr auto kernel = convolution1D< Index, Real, FetchData, FetchBoundary, FetchKernel, Convolve, Store >; cudaFuncSetCacheConfig(kernel, cudaFuncCachePreferShared); TNL::Cuda::launchKernel< true >( kernel, 0, configuration, kernelSize.x(), dimensions.x(), fetchData, fetchBoundary, fetchKernel, convolve, store ); }; Loading Loading @@ -488,6 +490,8 @@ public: constexpr auto kernel = convolution2D< Index, Real, FetchData, FetchBoundary, FetchKernel, Convolve, Store >; cudaFuncSetCacheConfig(kernel, cudaFuncCachePreferShared); TNL::Cuda::launchKernel< true >( kernel, 0, configuration, Loading Loading @@ -558,6 +562,8 @@ public: constexpr auto kernel = convolution3D< Index, Real, FetchData, FetchBoundary, FetchKernel, Convolve, Store >; cudaFuncSetCacheConfig(kernel, cudaFuncCachePreferShared); TNL::Cuda::launchKernel< true >( kernel, 0, configuration, Loading src/Benchmarks/Convolution/kernels/sharedKernel.h +6 −0 Original line number Diff line number Diff line Loading @@ -247,6 +247,8 @@ public: constexpr auto kernel = convolution1D< Index, Real, FetchData, FetchBoundary, FetchKernel, Convolve, Store >; cudaFuncSetCacheConfig(kernel, cudaFuncCachePreferShared); TNL::Cuda::launchKernel< true >( kernel, 0, configuration, kernelSize.x(), dimensions.x(), fetchData, fetchBoundary, fetchKernel, convolve, store ); }; Loading Loading @@ -301,6 +303,8 @@ public: constexpr auto kernel = convolution2D< Index, Real, FetchData, FetchBoundary, FetchKernel, Convolve, Store >; cudaFuncSetCacheConfig(kernel, cudaFuncCachePreferShared); TNL::Cuda::launchKernel< true >( kernel, 0, configuration, Loading Loading @@ -368,6 +372,8 @@ public: constexpr auto kernel = convolution3D< Index, Real, FetchData, FetchBoundary, FetchKernel, Convolve, Store >; cudaFuncSetCacheConfig(kernel, cudaFuncCachePreferShared); TNL::Cuda::launchKernel< true >( kernel, 0, configuration, Loading src/Benchmarks/Convolution/kernels/sharedData.h +1 −1 File changed.Contains only whitespace changes. Show changes Loading
src/Benchmarks/Convolution/kernels/sharedDataAndKernel.h +6 −0 Original line number Diff line number Diff line Loading @@ -431,6 +431,8 @@ public: constexpr auto kernel = convolution1D< Index, Real, FetchData, FetchBoundary, FetchKernel, Convolve, Store >; cudaFuncSetCacheConfig(kernel, cudaFuncCachePreferShared); TNL::Cuda::launchKernel< true >( kernel, 0, configuration, kernelSize.x(), dimensions.x(), fetchData, fetchBoundary, fetchKernel, convolve, store ); }; Loading Loading @@ -488,6 +490,8 @@ public: constexpr auto kernel = convolution2D< Index, Real, FetchData, FetchBoundary, FetchKernel, Convolve, Store >; cudaFuncSetCacheConfig(kernel, cudaFuncCachePreferShared); TNL::Cuda::launchKernel< true >( kernel, 0, configuration, Loading Loading @@ -558,6 +562,8 @@ public: constexpr auto kernel = convolution3D< Index, Real, FetchData, FetchBoundary, FetchKernel, Convolve, Store >; cudaFuncSetCacheConfig(kernel, cudaFuncCachePreferShared); TNL::Cuda::launchKernel< true >( kernel, 0, configuration, Loading
src/Benchmarks/Convolution/kernels/sharedKernel.h +6 −0 Original line number Diff line number Diff line Loading @@ -247,6 +247,8 @@ public: constexpr auto kernel = convolution1D< Index, Real, FetchData, FetchBoundary, FetchKernel, Convolve, Store >; cudaFuncSetCacheConfig(kernel, cudaFuncCachePreferShared); TNL::Cuda::launchKernel< true >( kernel, 0, configuration, kernelSize.x(), dimensions.x(), fetchData, fetchBoundary, fetchKernel, convolve, store ); }; Loading Loading @@ -301,6 +303,8 @@ public: constexpr auto kernel = convolution2D< Index, Real, FetchData, FetchBoundary, FetchKernel, Convolve, Store >; cudaFuncSetCacheConfig(kernel, cudaFuncCachePreferShared); TNL::Cuda::launchKernel< true >( kernel, 0, configuration, Loading Loading @@ -368,6 +372,8 @@ public: constexpr auto kernel = convolution3D< Index, Real, FetchData, FetchBoundary, FetchKernel, Convolve, Store >; cudaFuncSetCacheConfig(kernel, cudaFuncCachePreferShared); TNL::Cuda::launchKernel< true >( kernel, 0, configuration, Loading
src/Benchmarks/Convolution/kernels/sharedData.h +1 −1 File changed.Contains only whitespace changes. Show changes