diff --git a/src/TNL/Algorithms/Segments/details/CSRAdaptiveKernelParameters.h b/src/TNL/Algorithms/Segments/details/CSRAdaptiveKernelParameters.h index 0f00fbd808772b14bb11e85951566730c766e310..843f2f7d52d56e9aab89fcc63b06b1b1f936384b 100644 --- a/src/TNL/Algorithms/Segments/details/CSRAdaptiveKernelParameters.h +++ b/src/TNL/Algorithms/Segments/details/CSRAdaptiveKernelParameters.h @@ -15,6 +15,8 @@ namespace TNL { namespace Segments { namespace details { +// This can be used for tunning the number of CUDA threads per block depending on the size of Value +// TODO: Perform some tests static constexpr int CSRAdaptiveKernelParametersCudaBlockSizes[] = { 256, 256, 256, 256, 256, 256 }; template< int SizeOfValue = 1,