Commit 166bbe68 authored by Tomáš Oberhuber's avatar Tomáš Oberhuber
Browse files

Added comment to Adaptive CSR kernel about finetunning of CUDA block size...

Added comment to Adaptive CSR kernel about finetunning of CUDA block size depending on the size of Value type.
parent 9c559180
Loading
Loading
Loading
Loading
+2 −0
Original line number Diff line number Diff line
@@ -15,6 +15,8 @@ namespace TNL {
      namespace Segments {
         namespace details {

// This can be used for tunning the number of CUDA threads per block depending on the size of Value
// TODO: Perform some tests
static constexpr int CSRAdaptiveKernelParametersCudaBlockSizes[] = { 256, 256, 256, 256, 256, 256 };

template< int SizeOfValue = 1,