Loading src/TNL/Matrices/Legacy/CSR.h +5 −2 Original line number Diff line number Diff line Loading @@ -115,8 +115,11 @@ public: static constexpr Index THREADS_VECTOR = 128; static constexpr Index THREADS_LIGHT = 128; /* Max length of row to process one warp */ static constexpr Index MAX_ELEMENTS_PER_WARP = 1024; /* Max length of row to process one warp for CSR Light, MultiVector */ static constexpr Index MAX_ELEMENTS_PER_WARP = 384; /* Max length of row to process one warp for CSR Adaptive */ static constexpr Index MAX_ELEMENTS_PER_WARP_ADAPT = 512; /* How many shared memory use per block in CSR Adaptive kernel */ static constexpr Index SHARED_PER_BLOCK = 24576; Loading src/TNL/Matrices/Legacy/CSR_impl.h +3 −3 Original line number Diff line number Diff line Loading @@ -143,7 +143,7 @@ Index findLimit(const Index start, type = Type::STREAM; return current; } else { // one long row if (sum <= 2 * matrix.MAX_ELEMENTS_PER_WARP) if (sum <= 2 * matrix.MAX_ELEMENTS_PER_WARP_ADAPT) type = Type::VECTOR; else type = Type::LONG; Loading Loading @@ -1765,7 +1765,7 @@ void SpMVCSRAdaptivePrepare( const Real *inVector, SpMVCSRAdaptive< Real, Index, warpSize, matrix.WARPS, matrix.SHARED_PER_WARP, matrix.MAX_ELEMENTS_PER_WARP > matrix.MAX_ELEMENTS_PER_WARP_ADAPT > <<<blocks, threads>>>( inVector, outVector, Loading Loading
src/TNL/Matrices/Legacy/CSR.h +5 −2 Original line number Diff line number Diff line Loading @@ -115,8 +115,11 @@ public: static constexpr Index THREADS_VECTOR = 128; static constexpr Index THREADS_LIGHT = 128; /* Max length of row to process one warp */ static constexpr Index MAX_ELEMENTS_PER_WARP = 1024; /* Max length of row to process one warp for CSR Light, MultiVector */ static constexpr Index MAX_ELEMENTS_PER_WARP = 384; /* Max length of row to process one warp for CSR Adaptive */ static constexpr Index MAX_ELEMENTS_PER_WARP_ADAPT = 512; /* How many shared memory use per block in CSR Adaptive kernel */ static constexpr Index SHARED_PER_BLOCK = 24576; Loading
src/TNL/Matrices/Legacy/CSR_impl.h +3 −3 Original line number Diff line number Diff line Loading @@ -143,7 +143,7 @@ Index findLimit(const Index start, type = Type::STREAM; return current; } else { // one long row if (sum <= 2 * matrix.MAX_ELEMENTS_PER_WARP) if (sum <= 2 * matrix.MAX_ELEMENTS_PER_WARP_ADAPT) type = Type::VECTOR; else type = Type::LONG; Loading Loading @@ -1765,7 +1765,7 @@ void SpMVCSRAdaptivePrepare( const Real *inVector, SpMVCSRAdaptive< Real, Index, warpSize, matrix.WARPS, matrix.SHARED_PER_WARP, matrix.MAX_ELEMENTS_PER_WARP > matrix.MAX_ELEMENTS_PER_WARP_ADAPT > <<<blocks, threads>>>( inVector, outVector, Loading