Skip to content
Snippets Groups Projects
Commit fe1ca902 authored by Tomáš Oberhuber's avatar Tomáš Oberhuber
Browse files

Fixed indexing and data set size in traversers benchmark.

parent 23bb05df
No related branches found
No related tags found
1 merge request!20Traversers optimizations
......@@ -105,7 +105,7 @@ class GridTraversersBenchmark< 2, Device, Real, Index >
void writeOneUsingParallelFor()
{
Index _size = this->size;
auto f = [=] __cuda_callable__ ( Index i, Index j, Real* data )
auto f = [=] __cuda_callable__ ( Index j, Index i, Real* data )
{
data[ i * _size + j ] = 1.0;
};
......@@ -146,7 +146,7 @@ class GridTraversersBenchmark< 3, Device, Real, Index >
void writeOneUsingParallelFor()
{
Index _size = this->size;
auto f = [=] __cuda_callable__ ( Index i, Index j, Index k, Real* data )
auto f = [=] __cuda_callable__ ( Index k, Index j, Index i, Real* data )
{
data[ ( i * _size + j ) * _size + k ] = 1.0;
};
......
......@@ -64,7 +64,7 @@ bool runBenchmark( const Config::ParameterContainer& parameters,
cudaTraverserBenchmark.writeOneUsingParallelFor();
};
benchmark.setOperation( "write 1 using parallel for", size * sizeof( Real ) / oneGB );
benchmark.setOperation( "write 1 using parallel for", pow( ( double ) size, ( double ) Dimension ) * sizeof( Real ) / oneGB );
benchmark.time( reset, "CPU", hostWriteOneUsingParallelFor );
#ifdef HAVE_CUDA
benchmark.time( reset, "GPU", cudaWriteOneUsingParallelFor );
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment