Commit ad25a80f authored by Tomáš Oberhuber's avatar Tomáš Oberhuber
Browse files

Fixed 2D optimized CUDA grid traverser.

parent ee5a7cb4
Loading
Loading
Loading
Loading
+5 −9
Original line number Diff line number Diff line
@@ -495,16 +495,12 @@ processEntities(
                 gridIdx,
                 gridEntityParameters... );
      }
      // only launches into the stream 0 are synchronized
      if( stream == 0 )
      {
         //cudaStreamSynchronize( s1 );
         //cudaStreamSynchronize( s2 );
         //cudaStreamSynchronize( s3 );
         //cudaStreamSynchronize( s4 );
      cudaStreamSynchronize( s1 );
      cudaStreamSynchronize( s2 );
      cudaStreamSynchronize( s3 );
      cudaStreamSynchronize( s4 );
      checkCudaDevice;
   }
   }
   else
   {
      dim3 cudaBlockSize( 16, 16 );