Fixing matrix elements organization for ellpack wrapping. (362ecdd4) · Commits · TNL / tnl-dev

Documentation/Examples/CMakeLists.txt

+37 −75

Original line number	Diff line number	Diff line
		@@ -3,80 +3,42 @@ ADD_SUBDIRECTORY( Containers )
		ADD_SUBDIRECTORY( Pointers )
		ADD_SUBDIRECTORY( Matrices )

		ADD_EXECUTABLE( FileExample FileExample.cpp )
		ADD_CUSTOM_COMMAND( COMMAND FileExample > ${TNL_DOCUMENTATION_OUTPUT_SNIPPETS_PATH}/FileExample.out OUTPUT FileExample.out )

		IF( BUILD_CUDA )
		CUDA_ADD_EXECUTABLE(FileExampleCuda FileExampleCuda.cu)
		ADD_CUSTOM_COMMAND( COMMAND FileExampleCuda > ${TNL_DOCUMENTATION_OUTPUT_SNIPPETS_PATH}/FileExampleCuda.out OUTPUT FileExampleCuda.out )
		ENDIF()

		ADD_EXECUTABLE( FileExampleSaveAndLoad FileExampleSaveAndLoad.cpp )
		ADD_CUSTOM_COMMAND( COMMAND FileExampleSaveAndLoad > ${TNL_DOCUMENTATION_OUTPUT_SNIPPETS_PATH}/FileExampleSaveAndLoad.out OUTPUT FileExampleSaveAndLoad.out )

		ADD_EXECUTABLE( FileNameExample FileNameExample.cpp )
		ADD_CUSTOM_COMMAND( COMMAND FileNameExample > ${TNL_DOCUMENTATION_OUTPUT_SNIPPETS_PATH}/FileNameExample.out OUTPUT FileNameExample.out )

		ADD_EXECUTABLE( FileNameExampleDistributedSystemNodeCoordinates FileNameExampleDistributedSystemNodeCoordinates.cpp )
		ADD_CUSTOM_COMMAND( COMMAND FileNameExampleDistributedSystemNodeCoordinates > ${TNL_DOCUMENTATION_OUTPUT_SNIPPETS_PATH}/FileNameExampleDistributedSystemNodeCoordinates.out OUTPUT FileNameExampleDistributedSystemNodeCoordinates.out )


		ADD_EXECUTABLE( FileNameExampleDistributedSystemNodeId FileNameExampleDistributedSystemNodeId.cpp )
		ADD_CUSTOM_COMMAND( COMMAND FileNameExampleDistributedSystemNodeId > ${TNL_DOCUMENTATION_OUTPUT_SNIPPETS_PATH}/FileNameExampleDistributedSystemNodeId.out OUTPUT FileNameExampleDistributedSystemNodeId.out )

		ADD_EXECUTABLE( ObjectExample_getType ObjectExample_getType.cpp )
		ADD_CUSTOM_COMMAND( COMMAND ObjectExample_getType > ${TNL_DOCUMENTATION_OUTPUT_SNIPPETS_PATH}/ObjectExample_getType.out OUTPUT ObjectExample_getType.out )

		ADD_EXECUTABLE( ParameterContainerExample ParameterContainerExample.cpp )
		ADD_EXECUTABLE( ConfigDescriptionExample ConfigDescriptionExample.cpp )
		ADD_EXECUTABLE( LoggerExample LoggerExample.cpp )
		ADD_EXECUTABLE( MathExample MathExample.cpp )

		ADD_EXECUTABLE( ParseObjectTypeExample ParseObjectTypeExample.cpp )
		ADD_CUSTOM_COMMAND( COMMAND ParseObjectTypeExample > ${TNL_DOCUMENTATION_OUTPUT_SNIPPETS_PATH}/ParseObjectTypeExample.out OUTPUT ParseObjectTypeExample.out )

		ADD_EXECUTABLE( StringExample StringExample.cpp )
		ADD_CUSTOM_COMMAND( COMMAND StringExample > ${TNL_DOCUMENTATION_OUTPUT_SNIPPETS_PATH}/StringExample.out OUTPUT StringExample.out )

		ADD_EXECUTABLE( StringExampleGetAllocatedSize StringExampleGetAllocatedSize.cpp )
		ADD_CUSTOM_COMMAND( COMMAND StringExampleGetAllocatedSize > ${TNL_DOCUMENTATION_OUTPUT_SNIPPETS_PATH}/StringExampleGetAllocatedSize.out OUTPUT StringExampleGetAllocatedSize.out )

		ADD_EXECUTABLE( StringExampleReplace StringExampleReplace.cpp )
		ADD_CUSTOM_COMMAND( COMMAND StringExampleReplace > ${TNL_DOCUMENTATION_OUTPUT_SNIPPETS_PATH}/StringExampleReplace.out OUTPUT StringExampleReplace.out )

		ADD_EXECUTABLE( StringExampleSetSize StringExampleSetSize.cpp )
		ADD_CUSTOM_COMMAND( COMMAND StringExampleSetSize > ${TNL_DOCUMENTATION_OUTPUT_SNIPPETS_PATH}/StringExampleSetSize.out OUTPUT StringExampleSetSize.out )

		ADD_EXECUTABLE( StringExampleSplit StringExampleSplit.cpp )
		ADD_CUSTOM_COMMAND( COMMAND StringExampleSplit > ${TNL_DOCUMENTATION_OUTPUT_SNIPPETS_PATH}/StringExampleSplit.out OUTPUT StringExampleSplit.out )

		ADD_EXECUTABLE( StringExampleStrip StringExampleStrip.cpp )
		ADD_CUSTOM_COMMAND( COMMAND StringExampleStrip > ${TNL_DOCUMENTATION_OUTPUT_SNIPPETS_PATH}/StringExampleStrip.out OUTPUT StringExampleStrip.out )

		ADD_EXECUTABLE( TimerExample TimerExample.cpp )
		ADD_CUSTOM_COMMAND( COMMAND TimerExample > ${TNL_DOCUMENTATION_OUTPUT_SNIPPETS_PATH}/TimerExample.out OUTPUT TimerExample.out )

		ADD_EXECUTABLE( TimerExampleLogger TimerExampleLogger.cpp )
		ADD_CUSTOM_COMMAND( COMMAND TimerExampleLogger > ${TNL_DOCUMENTATION_OUTPUT_SNIPPETS_PATH}/TimerExampleLogger.out OUTPUT TimerExampleLogger.out )


		ADD_CUSTOM_TARGET( RunExamples ALL DEPENDS
		FileExample.out
		FileExampleSaveAndLoad.out
		FileNameExample.out
		FileNameExampleDistributedSystemNodeCoordinates.out
		FileNameExampleDistributedSystemNodeId.out
		ObjectExample_getType.out
		ParseObjectTypeExample.out
		StringExample.out
		StringExampleGetAllocatedSize.out
		StringExampleReplace.out
		StringExampleSplit.out
		StringExampleStrip.out
		TimerExample.out
		TimerExampleLogger.out )
		set( COMMON_EXAMPLES
		FileExampleCuda
		)

		set( HOST_EXAMPLES
		FileExample
		FileExampleSaveAndLoad
		FileNameExample
		FileNameExampleDistributedSystemNodeCoordinates
		FileNameExampleDistributedSystemNodeId
		ObjectExample_getType
		ParseObjectTypeExample
		StringExample
		StringExampleGetAllocatedSize
		StringExampleReplace
		StringExampleSplit
		StringExampleStrip
		TimerExample
		TimerExampleLogger )

		if( BUILD_CUDA )
		ADD_CUSTOM_TARGET( RunExamples-cuda ALL DEPENDS
		FileExampleCuda.out )
		foreach( target IN ITEMS ${COMMON_EXAMPLES} )
		cuda_add_executable( ${target}-cuda ${target}.cu OPTIONS )
		add_custom_command( COMMAND ${target}-cuda > ${TNL_DOCUMENTATION_OUTPUT_SNIPPETS_PATH}/${target}.out OUTPUT ${target}.out )
		set( CUDA_OUTPUTS ${CUDA_OUTPUTS} ${target}.out )
		endforeach()
		else()
		foreach( target IN ITEMS ${COMMON_EXAMPLES} ${HOST_EXAMPLES})
		add_executable( ${target} ${target}.cpp )
		add_custom_command( COMMAND ${target} > ${TNL_DOCUMENTATION_OUTPUT_SNIPPETS_PATH}/${target}.out OUTPUT ${target}.out )
		set( HOST_OUTPUTS ${HOST_OUTPUTS} ${target}.out )
		endforeach()
		endif()

		IF( BUILD_CUDA )
		ADD_CUSTOM_TARGET( RunExamples-cuda ALL DEPENDS ${CUDA_OUTPUTS} )
		ELSE()
		ADD_CUSTOM_TARGET( RunExamples ALL DEPENDS ${HOST_OUTPUTS} )
		ENDIF()
		No newline at end of file

Documentation/Examples/Matrices/SparseMatrix/SparseMatrixViewExample_wrapEllpack.cpp

+1 −1

Original line number	Diff line number	Diff line
		@@ -26,7 +26,7 @@ void wrapMatrixView()
		/***
		* Wrap the arrays `values` and `columnIndexes` to sparse matrix view
		*/
		auto matrix = TNL::Matrices::wrapEllpackMatrix< Device >( rows, columns, 2, values, columnIndexes );
		auto matrix = TNL::Matrices::wrapEllpackMatrix< Device, TNL::Algorithms::Segments::RowMajorOrder >( rows, columns, 2, values, columnIndexes );

		std::cout << "Matrix reads as: " << std::endl << matrix << std::endl;
		}

Documentation/Tutorials/Matrices/tutorial_Matrices.md

+1 −1

Original line number	Diff line number	Diff line
		@@ -677,7 +677,7 @@ Wrapping data corresponding with the Ellpack format is very similar as we can se

		\includelineno SparseMatrixViewExample_wrapEllpack.cpp

		We encode the same sparse matrix as in the previous example. The essence of the Ellpack format is that we allocate the same number of matrix elements for each row which is two in our example. For some matrix rows we use the padding zeros for which we set the column index to -1 (line 21). Therefore the size of `valuesVector` and `columnIndexesVector` equals number of matrix rows times number of matrix elements allocated in each row. As before, we turn the vectors into C style pointers (lines 23-24) and wrap them into sparse matrix view with Ellpack format (line 29). Note that we must state the device on which the arrays are allocated explicitly. The result looks as follows:
		We encode the same sparse matrix as in the previous example. The essence of the Ellpack format is that we allocate the same number of matrix elements for each row which is two in our example. For some matrix rows we use the padding zeros for which we set the column index to -1 (line 21). Therefore the size of `valuesVector` and `columnIndexesVector` equals number of matrix rows times number of matrix elements allocated in each row. As before, we turn the vectors into C style pointers (lines 23-24) and wrap them into sparse matrix view with Ellpack format (line 29). Note that we must state the device on which the arrays are allocated explicitly and also the matrix elements organization, which is \ref TNL::Algorithms::Segments::RowMajorOrder in this case. For Ellpack matrix stored on GPU, \ref TNL::Algorithms::Segments::ColumnMajorOrder is preferred. The result looks as follows:

		\include SparseMatrixViewExample_wrapEllpack.out

src/TNL/Matrices/MatrixWrapping.h

+4 −4

Original line number	Diff line number	Diff line
		@@ -94,9 +94,9 @@ wrapCSRMatrix( const Index& rows, const Index& columns, Index* rowPointers, Real
		/// This is to prevent from appearing in Doxygen documentation.
		/// \cond HIDDEN_CLASS
		template< typename Device,
		ElementsOrganization Organization,
		typename Real,
		typename Index,
		ElementsOrganization Organization = Algorithms::Segments::DefaultElementsOrganization< Device >::getOrganization(),
		int Alignment = 1 >
		struct EllpackMatrixWrapper
		{
		@@ -140,15 +140,15 @@ struct EllpackMatrixWrapper
		* \include SparseMatrixViewExample_wrapEllpack.out
		*/
		template< typename Device,
		ElementsOrganization Organization,
		typename Real,
		typename Index,
		ElementsOrganization Organization = Algorithms::Segments::DefaultElementsOrganization< Device >::getOrganization(),
		int Alignment = 1 >
		auto
		wrapEllpackMatrix( const Index rows, const Index columns, const Index nonzerosPerRow, Real* values, Index* columnIndexes )
		-> decltype( EllpackMatrixWrapper< Device, Real, Index, Organization, Alignment >::wrap( rows, columns, nonzerosPerRow, values, columnIndexes ) )
		-> decltype( EllpackMatrixWrapper< Device, Organization, Real, Index, Alignment >::wrap( rows, columns, nonzerosPerRow, values, columnIndexes ) )
		{
		return EllpackMatrixWrapper< Device, Real, Index, Organization, Alignment >::wrap( rows, columns, nonzerosPerRow, values, columnIndexes );
		return EllpackMatrixWrapper< Device, Organization, Real, Index, Alignment >::wrap( rows, columns, nonzerosPerRow, values, columnIndexes );
		}

		} //namespace Matrices

src/TNL/Matrices/SparseMatrix.hpp

+1 −1

Original line number	Diff line number	Diff line
		@@ -165,7 +165,7 @@ getConstView() const -> ConstViewType
		this->getColumns(),
		this->getValues().getConstView(),
		this->columnIndexes.getConstView(),
		this->segments.getConstView() );
		const_cast< SparseMatrix* >( this )->segments.getView() );
		}

		template< typename Real,