Added examples comparing native Hypre and TNL wrappers for Hypre

76389ead · Jakub Klinkovský · Jakub Klinkovský · 19c5cac7 · 76389ead · 76389ead
Commit 76389ead authored 2 years ago by Jakub Klinkovský Committed by Jakub Klinkovský 2 years ago
--- a/src/Examples/CMakeLists.txt
+++ b/src/Examples/CMakeLists.txt
+add_subdirectory( Hypre )
 #add_subdirectory( simple-examples )
 #add_subdirectory( Hamilton-Jacobi )
 #add_subdirectory( heat-equation )

--- a/src/Examples/Hypre/CMakeLists.txt
+++ b/src/Examples/Hypre/CMakeLists.txt
+if( ${BUILD_MPI} )
+   find_package(Hypre)
+   if( ${HYPRE_FOUND} )
+      foreach( source IN ITEMS hypre-ex5.c tnl-hypre-ex5.cpp )
+         string( REGEX REPLACE "\.cpp|\.c" "" target ${source} )
+         add_executable( ${target} ${source} )
+         target_compile_definitions( ${target} PUBLIC "-DHAVE_HYPRE" )
+         target_include_directories( ${target} PUBLIC ${HYPRE_INCLUDE_DIRS} )
+         target_link_libraries( ${target} ${HYPRE_LIBRARIES} -lm )
+         install( TARGETS ${target} RUNTIME DESTINATION bin )
+      endforeach()
+   endif()
+endif()
--- a/src/Examples/Hypre/ex.h
+++ b/src/Examples/Hypre/ex.h
+/******************************************************************************
+ * Copyright (c) 1998 Lawrence Livermore National Security, LLC and other
+ * HYPRE Project Developers. See the top-level COPYRIGHT file for details.
+ *
+ * SPDX-License-Identifier: (Apache-2.0 OR MIT)
+ ******************************************************************************/
+/*--------------------------------------------------------------------------
+ * Header file for examples
+ *--------------------------------------------------------------------------*/
+#ifndef HYPRE_EXAMPLES_INCLUDES
+#define HYPRE_EXAMPLES_INCLUDES
+#include <HYPRE_config.h>
+#if defined(HYPRE_EXAMPLE_USING_CUDA)
+#include <cuda_runtime.h>
+#ifndef HYPRE_USING_UNIFIED_MEMORY
+#error *** Running the examples on GPUs requires Unified Memory. Please reconfigure and rebuild with --enable-unified-memory ***
+#endif
+static inline void*
+gpu_malloc(size_t size)
+{
+   void *ptr = NULL;
+   cudaMallocManaged(&ptr, size, cudaMemAttachGlobal);
+   return ptr;
+}
+static inline void*
+gpu_calloc(size_t num, size_t size)
+{
+   void *ptr = NULL;
+   cudaMallocManaged(&ptr, num * size, cudaMemAttachGlobal);
+   cudaMemset(ptr, 0, num * size);
+   return ptr;
+}
+#define malloc(size) gpu_malloc(size)
+#define calloc(num, size) gpu_calloc(num, size)
+#define free(ptr) ( cudaFree(ptr), ptr = NULL )
+#endif /* #if defined(HYPRE_EXAMPLE_USING_CUDA) */
+#endif /* #ifndef HYPRE_EXAMPLES_INCLUDES */
--- a/src/Examples/Hypre/glvis-ex5.sh
+++ b/src/Examples/Hypre/glvis-ex5.sh
+#!/bin/bash
+ex=ex5
+keys=Aaamc
+dir="${1:-.}"
+mesh="$dir/$ex.mesh"
+sol="$dir/$ex.sol"
+if ! test -e "$mesh"; then
+    echo "Error: cannot find mesh file for $ex"
+    exit 1
+fi
+echo "FiniteElementSpace" > "$sol"
+echo "FiniteElementCollection: H1_2D_P1" >> "$sol"
+echo "VDim: 1" >> "$sol"
+echo "Ordering: 0" >> "$sol"
+echo "" >> "$sol"
+find "$dir" -name "$ex.sol.??????" | sort | xargs cat >> "$sol"
+glvis -m "$mesh" -g "$sol" -k "$keys"
--- a/src/Examples/Hypre/hypre-ex5.c
+++ b/src/Examples/Hypre/hypre-ex5.c
--- a/src/Examples/Hypre/tnl-hypre-ex5.cpp
+++ b/src/Examples/Hypre/tnl-hypre-ex5.cpp
+/**
+ * Description:
+ *
+ * This example solves the 2-D Laplacian problem with zero boundary conditions
+ * on an n x n grid.  The number of unknowns is N=n^2.  The standard 5-point
+ * stencil is used, and we solve for the interior nodes only.
+ *
+ * The example is based on the "ex5.c" example.  It demonstrates how the C code
+ * can be ported to C++ and TNL.  We recommend comparing this example the
+ * original one.
+ *
+ * Compile with: use the install script from TNL
+ *
+ * Sample run:   OMP_NUM_THREADS=1 mpirun -np 4 tnl-hypre-ex5
+ */
+#include <cstdio>
+#include <string>
+#include <TNL/Math.h>
+#include <TNL/MPI.h>
+#include <TNL/Hypre.h>
+#include <TNL/Containers/HypreParVector.h>
+#include <TNL/Matrices/HypreParCSRMatrix.h>
+#include <TNL/Solvers/Linear/Hypre.h>
+#include "vis.c"
+int
+hypre_FlexGMRESModifyPCAMGExample( void* precond_data, int iterations, double rel_residual_norm );
+int
+main( int argc, char* argv[] )
+{
+   // Initialize MPI
+   TNL::MPI::ScopedInitializer mpi( argc, argv );
+   const int myid = TNL::MPI::GetRank( MPI_COMM_WORLD );
+   const int num_procs = TNL::MPI::GetSize( MPI_COMM_WORLD );
+   // Initialize HYPRE and set some global options, notably HYPRE_SetSpGemmUseCusparse(0);
+   TNL::Hypre hypre;
+   // Default problem parameters
+   int n = 33;
+   int solver_id = 0;
+   int vis = 0;
+   // Parse the command line
+   {
+      int arg_index = 0;
+      int print_usage = 0;
+      while( arg_index < argc ) {
+         if( std::string( argv[ arg_index ] ) == "-n" ) {
+            arg_index++;
+            n = std::stoi( argv[ arg_index++ ] );
+         }
+         else if( std::string( argv[ arg_index ] ) == "-solver" ) {
+            arg_index++;
+            solver_id = std::stoi( argv[ arg_index++ ] );
+         }
+         else if( std::string( argv[ arg_index ] ) == "-vis" ) {
+            arg_index++;
+            vis = 1;
+         }
+         else if( std::string( argv[ arg_index ] ) == "-help" ) {
+            print_usage = 1;
+            break;
+         }
+         else {
+            arg_index++;
+         }
+      }
+      if( print_usage && myid == 0 ) {
+         std::cerr << "\n"
+                      "Usage: " << argv[ 0 ] << " [<options>]\n"
+                      "\n"
+                      "  -n <n>              : problem size in each direction (default: 33)\n"
+                      "  -solver <ID>        : solver ID\n"
+                      "                        0  - AMG (default) \n"
+                      "                        1  - AMG-PCG\n"
+                      "                        8  - ParaSails-PCG\n"
+                      "                        50 - PCG\n"
+                      "                        61 - AMG-FlexGMRES\n"
+                      "  -vis                : save the solution for GLVis visualization\n"
+                   << std::endl;
+      }
+      if( print_usage )
+         return EXIT_SUCCESS;
+   }
+   // Set the problem sizes
+   // Preliminaries: we want at least one rank per row
+   if( n * n < num_procs )
+      n = std::sqrt( num_procs ) + 1;
+   const int N = n * n;               // global number of rows
+   const double h = 1.0 / ( n + 1 );  // mesh cell size
+   /* Each rank knows only of its own rows - the range is denoted by ilower
+      and upper.  Here we partition the rows. We account for the fact that
+      N may not divide evenly by the number of ranks. */
+   HYPRE_Int local_size = N / num_procs;
+   HYPRE_Int extra = N - local_size * num_procs;
+   HYPRE_Int ilower = local_size * myid;
+   ilower += TNL::min( myid, extra );
+   HYPRE_Int iupper = local_size * ( myid + 1 );
+   iupper += TNL::min( myid + 1, extra );
+   iupper = iupper - 1;
+   // How many rows do I have?
+   local_size = iupper - ilower + 1;
+   // Let each rank create its local matrix in the CSR format in TNL
+   using CSR = TNL::Matrices::SparseMatrix< double, TNL::HYPRE_Device, HYPRE_Int >;
+   CSR A_local;
+   A_local.setDimensions( local_size, N );
+   // Allocate row capacities - this must match exactly the sparsity pattern of
+   // the matrix
+   typename CSR::RowsCapacitiesType capacities;
+   capacities.setSize( local_size );
+   auto capacities_view = capacities.getView();
+   TNL::Algorithms::ParallelFor< TNL::HYPRE_Device >::exec( ilower, iupper + 1,
+      [=] __cuda_callable__ ( HYPRE_Int i ) mutable
+      {
+         int nnz = 0;
+         // The left identity block: position i-n
+         if( i - n >= 0 )
+            nnz++;
+         // The left -1: position i-1
+         if( i % n )
+            nnz++;
+         // The diagonal: position i
+         nnz++;
+         // The right -1: position i+1
+         if( ( i + 1 ) % n )
+            nnz++;
+         // The right identity block: position i+n
+         if( i + n < N )
+            nnz++;
+         // The row index must be converted from global to local
+         capacities_view[ i - ilower ] = nnz;
+      } );
+   A_local.setRowCapacities( capacities );
+   /* Now assemble the local matrix. Each row has at most 5 entries. For
+    * example, if n=3:
+    *   A = [M -I 0; -I M -I; 0 -I M]
+    *   M = [4 -1 0; -1 4 -1; 0 -1 4]
+    */
+   A_local.forAllRows( [=] __cuda_callable__ ( typename CSR::RowView& row ) mutable {
+         // The row index must be converted from local to global
+         const HYPRE_Int i = ilower + row.getRowIndex();
+         int nnz = 0;
+         // The left identity block: position i-n
+         if( i - n >= 0 )
+            row.setElement( nnz++, i - n, -1.0 );
+         // The left -1: position i-1
+         if( i % n )
+            row.setElement( nnz++, i - 1, -1.0 );
+         // The diagonal: position i
+         row.setElement( nnz++, i, 4.0 );
+         // The right -1: position i+1
+         if( ( i + 1 ) % n )
+            row.setElement( nnz++, i + 1, -1.0 );
+         // The right identity block: position i+n
+         if( i + n < N )
+            row.setElement( nnz++, i + n, -1.0 );
+      } );
+   // Bind the TNL matrix to HypreCSR
+   TNL::Matrices::HypreCSRMatrix A_local_hypre;
+   A_local_hypre.bind( A_local );
+   // Assemble the distributed matrix in Hypre from the local blocks
+   // Note that this is a square matrix, so we indicate the row partition
+   // size twice (since number of rows = number of cols)
+   using HypreParCSR = TNL::Matrices::HypreParCSRMatrix;
+   HypreParCSR parcsr_A = HypreParCSR::fromLocalBlocks( MPI_COMM_WORLD, N, N, {ilower, iupper + 1}, {ilower, iupper + 1}, A_local_hypre );
+   // Deallocate the local matrix since it is not needed anymore in this example
+   A_local_hypre.reset();
+   A_local.reset();
+   // Create the rhs and solution vectors
+   TNL::Containers::HypreParVector par_b;
+   TNL::Containers::HypreParVector par_x;
+   par_b.setDistribution( {ilower, iupper + 1}, 0, N, MPI_COMM_WORLD );
+   par_x.setDistribution( {ilower, iupper + 1}, 0, N, MPI_COMM_WORLD );
+   // Set the rhs values to h^2 and the solution to zero
+   par_b.setValue( h * h );
+   par_x.setValue( 0.0 );
+   // Choose a solver and solve the system
+   // AMG
+   if( solver_id == 0 ) {
+      // Create the solver
+      TNL::Solvers::Linear::HypreBoomerAMG solver;
+      // Set the matrix of the linear system
+      // WARNING: setMatrix resets the preconditioner, including setting
+      //          default options.
+      // NOTE: The wrapper class sets its own default options that are
+      //       different from Hypre. The overriding settings below result in
+      //       the same state as the hypre-ex5.c example.
+      solver.setMatrix( parcsr_A );
+      // Set some parameters (See Reference Manual for more parameters)
+      HYPRE_BoomerAMGSetPrintLevel( solver, 3 );    // Print solve info + parameters
+      HYPRE_BoomerAMGSetOldDefault( solver );       // Falgout coarsening with modified classical interpolation
+      HYPRE_BoomerAMGSetRelaxType( solver, 6 );     // Sym. G-S/Jacobi hybrid relaxation
+      HYPRE_BoomerAMGSetRelaxOrder( solver, 1 );    // Uses C/F relaxation
+      HYPRE_BoomerAMGSetNumSweeps( solver, 1 );     // Sweeeps on each level
+      HYPRE_BoomerAMGSetTol( solver, 1e-7 );        // Convergence tolerance
+      HYPRE_BoomerAMGSetMaxIter( solver, 20 );      // Use as solver: max iterations
+      HYPRE_BoomerAMGSetAggNumLevels( solver, 0 );  // number of aggressive coarsening levels
+      // Solve the linear system (calls AMG setup, solve, and prints final residual norm)
+      solver.solve( par_b, par_x );
+   }
+   // PCG
+   else if( solver_id == 50 ) {
+      // Create the solver
+      TNL::Solvers::Linear::HyprePCG solver( MPI_COMM_WORLD );
+      // Set some parameters (See Reference Manual for more parameters)
+      HYPRE_PCGSetMaxIter( solver, 1000 );  // max iterations
+      HYPRE_PCGSetTol( solver, 1e-7 );      // convergence tolerance
+      HYPRE_PCGSetTwoNorm( solver, 1 );     // use the two norm as the stopping criteria
+      HYPRE_PCGSetPrintLevel( solver, 2 );  // prints out the iteration info
+      // Set the matrix of the linear system
+      solver.setMatrix( parcsr_A );
+      // Ignore errors returned from Hypre functions (e.g. when PCG does not
+      // converge within the maximum iterations limit).
+      solver.setErrorMode( solver.WARN_HYPRE_ERRORS );
+      // Solve the linear system (calls PCG setup, solve, and prints final residual norm)
+      solver.solve( par_b, par_x );
+   }
+   // PCG with AMG preconditioner
+   else if( solver_id == 1 ) {
+      // Create the solver
+      TNL::Solvers::Linear::HyprePCG solver( MPI_COMM_WORLD );
+      // Create the preconditioner
+      TNL::Solvers::Linear::HypreBoomerAMG precond;
+      // Set the PCG preconditioner
+      solver.setPreconditioner( precond );
+      // Set the matrix of the linear system
+      // WARNING: setMatrix resets the preconditioner, including setting
+      //          default options.
+      solver.setMatrix( parcsr_A );
+      // Set some parameters (See Reference Manual for more parameters)
+      HYPRE_BoomerAMGSetPrintLevel( precond, 1 );    // Print setup info + parameters
+      HYPRE_BoomerAMGSetOldDefault( precond );       // Falgout coarsening with modified classical interpolation
+      HYPRE_BoomerAMGSetRelaxType( precond, 6 );     // Sym G.S./Jacobi hybrid relaxation
+      HYPRE_BoomerAMGSetRelaxOrder( precond, 1 );    // Uses C/F relaxation
+      HYPRE_BoomerAMGSetAggNumLevels( precond, 0 );  // number of aggressive coarsening levels
+      // Set some parameters (See Reference Manual for more parameters)
+      HYPRE_PCGSetMaxIter( solver, 1000 );  // max iterations
+      HYPRE_PCGSetTol( solver, 1e-7 );      // convergence tolerance
+      HYPRE_PCGSetTwoNorm( solver, 1 );     // use the two norm as the stopping criteria
+      HYPRE_PCGSetPrintLevel( solver, 2 );  // prints out the iteration info
+      // Solve the linear system (calls PCG setup, solve, and prints final residual norm)
+      solver.solve( par_b, par_x );
+   }
+   // PCG with ParaSails preconditioner
+   else if( solver_id == 8 ) {
+      // Create the solver
+      TNL::Solvers::Linear::HyprePCG solver( MPI_COMM_WORLD );
+      // Create the preconditioner
+      TNL::Solvers::Linear::HypreParaSails precond( MPI_COMM_WORLD );
+      // Set the PCG preconditioner
+      solver.setPreconditioner( precond );
+      // Set the matrix of the linear system
+      // WARNING: setMatrix resets the preconditioner, including setting
+      //          default options.
+      solver.setMatrix( parcsr_A );
+      // Set some parameters (See Reference Manual for more parameters)
+      HYPRE_PCGSetMaxIter( solver, 1000 );  // max iterations
+      HYPRE_PCGSetTol( solver, 1e-7 );      // convergence tolerance
+      HYPRE_PCGSetTwoNorm( solver, 1 );     // use the two norm as the stopping criteria
+      HYPRE_PCGSetPrintLevel( solver, 2 );  // prints out the iteration info
+      // Set some parameters (See Reference Manual for more parameters)
+      HYPRE_ParaSailsSetParams( precond, 0.1, 1 );  // threshold and max levels
+      HYPRE_ParaSailsSetFilter( precond, 0.05 );
+      HYPRE_ParaSailsSetSym( precond, 1 );
+      // Solve the linear system (calls PCG setup, solve, and prints final residual norm)
+      solver.solve( par_b, par_x );
+   }
+   // Flexible GMRES with AMG preconditioner
+   else if( solver_id == 61 ) {
+      // Create the solver
+      TNL::Solvers::Linear::HypreFlexGMRES solver( MPI_COMM_WORLD );
+      // Create the preconditioner
+      TNL::Solvers::Linear::HypreBoomerAMG precond;
+      // Set the FlexGMRES preconditioner
+      solver.setPreconditioner( precond );
+      // Set the matrix of the linear system
+      // WARNING: setMatrix resets the preconditioner, including setting
+      //          default options.
+      solver.setMatrix( parcsr_A );
+      // Set some parameters (See Reference Manual for more parameters)
+      HYPRE_FlexGMRESSetKDim( solver, 30 );       // restart parameter
+      HYPRE_FlexGMRESSetMaxIter( solver, 1000 );  // max iterations
+      HYPRE_FlexGMRESSetTol( solver, 1e-7 );      // convergence tolerance
+      HYPRE_FlexGMRESSetPrintLevel( solver, 2 );  // print solve info
+      // Set some parameters (See Reference Manual for more parameters)
+      HYPRE_BoomerAMGSetPrintLevel( precond, 1 );    // Print setup info + parameters
+      HYPRE_BoomerAMGSetOldDefault( precond );       // Falgout coarsening with modified classical interpolation
+      HYPRE_BoomerAMGSetRelaxType( precond, 6 );     // Sym G.S./Jacobi hybrid relaxation
+      HYPRE_BoomerAMGSetRelaxOrder( precond, 1 );    // Uses C/F relaxation
+      HYPRE_BoomerAMGSetAggNumLevels( precond, 0 );  // number of aggressive coarsening levels
+      // This is an optional call - if you don't call it,
+      // hypre_FlexGMRESModifyPCDefault is used - which does nothing.
+      // Otherwise, you can define your own, similar to the one used here
+      HYPRE_FlexGMRESSetModifyPC( solver, (HYPRE_PtrToModifyPCFcn) hypre_FlexGMRESModifyPCAMGExample );
+      // Solve the linear system (calls FlexGMRES setup, solve, and prints final residual norm)
+      solver.solve( par_b, par_x );
+   }
+   else if( myid == 0 ) {
+      std::cerr << "Invalid solver id specified." << std::endl;
+      return EXIT_FAILURE;
+   }
+   // Save the solution for GLVis visualization, see glvis-ex5.sh
+   if( vis ) {
+      char filename[ 255 ];
+      sprintf( filename, "%s.%06d", "vis_tnl/ex5.sol", myid );
+      FILE* file = fopen( filename, "w" );
+      if( file == nullptr ) {
+         printf( "Error: can't open output file %s\n", filename );
+         return EXIT_FAILURE;
+      }
+      // Save the solution
+      const auto local_x = par_x.getConstLocalView();
+      for( HYPRE_Int i = 0; i < local_size; i++ )
+         fprintf( file, "%.14e\n", local_x[ i ] );
+      fflush( file );
+      fclose( file );
+      // Save the global finite element mesh
+      if( myid == 0 )
+         GLVis_PrintGlobalSquareMesh( "vis_tnl/ex5.mesh", n - 1 );
+   }
+   return EXIT_SUCCESS;
+}
+/**
+ * This is an example (not recommended) of how we can modify things about AMG
+ * that affect the solve phase based on how FlexGMRES is doing... For another
+ * preconditioner it may make sense to modify the tolerance.
+ */
+int
+hypre_FlexGMRESModifyPCAMGExample( void* precond_data, int iterations, double rel_residual_norm )
+{
+   if( rel_residual_norm > .1 )
+      HYPRE_BoomerAMGSetNumSweeps( (HYPRE_Solver) precond_data, 10 );
+   else
+      HYPRE_BoomerAMGSetNumSweeps( (HYPRE_Solver) precond_data, 1 );
+   return 0;
+}
--- a/src/Examples/Hypre/verify-ex5.sh
+++ b/src/Examples/Hypre/verify-ex5.sh
+#!/bin/bash
+set -e
+# make output directories
+mkdir -p vis vis_tnl
+# dbg suffix for binaries
+#dbg=""
+dbg="-dbg"
+# problem size: N=n^2
+n=100
+# disable OpenMP for reproducibility
+export OMP_NUM_THREADS=1
+make_glvis() {
+    local dir="$1"
+    local sol="$dir/ex5.sol"
+    echo "FiniteElementSpace" > "$sol"
+    echo "FiniteElementCollection: H1_2D_P1" >> "$sol"
+    echo "VDim: 1" >> "$sol"
+    echo "Ordering: 0" >> "$sol"
+    echo "" >> "$sol"
+    find "$dir" -name "ex5.sol.??????" | sort | xargs cat >> "$sol"
+}
+verify() {
+    make_glvis vis
+    make_glvis vis_tnl
+    diff "vis/ex5.sol" "vis_tnl/ex5.sol"
+    rm -f vis/ex5.sol* vis_tnl/ex5.sol*
+}
+# BoomerAMG
+mpirun hypre-ex5$dbg -vis -n $n -solver 0
+mpirun tnl-hypre-ex5$dbg -vis -n $n -solver 0
+verify
+# PCG
+mpirun hypre-ex5$dbg -vis -n $n -solver 50
+mpirun tnl-hypre-ex5$dbg -vis -n $n -solver 50
+verify
+# PCG with AMG
+mpirun hypre-ex5$dbg -vis -n $n -solver 1
+mpirun tnl-hypre-ex5$dbg -vis -n $n -solver 1
+verify
+# PCG with ParaSails
+mpirun hypre-ex5$dbg -vis -n $n -solver 8
+mpirun tnl-hypre-ex5$dbg -vis -n $n -solver 8
+verify
+# FlexGMRES with AMG
+mpirun hypre-ex5$dbg -vis -n $n -solver 61
+mpirun tnl-hypre-ex5$dbg -vis -n $n -solver 61
+verify
--- a/src/Examples/Hypre/vis.c
+++ b/src/Examples/Hypre/vis.c
+/******************************************************************************
+ * Copyright (c) 1998 Lawrence Livermore National Security, LLC and other
+ * HYPRE Project Developers. See the top-level COPYRIGHT file for details.
+ *
+ * SPDX-License-Identifier: (Apache-2.0 OR MIT)
+ ******************************************************************************/
+/* Save a structured n x n mesh of square elements on the unit square into a
+   GLVis mesh file with the given name. */
+#include <math.h>
+void GLVis_PrintGlobalSquareMesh(const char *meshfile, int n)
+{
+   FILE *file;
+   int Dim = 2;
+   int NumOfVertices = (n + 1) * (n + 1);
+   int NumOfElements = n * n;
+   int i, j;
+   double x, y;
+   double h = 1.0 / n;
+   if ((file = fopen(meshfile, "w")) == NULL)
+   {
+      printf("Error: can't open output file %s\n", meshfile);
+      exit(1);
+   }
+   /* mesh header */
+   fprintf(file, "MFEM mesh v1.0\n");
+   fprintf(file, "\ndimension\n");
+   fprintf(file, "%d\n", Dim);
+   /* mesh elements */
+   fprintf(file, "\nelements\n");
+   fprintf(file, "%d\n", NumOfElements);
+   for (j = 0; j < n; j++)
+      for (i = 0; i < n; i++)
+         fprintf(file, "1 3 %d %d %d %d\n", i + j * (n + 1), i + 1 + j * (n + 1),
+                 i + 1 + (j + 1) * (n + 1), i + (j + 1) * (n + 1));
+   /* boundary will be generated by GLVis */
+   fprintf(file, "\nboundary\n");
+   fprintf(file, "0\n");
+   /* mesh vertices */
+   fprintf(file, "\nvertices\n");
+   fprintf(file, "%d\n", NumOfVertices);
+   fprintf(file, "%d\n", Dim);
+   for (j = 0; j < n + 1; j++)
+      for (i = 0; i < n + 1; i++)
+      {
+         x = i * h;
+         y = j * h;
+         fprintf(file, "%.14e %.14e\n", x, y);
+      }
+   fflush(file);
+   fclose(file);
+}