Add documentation and usage examples.

nncarlson · nncarlson · commit 7b26baf73f24 · 2022-03-03T17:54:24.000-07:00
diff --git a/CMakeLists.txt b/CMakeLists.txt
@@ -8,3 +8,4 @@ include(CTest)
 
 add_subdirectory(src)
 add_subdirectory(test)
+add_subdirectory(example)
diff --git a/README.md b/README.md
@@ -6,3 +6,7 @@ derived type that describes the mapping of an array's index set to processes.
 The mapping allows for overlap between processes, and provides collective
 array gather procedures and scatter reduction procedures associated with that
 overlap.
+
+Documentation for the module is in the `doc` directory.
+
+Usage examples are in the `example` directory.
diff --git a/doc/index_map_type.md b/doc/index_map_type.md
diff --git a/example/CMakeLists.txt b/example/CMakeLists.txt
@@ -0,0 +1,7 @@
+# Want test modules in the build directory.
+#unset(CMAKE_Fortran_MODULE_DIRECTORY)
+
+add_executable(disk-fv-serial disk-fv-serial.f90)
+
+add_executable(disk-fv-mpi disk-fv-mpi.f90)
+target_link_libraries(disk-fv-mpi common MPI::MPI_Fortran)
diff --git a/example/README.md b/example/README.md
@@ -0,0 +1,25 @@
+## Example Programs
+
+This directory contains example programs that illustrate the use of the
+`index_map_type` Fortran module.
+
+### Finite Volume Solution of the Heat Equation on a Unit Disk
+
+The program `disk-fv-mpi.f90` solves the heat equation $`u_t = \Delta u`$ on
+the unit disk subject to zero boundary conditions. It uses a simple finite
+volume discretization on a regular 2D Cartesian mesh that contains the unit
+disk. Only those cells whose center is contained in the unit disk are
+included in the problem. The unknowns are cell-centered values of $`u`$.
+Simple first-order forward Euler time stepping is used to solve from a
+uniform initial condition to a final time. Domain decomposition is used to
+parallelize the computation. The cells are numbered according to the usual
+order of the elements of a rank-2 array (but only for those included in
+the problem) and then partitioned into approximately equal blocks, one per
+MPI rank. There is a single indirect indexing array that maps a cell index
+to the cell indices of its neighboring cells. For comparison, the program
+`disk-fv-serial.F90` is a serial version of the solver. Aside from the initial
+setup of the parallel decomposition of the problem, the only difference
+between the MPI-parallel solver and the serial solver is a single call to
+`index_map%gather_offp` to update the off-process elements of the local
+unknown array with values from their corresponding on-process elements on
+neighboring processes -- a parallel halo exchange operation.
diff --git a/example/disk-fv-mpi.f90 b/example/disk-fv-mpi.f90
@@ -0,0 +1,207 @@
+!! DISK_FV_MPI
+!!
+!! This example program solves the heat equation \(u_t = \Delta u\) on the
+!! unit disk subject to 0 boundary conditions. It uses a simple finite volume
+!! discretization on a regular 2D Cartesian mesh that contains the unit disk.
+!! Only those cells whose center is contained in the unit disk are included
+!! in the problem. The unknowns are cell-centered values of \(u\). Simple
+!! first-order forward Euler time stepping is used to solve from a uniform
+!! initial condition to a final time. Domain decomposition is used to
+!! parallelize the computation. The cells are numbered according to the usual
+!! order of the elements of a rank-2 array (but only for those included in
+!! the problem) and then partitioned into approximately equal blocks, one per
+!! MPI rank. For reference, see the serial implementation disk-serial.f90
+!!
+!! Copyright 2022 Neil N. Carlson <neil.n.carlson@gmail.com>
+!!
+!! Permission is hereby granted, free of charge, to any person obtaining a
+!! copy of this software and associated documentation files (the "Software"),
+!! to deal in the Software without restriction, including without limitation
+!! the rights to use, copy, modify, merge, publish, distribute, sublicense,
+!! and/or sell copies of the Software, and to permit persons to whom the
+!! Software is furnished to do so, subject to the following conditions:
+!!
+!! The above copyright notice and this permission notice shall be included
+!! in all copies or substantial portions of the Software.
+!!
+!! THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+!! IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+!! FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+!! THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+!! LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+!! FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+!! DEALINGS IN THE SOFTWARE.
+!!
+!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!
+
+program disk_fv_mpi
+
+  use,intrinsic ::iso_fortran_env, only: i8 => int64, r8 => real64
+  use mpi
+  use index_map_type
+  implicit none
+
+  integer, parameter :: NZ = 101  ! number of zones in each dimension
+  integer :: ierr, nproc, rank, bsize, n, ncell, j, step, nstep, nstep0
+  integer, allocatable :: mask(:,:), cnhbr(:,:), cnhbr_local(:,:)
+  real(r8), allocatable :: u(:), u_local(:), u_prev(:)
+  type(index_map) :: cell_map
+  real(r8) :: dt, dx, c, tfinal
+  integer(i8) :: t1, t2, rate
+
+  call MPI_Init(ierr)
+  call MPI_Comm_size(MPI_COMM_WORLD, nproc, ierr)
+  call MPI_Comm_rank(MPI_COMM_WORLD, rank, ierr)
+
+  !! The MASK array marks grid cells inside the unit disk with a unique
+  !! positive index. Other cells are marked with a 0. It is sized to include
+  !! a border of cells around the actual grid. NCELL is the number of cells
+  !! contained in the unit disk and the number of cell-centered unknowns.
+  if (rank == 0) then
+    allocate(mask(0:NZ+1,0:NZ+1))
+    call unit_disk_mask(mask, ncell)
+  end if
+  call MPI_Bcast(ncell, 1, MPI_INTEGER, 0, MPI_COMM_WORLD, ierr)
+
+  !! Create a mapping of the cell index set onto NPROC processes with
+  !! nearly equal block sizes.
+  bsize = ncell/nproc
+  if (rank < ncell-bsize*nproc) bsize = bsize + 1
+  call cell_map%init(MPI_COMM_WORLD, bsize)
+
+  !! Create the indirect indexing array CNHBR. CNHBR(:,j) are the indices
+  !! of the 4 cells adjacent to cell j, or 0 if no neighbor. CNHBR_LOCAL is
+  !! the corresponding distributed indexing array with local index values.
+  n = merge(ncell, 0, rank==0)
+  allocate(cnhbr(4,n))
+  if (rank == 0) call fill_cnhbr(mask, cnhbr)
+  call cell_map%localize_index_array(cnhbr, cell_map, cnhbr_local)
+
+  !! U is the global array of cell-centered unknowns, and U_LOCAL is the
+  !! corresponding distributed array. For convenience, an extra element
+  !! is prepended to the arrays for the artificial index 0 to serve as a
+  !! place to hold the boundary value.
+  allocate(u(0:n), u_local(0:cell_map%local_size))
+  u = 1   ! initial conditions
+  call cell_map%distribute(u(1:), u_local(1:))
+  u_local(0) = 0 ! boundary value
+
+  !! Time step out to time TFINAL using the explicit first order Euler
+  !! method with a fixed stable time step DT.
+  dx = 1.0_r8/NZ
+  dt = 0.25_r8*dx**2
+  c  = dt/dx**2
+
+  tfinal = 0.05_r8
+  nstep = ceiling(tfinal/dt)
+  tfinal = nstep*dt
+  
+  nstep0 = max(1, nstep/10) ! warm-up: start timing on this step
+
+  allocate(u_prev, mold=u_local)
+  call MPI_Barrier(MPI_COMM_WORLD, ierr) ! for timing purposes
+  do step = 1, nstep
+    if (step == nstep0) call system_clock(t1)
+    call cell_map%gather_offp(u_local(1:))
+    u_prev = u_local
+    do j = 1, cell_map%onp_size
+      u_local(j) = u_prev(j) + c*(sum(u_prev(cnhbr_local(:,j))) - 4*u_prev(j))
+    end do
+  end do
+  call MPI_Barrier(MPI_COMM_WORLD, ierr) ! for timing purposes
+  call system_clock(t2, rate)
+
+  !! Gather the distributed solution onto rank 0 and output.
+  call cell_map%collate(u_local(1:), u(1:))
+  if (rank == 0) then
+    write(*,'(a,es10.4,a)') 'Solution at t=', tfinal, ' written to out.vtk; visualize with paraview.'
+    u(0) = 0 ! boundary value
+    call vtk_plot(mask, u)
+    write(*,'(g0,a,i0,a)') (10**6)*real(t2-t1)/real(rate)/(nstep-nstep0+1), &
+        ' µsec per time step; ', ncell/nproc, ' cells per process'
+  end if
+
+  call MPI_Finalize(ierr)
+
+contains
+
+  !! Generate a grid mask array for a unit disk. A mask element corresponding
+  !! to a grid cell whose center lies outside the unit disk is set to zero.
+  !! Other elements are assigned sequential integers starting with 1 according
+  !! to the normal traveral order of a rank-2 array. The number of grid cells
+  !! so contained by the unit disk is returned in N.
+
+  subroutine unit_disk_mask(mask, n)
+    integer, intent(out) :: mask(0:,0:), n
+    real :: dx, dy, x, y
+    integer :: i, j
+    mask = 0
+    dx = 2.0/NZ
+    dy = 2.0/NZ
+    n = 0
+    y = -1 + dy/2
+    do j = 1, NZ
+      x = -1 + dx/2
+      do i = 1, NZ
+        if (x**2 + y**2 <= 1) then
+          n = n + 1
+          mask(i,j) = n
+        end if
+        x = x + dx
+      end do
+      y = y + dy
+    end do
+  end subroutine
+
+  !! Fill the cell neighor indirect indexing array using the mask array to
+  !! obtain the cell indices of the neighbors (or 0 where there is no neighbor).
+
+  subroutine fill_cnhbr(mask, cnhbr)
+    integer, intent(in) :: mask(0:,0:)
+    integer, intent(out) :: cnhbr(:,:)
+    integer :: n, i, j
+    n = 0
+    do j = 1, NZ
+      do i = 1, NZ
+        n = mask(i,j)
+        if (n > 0) then
+          cnhbr(1,n) = mask(i,j-1)
+          cnhbr(2,n) = mask(i+1,j)
+          cnhbr(3,n) = mask(i,j+1)
+          cnhbr(4,n) = mask(i-1,j)
+        end if
+      end do
+    end do
+  end subroutine
+
+  !! Write a VTK plot file of the solution U. The solution is embedded in a
+  !! rectangular grid with boundary values (0) for grid cells outside the
+  !! masked region.
+
+  subroutine vtk_plot(mask, u)
+    integer, intent(in) :: mask(0:,0:)
+    real(r8), intent(in) :: u(0:)
+    integer :: lun, i, j
+    real, allocatable :: u_plot(:,:)
+    open(newunit=lun,file='out.vtk')
+    write(lun,'("# vtk DataFile Version 3.0")')
+    write(lun,'("example solution")')
+    write(lun,'("ASCII")')
+    write(lun,'("DATASET STRUCTURED_POINTS")')
+    write(lun,'("DIMENSIONS",3(1x,i0))') NZ+1, NZ+1, 1
+    write(lun,'("ORIGIN 0 0 0")')
+    write(lun,'("SPACING",3(1x,g0))') 1.0/NZ, 1.0/NZ, 1
+    write(lun,'("CELL_DATA ",i0)') NZ**2
+    write(lun,'("SCALARS u float 1")')
+    write(lun,'("LOOKUP_TABLE default")')
+    allocate(u_plot(NZ,NZ))
+    do j = 1, NZ
+      do i = 1, NZ
+        u_plot(i,j) = u(mask(i,j))
+      end do
+    end do
+    write(lun,'(g0)') u_plot
+    close(lun)
+  end subroutine
+
+end program
diff --git a/example/disk-fv-serial.f90 b/example/disk-fv-serial.f90

Original file line number	Diff line number	Diff line change
`@@ -8,3 +8,4 @@ include(CTest)`
`8`	`8`
`9`	`9`	`add_subdirectory(src)`
`10`	`10`	`add_subdirectory(test)`
	`11`	`+add_subdirectory(example)`