Tentative velocity algorithms (#1)

* Add some more structure * More updates, getting slightly further * add initial performance test for different assembly strategies * Add efficiency of parameters to output * Add notes regarding Oasis approach * Fix end of name * Add python code in demo folder * Add assembly strategies and larger P1 to book * Flake8 * Mypy fixes * BC version * Flake8 * Rewrite assembly strategy to be non-symmetric * Go back to using zerorowslocal * Update to run on EX3 * Add some more changes, no luck on EX3 * Add symmetric prior to eternal * Minor fixes * Add more docs and stuff * Restructure and add more steps * Add solver step for tentative velocity * Add more work. Now the code executes for both versions of grad p v assembly * Start adding structure to bcs * Add bc wrapper * Add DIrichlet handling and tentative velocity test * Add docs to enum * Add more work, not done yet * Add some more memory intensive stuff. Need to take a step back to consider boundary conditions and solution method for pressure correction * Add notes on splitting schemes * Flake8 * Various fixes for mypy flake8 and CI * More CI fixes Co-authored-by: Jørgen Schartum Dokken <[email protected]>
ComputationalPhysiology · Nov 7, 2022 · 17cd652 · 17cd652
1 parent f80c5f6
commit 17cd652
Show file tree

Hide file tree

Showing 21 changed files with 1,824 additions and 18 deletions.
diff --git a/.flake8 b/.flake8
@@ -1,5 +1,5 @@
 # flake8 does not support pyproject.toml, see:
 # https://github.com/PyCQA/flake8/issues/234
 [flake8]
-exclude = docs,venv
+exclude = docs,venv,build
 max-line-length = 100
diff --git a/.github/workflows/pages.yml b/.github/workflows/pages.yml
@@ -23,6 +23,7 @@ concurrency:
 env:
   # Directory that will be published on github pages
   PUBLISH_DIR: ./docs/_build/html
+  DEB_PYTHON_INSTALL_LAYOUT: deb_system
 
 jobs:
 
@@ -37,7 +38,6 @@ jobs:
       - name: Upgrade pip and setuptools
         run: |
           python3 -m pip install pip setuptools --upgrade
-          apt-get purge -y python3-setuptools
 
       - name: Install dependencies
         run: python3 -m pip install ".[test,docs]"

diff --git a/.github/workflows/test_package.yml b/.github/workflows/test_package.yml
@@ -13,6 +13,10 @@ on:
   schedule:
     # The CI is executed every day at 8am
     - cron: "0 8 * * *"
+
+env:
+  DEB_PYTHON_INSTALL_LAYOUT: deb_system
+
 jobs:
   check-code:
 
@@ -26,9 +30,8 @@ jobs:
       - uses: actions/checkout@v3
 
       - name: Upgrade pip and setuptools
-        run: |
+        run:
           python3 -m pip install pip setuptools --upgrade
-          apt-get purge -y python3-setuptools
 
       - name: "Install code"
         run: python3 -m pip install .[test]
@@ -49,9 +52,8 @@ jobs:
       - uses: actions/checkout@v3
 
       - name: Upgrade pip and setuptools
-        run: |
+        run:
           python3 -m pip install pip setuptools --upgrade
-          apt-get purge -y python3-setuptools
 
       - name: "Install oasisx"
         run: pip install .[test]

diff --git a/Makefile b/Makefile
@@ -1,14 +1,13 @@
 # List of Python demos (without file extenion) from the repo `demo` to include in the jupyterbook. 
 # These files should be listed in `docs/_toc.yml`
-#DEMOS = 
+DEMOS = "assembly_strategies"
 
+# We use --set-kernel with jupytext to make it possible for binder to pick it up
 doc: # Generate Sphinx HTML documentation, including API docs 
+	@for demo in ${DEMOS}; do \
+	jupytext --to=ipynb --set-kernel=python3 demo/$$demo.py --output=docs/$$demo.ipynb ;\
+	done
 	jupyter book build -W docs
-# We use --set-kernel with jupytext to make it possible for binder to pick it up
-# @for demo in ${DEMOS}; do \
-# 	jupytext --to=ipynb --set-kernel=python3 demo/$$demo.py --output=docs/$$demo.ipynb ;\
-# ;\
-#	done
 
 clean-pytest: # Remove output from pytest
 	rm -rf .pytest_cache

diff --git a/demo/assembly_bcs.py b/demo/assembly_bcs.py
@@ -0,0 +1,316 @@
+# ---
+# jupyter:
+#   jupytext:
+#     formats: ipynb,py:light
+#     text_representation:
+#       extension: .py
+#       format_name: light
+#       format_version: '1.5'
+#       jupytext_version: 1.14.1
+#   kernelspec:
+#     display_name: Python 3 (ipykernel)
+#     language: python
+#     name: python3
+# ---
+
+# Copyright (C) 2022 Jørgen Schartum Dokken
+#
+# This file is part of Oasisx
+# SPDX-License-Identifier:    MIT
+#
+# # Application of Dirichlet BCs
+# Illustrates how to apply bcs to the component of the tentative velocity equation.
+# We compare two strategies:
+# 1. Using matrix-vector products of pre-assembled matrices to compute the RHS
+# 2. Assemble the matrix and vector separately
+# We start by importing the necessary modules
+
+import matplotlib.pyplot as plt
+import time
+import seaborn
+import pandas
+import dolfinx
+from mpi4py import MPI
+from petsc4py import PETSc
+import ufl
+import numpy as np
+import typing
+
+
+def assembly(mesh, P: int, repeats: int, jit_options: typing.Optional[dict] = None):
+    V = dolfinx.fem.FunctionSpace(mesh, ("CG", int(P)))
+
+    def f(x):
+        return 2*np.sin(x[0])+3+2*x[1]
+    mesh.topology.create_connectivity(mesh.topology.dim-1, mesh.topology.dim)
+    boundary_facets = dolfinx.mesh.exterior_facet_indices(mesh.topology)
+    boundary_dofs = dolfinx.fem.locate_dofs_topological(V, mesh.topology.dim-1, boundary_facets)
+    g = dolfinx.fem.Function(V)
+    g.interpolate(f)
+    bcs = [dolfinx.fem.dirichletbc(g, boundary_dofs)]
+
+    dt = 0.5
+    nu = 0.3
+    u = ufl.TrialFunction(V)
+    v = ufl.TestFunction(V)
+
+    # Solution from previous time step
+    u_1 = dolfinx.fem.Function(V)
+    u_1.interpolate(lambda x: np.sin(x[0])*np.cos(x[1]))
+
+    # Define variational forms
+    mass = ufl.inner(u, v) * ufl.dx
+    stiffness = ufl.inner(ufl.grad(u), ufl.grad(v)) * ufl.dx
+
+    u_ab = [dolfinx.fem.Function(V, name=f"u_ab{i}") for i in range(mesh.geometry.dim)]
+    convection = ufl.inner(ufl.dot(ufl.as_vector(u_ab), ufl.nabla_grad(u)), v) * ufl.dx
+    for u_abi in u_ab:
+        u_abi.interpolate(lambda x: x[0])
+
+    # Compile forms for matrix vector products
+    jit_options = {} if jit_options is None else jit_options
+    mass_form = dolfinx.fem.form(mass, jit_params=jit_options)
+    stiffness_form = dolfinx.fem.form(stiffness, jit_params=jit_options)
+    convection_form = dolfinx.fem.form(convection, jit_params=jit_options)
+
+    # Compile form for vector assembly (action)
+    dt_inv = dolfinx.fem.Constant(mesh, 1./dt)
+    dt_inv.name = "dt_inv"
+    nu_c = dolfinx.fem.Constant(mesh, nu)
+    nu_c.name = "nu"
+    rhs = dt_inv * mass - 0.5 * nu_c * stiffness - 0.5*convection
+    rhs_form = dolfinx.fem.form(ufl.action(rhs, u_1), jit_params=jit_options)
+
+    # Assemble time independent matrices
+    # Mass matrix
+    M = dolfinx.fem.petsc.create_matrix(mass_form)
+    M.setOption(PETSc.Mat.Option.SYMMETRIC, True)
+    M.setOption(PETSc.Mat.Option.SYMMETRY_ETERNAL, True)
+    M.setOption(PETSc.Mat.Option.IGNORE_ZERO_ENTRIES, True)
+    dolfinx.fem.petsc.assemble_matrix(M, mass_form)
+    M.assemble()
+    M.setOption(PETSc.Mat.Option.NEW_NONZERO_LOCATIONS, False)
+
+    # Stiffness matrix
+    K = dolfinx.fem.petsc.create_matrix(stiffness_form)
+    K.setOption(PETSc.Mat.Option.SYMMETRIC, True)
+    K.setOption(PETSc.Mat.Option.SYMMETRY_ETERNAL, True)
+    K.setOption(PETSc.Mat.Option.IGNORE_ZERO_ENTRIES, True)
+    dolfinx.fem.petsc.assemble_matrix(K, stiffness_form)
+    K.assemble()
+    K.setOption(PETSc.Mat.Option.NEW_NONZERO_LOCATIONS, False)
+
+    # RHS vectors
+    b = dolfinx.fem.Function(V)
+    bx = dolfinx.fem.Function(V)
+
+    # Timing vectors
+    oasis_lhs = np.zeros((repeats, mesh.comm.size), dtype=np.float64)
+    oasis_rhs = np.zeros((repeats, mesh.comm.size), dtype=np.float64)
+    new_lhs = np.zeros((repeats, mesh.comm.size), dtype=np.float64)
+    new_rhs = np.zeros((repeats, mesh.comm.size), dtype=np.float64)
+    new_total = np.zeros((repeats, mesh.comm.size), dtype=np.float64)
+    oasis_total = np.zeros((repeats, mesh.comm.size), dtype=np.float64)
+
+    A_sp = dolfinx.fem.create_sparsity_pattern(mass_form)
+    A_sp.assemble()
+
+    A = dolfinx.cpp.la.petsc.create_matrix(mesh.comm, A_sp)
+    Ax = dolfinx.cpp.la.petsc.create_matrix(mesh.comm, A_sp)
+    D = dolfinx.cpp.la.petsc.create_matrix(mesh.comm, A_sp)
+    D.assemble()
+    for i in range(repeats):
+        mesh.comm.Barrier()
+        # --------------Oasis approach-------------------------
+        # Zero out time-dependent matrix
+        start_mat = time.perf_counter()
+        A.zeroEntries()
+        A.setOption(PETSc.Mat.Option.KEEP_NONZERO_PATTERN, True)
+        A.setOption(PETSc.Mat.Option.IGNORE_ZERO_ENTRIES, False)
+        end_mat = time.perf_counter()
+
+        # Add convection term
+        start_lhs = time.perf_counter()
+        dolfinx.fem.petsc.assemble_matrix(A, convection_form)
+        A.assemble()
+        A.scale(-0.5)
+        A.axpy(1./dt, M, PETSc.Mat.Structure.SUBSET_NONZERO_PATTERN)
+        A.axpy(-0.5*nu, K, PETSc.Mat.Structure.SUBSET_NONZERO_PATTERN)
+        end_lhs = time.perf_counter()
+
+        # Do mat-vec operations
+        b.x.array[:] = 0
+        start_rhs = time.perf_counter()
+        A.mult(u_1.vector, b.vector)
+        b.x.scatter_reverse(dolfinx.la.ScatterMode.add)
+        dolfinx.fem.petsc.set_bc(b.vector, bcs)
+        b.x.scatter_forward()
+        end_rhs = time.perf_counter()
+        t_matvec = end_rhs - start_rhs
+
+        mesh.comm.Barrier()
+        # Rescale matrix and apply bc
+        start_rescale = time.perf_counter()
+        A.scale(-1)
+        A.axpy(2/dt, M, PETSc.Mat.Structure.SUBSET_NONZERO_PATTERN)
+        for bc in bcs:
+            A.zeroRowsLocal(bc.dof_indices()[0], 1.)  # type: ignore
+        end_rescale = time.perf_counter()
+        t_matrix = end_rescale - start_rescale + end_lhs - start_lhs
+
+        mesh.comm.Barrier()
+
+        # Gather results
+        oasis_lhs[i, :] = mesh.comm.allgather(t_matrix)
+        oasis_rhs[i, :] = mesh.comm.allgather(t_matvec)
+        oasis_total[i, :] = mesh.comm.allgather(t_matrix + t_matvec)
+        # ---------------------------------------------------------
+        # Zero out time-dependent matrix
+        Ax.zeroEntries()
+        Ax.setOption(PETSc.Mat.Option.KEEP_NONZERO_PATTERN, True)
+        Ax.setOption(PETSc.Mat.Option.IGNORE_ZERO_ENTRIES, False)
+
+        mesh.comm.Barrier()
+
+        # Add convection term
+        start_lhs_new = time.perf_counter()
+        dolfinx.fem.petsc.assemble_matrix(Ax, convection_form)
+        Ax.assemble()
+        Ax.scale(0.5)
+        Ax.axpy(1./dt, M, PETSc.Mat.Structure.SUBSET_NONZERO_PATTERN)
+        Ax.axpy(0.5*nu, K, PETSc.Mat.Structure.SUBSET_NONZERO_PATTERN)
+        for bc in bcs:
+            Ax.zeroRowsLocal(bc.dof_indices()[0], 1.)  # type: ignore
+        end_lhs_new = time.perf_counter()
+
+        mesh.comm.Barrier()
+
+        # Compute the vector without using pre-generated matrices
+        bx.x.array[:] = 0
+        start_rhs_new = time.perf_counter()
+        dolfinx.fem.petsc.assemble_vector(bx.vector, rhs_form)
+        bx.x.scatter_reverse(dolfinx.la.ScatterMode.add)
+        dolfinx.fem.petsc.set_bc(bx.vector, bcs)
+        bx.x.scatter_forward()
+        end_rhs_new = time.perf_counter()
+
+        # Gather results
+        new_total[i, :] = mesh.comm.allgather(end_lhs_new - start_lhs_new
+                                              + end_rhs_new - start_rhs_new)
+        new_lhs[i, :] = mesh.comm.allgather(end_lhs_new - start_lhs_new)
+        new_rhs[i, :] = mesh.comm.allgather(end_rhs_new - start_rhs_new)
+
+        matrix_total = mesh.comm.allgather(end_mat-start_mat)
+        if mesh.comm.rank == 0:
+            print("Oasis Total", oasis_total[i],  "\nNew Total", new_total[i],
+                  "\nMatrix total", matrix_total, flush=True)
+        # Check that vectors are the same
+        if not np.allclose(bx.x.array, b.x.array):
+            print(np.max(np.abs(bx.x.array[:]-b.x.array[:])))
+            raise RuntimeError("Vectors are not equal after assembly")
+
+        # Check that matrices are the same
+        D.zeroEntries()
+        A.copy(D, PETSc.Mat.Structure.DIFFERENT_NONZERO_PATTERN)
+        D.axpy(-1, Ax, PETSc.Mat.Structure.DIFFERENT_NONZERO_PATTERN)
+        if not np.allclose(D.getValuesCSR()[2], 0):
+            print(np.max(np.abs(D.getValuesCSR()[2])))
+            raise RuntimeError("Matrices are not equal after assembly")
+    num_dofs_global = V.dofmap.index_map_bs * V.dofmap.index_map.size_global
+    return num_dofs_global, new_lhs, new_rhs, oasis_lhs, oasis_rhs, oasis_total, new_total
+
+
+# We solve the problem on a unit cube that is split into tetrahedras with `Nx`,`Ny` and `Nx`
+# tetrahera in the x, y and z-direction respectively.
+
+def run_parameter_sweep(Nx: int, Ny: int, Nz: int, repeats: int, min_degree: int,
+                        max_degree: int) -> dict:
+    # Information regarding optimization flags can be found at:
+    # https://gcc.gnu.org/onlinedocs/gcc/Optimize-Options.html
+    jit_options = {"cffi_extra_compile_args": ["-march=native", "-O3"]}
+
+    mesh = dolfinx.mesh.create_unit_cube(MPI.COMM_WORLD, Nx, Ny, Nz)
+    Ps = np.arange(min_degree, max_degree+1, dtype=np.int32)
+    j = 0
+    results = {}
+    for i, P in enumerate(Ps):
+        if mesh.comm.rank == 0:
+            print(i, P, flush=True)
+        dof, new_lhs, new_rhs, oasis_lhs, oasis_rhs, oasis_total, new_total = assembly(
+            mesh, P, repeats=repeats, jit_options=jit_options)
+        if mesh.comm.rank == 0:
+            print("Writing to dict")
+        for row in new_lhs:
+            for process in row:
+                results[j] = {"P": P, "num_dofs": dof, "method": "new", "side":
+                              "lhs", "time (s)": process, "procs": MPI.COMM_WORLD.size}
+                j += 1
+        for row in new_rhs:
+            for process in row:
+                results[j] = {"P": P, "num_dofs": dof, "method": "new", "side":
+                              "rhs", "time (s)": process, "procs": MPI.COMM_WORLD.size}
+                j += 1
+
+        for row in oasis_lhs:
+            for process in row:
+                results[j] = {"P": P, "num_dofs": dof, "method": "oasis", "side":
+                              "lhs", "time (s)": process, "procs": MPI.COMM_WORLD.size}
+                j += 1
+        for row in oasis_rhs:
+            for process in row:
+                results[j] = {"P": P, "num_dofs": dof, "method": "oasis", "side":
+                              "rhs", "time (s)": process, "procs": MPI.COMM_WORLD.size}
+                j += 1
+        for row in oasis_total:
+            for process in row:
+                results[j] = {"P": P, "num_dofs": dof, "method": "oasis", "side":
+                              "total", "time (s)": process, "procs": MPI.COMM_WORLD.size}
+                j += 1
+        for row in new_total:
+            for process in row:
+                results[j] = {"P": P, "num_dofs": dof, "method": "new", "side":
+                              "total", "time (s)": process, "procs": MPI.COMM_WORLD.size}
+                j += 1
+    return results
+
+
+# We use `pandas` and `seaborn` to visualize the results
+
+# +
+
+
+def create_plot(results: dict, outfile: str):
+    if MPI.COMM_WORLD.rank == 0:
+        df = pandas.DataFrame.from_dict(results, orient="index")
+        df["label"] = "P" + df["P"].astype(str) + " " + \
+            df["num_dofs"].astype(str) + " \n Comms: " + df["procs"].astype(str)
+        plt.figure()
+        df_rhs = df[df["side"] == "rhs"]
+        plot = seaborn.catplot(data=df_rhs, kind="swarm",  x="label",
+                               y="time (s)", hue="method")
+        plot.set(yscale="log")
+        plt.grid()
+        plt.savefig(f"{outfile}_rhs.png")
+        plt.figure()
+        df_lhs = df[df["side"] == "lhs"]
+        plot = seaborn.catplot(data=df_lhs, kind="swarm",  x="label",
+                               y="time (s)", hue="method")
+        plot.set(yscale="log")
+        plt.grid()
+        plt.savefig(f"{outfile}_lhs.png")
+        plt.figure()
+        df_total = df[df["side"] == "total"]
+        plot = seaborn.catplot(data=df_total, kind="swarm",  x="label",
+                               y="time (s)", hue="method")
+        plot.set(yscale="log")
+        plt.grid()
+        plt.savefig(f"{outfile}_total.png")
+
+# -
+
+
+# We start by running the comparison for an increasing number of degrees of freedom on a fixed grid.
+if __name__ == "__main__":
+    N = 100
+    results_p = run_parameter_sweep(N, N, N, repeats=3, min_degree=1, max_degree=3)
+    create_plot(results_p, "results")