Skip to content

Instantly share code, notes, and snippets.

@w1th0utnam3
Created June 4, 2018 21:33
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save w1th0utnam3/3f0700bcecdf9d29cabd44e86b1dcab5 to your computer and use it in GitHub Desktop.
Save w1th0utnam3/3f0700bcecdf9d29cabd44e86b1dcab5 to your computer and use it in GitHub Desktop.
FEniCS Poisson example with C/CFFI kernel
import dolfin
import dolfin.cpp
from dolfin import *
from dolfin.la import PETScMatrix, PETScVector, PETScKrylovSolver
from dolfin.jit.jit import ffc_jit
import numba as nb
import numpy as np
import cffi
import importlib
import time
# C code for Poisson tensor tabulation
TABULATE_C = """
void tabulate_tensor_A(double* A_mat, double** w, double* coords, int cell_orientation)
{
typedef double CoordsMat[4][3];
CoordsMat* coordinate_dofs = (CoordsMat*)coords;
const double* x0 = &((*coordinate_dofs)[0][0]);
const double* x1 = &((*coordinate_dofs)[1][0]);
const double* x2 = &((*coordinate_dofs)[2][0]);
const double* x3 = &((*coordinate_dofs)[3][0]);
// Entries of transformation matrix B
const double a = x1[0] - x0[0];
const double b = x2[0] - x0[0];
const double c = x3[0] - x0[0];
const double d = x1[1] - x0[1];
const double e = x2[1] - x0[1];
const double f = x3[1] - x0[1];
const double g = x1[2] - x0[2];
const double h = x2[2] - x0[2];
const double i = x3[2] - x0[2];
// Invert B
// Computation according to https://en.wikipedia.org/wiki/Invertible_matrix#Inversion_of_3_%C3%97_3_matrices
const double A = (e*i - f*h);
const double B = -(d*i - f*g);
const double C = (d*h - e*g);
const double D = -(b*i - c*h);
const double E = (a*i - c*g);
const double F = -(a*h - b*g);
const double G = (b*f - c*e);
const double H = -(a*f - c*d);
const double I = (a*e - b*d);
const double detB = a*A + b*B + c*C;
const double detB_inv = 1.0/detB;
const double Binv[3][3] = {{detB_inv*A, detB_inv*D, detB_inv*G},
{detB_inv*B, detB_inv*E, detB_inv*H},
{detB_inv*C, detB_inv*F, detB_inv*I}};
static const double gradPhi[4][3] = {{-1, -1, -1},
{ 1, 0, 0},
{ 0, 1, 0},
{ 0, 0, 1}};
// Bphi = G*B^-1
double Bphi[4][3];
for (int i = 0; i < 4; ++i) {
for (int j = 0; j < 3; ++j) {
Bphi[i][j] = 0;
for (int k = 0; k < 3; ++k) {
Bphi[i][j] += gradPhi[i][k]*Binv[k][j];
}
}
}
// A = vol*Bphi*Bphi^T
const double vol = (fabs(detB)/6.0);
for (int i = 0; i < 4; ++i) {
for (int j = 0; j < 4; ++j) {
A_mat[4*i + j] = 0;
for (int k = 0; k < 3; ++k) {
A_mat[4*i + j] += vol*Bphi[i][k]*Bphi[j][k];
}
}
}
return;
}
"""
# C header for Poisson tensor tabulation
TABULATE_H = """
void tabulate_tensor_A(double* A, double** w, double* coords, int cell_orientation);
"""
def tabulate_tensor_A(A_, w_, coords_, cell_orientation):
'''Computes the Laplace cell tensor for linear 3D Lagrange elements'''
A = nb.carray(A_, (4, 4), dtype=np.double)
coordinate_dofs = nb.carray(coords_, (4, 3), dtype=np.double)
# Coordinates of tet vertices
x0 = coordinate_dofs[0, :]
x1 = coordinate_dofs[1, :]
x2 = coordinate_dofs[2, :]
x3 = coordinate_dofs[3, :]
# Reference to global transformation matrix
B = np.zeros((3,3), dtype=np.double)
B[:, 0] = x1 - x0
B[:, 1] = x2 - x0
B[:, 2] = x3 - x0
Binv = np.linalg.inv(B)
detB = np.linalg.det(B)
# Matrix of basis function gradients
gradPhi = np.zeros((4,3), dtype=np.double)
gradPhi[0, :] = [-1, -1, -1]
gradPhi[1, :] = [1, 0, 0]
gradPhi[2, :] = [0, 1, 0]
gradPhi[3, :] = [0, 0, 1]
# Compute cell tensor
Bphi = gradPhi @ Binv
A[:,:] = np.abs(detB)/6.0*(Bphi @ Bphi.transpose())
def tabulate_tensor_L(b_, w_, coords_, cell_orientation):
'''Computes the rhs for the Poisson problem with f=1 for linear 3D Lagrange elements'''
b = nb.carray(b_, (4), dtype=np.float64)
coordinate_dofs = nb.carray(coords_, (4, 3), dtype=np.double)
# Coordinates of tet vertices
x0 = coordinate_dofs[0, :]
x1 = coordinate_dofs[1, :]
x2 = coordinate_dofs[2, :]
x3 = coordinate_dofs[3, :]
# Reference to global transformation matrix
B = np.zeros((3, 3), dtype=np.double)
B[:, 0] = x1 - x0
B[:, 1] = x2 - x0
B[:, 2] = x3 - x0
detB = np.linalg.det(B)
vol = np.abs(detB)/6.0
f = 2.0
b[:] = f * (vol / 4.0)
def solve():
# Whether to use custom Numba kernels instead of FFC
useCustomKernels = True
# Generate a unit cube with (n+1)^3 vertices
n = 22
mesh = UnitCubeMesh(MPI.comm_world, n, n, n)
Q = FunctionSpace(mesh, "Lagrange", 1)
u = TrialFunction(Q)
v = TestFunction(Q)
# Define the boundary: vertices where any component is in machine precision accuracy 0 or 1
def boundary(x):
return np.sum(np.logical_or(x < DOLFIN_EPS, x > 1.0 - DOLFIN_EPS), axis=1) > 0
u0 = Constant(0.0)
bc = DirichletBC(Q, u0, boundary)
# Initialize bilinear form and rhs
a = dolfin.cpp.fem.Form([Q._cpp_object, Q._cpp_object])
L = dolfin.cpp.fem.Form([Q._cpp_object])
# Signature of tabulate_tensor functions
sig = nb.types.void(nb.types.CPointer(nb.types.double),
nb.types.CPointer(nb.types.CPointer(nb.types.double)),
nb.types.CPointer(nb.types.double), nb.types.intc)
# Compile the python functions using Numba
fnA = nb.cfunc(sig, cache=True, nopython=True)(tabulate_tensor_A)
fnL = nb.cfunc(sig, cache=True, nopython=True)(tabulate_tensor_L)
module_name = "_laplace_kernel"
# Build the kernel
ffi = cffi.FFI()
ffi.set_source(module_name, TABULATE_C)
ffi.cdef(TABULATE_H)
ffi.compile()
# Import the compiled kernel
kernel_mod = importlib.import_module(module_name)
ffi, lib = kernel_mod.ffi, kernel_mod.lib
# Get pointer to the compiled function
fnA_ptr = ffi.cast("uintptr_t", ffi.addressof(lib, "tabulate_tensor_A"))
# Get pointers to Numba functions
#fnA_ptr = fnA.address
fnL_ptr = fnL.address
if useCustomKernels:
# Configure Forms to use own tabulate functions
a.set_cell_tabulate(0, fnA_ptr)
L.set_cell_tabulate(0, fnL_ptr)
else:
# Use FFC
# Bilinear form
jit_result = ffc_jit(dot(grad(u), grad(v)) * dx)
ufc_form = dolfin.cpp.fem.make_ufc_form(jit_result[0])
a = dolfin.cpp.fem.Form(ufc_form, [Q._cpp_object, Q._cpp_object])
# Rhs
f = Expression("2.0", element=Q.ufl_element())
jit_result = ffc_jit(f*v * dx)
ufc_form = dolfin.cpp.fem.make_ufc_form(jit_result[0])
L = dolfin.cpp.fem.Form(ufc_form, [Q._cpp_object])
# Attach rhs expression as coefficient
L.set_coefficient(0, f._cpp_object)
assembler = dolfin.cpp.fem.Assembler([[a]], [L], [bc])
A = PETScMatrix()
b = PETScVector()
# Perform assembly
start = time.time()
assembler.assemble(A, dolfin.cpp.fem.Assembler.BlockType.monolithic)
end = time.time()
# We don't care about the RHS
assembler.assemble(b, dolfin.cpp.fem.Assembler.BlockType.monolithic)
print(f"Time for assembly: {(end-start)*1000.0}ms")
Anorm = A.norm(dolfin.cpp.la.Norm.frobenius)
bnorm = b.norm(dolfin.cpp.la.Norm.l2)
print(Anorm, bnorm)
# Norms obtained with FFC and n=13
assert (np.isclose(Anorm, 60.86192203436385))
assert (np.isclose(bnorm, 0.018075523965828778))
comm = L.mesh().mpi_comm()
solver = PETScKrylovSolver(comm)
u = Function(Q)
solver.set_operator(A)
solver.solve(u.vector(), b)
# Export result
file = XDMFFile(MPI.comm_world, "poisson_3d.xdmf")
file.write(u, XDMFFile.Encoding.HDF5)
def run_example():
solve()
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment