xref: /libCEED/examples/petsc/qfunctions/bps/bp3.h (revision d4d455536df293f3f9ba6a974c8a4079393bc3b8)
13d8e8822SJeremy L Thompson // Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors.
23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details.
3cb32e2e7SValeria Barra //
43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause
5cb32e2e7SValeria Barra //
63d8e8822SJeremy L Thompson // This file is part of CEED:  http://github.com/ceed
7cb32e2e7SValeria Barra 
8cb32e2e7SValeria Barra /// @file
9cb32e2e7SValeria Barra /// libCEED QFunctions for diffusion operator example using PETSc
10cb32e2e7SValeria Barra 
1113921685Svaleriabarra #ifndef bp3_h
1213921685Svaleriabarra #define bp3_h
1313921685Svaleriabarra 
14c9c2c079SJeremy L Thompson #include <ceed.h>
1513921685Svaleriabarra #include <math.h>
1613921685Svaleriabarra 
17e83e87a5Sjeremylt // -----------------------------------------------------------------------------
18ed264d09SValeria Barra // This QFunction sets up the geometric factors required to apply the
19ed264d09SValeria Barra //   diffusion operator
20ed264d09SValeria Barra //
21ed264d09SValeria Barra // We require the product of the inverse of the Jacobian and its transpose to
22ed264d09SValeria Barra //   properly compute integrals of the form: int( gradv gradu)
23ed264d09SValeria Barra //
24ed264d09SValeria Barra // Determinant of Jacobian:
25ed264d09SValeria Barra //   detJ = J11*A11 + J21*A12 + J31*A13
26ed264d09SValeria Barra //     Jij = Jacobian entry ij
27ed264d09SValeria Barra //     Aij = Adjoint ij
28ed264d09SValeria Barra //
29ed264d09SValeria Barra // Inverse of Jacobian:
30ed264d09SValeria Barra //   Bij = Aij / detJ
31ed264d09SValeria Barra //
32ed264d09SValeria Barra // Product of Inverse and Transpose:
33ed264d09SValeria Barra //   BBij = sum( Bik Bkj )
34ed264d09SValeria Barra //
35ed264d09SValeria Barra // Stored: w B^T B detJ = w A^T A / detJ
36ed264d09SValeria Barra //   Note: This matrix is symmetric, so we only store 6 distinct entries
37ed264d09SValeria Barra //     qd: 0 3 6
38ed264d09SValeria Barra //         1 4 7
39ed264d09SValeria Barra //         2 5 8
40cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
41cb32e2e7SValeria Barra CEED_QFUNCTION(SetupDiffGeo)(void *ctx, CeedInt Q,
42cb32e2e7SValeria Barra                              const CeedScalar *const *in,
43cb32e2e7SValeria Barra                              CeedScalar *const *out) {
44*d4d45553Srezgarshakeri   // Inputs
45*d4d45553Srezgarshakeri   const CeedScalar(*J)[3][CEED_Q_VLA] = (const CeedScalar(*)[3][CEED_Q_VLA])in[1];
46*d4d45553Srezgarshakeri   const CeedScalar(*w)                = in[2]; // Note: *X = in[0]
47*d4d45553Srezgarshakeri   // Outputs
48*d4d45553Srezgarshakeri   CeedScalar(*qd) = out[0];
49cb32e2e7SValeria Barra 
50*d4d45553Srezgarshakeri   const CeedInt dim = 3;
51cb32e2e7SValeria Barra   // Quadrature Point Loop
52cb32e2e7SValeria Barra   CeedPragmaSIMD
53cb32e2e7SValeria Barra   for (CeedInt i=0; i<Q; i++) {
54*d4d45553Srezgarshakeri     // Setup
55*d4d45553Srezgarshakeri     CeedScalar A[3][3];
56*d4d45553Srezgarshakeri     for (CeedInt j = 0; j < dim; j++) {
57*d4d45553Srezgarshakeri       for (CeedInt k = 0; k < dim; k++) {
58*d4d45553Srezgarshakeri         // Equivalent code with no mod operations:
59*d4d45553Srezgarshakeri         // A[k][j] = J[k+1][j+1]*J[k+2][j+2] - J[k+1][j+2]*J[k+2][j+1]
60*d4d45553Srezgarshakeri         A[k][j] = J[(k + 1) % dim][(j + 1) % dim][i] * J[(k + 2) % dim][(j + 2) % dim][i] -
61*d4d45553Srezgarshakeri                   J[(k + 1) % dim][(j + 2) % dim][i] * J[(k + 2) % dim][(j + 1) % dim][i];
62*d4d45553Srezgarshakeri       }
63*d4d45553Srezgarshakeri     }
64*d4d45553Srezgarshakeri     const CeedScalar detJ = J[0][0][i] * A[0][0] + J[0][1][i] * A[0][1] + J[0][2][i] * A[0][2];
65*d4d45553Srezgarshakeri 
66*d4d45553Srezgarshakeri     const CeedScalar qw = w[i] / detJ;
67*d4d45553Srezgarshakeri     qd[i+Q*0] = qw * (A[0][0]*A[0][0] + A[0][1]*A[0][1] + A[0][2]*A[0][2]);
68*d4d45553Srezgarshakeri     qd[i+Q*1] = qw * (A[0][0]*A[1][0] + A[0][1]*A[1][1] + A[0][2]*A[1][2]);
69*d4d45553Srezgarshakeri     qd[i+Q*2] = qw * (A[0][0]*A[2][0] + A[0][1]*A[2][1] + A[0][2]*A[2][2]);
70*d4d45553Srezgarshakeri     qd[i+Q*3] = qw * (A[1][0]*A[1][0] + A[1][1]*A[1][1] + A[1][2]*A[1][2]);
71*d4d45553Srezgarshakeri     qd[i+Q*4] = qw * (A[1][0]*A[2][0] + A[1][1]*A[2][1] + A[1][2]*A[2][2]);
72*d4d45553Srezgarshakeri     qd[i+Q*5] = qw * (A[2][0]*A[2][0] + A[2][1]*A[2][1] + A[2][2]*A[2][2]);
73*d4d45553Srezgarshakeri     qd[i+Q*6] = w[i] * detJ;
74cb32e2e7SValeria Barra   } // End of Quadrature Point Loop
75cb32e2e7SValeria Barra 
76cb32e2e7SValeria Barra   return 0;
77cb32e2e7SValeria Barra }
78cb32e2e7SValeria Barra 
79e83e87a5Sjeremylt // -----------------------------------------------------------------------------
80ed264d09SValeria Barra // This QFunction sets up the rhs and true solution for the problem
81cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
82cb32e2e7SValeria Barra CEED_QFUNCTION(SetupDiffRhs)(void *ctx, CeedInt Q,
83cb32e2e7SValeria Barra                              const CeedScalar *const *in,
84cb32e2e7SValeria Barra                              CeedScalar *const *out) {
85cb32e2e7SValeria Barra #ifndef M_PI
86cb32e2e7SValeria Barra #  define M_PI    3.14159265358979323846
87cb32e2e7SValeria Barra #endif
88e83e87a5Sjeremylt   const CeedScalar *x = in[0], *w = in[1];
89cb32e2e7SValeria Barra   CeedScalar *true_soln = out[0], *rhs = out[1];
90cb32e2e7SValeria Barra 
91cb32e2e7SValeria Barra   // Quadrature Point Loop
92cb32e2e7SValeria Barra   CeedPragmaSIMD
93cb32e2e7SValeria Barra   for (CeedInt i=0; i<Q; i++) {
94cb32e2e7SValeria Barra     const CeedScalar c[3] = { 0, 1., 2. };
95cb32e2e7SValeria Barra     const CeedScalar k[3] = { 1., 2., 3. };
96cb32e2e7SValeria Barra 
97cb32e2e7SValeria Barra     true_soln[i] = sin(M_PI*(c[0] + k[0]*x[i+Q*0])) *
98cb32e2e7SValeria Barra                    sin(M_PI*(c[1] + k[1]*x[i+Q*1])) *
99cb32e2e7SValeria Barra                    sin(M_PI*(c[2] + k[2]*x[i+Q*2]));
100cb32e2e7SValeria Barra 
101e83e87a5Sjeremylt     rhs[i] = w[i+Q*6] * M_PI*M_PI * (k[0]*k[0] + k[1]*k[1] + k[2]*k[2]) *
102cb32e2e7SValeria Barra              true_soln[i];
103cb32e2e7SValeria Barra   } // End of Quadrature Point Loop
104cb32e2e7SValeria Barra 
105cb32e2e7SValeria Barra   return 0;
106cb32e2e7SValeria Barra }
107cb32e2e7SValeria Barra 
108e83e87a5Sjeremylt // -----------------------------------------------------------------------------
109ed264d09SValeria Barra // This QFunction applies the diffusion operator for a scalar field.
110ed264d09SValeria Barra //
111ed264d09SValeria Barra // Inputs:
112ed264d09SValeria Barra //   ug     - Input vector gradient at quadrature points
1139b072555Sjeremylt //   q_data  - Geometric factors
114ed264d09SValeria Barra //
115ed264d09SValeria Barra // Output:
116ed264d09SValeria Barra //   vg     - Output vector (test functions) gradient at quadrature points
117ed264d09SValeria Barra //
118cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
119cb32e2e7SValeria Barra CEED_QFUNCTION(Diff)(void *ctx, CeedInt Q,
120cb32e2e7SValeria Barra                      const CeedScalar *const *in, CeedScalar *const *out) {
1219b072555Sjeremylt   const CeedScalar *ug = in[0], *q_data = in[1];
122cb32e2e7SValeria Barra   CeedScalar *vg = out[0];
123cb32e2e7SValeria Barra 
124cb32e2e7SValeria Barra   // Quadrature Point Loop
125cb32e2e7SValeria Barra   CeedPragmaSIMD
126cb32e2e7SValeria Barra   for (CeedInt i=0; i<Q; i++) {
127cb32e2e7SValeria Barra     // Read spatial derivatives of u
128cb32e2e7SValeria Barra     const CeedScalar du[3]            =  {ug[i+Q*0],
129cb32e2e7SValeria Barra                                           ug[i+Q*1],
130cb32e2e7SValeria Barra                                           ug[i+Q*2]
131cb32e2e7SValeria Barra                                          };
1329b072555Sjeremylt     // Read q_data (dXdxdXdx_T symmetric matrix)
1339b072555Sjeremylt     const CeedScalar dXdxdXdx_T[3][3] = {{q_data[i+0*Q],
1349b072555Sjeremylt                                           q_data[i+1*Q],
1359b072555Sjeremylt                                           q_data[i+2*Q]},
1369b072555Sjeremylt                                          {q_data[i+1*Q],
1379b072555Sjeremylt                                           q_data[i+3*Q],
1389b072555Sjeremylt                                           q_data[i+4*Q]},
1399b072555Sjeremylt                                          {q_data[i+2*Q],
1409b072555Sjeremylt                                           q_data[i+4*Q],
1419b072555Sjeremylt                                           q_data[i+5*Q]}
142cb32e2e7SValeria Barra                                         };
143cb32e2e7SValeria Barra 
144cb32e2e7SValeria Barra     for (int j=0; j<3; j++) // j = direction of vg
1459b072555Sjeremylt       vg[i+j*Q] = (du[0] * dXdxdXdx_T[0][j] +
1469b072555Sjeremylt                    du[1] * dXdxdXdx_T[1][j] +
1479b072555Sjeremylt                    du[2] * dXdxdXdx_T[2][j]);
148cb32e2e7SValeria Barra 
149cb32e2e7SValeria Barra   } // End of Quadrature Point Loop
150cb32e2e7SValeria Barra   return 0;
151cb32e2e7SValeria Barra }
152cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
153f6b55d2cSvaleriabarra 
154f6b55d2cSvaleriabarra #endif // bp3_h
155