xref: /libCEED/examples/petsc/qfunctions/bps/bp3.h (revision 5aed82e4fa97acf4ba24a7f10a35f5303a6798e0) !
1*5aed82e4SJeremy L Thompson // Copyright (c) 2017-2024, Lawrence Livermore National Security, LLC and other CEED contributors.
23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details.
3cb32e2e7SValeria Barra //
43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause
5cb32e2e7SValeria Barra //
63d8e8822SJeremy L Thompson // This file is part of CEED:  http://github.com/ceed
7cb32e2e7SValeria Barra 
8cb32e2e7SValeria Barra /// @file
9cb32e2e7SValeria Barra /// libCEED QFunctions for diffusion operator example using PETSc
10cb32e2e7SValeria Barra 
1113921685Svaleriabarra #ifndef bp3_h
1213921685Svaleriabarra #define bp3_h
1313921685Svaleriabarra 
14c9c2c079SJeremy L Thompson #include <ceed.h>
1513921685Svaleriabarra #include <math.h>
1613921685Svaleriabarra 
17e83e87a5Sjeremylt // -----------------------------------------------------------------------------
18ea61e9acSJeremy L Thompson // This QFunction sets up the geometric factors required to apply the diffusion operator
19ed264d09SValeria Barra //
20ea61e9acSJeremy L Thompson // We require the product of the inverse of the Jacobian and its transpose to properly compute integrals of the form: int( gradv gradu)
21ed264d09SValeria Barra //
22ed264d09SValeria Barra // Determinant of Jacobian:
23ed264d09SValeria Barra //   detJ = J11*A11 + J21*A12 + J31*A13
24ed264d09SValeria Barra //     Jij = Jacobian entry ij
25ed264d09SValeria Barra //     Aij = Adjoint ij
26ed264d09SValeria Barra //
27ed264d09SValeria Barra // Inverse of Jacobian:
28ed264d09SValeria Barra //   Bij = Aij / detJ
29ed264d09SValeria Barra //
30ed264d09SValeria Barra // Product of Inverse and Transpose:
31ed264d09SValeria Barra //   BBij = sum( Bik Bkj )
32ed264d09SValeria Barra //
33ed264d09SValeria Barra // Stored: w B^T B detJ = w A^T A / detJ
34ed264d09SValeria Barra //   Note: This matrix is symmetric, so we only store 6 distinct entries
350a8fc04aSrezgarshakeri //     qd: 1 4 7
36ed264d09SValeria Barra //         2 5 8
370a8fc04aSrezgarshakeri //         3 6 9
38cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
392b730f8bSJeremy L Thompson CEED_QFUNCTION(SetupDiffGeo)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) {
40d4d45553Srezgarshakeri   // Inputs
41d4d45553Srezgarshakeri   const CeedScalar(*J)[3][CEED_Q_VLA] = (const CeedScalar(*)[3][CEED_Q_VLA])in[1];
42d4d45553Srezgarshakeri   const CeedScalar(*w)                = in[2];  // Note: *X = in[0]
43d4d45553Srezgarshakeri   // Outputs
44d4d45553Srezgarshakeri   CeedScalar(*qd) = out[0];
45cb32e2e7SValeria Barra 
46d4d45553Srezgarshakeri   const CeedInt dim = 3;
47cb32e2e7SValeria Barra   // Quadrature Point Loop
482b730f8bSJeremy L Thompson   CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) {
49d4d45553Srezgarshakeri     // Setup
50d4d45553Srezgarshakeri     CeedScalar A[3][3];
51d4d45553Srezgarshakeri     for (CeedInt j = 0; j < dim; j++) {
52d4d45553Srezgarshakeri       for (CeedInt k = 0; k < dim; k++) {
53d4d45553Srezgarshakeri         // Equivalent code with no mod operations:
54d4d45553Srezgarshakeri         // A[k][j] = J[k+1][j+1]*J[k+2][j+2] - J[k+1][j+2]*J[k+2][j+1]
55d4d45553Srezgarshakeri         A[k][j] = J[(k + 1) % dim][(j + 1) % dim][i] * J[(k + 2) % dim][(j + 2) % dim][i] -
56d4d45553Srezgarshakeri                   J[(k + 1) % dim][(j + 2) % dim][i] * J[(k + 2) % dim][(j + 1) % dim][i];
57d4d45553Srezgarshakeri       }
58d4d45553Srezgarshakeri     }
59d4d45553Srezgarshakeri     const CeedScalar detJ = J[0][0][i] * A[0][0] + J[0][1][i] * A[0][1] + J[0][2][i] * A[0][2];
60d4d45553Srezgarshakeri 
61d4d45553Srezgarshakeri     const CeedScalar qw = w[i] / detJ;
620a8fc04aSrezgarshakeri     qd[i + Q * 0]       = w[i] * detJ;
630a8fc04aSrezgarshakeri     qd[i + Q * 1]       = qw * (A[0][0] * A[0][0] + A[0][1] * A[0][1] + A[0][2] * A[0][2]);
640a8fc04aSrezgarshakeri     qd[i + Q * 2]       = qw * (A[0][0] * A[1][0] + A[0][1] * A[1][1] + A[0][2] * A[1][2]);
650a8fc04aSrezgarshakeri     qd[i + Q * 3]       = qw * (A[0][0] * A[2][0] + A[0][1] * A[2][1] + A[0][2] * A[2][2]);
660a8fc04aSrezgarshakeri     qd[i + Q * 4]       = qw * (A[1][0] * A[1][0] + A[1][1] * A[1][1] + A[1][2] * A[1][2]);
670a8fc04aSrezgarshakeri     qd[i + Q * 5]       = qw * (A[1][0] * A[2][0] + A[1][1] * A[2][1] + A[1][2] * A[2][2]);
680a8fc04aSrezgarshakeri     qd[i + Q * 6]       = qw * (A[2][0] * A[2][0] + A[2][1] * A[2][1] + A[2][2] * A[2][2]);
69cb32e2e7SValeria Barra   }  // End of Quadrature Point Loop
70cb32e2e7SValeria Barra 
71cb32e2e7SValeria Barra   return 0;
72cb32e2e7SValeria Barra }
73cb32e2e7SValeria Barra 
74e83e87a5Sjeremylt // -----------------------------------------------------------------------------
75ed264d09SValeria Barra // This QFunction sets up the rhs and true solution for the problem
76cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
772b730f8bSJeremy L Thompson CEED_QFUNCTION(SetupDiffRhs)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) {
78cb32e2e7SValeria Barra #ifndef M_PI
79cb32e2e7SValeria Barra #define M_PI 3.14159265358979323846
80cb32e2e7SValeria Barra #endif
81e83e87a5Sjeremylt   const CeedScalar *x = in[0], *w = in[1];
82cb32e2e7SValeria Barra   CeedScalar       *true_soln = out[0], *rhs = out[1];
83cb32e2e7SValeria Barra 
84cb32e2e7SValeria Barra   // Quadrature Point Loop
852b730f8bSJeremy L Thompson   CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) {
86cb32e2e7SValeria Barra     const CeedScalar c[3] = {0, 1., 2.};
87cb32e2e7SValeria Barra     const CeedScalar k[3] = {1., 2., 3.};
88cb32e2e7SValeria Barra 
892b730f8bSJeremy L Thompson     true_soln[i] = sin(M_PI * (c[0] + k[0] * x[i + Q * 0])) * sin(M_PI * (c[1] + k[1] * x[i + Q * 1])) * sin(M_PI * (c[2] + k[2] * x[i + Q * 2]));
90cb32e2e7SValeria Barra 
912b730f8bSJeremy L Thompson     rhs[i] = w[i + Q * 0] * M_PI * M_PI * (k[0] * k[0] + k[1] * k[1] + k[2] * k[2]) * true_soln[i];
92cb32e2e7SValeria Barra   }  // End of Quadrature Point Loop
93cb32e2e7SValeria Barra 
94cb32e2e7SValeria Barra   return 0;
95cb32e2e7SValeria Barra }
96cb32e2e7SValeria Barra 
97e83e87a5Sjeremylt // -----------------------------------------------------------------------------
98ed264d09SValeria Barra // This QFunction applies the diffusion operator for a scalar field.
99ed264d09SValeria Barra //
100ed264d09SValeria Barra // Inputs:
101ed264d09SValeria Barra //   ug      - Input vector gradient at quadrature points
1029b072555Sjeremylt //   q_data  - Geometric factors
103ed264d09SValeria Barra //
104ed264d09SValeria Barra // Output:
105ed264d09SValeria Barra //   vg     - Output vector (test functions) gradient at quadrature points
106cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
1072b730f8bSJeremy L Thompson CEED_QFUNCTION(Diff)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) {
1089b072555Sjeremylt   const CeedScalar *ug = in[0], *q_data = in[1];
109cb32e2e7SValeria Barra   CeedScalar       *vg = out[0];
110cb32e2e7SValeria Barra 
111cb32e2e7SValeria Barra   // Quadrature Point Loop
1122b730f8bSJeremy L Thompson   CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) {
113cb32e2e7SValeria Barra     // Read spatial derivatives of u
1142b730f8bSJeremy L Thompson     const CeedScalar du[3] = {ug[i + Q * 0], ug[i + Q * 1], ug[i + Q * 2]};
1159b072555Sjeremylt     // Read q_data (dXdxdXdx_T symmetric matrix)
1162b730f8bSJeremy L Thompson     const CeedScalar dXdxdXdx_T[3][3] = {
1172b730f8bSJeremy L Thompson         {q_data[i + 1 * Q], q_data[i + 2 * Q], q_data[i + 3 * Q]},
1182b730f8bSJeremy L Thompson         {q_data[i + 2 * Q], q_data[i + 4 * Q], q_data[i + 5 * Q]},
1192b730f8bSJeremy L Thompson         {q_data[i + 3 * Q], q_data[i + 5 * Q], q_data[i + 6 * Q]}
120cb32e2e7SValeria Barra     };
121cb32e2e7SValeria Barra 
1222b730f8bSJeremy L Thompson     for (int j = 0; j < 3; j++) {  // j = direction of vg
1232b730f8bSJeremy L Thompson       vg[i + j * Q] = (du[0] * dXdxdXdx_T[0][j] + du[1] * dXdxdXdx_T[1][j] + du[2] * dXdxdXdx_T[2][j]);
1242b730f8bSJeremy L Thompson     }
125cb32e2e7SValeria Barra   }  // End of Quadrature Point Loop
126cb32e2e7SValeria Barra   return 0;
127cb32e2e7SValeria Barra }
128cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
129f6b55d2cSvaleriabarra 
130f6b55d2cSvaleriabarra #endif  // bp3_h
131