xref: /libCEED/examples/petsc/qfunctions/bps/bp3.h (revision 13921685346cfad96119dcd8a0eb3be08260e4ff)
1cb32e2e7SValeria Barra // Copyright (c) 2017, Lawrence Livermore National Security, LLC. Produced at
2cb32e2e7SValeria Barra // the Lawrence Livermore National Laboratory. LLNL-CODE-734707. All Rights
3cb32e2e7SValeria Barra // reserved. See files LICENSE and NOTICE for details.
4cb32e2e7SValeria Barra //
5cb32e2e7SValeria Barra // This file is part of CEED, a collection of benchmarks, miniapps, software
6cb32e2e7SValeria Barra // libraries and APIs for efficient high-order finite element and spectral
7cb32e2e7SValeria Barra // element discretizations for exascale applications. For more information and
8cb32e2e7SValeria Barra // source code availability see http://github.com/ceed.
9cb32e2e7SValeria Barra //
10cb32e2e7SValeria Barra // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC,
11cb32e2e7SValeria Barra // a collaborative effort of two U.S. Department of Energy organizations (Office
12cb32e2e7SValeria Barra // of Science and the National Nuclear Security Administration) responsible for
13cb32e2e7SValeria Barra // the planning and preparation of a capable exascale ecosystem, including
14cb32e2e7SValeria Barra // software, applications, hardware, advanced system engineering and early
15cb32e2e7SValeria Barra // testbed platforms, in support of the nation's exascale computing imperative.
16cb32e2e7SValeria Barra 
17cb32e2e7SValeria Barra /// @file
18cb32e2e7SValeria Barra /// libCEED QFunctions for diffusion operator example using PETSc
19cb32e2e7SValeria Barra 
20*13921685Svaleriabarra #ifndef bp3_h
21*13921685Svaleriabarra #define bp3_h
22*13921685Svaleriabarra 
23*13921685Svaleriabarra #ifndef __CUDACC__
24*13921685Svaleriabarra #  include <math.h>
25*13921685Svaleriabarra #endif
26*13921685Svaleriabarra 
27ed264d09SValeria Barra // *****************************************************************************
28ed264d09SValeria Barra // This QFunction sets up the geometric factors required to apply the
29ed264d09SValeria Barra //   diffusion operator
30ed264d09SValeria Barra //
31ed264d09SValeria Barra // We require the product of the inverse of the Jacobian and its transpose to
32ed264d09SValeria Barra //   properly compute integrals of the form: int( gradv gradu)
33ed264d09SValeria Barra //
34ed264d09SValeria Barra // Determinant of Jacobian:
35ed264d09SValeria Barra //   detJ = J11*A11 + J21*A12 + J31*A13
36ed264d09SValeria Barra //     Jij = Jacobian entry ij
37ed264d09SValeria Barra //     Aij = Adjoint ij
38ed264d09SValeria Barra //
39ed264d09SValeria Barra // Inverse of Jacobian:
40ed264d09SValeria Barra //   Bij = Aij / detJ
41ed264d09SValeria Barra //
42ed264d09SValeria Barra // Product of Inverse and Transpose:
43ed264d09SValeria Barra //   BBij = sum( Bik Bkj )
44ed264d09SValeria Barra //
45ed264d09SValeria Barra // Stored: w B^T B detJ = w A^T A / detJ
46ed264d09SValeria Barra //   Note: This matrix is symmetric, so we only store 6 distinct entries
47ed264d09SValeria Barra //     qd: 0 3 6
48ed264d09SValeria Barra //         1 4 7
49ed264d09SValeria Barra //         2 5 8
50ed264d09SValeria Barra // *****************************************************************************
51ed264d09SValeria Barra 
52cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
53cb32e2e7SValeria Barra CEED_QFUNCTION(SetupDiffGeo)(void *ctx, CeedInt Q,
54cb32e2e7SValeria Barra                              const CeedScalar *const *in,
55cb32e2e7SValeria Barra                              CeedScalar *const *out) {
56cb32e2e7SValeria Barra   const CeedScalar *J = in[0], *w = in[1];
57cb32e2e7SValeria Barra   CeedScalar *qd = out[0];
58cb32e2e7SValeria Barra 
59cb32e2e7SValeria Barra   // Quadrature Point Loop
60cb32e2e7SValeria Barra   CeedPragmaSIMD
61cb32e2e7SValeria Barra   for (CeedInt i=0; i<Q; i++) {
62cb32e2e7SValeria Barra     const CeedScalar J11 = J[i+Q*0];
63cb32e2e7SValeria Barra     const CeedScalar J21 = J[i+Q*1];
64cb32e2e7SValeria Barra     const CeedScalar J31 = J[i+Q*2];
65cb32e2e7SValeria Barra     const CeedScalar J12 = J[i+Q*3];
66cb32e2e7SValeria Barra     const CeedScalar J22 = J[i+Q*4];
67cb32e2e7SValeria Barra     const CeedScalar J32 = J[i+Q*5];
68cb32e2e7SValeria Barra     const CeedScalar J13 = J[i+Q*6];
69cb32e2e7SValeria Barra     const CeedScalar J23 = J[i+Q*7];
70cb32e2e7SValeria Barra     const CeedScalar J33 = J[i+Q*8];
71cb32e2e7SValeria Barra     const CeedScalar A11 = J22*J33 - J23*J32;
72cb32e2e7SValeria Barra     const CeedScalar A12 = J13*J32 - J12*J33;
73cb32e2e7SValeria Barra     const CeedScalar A13 = J12*J23 - J13*J22;
74cb32e2e7SValeria Barra     const CeedScalar A21 = J23*J31 - J21*J33;
75cb32e2e7SValeria Barra     const CeedScalar A22 = J11*J33 - J13*J31;
76cb32e2e7SValeria Barra     const CeedScalar A23 = J13*J21 - J11*J23;
77cb32e2e7SValeria Barra     const CeedScalar A31 = J21*J32 - J22*J31;
78cb32e2e7SValeria Barra     const CeedScalar A32 = J12*J31 - J11*J32;
79cb32e2e7SValeria Barra     const CeedScalar A33 = J11*J22 - J12*J21;
80cb32e2e7SValeria Barra     const CeedScalar qw = w[i] / (J11*A11 + J21*A12 + J31*A13);
81cb32e2e7SValeria Barra     qd[i+Q*0] = qw * (A11*A11 + A12*A12 + A13*A13);
82cb32e2e7SValeria Barra     qd[i+Q*1] = qw * (A11*A21 + A12*A22 + A13*A23);
83cb32e2e7SValeria Barra     qd[i+Q*2] = qw * (A11*A31 + A12*A32 + A13*A33);
84cb32e2e7SValeria Barra     qd[i+Q*3] = qw * (A21*A21 + A22*A22 + A23*A23);
85cb32e2e7SValeria Barra     qd[i+Q*4] = qw * (A21*A31 + A22*A32 + A23*A33);
86cb32e2e7SValeria Barra     qd[i+Q*5] = qw * (A31*A31 + A32*A32 + A33*A33);
87cb32e2e7SValeria Barra   } // End of Quadrature Point Loop
88cb32e2e7SValeria Barra 
89cb32e2e7SValeria Barra   return 0;
90cb32e2e7SValeria Barra }
91cb32e2e7SValeria Barra 
92ed264d09SValeria Barra // *****************************************************************************
93ed264d09SValeria Barra // This QFunction sets up the rhs and true solution for the problem
94ed264d09SValeria Barra // *****************************************************************************
95ed264d09SValeria Barra 
96cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
97cb32e2e7SValeria Barra CEED_QFUNCTION(SetupDiffRhs)(void *ctx, CeedInt Q,
98cb32e2e7SValeria Barra                              const CeedScalar *const *in,
99cb32e2e7SValeria Barra                              CeedScalar *const *out) {
100cb32e2e7SValeria Barra #ifndef M_PI
101cb32e2e7SValeria Barra #  define M_PI    3.14159265358979323846
102cb32e2e7SValeria Barra #endif
103cb32e2e7SValeria Barra   const CeedScalar *x = in[0], *J = in[1], *w = in[2];
104cb32e2e7SValeria Barra   CeedScalar *true_soln = out[0], *rhs = out[1];
105cb32e2e7SValeria Barra 
106cb32e2e7SValeria Barra   // Quadrature Point Loop
107cb32e2e7SValeria Barra   CeedPragmaSIMD
108cb32e2e7SValeria Barra   for (CeedInt i=0; i<Q; i++) {
109cb32e2e7SValeria Barra     const CeedScalar J11 = J[i+Q*0];
110cb32e2e7SValeria Barra     const CeedScalar J21 = J[i+Q*1];
111cb32e2e7SValeria Barra     const CeedScalar J31 = J[i+Q*2];
112cb32e2e7SValeria Barra     const CeedScalar J12 = J[i+Q*3];
113cb32e2e7SValeria Barra     const CeedScalar J22 = J[i+Q*4];
114cb32e2e7SValeria Barra     const CeedScalar J32 = J[i+Q*5];
115cb32e2e7SValeria Barra     const CeedScalar J13 = J[i+Q*6];
116cb32e2e7SValeria Barra     const CeedScalar J23 = J[i+Q*7];
117cb32e2e7SValeria Barra     const CeedScalar J33 = J[i+Q*8];
118cb32e2e7SValeria Barra     const CeedScalar A11 = J22*J33 - J23*J32;
119cb32e2e7SValeria Barra     const CeedScalar A12 = J13*J32 - J12*J33;
120cb32e2e7SValeria Barra     const CeedScalar A13 = J12*J23 - J13*J22;
121cb32e2e7SValeria Barra 
122cb32e2e7SValeria Barra     const CeedScalar c[3] = { 0, 1., 2. };
123cb32e2e7SValeria Barra     const CeedScalar k[3] = { 1., 2., 3. };
124cb32e2e7SValeria Barra 
125cb32e2e7SValeria Barra     true_soln[i] = sin(M_PI*(c[0] + k[0]*x[i+Q*0])) *
126cb32e2e7SValeria Barra                    sin(M_PI*(c[1] + k[1]*x[i+Q*1])) *
127cb32e2e7SValeria Barra                    sin(M_PI*(c[2] + k[2]*x[i+Q*2]));
128cb32e2e7SValeria Barra 
129cb32e2e7SValeria Barra     const CeedScalar rho = w[i] * (J11*A11 + J21*A12 + J31*A13);
130cb32e2e7SValeria Barra     rhs[i] = rho * M_PI*M_PI * (k[0]*k[0] + k[1]*k[1] + k[2]*k[2]) *
131cb32e2e7SValeria Barra              true_soln[i];
132cb32e2e7SValeria Barra   } // End of Quadrature Point Loop
133cb32e2e7SValeria Barra 
134cb32e2e7SValeria Barra   return 0;
135cb32e2e7SValeria Barra }
136cb32e2e7SValeria Barra 
137ed264d09SValeria Barra // *****************************************************************************
138ed264d09SValeria Barra // This QFunction applies the diffusion operator for a scalar field.
139ed264d09SValeria Barra //
140ed264d09SValeria Barra // Inputs:
141ed264d09SValeria Barra //   ug     - Input vector gradient at quadrature points
142ed264d09SValeria Barra //   qdata  - Geometric factors
143ed264d09SValeria Barra //
144ed264d09SValeria Barra // Output:
145ed264d09SValeria Barra //   vg     - Output vector (test functions) gradient at quadrature points
146ed264d09SValeria Barra //
147ed264d09SValeria Barra // *****************************************************************************
148ed264d09SValeria Barra 
149cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
150cb32e2e7SValeria Barra CEED_QFUNCTION(Diff)(void *ctx, CeedInt Q,
151cb32e2e7SValeria Barra                      const CeedScalar *const *in, CeedScalar *const *out) {
152ed264d09SValeria Barra   const CeedScalar *ug = in[0], *qdata = in[1];
153cb32e2e7SValeria Barra   CeedScalar *vg = out[0];
154cb32e2e7SValeria Barra 
155cb32e2e7SValeria Barra   // Quadrature Point Loop
156cb32e2e7SValeria Barra   CeedPragmaSIMD
157cb32e2e7SValeria Barra   for (CeedInt i=0; i<Q; i++) {
158cb32e2e7SValeria Barra     // Read spatial derivatives of u
159cb32e2e7SValeria Barra     const CeedScalar du[3]        =  {ug[i+Q*0],
160cb32e2e7SValeria Barra                                       ug[i+Q*1],
161cb32e2e7SValeria Barra                                       ug[i+Q*2]
162cb32e2e7SValeria Barra                                      };
163cb32e2e7SValeria Barra     // Read qdata (dXdxdXdxT symmetric matrix)
164ed264d09SValeria Barra     const CeedScalar dXdxdXdxT[3][3] = {{qdata[i+0*Q],
165ed264d09SValeria Barra                                          qdata[i+1*Q],
166ed264d09SValeria Barra                                          qdata[i+2*Q]},
167ed264d09SValeria Barra                                         {qdata[i+1*Q],
168ed264d09SValeria Barra                                          qdata[i+3*Q],
169ed264d09SValeria Barra                                          qdata[i+4*Q]},
170ed264d09SValeria Barra                                         {qdata[i+2*Q],
171ed264d09SValeria Barra                                          qdata[i+4*Q],
172ed264d09SValeria Barra                                          qdata[i+5*Q]}
173cb32e2e7SValeria Barra                                        };
174cb32e2e7SValeria Barra 
175cb32e2e7SValeria Barra     for (int j=0; j<3; j++) // j = direction of vg
176cb32e2e7SValeria Barra       vg[i+j*Q] = (du[0] * dXdxdXdxT[0][j] +
177cb32e2e7SValeria Barra                    du[1] * dXdxdXdxT[1][j] +
178cb32e2e7SValeria Barra                    du[2] * dXdxdXdxT[2][j]);
179cb32e2e7SValeria Barra 
180cb32e2e7SValeria Barra   } // End of Quadrature Point Loop
181cb32e2e7SValeria Barra   return 0;
182cb32e2e7SValeria Barra }
183cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
184f6b55d2cSvaleriabarra 
185f6b55d2cSvaleriabarra #endif // bp3_h
186