xref: /libCEED/examples/ceed/ex2-surface.h (revision d1d35e2f02dc969aee8debf3fd943dd784aa847a)
166087c08SValeria Barra // Copyright (c) 2017-2018, Lawrence Livermore National Security, LLC.
266087c08SValeria Barra // Produced at the Lawrence Livermore National Laboratory. LLNL-CODE-734707.
366087c08SValeria Barra // All Rights reserved. See files LICENSE and NOTICE for details.
466087c08SValeria Barra //
566087c08SValeria Barra // This file is part of CEED, a collection of benchmarks, miniapps, software
666087c08SValeria Barra // libraries and APIs for efficient high-order finite element and spectral
766087c08SValeria Barra // element discretizations for exascale applications. For more information and
866087c08SValeria Barra // source code availability see http://github.com/ceed.
966087c08SValeria Barra //
1066087c08SValeria Barra // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC,
1166087c08SValeria Barra // a collaborative effort of two U.S. Department of Energy organizations (Office
1266087c08SValeria Barra // of Science and the National Nuclear Security Administration) responsible for
1366087c08SValeria Barra // the planning and preparation of a capable exascale ecosystem, including
1466087c08SValeria Barra // software, applications, hardware, advanced system engineering and early
1566087c08SValeria Barra // testbed platforms, in support of the nation's exascale computing imperative.
1666087c08SValeria Barra 
17e3bad73bSvaleriabarra #ifndef ex2_surface_h
18e3bad73bSvaleriabarra #define ex2_surface_h
19e3bad73bSvaleriabarra 
2066087c08SValeria Barra /// A structure used to pass additional data to f_build_diff
2166087c08SValeria Barra struct BuildContext { CeedInt dim, space_dim; };
2266087c08SValeria Barra 
2366087c08SValeria Barra /// libCEED Q-function for building quadrature data for a diffusion operator
2466087c08SValeria Barra CEED_QFUNCTION(f_build_diff)(void *ctx, const CeedInt Q,
2566087c08SValeria Barra                              const CeedScalar *const *in, CeedScalar *const *out) {
2666087c08SValeria Barra   struct BuildContext *bc = (struct BuildContext *)ctx;
2766087c08SValeria Barra   // in[0] is Jacobians with shape [dim, nc=dim, Q]
2866087c08SValeria Barra   // in[1] is quadrature weights, size (Q)
2966087c08SValeria Barra   //
3066087c08SValeria Barra   // At every quadrature point, compute w/det(J).adj(J).adj(J)^T and store
3166087c08SValeria Barra   // the symmetric part of the result.
3266087c08SValeria Barra   const CeedScalar *J = in[0], *w = in[1];
33*d1d35e2fSjeremylt   CeedScalar *q_data = out[0];
3466087c08SValeria Barra 
3566087c08SValeria Barra   switch (bc->dim + 10*bc->space_dim) {
3666087c08SValeria Barra   case 11:
3766087c08SValeria Barra     CeedPragmaSIMD
3866087c08SValeria Barra     for (CeedInt i=0; i<Q; i++) {
39*d1d35e2fSjeremylt       q_data[i] = w[i] / J[i];
4066087c08SValeria Barra     } // End of Quadrature Point Loop
4166087c08SValeria Barra     break;
4266087c08SValeria Barra   case 22:
4366087c08SValeria Barra     CeedPragmaSIMD
4466087c08SValeria Barra     for (CeedInt i=0; i<Q; i++) {
45*d1d35e2fSjeremylt       // J: 0 2   q_data: 0 2   adj(J):  J22 -J12
4666087c08SValeria Barra       //    1 3          2 1           -J21  J11
4766087c08SValeria Barra       const CeedScalar J11 = J[i+Q*0];
4866087c08SValeria Barra       const CeedScalar J21 = J[i+Q*1];
4966087c08SValeria Barra       const CeedScalar J12 = J[i+Q*2];
5066087c08SValeria Barra       const CeedScalar J22 = J[i+Q*3];
5166087c08SValeria Barra       const CeedScalar qw = w[i] / (J11*J22 - J21*J12);
52*d1d35e2fSjeremylt       q_data[i+Q*0] =   qw * (J12*J12 + J22*J22);
53*d1d35e2fSjeremylt       q_data[i+Q*1] =   qw * (J11*J11 + J21*J21);
54*d1d35e2fSjeremylt       q_data[i+Q*2] = - qw * (J11*J12 + J21*J22);
5566087c08SValeria Barra     } // End of Quadrature Point Loop
5666087c08SValeria Barra     break;
5766087c08SValeria Barra   case 33:
5866087c08SValeria Barra     CeedPragmaSIMD
5966087c08SValeria Barra     for (CeedInt i=0; i<Q; i++) {
6066087c08SValeria Barra       // Compute the adjoint
6166087c08SValeria Barra       CeedScalar A[3][3];
6266087c08SValeria Barra       for (CeedInt j=0; j<3; j++)
6366087c08SValeria Barra         for (CeedInt k=0; k<3; k++)
6466087c08SValeria Barra           // Equivalent code with J as a VLA and no mod operations:
6566087c08SValeria Barra           // A[k][j] = J[j+1][k+1]*J[j+2][k+2] - J[j+1][k+2]*J[j+2][k+1]
6666087c08SValeria Barra           A[k][j] = J[i+Q*((j+1)%3+3*((k+1)%3))]*J[i+Q*((j+2)%3+3*((k+2)%3))] -
6766087c08SValeria Barra                     J[i+Q*((j+1)%3+3*((k+2)%3))]*J[i+Q*((j+2)%3+3*((k+1)%3))];
6866087c08SValeria Barra 
6966087c08SValeria Barra       // Compute quadrature weight / det(J)
7066087c08SValeria Barra       const CeedScalar qw = w[i] / (J[i+Q*0]*A[0][0] + J[i+Q*1]*A[1][1] +
7166087c08SValeria Barra                                     J[i+Q*2]*A[2][2]);
7266087c08SValeria Barra 
7366087c08SValeria Barra       // Compute geometric factors
7466087c08SValeria Barra       // Stored in Voigt convention
7566087c08SValeria Barra       // 0 5 4
7666087c08SValeria Barra       // 5 1 3
7766087c08SValeria Barra       // 4 3 2
78*d1d35e2fSjeremylt       q_data[i+Q*0] = qw * (A[0][0]*A[0][0] + A[0][1]*A[0][1] + A[0][2]*A[0][2]);
79*d1d35e2fSjeremylt       q_data[i+Q*1] = qw * (A[1][0]*A[1][0] + A[1][1]*A[1][1] + A[1][2]*A[1][2]);
80*d1d35e2fSjeremylt       q_data[i+Q*2] = qw * (A[2][0]*A[2][0] + A[2][1]*A[2][1] + A[2][2]*A[2][2]);
81*d1d35e2fSjeremylt       q_data[i+Q*3] = qw * (A[1][0]*A[2][0] + A[1][1]*A[2][1] + A[1][2]*A[2][2]);
82*d1d35e2fSjeremylt       q_data[i+Q*4] = qw * (A[0][0]*A[2][0] + A[0][1]*A[2][1] + A[0][2]*A[2][2]);
83*d1d35e2fSjeremylt       q_data[i+Q*5] = qw * (A[0][0]*A[1][0] + A[0][1]*A[1][1] + A[0][2]*A[1][2]);
8466087c08SValeria Barra     } // End of Quadrature Point Loop
8566087c08SValeria Barra     break;
8666087c08SValeria Barra   }
8766087c08SValeria Barra   return 0;
8866087c08SValeria Barra }
8966087c08SValeria Barra 
9066087c08SValeria Barra /// libCEED Q-function for applying a diff operator
9166087c08SValeria Barra CEED_QFUNCTION(f_apply_diff)(void *ctx, const CeedInt Q,
9266087c08SValeria Barra                              const CeedScalar *const *in, CeedScalar *const *out) {
9366087c08SValeria Barra   struct BuildContext *bc = (struct BuildContext *)ctx;
9466087c08SValeria Barra   // in[0], out[0] have shape [dim, nc=1, Q]
95*d1d35e2fSjeremylt   const CeedScalar *ug = in[0], *q_data = in[1];
9666087c08SValeria Barra   CeedScalar *vg = out[0];
9766087c08SValeria Barra 
9866087c08SValeria Barra   switch (bc->dim) {
9966087c08SValeria Barra   case 1:
10066087c08SValeria Barra     CeedPragmaSIMD
10166087c08SValeria Barra     for (CeedInt i=0; i<Q; i++) {
102*d1d35e2fSjeremylt       vg[i] = ug[i] * q_data[i];
10366087c08SValeria Barra     } // End of Quadrature Point Loop
10466087c08SValeria Barra     break;
10566087c08SValeria Barra   case 2:
10666087c08SValeria Barra     CeedPragmaSIMD
10766087c08SValeria Barra     for (CeedInt i=0; i<Q; i++) {
10866087c08SValeria Barra       // Read spatial derivatives of u
10966087c08SValeria Barra       const CeedScalar du[2]        =  {ug[i+Q*0],
11066087c08SValeria Barra                                         ug[i+Q*1]
11166087c08SValeria Barra                                        };
11266087c08SValeria Barra 
113*d1d35e2fSjeremylt       // Read q_data (dXdxdXdx_T symmetric matrix)
11466087c08SValeria Barra       // Stored in Voigt convention
11566087c08SValeria Barra       // 0 2
11666087c08SValeria Barra       // 2 1
11766087c08SValeria Barra       // *INDENT-OFF*
118*d1d35e2fSjeremylt       const CeedScalar dXdxdXdx_T[2][2] = {{q_data[i+0*Q],
119*d1d35e2fSjeremylt                                             q_data[i+2*Q]},
120*d1d35e2fSjeremylt                                            {q_data[i+2*Q],
121*d1d35e2fSjeremylt                                             q_data[i+1*Q]}};
12266087c08SValeria Barra       // *INDENT-ON*
12366087c08SValeria Barra       // j = direction of vg
12466087c08SValeria Barra       for (int j=0; j<2; j++)
125*d1d35e2fSjeremylt         vg[i+j*Q] = (du[0] * dXdxdXdx_T[0][j] +
126*d1d35e2fSjeremylt                      du[1] * dXdxdXdx_T[1][j]);
12766087c08SValeria Barra     } // End of Quadrature Point Loop
12866087c08SValeria Barra     break;
12966087c08SValeria Barra   case 3:
13066087c08SValeria Barra     CeedPragmaSIMD
13166087c08SValeria Barra     for (CeedInt i=0; i<Q; i++) {
13266087c08SValeria Barra       // Read spatial derivatives of u
13366087c08SValeria Barra       const CeedScalar du[3]        =  {ug[i+Q*0],
13466087c08SValeria Barra                                         ug[i+Q*1],
13566087c08SValeria Barra                                         ug[i+Q*2]
13666087c08SValeria Barra                                        };
13766087c08SValeria Barra 
138*d1d35e2fSjeremylt       // Read q_data (dXdxdXdx_T symmetric matrix)
13966087c08SValeria Barra       // Stored in Voigt convention
14066087c08SValeria Barra       // 0 5 4
14166087c08SValeria Barra       // 5 1 3
14266087c08SValeria Barra       // 4 3 2
14366087c08SValeria Barra       // *INDENT-OFF*
144*d1d35e2fSjeremylt       const CeedScalar dXdxdXdx_T[3][3] = {{q_data[i+0*Q],
145*d1d35e2fSjeremylt                                             q_data[i+5*Q],
146*d1d35e2fSjeremylt                                             q_data[i+4*Q]},
147*d1d35e2fSjeremylt                                            {q_data[i+5*Q],
148*d1d35e2fSjeremylt                                             q_data[i+1*Q],
149*d1d35e2fSjeremylt                                             q_data[i+3*Q]},
150*d1d35e2fSjeremylt                                            {q_data[i+4*Q],
151*d1d35e2fSjeremylt                                             q_data[i+3*Q],
152*d1d35e2fSjeremylt                                             q_data[i+2*Q]}
15366087c08SValeria Barra                                           };
15466087c08SValeria Barra       // *INDENT-ON*
15566087c08SValeria Barra       // j = direction of vg
15666087c08SValeria Barra       for (int j=0; j<3; j++)
157*d1d35e2fSjeremylt         vg[i+j*Q] = (du[0] * dXdxdXdx_T[0][j] +
158*d1d35e2fSjeremylt                      du[1] * dXdxdXdx_T[1][j] +
159*d1d35e2fSjeremylt                      du[2] * dXdxdXdx_T[2][j]);
16066087c08SValeria Barra     } // End of Quadrature Point Loop
16166087c08SValeria Barra     break;
16266087c08SValeria Barra   }
16366087c08SValeria Barra   return 0;
16466087c08SValeria Barra }
165e3bad73bSvaleriabarra 
166e3bad73bSvaleriabarra #endif // ex2_surface_h
167