166087c08SValeria Barra // Copyright (c) 2017-2018, Lawrence Livermore National Security, LLC. 266087c08SValeria Barra // Produced at the Lawrence Livermore National Laboratory. LLNL-CODE-734707. 366087c08SValeria Barra // All Rights reserved. See files LICENSE and NOTICE for details. 466087c08SValeria Barra // 566087c08SValeria Barra // This file is part of CEED, a collection of benchmarks, miniapps, software 666087c08SValeria Barra // libraries and APIs for efficient high-order finite element and spectral 766087c08SValeria Barra // element discretizations for exascale applications. For more information and 866087c08SValeria Barra // source code availability see http://github.com/ceed. 966087c08SValeria Barra // 1066087c08SValeria Barra // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, 1166087c08SValeria Barra // a collaborative effort of two U.S. Department of Energy organizations (Office 1266087c08SValeria Barra // of Science and the National Nuclear Security Administration) responsible for 1366087c08SValeria Barra // the planning and preparation of a capable exascale ecosystem, including 1466087c08SValeria Barra // software, applications, hardware, advanced system engineering and early 1566087c08SValeria Barra // testbed platforms, in support of the nation's exascale computing imperative. 1666087c08SValeria Barra 17e3bad73bSvaleriabarra #ifndef ex2_surface_h 18e3bad73bSvaleriabarra #define ex2_surface_h 19e3bad73bSvaleriabarra 2066087c08SValeria Barra /// A structure used to pass additional data to f_build_diff 2166087c08SValeria Barra struct BuildContext { CeedInt dim, space_dim; }; 2266087c08SValeria Barra 2366087c08SValeria Barra /// libCEED Q-function for building quadrature data for a diffusion operator 2466087c08SValeria Barra CEED_QFUNCTION(f_build_diff)(void *ctx, const CeedInt Q, 2566087c08SValeria Barra const CeedScalar *const *in, CeedScalar *const *out) { 2666087c08SValeria Barra struct BuildContext *bc = (struct BuildContext *)ctx; 2766087c08SValeria Barra // in[0] is Jacobians with shape [dim, nc=dim, Q] 2866087c08SValeria Barra // in[1] is quadrature weights, size (Q) 2966087c08SValeria Barra // 3066087c08SValeria Barra // At every quadrature point, compute w/det(J).adj(J).adj(J)^T and store 3166087c08SValeria Barra // the symmetric part of the result. 3266087c08SValeria Barra const CeedScalar *J = in[0], *w = in[1]; 33*d1d35e2fSjeremylt CeedScalar *q_data = out[0]; 3466087c08SValeria Barra 3566087c08SValeria Barra switch (bc->dim + 10*bc->space_dim) { 3666087c08SValeria Barra case 11: 3766087c08SValeria Barra CeedPragmaSIMD 3866087c08SValeria Barra for (CeedInt i=0; i<Q; i++) { 39*d1d35e2fSjeremylt q_data[i] = w[i] / J[i]; 4066087c08SValeria Barra } // End of Quadrature Point Loop 4166087c08SValeria Barra break; 4266087c08SValeria Barra case 22: 4366087c08SValeria Barra CeedPragmaSIMD 4466087c08SValeria Barra for (CeedInt i=0; i<Q; i++) { 45*d1d35e2fSjeremylt // J: 0 2 q_data: 0 2 adj(J): J22 -J12 4666087c08SValeria Barra // 1 3 2 1 -J21 J11 4766087c08SValeria Barra const CeedScalar J11 = J[i+Q*0]; 4866087c08SValeria Barra const CeedScalar J21 = J[i+Q*1]; 4966087c08SValeria Barra const CeedScalar J12 = J[i+Q*2]; 5066087c08SValeria Barra const CeedScalar J22 = J[i+Q*3]; 5166087c08SValeria Barra const CeedScalar qw = w[i] / (J11*J22 - J21*J12); 52*d1d35e2fSjeremylt q_data[i+Q*0] = qw * (J12*J12 + J22*J22); 53*d1d35e2fSjeremylt q_data[i+Q*1] = qw * (J11*J11 + J21*J21); 54*d1d35e2fSjeremylt q_data[i+Q*2] = - qw * (J11*J12 + J21*J22); 5566087c08SValeria Barra } // End of Quadrature Point Loop 5666087c08SValeria Barra break; 5766087c08SValeria Barra case 33: 5866087c08SValeria Barra CeedPragmaSIMD 5966087c08SValeria Barra for (CeedInt i=0; i<Q; i++) { 6066087c08SValeria Barra // Compute the adjoint 6166087c08SValeria Barra CeedScalar A[3][3]; 6266087c08SValeria Barra for (CeedInt j=0; j<3; j++) 6366087c08SValeria Barra for (CeedInt k=0; k<3; k++) 6466087c08SValeria Barra // Equivalent code with J as a VLA and no mod operations: 6566087c08SValeria Barra // A[k][j] = J[j+1][k+1]*J[j+2][k+2] - J[j+1][k+2]*J[j+2][k+1] 6666087c08SValeria Barra A[k][j] = J[i+Q*((j+1)%3+3*((k+1)%3))]*J[i+Q*((j+2)%3+3*((k+2)%3))] - 6766087c08SValeria Barra J[i+Q*((j+1)%3+3*((k+2)%3))]*J[i+Q*((j+2)%3+3*((k+1)%3))]; 6866087c08SValeria Barra 6966087c08SValeria Barra // Compute quadrature weight / det(J) 7066087c08SValeria Barra const CeedScalar qw = w[i] / (J[i+Q*0]*A[0][0] + J[i+Q*1]*A[1][1] + 7166087c08SValeria Barra J[i+Q*2]*A[2][2]); 7266087c08SValeria Barra 7366087c08SValeria Barra // Compute geometric factors 7466087c08SValeria Barra // Stored in Voigt convention 7566087c08SValeria Barra // 0 5 4 7666087c08SValeria Barra // 5 1 3 7766087c08SValeria Barra // 4 3 2 78*d1d35e2fSjeremylt q_data[i+Q*0] = qw * (A[0][0]*A[0][0] + A[0][1]*A[0][1] + A[0][2]*A[0][2]); 79*d1d35e2fSjeremylt q_data[i+Q*1] = qw * (A[1][0]*A[1][0] + A[1][1]*A[1][1] + A[1][2]*A[1][2]); 80*d1d35e2fSjeremylt q_data[i+Q*2] = qw * (A[2][0]*A[2][0] + A[2][1]*A[2][1] + A[2][2]*A[2][2]); 81*d1d35e2fSjeremylt q_data[i+Q*3] = qw * (A[1][0]*A[2][0] + A[1][1]*A[2][1] + A[1][2]*A[2][2]); 82*d1d35e2fSjeremylt q_data[i+Q*4] = qw * (A[0][0]*A[2][0] + A[0][1]*A[2][1] + A[0][2]*A[2][2]); 83*d1d35e2fSjeremylt q_data[i+Q*5] = qw * (A[0][0]*A[1][0] + A[0][1]*A[1][1] + A[0][2]*A[1][2]); 8466087c08SValeria Barra } // End of Quadrature Point Loop 8566087c08SValeria Barra break; 8666087c08SValeria Barra } 8766087c08SValeria Barra return 0; 8866087c08SValeria Barra } 8966087c08SValeria Barra 9066087c08SValeria Barra /// libCEED Q-function for applying a diff operator 9166087c08SValeria Barra CEED_QFUNCTION(f_apply_diff)(void *ctx, const CeedInt Q, 9266087c08SValeria Barra const CeedScalar *const *in, CeedScalar *const *out) { 9366087c08SValeria Barra struct BuildContext *bc = (struct BuildContext *)ctx; 9466087c08SValeria Barra // in[0], out[0] have shape [dim, nc=1, Q] 95*d1d35e2fSjeremylt const CeedScalar *ug = in[0], *q_data = in[1]; 9666087c08SValeria Barra CeedScalar *vg = out[0]; 9766087c08SValeria Barra 9866087c08SValeria Barra switch (bc->dim) { 9966087c08SValeria Barra case 1: 10066087c08SValeria Barra CeedPragmaSIMD 10166087c08SValeria Barra for (CeedInt i=0; i<Q; i++) { 102*d1d35e2fSjeremylt vg[i] = ug[i] * q_data[i]; 10366087c08SValeria Barra } // End of Quadrature Point Loop 10466087c08SValeria Barra break; 10566087c08SValeria Barra case 2: 10666087c08SValeria Barra CeedPragmaSIMD 10766087c08SValeria Barra for (CeedInt i=0; i<Q; i++) { 10866087c08SValeria Barra // Read spatial derivatives of u 10966087c08SValeria Barra const CeedScalar du[2] = {ug[i+Q*0], 11066087c08SValeria Barra ug[i+Q*1] 11166087c08SValeria Barra }; 11266087c08SValeria Barra 113*d1d35e2fSjeremylt // Read q_data (dXdxdXdx_T symmetric matrix) 11466087c08SValeria Barra // Stored in Voigt convention 11566087c08SValeria Barra // 0 2 11666087c08SValeria Barra // 2 1 11766087c08SValeria Barra // *INDENT-OFF* 118*d1d35e2fSjeremylt const CeedScalar dXdxdXdx_T[2][2] = {{q_data[i+0*Q], 119*d1d35e2fSjeremylt q_data[i+2*Q]}, 120*d1d35e2fSjeremylt {q_data[i+2*Q], 121*d1d35e2fSjeremylt q_data[i+1*Q]}}; 12266087c08SValeria Barra // *INDENT-ON* 12366087c08SValeria Barra // j = direction of vg 12466087c08SValeria Barra for (int j=0; j<2; j++) 125*d1d35e2fSjeremylt vg[i+j*Q] = (du[0] * dXdxdXdx_T[0][j] + 126*d1d35e2fSjeremylt du[1] * dXdxdXdx_T[1][j]); 12766087c08SValeria Barra } // End of Quadrature Point Loop 12866087c08SValeria Barra break; 12966087c08SValeria Barra case 3: 13066087c08SValeria Barra CeedPragmaSIMD 13166087c08SValeria Barra for (CeedInt i=0; i<Q; i++) { 13266087c08SValeria Barra // Read spatial derivatives of u 13366087c08SValeria Barra const CeedScalar du[3] = {ug[i+Q*0], 13466087c08SValeria Barra ug[i+Q*1], 13566087c08SValeria Barra ug[i+Q*2] 13666087c08SValeria Barra }; 13766087c08SValeria Barra 138*d1d35e2fSjeremylt // Read q_data (dXdxdXdx_T symmetric matrix) 13966087c08SValeria Barra // Stored in Voigt convention 14066087c08SValeria Barra // 0 5 4 14166087c08SValeria Barra // 5 1 3 14266087c08SValeria Barra // 4 3 2 14366087c08SValeria Barra // *INDENT-OFF* 144*d1d35e2fSjeremylt const CeedScalar dXdxdXdx_T[3][3] = {{q_data[i+0*Q], 145*d1d35e2fSjeremylt q_data[i+5*Q], 146*d1d35e2fSjeremylt q_data[i+4*Q]}, 147*d1d35e2fSjeremylt {q_data[i+5*Q], 148*d1d35e2fSjeremylt q_data[i+1*Q], 149*d1d35e2fSjeremylt q_data[i+3*Q]}, 150*d1d35e2fSjeremylt {q_data[i+4*Q], 151*d1d35e2fSjeremylt q_data[i+3*Q], 152*d1d35e2fSjeremylt q_data[i+2*Q]} 15366087c08SValeria Barra }; 15466087c08SValeria Barra // *INDENT-ON* 15566087c08SValeria Barra // j = direction of vg 15666087c08SValeria Barra for (int j=0; j<3; j++) 157*d1d35e2fSjeremylt vg[i+j*Q] = (du[0] * dXdxdXdx_T[0][j] + 158*d1d35e2fSjeremylt du[1] * dXdxdXdx_T[1][j] + 159*d1d35e2fSjeremylt du[2] * dXdxdXdx_T[2][j]); 16066087c08SValeria Barra } // End of Quadrature Point Loop 16166087c08SValeria Barra break; 16266087c08SValeria Barra } 16366087c08SValeria Barra return 0; 16466087c08SValeria Barra } 165e3bad73bSvaleriabarra 166e3bad73bSvaleriabarra #endif // ex2_surface_h 167