166087c08SValeria Barra // Copyright (c) 2017-2018, Lawrence Livermore National Security, LLC. 266087c08SValeria Barra // Produced at the Lawrence Livermore National Laboratory. LLNL-CODE-734707. 366087c08SValeria Barra // All Rights reserved. See files LICENSE and NOTICE for details. 466087c08SValeria Barra // 566087c08SValeria Barra // This file is part of CEED, a collection of benchmarks, miniapps, software 666087c08SValeria Barra // libraries and APIs for efficient high-order finite element and spectral 766087c08SValeria Barra // element discretizations for exascale applications. For more information and 866087c08SValeria Barra // source code availability see http://github.com/ceed. 966087c08SValeria Barra // 1066087c08SValeria Barra // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, 1166087c08SValeria Barra // a collaborative effort of two U.S. Department of Energy organizations (Office 1266087c08SValeria Barra // of Science and the National Nuclear Security Administration) responsible for 1366087c08SValeria Barra // the planning and preparation of a capable exascale ecosystem, including 1466087c08SValeria Barra // software, applications, hardware, advanced system engineering and early 1566087c08SValeria Barra // testbed platforms, in support of the nation's exascale computing imperative. 1666087c08SValeria Barra 17*e3bad73bSvaleriabarra #ifndef ex2_surface_h 18*e3bad73bSvaleriabarra #define ex2_surface_h 19*e3bad73bSvaleriabarra #include <ceed.h> 20*e3bad73bSvaleriabarra 2166087c08SValeria Barra /// A structure used to pass additional data to f_build_diff 2266087c08SValeria Barra struct BuildContext { CeedInt dim, space_dim; }; 2366087c08SValeria Barra 2466087c08SValeria Barra /// libCEED Q-function for building quadrature data for a diffusion operator 2566087c08SValeria Barra CEED_QFUNCTION(f_build_diff)(void *ctx, const CeedInt Q, 2666087c08SValeria Barra const CeedScalar *const *in, CeedScalar *const *out) { 2766087c08SValeria Barra struct BuildContext *bc = (struct BuildContext *)ctx; 2866087c08SValeria Barra // in[0] is Jacobians with shape [dim, nc=dim, Q] 2966087c08SValeria Barra // in[1] is quadrature weights, size (Q) 3066087c08SValeria Barra // 3166087c08SValeria Barra // At every quadrature point, compute w/det(J).adj(J).adj(J)^T and store 3266087c08SValeria Barra // the symmetric part of the result. 3366087c08SValeria Barra const CeedScalar *J = in[0], *w = in[1]; 3466087c08SValeria Barra CeedScalar *qdata = out[0]; 3566087c08SValeria Barra 3666087c08SValeria Barra switch (bc->dim + 10*bc->space_dim) { 3766087c08SValeria Barra case 11: 3866087c08SValeria Barra CeedPragmaSIMD 3966087c08SValeria Barra for (CeedInt i=0; i<Q; i++) { 4066087c08SValeria Barra qdata[i] = w[i] / J[i]; 4166087c08SValeria Barra } // End of Quadrature Point Loop 4266087c08SValeria Barra break; 4366087c08SValeria Barra case 22: 4466087c08SValeria Barra CeedPragmaSIMD 4566087c08SValeria Barra for (CeedInt i=0; i<Q; i++) { 4666087c08SValeria Barra // J: 0 2 qdata: 0 2 adj(J): J22 -J12 4766087c08SValeria Barra // 1 3 2 1 -J21 J11 4866087c08SValeria Barra const CeedScalar J11 = J[i+Q*0]; 4966087c08SValeria Barra const CeedScalar J21 = J[i+Q*1]; 5066087c08SValeria Barra const CeedScalar J12 = J[i+Q*2]; 5166087c08SValeria Barra const CeedScalar J22 = J[i+Q*3]; 5266087c08SValeria Barra const CeedScalar qw = w[i] / (J11*J22 - J21*J12); 5366087c08SValeria Barra qdata[i+Q*0] = qw * (J12*J12 + J22*J22); 5466087c08SValeria Barra qdata[i+Q*1] = qw * (J11*J11 + J21*J21); 5566087c08SValeria Barra qdata[i+Q*2] = - qw * (J11*J12 + J21*J22); 5666087c08SValeria Barra } // End of Quadrature Point Loop 5766087c08SValeria Barra break; 5866087c08SValeria Barra case 33: 5966087c08SValeria Barra CeedPragmaSIMD 6066087c08SValeria Barra for (CeedInt i=0; i<Q; i++) { 6166087c08SValeria Barra // Compute the adjoint 6266087c08SValeria Barra CeedScalar A[3][3]; 6366087c08SValeria Barra for (CeedInt j=0; j<3; j++) 6466087c08SValeria Barra for (CeedInt k=0; k<3; k++) 6566087c08SValeria Barra // Equivalent code with J as a VLA and no mod operations: 6666087c08SValeria Barra // A[k][j] = J[j+1][k+1]*J[j+2][k+2] - J[j+1][k+2]*J[j+2][k+1] 6766087c08SValeria Barra A[k][j] = J[i+Q*((j+1)%3+3*((k+1)%3))]*J[i+Q*((j+2)%3+3*((k+2)%3))] - 6866087c08SValeria Barra J[i+Q*((j+1)%3+3*((k+2)%3))]*J[i+Q*((j+2)%3+3*((k+1)%3))]; 6966087c08SValeria Barra 7066087c08SValeria Barra // Compute quadrature weight / det(J) 7166087c08SValeria Barra const CeedScalar qw = w[i] / (J[i+Q*0]*A[0][0] + J[i+Q*1]*A[1][1] + 7266087c08SValeria Barra J[i+Q*2]*A[2][2]); 7366087c08SValeria Barra 7466087c08SValeria Barra // Compute geometric factors 7566087c08SValeria Barra // Stored in Voigt convention 7666087c08SValeria Barra // 0 5 4 7766087c08SValeria Barra // 5 1 3 7866087c08SValeria Barra // 4 3 2 7966087c08SValeria Barra qdata[i+Q*0] = qw * (A[0][0]*A[0][0] + A[0][1]*A[0][1] + A[0][2]*A[0][2]); 8066087c08SValeria Barra qdata[i+Q*1] = qw * (A[1][0]*A[1][0] + A[1][1]*A[1][1] + A[1][2]*A[1][2]); 8166087c08SValeria Barra qdata[i+Q*2] = qw * (A[2][0]*A[2][0] + A[2][1]*A[2][1] + A[2][2]*A[2][2]); 8266087c08SValeria Barra qdata[i+Q*3] = qw * (A[1][0]*A[2][0] + A[1][1]*A[2][1] + A[1][2]*A[2][2]); 8366087c08SValeria Barra qdata[i+Q*4] = qw * (A[0][0]*A[2][0] + A[0][1]*A[2][1] + A[0][2]*A[2][2]); 8466087c08SValeria Barra qdata[i+Q*5] = qw * (A[0][0]*A[1][0] + A[0][1]*A[1][1] + A[0][2]*A[1][2]); 8566087c08SValeria Barra } // End of Quadrature Point Loop 8666087c08SValeria Barra break; 8766087c08SValeria Barra } 8866087c08SValeria Barra return 0; 8966087c08SValeria Barra } 9066087c08SValeria Barra 9166087c08SValeria Barra /// libCEED Q-function for applying a diff operator 9266087c08SValeria Barra CEED_QFUNCTION(f_apply_diff)(void *ctx, const CeedInt Q, 9366087c08SValeria Barra const CeedScalar *const *in, CeedScalar *const *out) { 9466087c08SValeria Barra struct BuildContext *bc = (struct BuildContext *)ctx; 9566087c08SValeria Barra // in[0], out[0] have shape [dim, nc=1, Q] 9666087c08SValeria Barra const CeedScalar *ug = in[0], *qdata = in[1]; 9766087c08SValeria Barra CeedScalar *vg = out[0]; 9866087c08SValeria Barra 9966087c08SValeria Barra switch (bc->dim) { 10066087c08SValeria Barra case 1: 10166087c08SValeria Barra CeedPragmaSIMD 10266087c08SValeria Barra for (CeedInt i=0; i<Q; i++) { 10366087c08SValeria Barra vg[i] = ug[i] * qdata[i]; 10466087c08SValeria Barra } // End of Quadrature Point Loop 10566087c08SValeria Barra break; 10666087c08SValeria Barra case 2: 10766087c08SValeria Barra CeedPragmaSIMD 10866087c08SValeria Barra for (CeedInt i=0; i<Q; i++) { 10966087c08SValeria Barra // Read spatial derivatives of u 11066087c08SValeria Barra const CeedScalar du[2] = {ug[i+Q*0], 11166087c08SValeria Barra ug[i+Q*1] 11266087c08SValeria Barra }; 11366087c08SValeria Barra 11466087c08SValeria Barra // Read qdata (dXdxdXdxT symmetric matrix) 11566087c08SValeria Barra // Stored in Voigt convention 11666087c08SValeria Barra // 0 2 11766087c08SValeria Barra // 2 1 11866087c08SValeria Barra // *INDENT-OFF* 11966087c08SValeria Barra const CeedScalar dXdxdXdxT[2][2] = {{qdata[i+0*Q], 12066087c08SValeria Barra qdata[i+2*Q]}, 12166087c08SValeria Barra {qdata[i+2*Q], 12266087c08SValeria Barra qdata[i+1*Q]}}; 12366087c08SValeria Barra // *INDENT-ON* 12466087c08SValeria Barra // j = direction of vg 12566087c08SValeria Barra for (int j=0; j<2; j++) 12666087c08SValeria Barra vg[i+j*Q] = (du[0] * dXdxdXdxT[0][j] + 12766087c08SValeria Barra du[1] * dXdxdXdxT[1][j]); 12866087c08SValeria Barra } // End of Quadrature Point Loop 12966087c08SValeria Barra break; 13066087c08SValeria Barra case 3: 13166087c08SValeria Barra CeedPragmaSIMD 13266087c08SValeria Barra for (CeedInt i=0; i<Q; i++) { 13366087c08SValeria Barra // Read spatial derivatives of u 13466087c08SValeria Barra const CeedScalar du[3] = {ug[i+Q*0], 13566087c08SValeria Barra ug[i+Q*1], 13666087c08SValeria Barra ug[i+Q*2] 13766087c08SValeria Barra }; 13866087c08SValeria Barra 13966087c08SValeria Barra // Read qdata (dXdxdXdxT symmetric matrix) 14066087c08SValeria Barra // Stored in Voigt convention 14166087c08SValeria Barra // 0 5 4 14266087c08SValeria Barra // 5 1 3 14366087c08SValeria Barra // 4 3 2 14466087c08SValeria Barra // *INDENT-OFF* 14566087c08SValeria Barra const CeedScalar dXdxdXdxT[3][3] = {{qdata[i+0*Q], 14666087c08SValeria Barra qdata[i+5*Q], 14766087c08SValeria Barra qdata[i+4*Q]}, 14866087c08SValeria Barra {qdata[i+5*Q], 14966087c08SValeria Barra qdata[i+1*Q], 15066087c08SValeria Barra qdata[i+3*Q]}, 15166087c08SValeria Barra {qdata[i+4*Q], 15266087c08SValeria Barra qdata[i+3*Q], 15366087c08SValeria Barra qdata[i+2*Q]} 15466087c08SValeria Barra }; 15566087c08SValeria Barra // *INDENT-ON* 15666087c08SValeria Barra // j = direction of vg 15766087c08SValeria Barra for (int j=0; j<3; j++) 15866087c08SValeria Barra vg[i+j*Q] = (du[0] * dXdxdXdxT[0][j] + 15966087c08SValeria Barra du[1] * dXdxdXdxT[1][j] + 16066087c08SValeria Barra du[2] * dXdxdXdxT[2][j]); 16166087c08SValeria Barra } // End of Quadrature Point Loop 16266087c08SValeria Barra break; 16366087c08SValeria Barra } 16466087c08SValeria Barra return 0; 16566087c08SValeria Barra } 166*e3bad73bSvaleriabarra 167*e3bad73bSvaleriabarra #endif // ex2_surface_h 168