1cb32e2e7SValeria Barra // Copyright (c) 2017, Lawrence Livermore National Security, LLC. Produced at 2cb32e2e7SValeria Barra // the Lawrence Livermore National Laboratory. LLNL-CODE-734707. All Rights 3cb32e2e7SValeria Barra // reserved. See files LICENSE and NOTICE for details. 4cb32e2e7SValeria Barra // 5cb32e2e7SValeria Barra // This file is part of CEED, a collection of benchmarks, miniapps, software 6cb32e2e7SValeria Barra // libraries and APIs for efficient high-order finite element and spectral 7cb32e2e7SValeria Barra // element discretizations for exascale applications. For more information and 8cb32e2e7SValeria Barra // source code availability see http://github.com/ceed. 9cb32e2e7SValeria Barra // 10cb32e2e7SValeria Barra // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, 11cb32e2e7SValeria Barra // a collaborative effort of two U.S. Department of Energy organizations (Office 12cb32e2e7SValeria Barra // of Science and the National Nuclear Security Administration) responsible for 13cb32e2e7SValeria Barra // the planning and preparation of a capable exascale ecosystem, including 14cb32e2e7SValeria Barra // software, applications, hardware, advanced system engineering and early 15cb32e2e7SValeria Barra // testbed platforms, in support of the nation's exascale computing imperative. 16cb32e2e7SValeria Barra 17cb32e2e7SValeria Barra /// @file 18cb32e2e7SValeria Barra /// libCEED QFunctions for diffusion operator example using PETSc 19cb32e2e7SValeria Barra 20ed264d09SValeria Barra // ***************************************************************************** 21ed264d09SValeria Barra // This QFunction sets up the geometric factors required to apply the 22ed264d09SValeria Barra // diffusion operator 23ed264d09SValeria Barra // 24ed264d09SValeria Barra // We require the product of the inverse of the Jacobian and its transpose to 25ed264d09SValeria Barra // properly compute integrals of the form: int( gradv gradu) 26ed264d09SValeria Barra // 27ed264d09SValeria Barra // Determinant of Jacobian: 28ed264d09SValeria Barra // detJ = J11*A11 + J21*A12 + J31*A13 29ed264d09SValeria Barra // Jij = Jacobian entry ij 30ed264d09SValeria Barra // Aij = Adjoint ij 31ed264d09SValeria Barra // 32ed264d09SValeria Barra // Inverse of Jacobian: 33ed264d09SValeria Barra // Bij = Aij / detJ 34ed264d09SValeria Barra // 35ed264d09SValeria Barra // Product of Inverse and Transpose: 36ed264d09SValeria Barra // BBij = sum( Bik Bkj ) 37ed264d09SValeria Barra // 38ed264d09SValeria Barra // Stored: w B^T B detJ = w A^T A / detJ 39ed264d09SValeria Barra // Note: This matrix is symmetric, so we only store 6 distinct entries 40ed264d09SValeria Barra // qd: 0 3 6 41ed264d09SValeria Barra // 1 4 7 42ed264d09SValeria Barra // 2 5 8 43ed264d09SValeria Barra // ***************************************************************************** 44ed264d09SValeria Barra 45*f6b55d2cSvaleriabarra #ifndef bp3_h 46*f6b55d2cSvaleriabarra #define bp3_h 47*f6b55d2cSvaleriabarra #include <ceed.h> 48*f6b55d2cSvaleriabarra 49*f6b55d2cSvaleriabarra #ifndef __CUDACC__ 50*f6b55d2cSvaleriabarra # include <math.h> 51*f6b55d2cSvaleriabarra #endif 52*f6b55d2cSvaleriabarra 53cb32e2e7SValeria Barra // ----------------------------------------------------------------------------- 54cb32e2e7SValeria Barra CEED_QFUNCTION(SetupDiffGeo)(void *ctx, CeedInt Q, 55cb32e2e7SValeria Barra const CeedScalar *const *in, 56cb32e2e7SValeria Barra CeedScalar *const *out) { 57cb32e2e7SValeria Barra const CeedScalar *J = in[0], *w = in[1]; 58cb32e2e7SValeria Barra CeedScalar *qd = out[0]; 59cb32e2e7SValeria Barra 60cb32e2e7SValeria Barra // Quadrature Point Loop 61cb32e2e7SValeria Barra CeedPragmaSIMD 62cb32e2e7SValeria Barra for (CeedInt i=0; i<Q; i++) { 63cb32e2e7SValeria Barra const CeedScalar J11 = J[i+Q*0]; 64cb32e2e7SValeria Barra const CeedScalar J21 = J[i+Q*1]; 65cb32e2e7SValeria Barra const CeedScalar J31 = J[i+Q*2]; 66cb32e2e7SValeria Barra const CeedScalar J12 = J[i+Q*3]; 67cb32e2e7SValeria Barra const CeedScalar J22 = J[i+Q*4]; 68cb32e2e7SValeria Barra const CeedScalar J32 = J[i+Q*5]; 69cb32e2e7SValeria Barra const CeedScalar J13 = J[i+Q*6]; 70cb32e2e7SValeria Barra const CeedScalar J23 = J[i+Q*7]; 71cb32e2e7SValeria Barra const CeedScalar J33 = J[i+Q*8]; 72cb32e2e7SValeria Barra const CeedScalar A11 = J22*J33 - J23*J32; 73cb32e2e7SValeria Barra const CeedScalar A12 = J13*J32 - J12*J33; 74cb32e2e7SValeria Barra const CeedScalar A13 = J12*J23 - J13*J22; 75cb32e2e7SValeria Barra const CeedScalar A21 = J23*J31 - J21*J33; 76cb32e2e7SValeria Barra const CeedScalar A22 = J11*J33 - J13*J31; 77cb32e2e7SValeria Barra const CeedScalar A23 = J13*J21 - J11*J23; 78cb32e2e7SValeria Barra const CeedScalar A31 = J21*J32 - J22*J31; 79cb32e2e7SValeria Barra const CeedScalar A32 = J12*J31 - J11*J32; 80cb32e2e7SValeria Barra const CeedScalar A33 = J11*J22 - J12*J21; 81cb32e2e7SValeria Barra const CeedScalar qw = w[i] / (J11*A11 + J21*A12 + J31*A13); 82cb32e2e7SValeria Barra qd[i+Q*0] = qw * (A11*A11 + A12*A12 + A13*A13); 83cb32e2e7SValeria Barra qd[i+Q*1] = qw * (A11*A21 + A12*A22 + A13*A23); 84cb32e2e7SValeria Barra qd[i+Q*2] = qw * (A11*A31 + A12*A32 + A13*A33); 85cb32e2e7SValeria Barra qd[i+Q*3] = qw * (A21*A21 + A22*A22 + A23*A23); 86cb32e2e7SValeria Barra qd[i+Q*4] = qw * (A21*A31 + A22*A32 + A23*A33); 87cb32e2e7SValeria Barra qd[i+Q*5] = qw * (A31*A31 + A32*A32 + A33*A33); 88cb32e2e7SValeria Barra } // End of Quadrature Point Loop 89cb32e2e7SValeria Barra 90cb32e2e7SValeria Barra return 0; 91cb32e2e7SValeria Barra } 92cb32e2e7SValeria Barra 93ed264d09SValeria Barra // ***************************************************************************** 94ed264d09SValeria Barra // This QFunction sets up the rhs and true solution for the problem 95ed264d09SValeria Barra // ***************************************************************************** 96ed264d09SValeria Barra 97cb32e2e7SValeria Barra // ----------------------------------------------------------------------------- 98cb32e2e7SValeria Barra CEED_QFUNCTION(SetupDiffRhs)(void *ctx, CeedInt Q, 99cb32e2e7SValeria Barra const CeedScalar *const *in, 100cb32e2e7SValeria Barra CeedScalar *const *out) { 101cb32e2e7SValeria Barra #ifndef M_PI 102cb32e2e7SValeria Barra # define M_PI 3.14159265358979323846 103cb32e2e7SValeria Barra #endif 104cb32e2e7SValeria Barra const CeedScalar *x = in[0], *J = in[1], *w = in[2]; 105cb32e2e7SValeria Barra CeedScalar *true_soln = out[0], *rhs = out[1]; 106cb32e2e7SValeria Barra 107cb32e2e7SValeria Barra // Quadrature Point Loop 108cb32e2e7SValeria Barra CeedPragmaSIMD 109cb32e2e7SValeria Barra for (CeedInt i=0; i<Q; i++) { 110cb32e2e7SValeria Barra const CeedScalar J11 = J[i+Q*0]; 111cb32e2e7SValeria Barra const CeedScalar J21 = J[i+Q*1]; 112cb32e2e7SValeria Barra const CeedScalar J31 = J[i+Q*2]; 113cb32e2e7SValeria Barra const CeedScalar J12 = J[i+Q*3]; 114cb32e2e7SValeria Barra const CeedScalar J22 = J[i+Q*4]; 115cb32e2e7SValeria Barra const CeedScalar J32 = J[i+Q*5]; 116cb32e2e7SValeria Barra const CeedScalar J13 = J[i+Q*6]; 117cb32e2e7SValeria Barra const CeedScalar J23 = J[i+Q*7]; 118cb32e2e7SValeria Barra const CeedScalar J33 = J[i+Q*8]; 119cb32e2e7SValeria Barra const CeedScalar A11 = J22*J33 - J23*J32; 120cb32e2e7SValeria Barra const CeedScalar A12 = J13*J32 - J12*J33; 121cb32e2e7SValeria Barra const CeedScalar A13 = J12*J23 - J13*J22; 122cb32e2e7SValeria Barra 123cb32e2e7SValeria Barra const CeedScalar c[3] = { 0, 1., 2. }; 124cb32e2e7SValeria Barra const CeedScalar k[3] = { 1., 2., 3. }; 125cb32e2e7SValeria Barra 126cb32e2e7SValeria Barra true_soln[i] = sin(M_PI*(c[0] + k[0]*x[i+Q*0])) * 127cb32e2e7SValeria Barra sin(M_PI*(c[1] + k[1]*x[i+Q*1])) * 128cb32e2e7SValeria Barra sin(M_PI*(c[2] + k[2]*x[i+Q*2])); 129cb32e2e7SValeria Barra 130cb32e2e7SValeria Barra const CeedScalar rho = w[i] * (J11*A11 + J21*A12 + J31*A13); 131cb32e2e7SValeria Barra rhs[i] = rho * M_PI*M_PI * (k[0]*k[0] + k[1]*k[1] + k[2]*k[2]) * 132cb32e2e7SValeria Barra true_soln[i]; 133cb32e2e7SValeria Barra } // End of Quadrature Point Loop 134cb32e2e7SValeria Barra 135cb32e2e7SValeria Barra return 0; 136cb32e2e7SValeria Barra } 137cb32e2e7SValeria Barra 138ed264d09SValeria Barra // ***************************************************************************** 139ed264d09SValeria Barra // This QFunction applies the diffusion operator for a scalar field. 140ed264d09SValeria Barra // 141ed264d09SValeria Barra // Inputs: 142ed264d09SValeria Barra // ug - Input vector gradient at quadrature points 143ed264d09SValeria Barra // qdata - Geometric factors 144ed264d09SValeria Barra // 145ed264d09SValeria Barra // Output: 146ed264d09SValeria Barra // vg - Output vector (test functions) gradient at quadrature points 147ed264d09SValeria Barra // 148ed264d09SValeria Barra // ***************************************************************************** 149ed264d09SValeria Barra 150cb32e2e7SValeria Barra // ----------------------------------------------------------------------------- 151cb32e2e7SValeria Barra CEED_QFUNCTION(Diff)(void *ctx, CeedInt Q, 152cb32e2e7SValeria Barra const CeedScalar *const *in, CeedScalar *const *out) { 153ed264d09SValeria Barra const CeedScalar *ug = in[0], *qdata = in[1]; 154cb32e2e7SValeria Barra CeedScalar *vg = out[0]; 155cb32e2e7SValeria Barra 156cb32e2e7SValeria Barra // Quadrature Point Loop 157cb32e2e7SValeria Barra CeedPragmaSIMD 158cb32e2e7SValeria Barra for (CeedInt i=0; i<Q; i++) { 159cb32e2e7SValeria Barra // Read spatial derivatives of u 160cb32e2e7SValeria Barra const CeedScalar du[3] = {ug[i+Q*0], 161cb32e2e7SValeria Barra ug[i+Q*1], 162cb32e2e7SValeria Barra ug[i+Q*2] 163cb32e2e7SValeria Barra }; 164cb32e2e7SValeria Barra // Read qdata (dXdxdXdxT symmetric matrix) 165ed264d09SValeria Barra const CeedScalar dXdxdXdxT[3][3] = {{qdata[i+0*Q], 166ed264d09SValeria Barra qdata[i+1*Q], 167ed264d09SValeria Barra qdata[i+2*Q]}, 168ed264d09SValeria Barra {qdata[i+1*Q], 169ed264d09SValeria Barra qdata[i+3*Q], 170ed264d09SValeria Barra qdata[i+4*Q]}, 171ed264d09SValeria Barra {qdata[i+2*Q], 172ed264d09SValeria Barra qdata[i+4*Q], 173ed264d09SValeria Barra qdata[i+5*Q]} 174cb32e2e7SValeria Barra }; 175cb32e2e7SValeria Barra 176cb32e2e7SValeria Barra for (int j=0; j<3; j++) // j = direction of vg 177cb32e2e7SValeria Barra vg[i+j*Q] = (du[0] * dXdxdXdxT[0][j] + 178cb32e2e7SValeria Barra du[1] * dXdxdXdxT[1][j] + 179cb32e2e7SValeria Barra du[2] * dXdxdXdxT[2][j]); 180cb32e2e7SValeria Barra 181cb32e2e7SValeria Barra } // End of Quadrature Point Loop 182cb32e2e7SValeria Barra return 0; 183cb32e2e7SValeria Barra } 184cb32e2e7SValeria Barra // ----------------------------------------------------------------------------- 185*f6b55d2cSvaleriabarra 186*f6b55d2cSvaleriabarra #endif // bp3_h 187