13d8e8822SJeremy L Thompson // Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors. 23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details. 3cb32e2e7SValeria Barra // 43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause 5cb32e2e7SValeria Barra // 63d8e8822SJeremy L Thompson // This file is part of CEED: http://github.com/ceed 7cb32e2e7SValeria Barra 8cb32e2e7SValeria Barra /// @file 9cb32e2e7SValeria Barra /// libCEED QFunctions for diffusion operator example using PETSc 10cb32e2e7SValeria Barra 1113921685Svaleriabarra #ifndef bp3_h 1213921685Svaleriabarra #define bp3_h 1313921685Svaleriabarra 14c9c2c079SJeremy L Thompson #include <ceed.h> 1513921685Svaleriabarra #include <math.h> 1613921685Svaleriabarra 17e83e87a5Sjeremylt // ----------------------------------------------------------------------------- 18ed264d09SValeria Barra // This QFunction sets up the geometric factors required to apply the 19ed264d09SValeria Barra // diffusion operator 20ed264d09SValeria Barra // 21ed264d09SValeria Barra // We require the product of the inverse of the Jacobian and its transpose to 22ed264d09SValeria Barra // properly compute integrals of the form: int( gradv gradu) 23ed264d09SValeria Barra // 24ed264d09SValeria Barra // Determinant of Jacobian: 25ed264d09SValeria Barra // detJ = J11*A11 + J21*A12 + J31*A13 26ed264d09SValeria Barra // Jij = Jacobian entry ij 27ed264d09SValeria Barra // Aij = Adjoint ij 28ed264d09SValeria Barra // 29ed264d09SValeria Barra // Inverse of Jacobian: 30ed264d09SValeria Barra // Bij = Aij / detJ 31ed264d09SValeria Barra // 32ed264d09SValeria Barra // Product of Inverse and Transpose: 33ed264d09SValeria Barra // BBij = sum( Bik Bkj ) 34ed264d09SValeria Barra // 35ed264d09SValeria Barra // Stored: w B^T B detJ = w A^T A / detJ 36ed264d09SValeria Barra // Note: This matrix is symmetric, so we only store 6 distinct entries 37*0a8fc04aSrezgarshakeri // qd: 1 4 7 38ed264d09SValeria Barra // 2 5 8 39*0a8fc04aSrezgarshakeri // 3 6 9 40cb32e2e7SValeria Barra // ----------------------------------------------------------------------------- 41cb32e2e7SValeria Barra CEED_QFUNCTION(SetupDiffGeo)(void *ctx, CeedInt Q, 42cb32e2e7SValeria Barra const CeedScalar *const *in, 43cb32e2e7SValeria Barra CeedScalar *const *out) { 44d4d45553Srezgarshakeri // Inputs 45d4d45553Srezgarshakeri const CeedScalar(*J)[3][CEED_Q_VLA] = (const CeedScalar(*)[3][CEED_Q_VLA])in[1]; 46d4d45553Srezgarshakeri const CeedScalar(*w) = in[2]; // Note: *X = in[0] 47d4d45553Srezgarshakeri // Outputs 48d4d45553Srezgarshakeri CeedScalar(*qd) = out[0]; 49cb32e2e7SValeria Barra 50d4d45553Srezgarshakeri const CeedInt dim = 3; 51cb32e2e7SValeria Barra // Quadrature Point Loop 52cb32e2e7SValeria Barra CeedPragmaSIMD 53cb32e2e7SValeria Barra for (CeedInt i=0; i<Q; i++) { 54d4d45553Srezgarshakeri // Setup 55d4d45553Srezgarshakeri CeedScalar A[3][3]; 56d4d45553Srezgarshakeri for (CeedInt j = 0; j < dim; j++) { 57d4d45553Srezgarshakeri for (CeedInt k = 0; k < dim; k++) { 58d4d45553Srezgarshakeri // Equivalent code with no mod operations: 59d4d45553Srezgarshakeri // A[k][j] = J[k+1][j+1]*J[k+2][j+2] - J[k+1][j+2]*J[k+2][j+1] 60d4d45553Srezgarshakeri A[k][j] = J[(k + 1) % dim][(j + 1) % dim][i] * J[(k + 2) % dim][(j + 2) % dim][i] - 61d4d45553Srezgarshakeri J[(k + 1) % dim][(j + 2) % dim][i] * J[(k + 2) % dim][(j + 1) % dim][i]; 62d4d45553Srezgarshakeri } 63d4d45553Srezgarshakeri } 64d4d45553Srezgarshakeri const CeedScalar detJ = J[0][0][i] * A[0][0] + J[0][1][i] * A[0][1] + J[0][2][i] * A[0][2]; 65d4d45553Srezgarshakeri 66d4d45553Srezgarshakeri const CeedScalar qw = w[i] / detJ; 67*0a8fc04aSrezgarshakeri qd[i+Q*0] = w[i] * detJ; 68*0a8fc04aSrezgarshakeri qd[i+Q*1] = qw * (A[0][0]*A[0][0] + A[0][1]*A[0][1] + A[0][2]*A[0][2]); 69*0a8fc04aSrezgarshakeri qd[i+Q*2] = qw * (A[0][0]*A[1][0] + A[0][1]*A[1][1] + A[0][2]*A[1][2]); 70*0a8fc04aSrezgarshakeri qd[i+Q*3] = qw * (A[0][0]*A[2][0] + A[0][1]*A[2][1] + A[0][2]*A[2][2]); 71*0a8fc04aSrezgarshakeri qd[i+Q*4] = qw * (A[1][0]*A[1][0] + A[1][1]*A[1][1] + A[1][2]*A[1][2]); 72*0a8fc04aSrezgarshakeri qd[i+Q*5] = qw * (A[1][0]*A[2][0] + A[1][1]*A[2][1] + A[1][2]*A[2][2]); 73*0a8fc04aSrezgarshakeri qd[i+Q*6] = qw * (A[2][0]*A[2][0] + A[2][1]*A[2][1] + A[2][2]*A[2][2]); 74cb32e2e7SValeria Barra } // End of Quadrature Point Loop 75cb32e2e7SValeria Barra 76cb32e2e7SValeria Barra return 0; 77cb32e2e7SValeria Barra } 78cb32e2e7SValeria Barra 79e83e87a5Sjeremylt // ----------------------------------------------------------------------------- 80ed264d09SValeria Barra // This QFunction sets up the rhs and true solution for the problem 81cb32e2e7SValeria Barra // ----------------------------------------------------------------------------- 82cb32e2e7SValeria Barra CEED_QFUNCTION(SetupDiffRhs)(void *ctx, CeedInt Q, 83cb32e2e7SValeria Barra const CeedScalar *const *in, 84cb32e2e7SValeria Barra CeedScalar *const *out) { 85cb32e2e7SValeria Barra #ifndef M_PI 86cb32e2e7SValeria Barra # define M_PI 3.14159265358979323846 87cb32e2e7SValeria Barra #endif 88e83e87a5Sjeremylt const CeedScalar *x = in[0], *w = in[1]; 89cb32e2e7SValeria Barra CeedScalar *true_soln = out[0], *rhs = out[1]; 90cb32e2e7SValeria Barra 91cb32e2e7SValeria Barra // Quadrature Point Loop 92cb32e2e7SValeria Barra CeedPragmaSIMD 93cb32e2e7SValeria Barra for (CeedInt i=0; i<Q; i++) { 94cb32e2e7SValeria Barra const CeedScalar c[3] = { 0, 1., 2. }; 95cb32e2e7SValeria Barra const CeedScalar k[3] = { 1., 2., 3. }; 96cb32e2e7SValeria Barra 97cb32e2e7SValeria Barra true_soln[i] = sin(M_PI*(c[0] + k[0]*x[i+Q*0])) * 98cb32e2e7SValeria Barra sin(M_PI*(c[1] + k[1]*x[i+Q*1])) * 99cb32e2e7SValeria Barra sin(M_PI*(c[2] + k[2]*x[i+Q*2])); 100cb32e2e7SValeria Barra 101*0a8fc04aSrezgarshakeri rhs[i] = w[i+Q*0] * M_PI*M_PI * (k[0]*k[0] + k[1]*k[1] + k[2]*k[2]) * 102cb32e2e7SValeria Barra true_soln[i]; 103cb32e2e7SValeria Barra } // End of Quadrature Point Loop 104cb32e2e7SValeria Barra 105cb32e2e7SValeria Barra return 0; 106cb32e2e7SValeria Barra } 107cb32e2e7SValeria Barra 108e83e87a5Sjeremylt // ----------------------------------------------------------------------------- 109ed264d09SValeria Barra // This QFunction applies the diffusion operator for a scalar field. 110ed264d09SValeria Barra // 111ed264d09SValeria Barra // Inputs: 112ed264d09SValeria Barra // ug - Input vector gradient at quadrature points 1139b072555Sjeremylt // q_data - Geometric factors 114ed264d09SValeria Barra // 115ed264d09SValeria Barra // Output: 116ed264d09SValeria Barra // vg - Output vector (test functions) gradient at quadrature points 117ed264d09SValeria Barra // 118cb32e2e7SValeria Barra // ----------------------------------------------------------------------------- 119cb32e2e7SValeria Barra CEED_QFUNCTION(Diff)(void *ctx, CeedInt Q, 120cb32e2e7SValeria Barra const CeedScalar *const *in, CeedScalar *const *out) { 1219b072555Sjeremylt const CeedScalar *ug = in[0], *q_data = in[1]; 122cb32e2e7SValeria Barra CeedScalar *vg = out[0]; 123cb32e2e7SValeria Barra 124cb32e2e7SValeria Barra // Quadrature Point Loop 125cb32e2e7SValeria Barra CeedPragmaSIMD 126cb32e2e7SValeria Barra for (CeedInt i=0; i<Q; i++) { 127cb32e2e7SValeria Barra // Read spatial derivatives of u 128cb32e2e7SValeria Barra const CeedScalar du[3] = {ug[i+Q*0], 129cb32e2e7SValeria Barra ug[i+Q*1], 130cb32e2e7SValeria Barra ug[i+Q*2] 131cb32e2e7SValeria Barra }; 1329b072555Sjeremylt // Read q_data (dXdxdXdx_T symmetric matrix) 133*0a8fc04aSrezgarshakeri const CeedScalar dXdxdXdx_T[3][3] = {{q_data[i+1*Q], 134*0a8fc04aSrezgarshakeri q_data[i+2*Q], 135*0a8fc04aSrezgarshakeri q_data[i+3*Q]}, 1369b072555Sjeremylt {q_data[i+2*Q], 1379b072555Sjeremylt q_data[i+4*Q], 138*0a8fc04aSrezgarshakeri q_data[i+5*Q]}, 139*0a8fc04aSrezgarshakeri {q_data[i+3*Q], 140*0a8fc04aSrezgarshakeri q_data[i+5*Q], 141*0a8fc04aSrezgarshakeri q_data[i+6*Q]} 142cb32e2e7SValeria Barra }; 143cb32e2e7SValeria Barra 144cb32e2e7SValeria Barra for (int j=0; j<3; j++) // j = direction of vg 1459b072555Sjeremylt vg[i+j*Q] = (du[0] * dXdxdXdx_T[0][j] + 1469b072555Sjeremylt du[1] * dXdxdXdx_T[1][j] + 1479b072555Sjeremylt du[2] * dXdxdXdx_T[2][j]); 148cb32e2e7SValeria Barra 149cb32e2e7SValeria Barra } // End of Quadrature Point Loop 150cb32e2e7SValeria Barra return 0; 151cb32e2e7SValeria Barra } 152cb32e2e7SValeria Barra // ----------------------------------------------------------------------------- 153f6b55d2cSvaleriabarra 154f6b55d2cSvaleriabarra #endif // bp3_h 155