1ed264d09SValeria Barra // Copyright (c) 2017, Lawrence Livermore National Security, LLC. Produced at 2ed264d09SValeria Barra // the Lawrence Livermore National Laboratory. LLNL-CODE-734707. All Rights 3ed264d09SValeria Barra // reserved. See files LICENSE and NOTICE for details. 4ed264d09SValeria Barra // 5ed264d09SValeria Barra // This file is part of CEED, a collection of benchmarks, miniapps, software 6ed264d09SValeria Barra // libraries and APIs for efficient high-order finite element and spectral 7ed264d09SValeria Barra // element discretizations for exascale applications. For more information and 8ed264d09SValeria Barra // source code availability see http://github.com/ceed. 9ed264d09SValeria Barra // 10ed264d09SValeria Barra // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, 11ed264d09SValeria Barra // a collaborative effort of two U.S. Department of Energy organizations (Office 12ed264d09SValeria Barra // of Science and the National Nuclear Security Administration) responsible for 13ed264d09SValeria Barra // the planning and preparation of a capable exascale ecosystem, including 14ed264d09SValeria Barra // software, applications, hardware, advanced system engineering and early 15ed264d09SValeria Barra // testbed platforms, in support of the nation's exascale computing imperative. 16ed264d09SValeria Barra 17ed264d09SValeria Barra /// @file 18ed264d09SValeria Barra /// libCEED QFunctions for diffusion operator example for a scalar field on the sphere using PETSc 19ed264d09SValeria Barra 20*f6b55d2cSvaleriabarra #ifndef bp3sphere_h 21*f6b55d2cSvaleriabarra #define bp3sphere_h 22*f6b55d2cSvaleriabarra #include <ceed.h> 23*f6b55d2cSvaleriabarra 24ed264d09SValeria Barra #ifndef __CUDACC__ 25ed264d09SValeria Barra # include <math.h> 26ed264d09SValeria Barra #endif 27ed264d09SValeria Barra 28ed264d09SValeria Barra // ***************************************************************************** 29ed264d09SValeria Barra // This QFunction sets up the geometric factors required for integration and 30ed264d09SValeria Barra // coordinate transformations when reference coordinates have a different 31ed264d09SValeria Barra // dimension than the one of physical coordinates 32ed264d09SValeria Barra // 33ed264d09SValeria Barra // Reference (parent) 2D coordinates: X \in [-1, 1]^2 34ed264d09SValeria Barra // 35ed264d09SValeria Barra // Global 3D physical coordinates given by the mesh: xx \in [-R, R]^3 36ed264d09SValeria Barra // with R radius of the sphere 37ed264d09SValeria Barra // 38ed264d09SValeria Barra // Local 3D physical coordinates on the 2D manifold: x \in [-l, l]^3 39ed264d09SValeria Barra // with l half edge of the cube inscribed in the sphere 40ed264d09SValeria Barra // 41ed264d09SValeria Barra // Change of coordinates matrix computed by the library: 42ed264d09SValeria Barra // (physical 3D coords relative to reference 2D coords) 43ed264d09SValeria Barra // dxx_j/dX_i (indicial notation) [3 * 2] 44ed264d09SValeria Barra // 45ed264d09SValeria Barra // Change of coordinates x (on the 2D manifold) relative to xx (phyisical 3D): 46ed264d09SValeria Barra // dx_i/dxx_j (indicial notation) [3 * 3] 47ed264d09SValeria Barra // 48ed264d09SValeria Barra // Change of coordinates x (on the 2D manifold) relative to X (reference 2D): 49ed264d09SValeria Barra // (by chain rule) 50ed264d09SValeria Barra // dx_i/dX_j [3 * 2] = dx_i/dxx_k [3 * 3] * dxx_k/dX_j [3 * 2] 51ed264d09SValeria Barra // 52ed264d09SValeria Barra // modJ is given by the magnitude of the cross product of the columns of dx_i/dX_j 53ed264d09SValeria Barra // 54ed264d09SValeria Barra // The quadrature data is stored in the array qdata. 55ed264d09SValeria Barra // 56ed264d09SValeria Barra // We require the determinant of the Jacobian to properly compute integrals of 57ed264d09SValeria Barra // the form: int( u v ) 58ed264d09SValeria Barra // 59ed264d09SValeria Barra // qdata[0]: modJ * w 60ed264d09SValeria Barra // 61ed264d09SValeria Barra // We use the Moore–Penrose (left) pseudoinverse of dx_i/dX_j, to compute dX_i/dx_j (and its transpose), 62ed264d09SValeria Barra // needed to properly compute integrals of the form: int( gradv gradu ) 63ed264d09SValeria Barra // 64ed264d09SValeria Barra // dX_i/dx_j [2 * 3] = (dx_i/dX_j)+ = (dxdX^T dxdX)^(-1) dxdX 65ed264d09SValeria Barra // 66ac4340cfSJed Brown // and the product simplifies to yield the contravariant metric tensor 67ac4340cfSJed Brown // 68ac4340cfSJed Brown // g^{ij} = dX_i/dx_k dX_j/dx_k = (dxdX^T dxdX)^{-1} 69ac4340cfSJed Brown // 7008fade8cSvaleriabarra // Stored: g^{ij} (in Voigt convention) in 7108fade8cSvaleriabarra // 7208fade8cSvaleriabarra // qdata[1:3]: [dXdxdXdxT00 dXdxdXdxT01] 7308fade8cSvaleriabarra // [dXdxdXdxT01 dXdxdXdxT11] 74ed264d09SValeria Barra // ***************************************************************************** 75ed264d09SValeria Barra 76ed264d09SValeria Barra // ----------------------------------------------------------------------------- 77ed264d09SValeria Barra CEED_QFUNCTION(SetupDiffGeo)(void *ctx, CeedInt Q, 78ed264d09SValeria Barra const CeedScalar *const *in, 79ed264d09SValeria Barra CeedScalar *const *out) { 80ed264d09SValeria Barra const CeedScalar *X = in[0], *J = in[1], *w = in[2]; 81ed264d09SValeria Barra CeedScalar *qdata = out[0]; 82ed264d09SValeria Barra 83ed264d09SValeria Barra // Quadrature Point Loop 84ed264d09SValeria Barra CeedPragmaSIMD 85ed264d09SValeria Barra for (CeedInt i=0; i<Q; i++) { 86ed264d09SValeria Barra // Read global Cartesian coordinates 87ed264d09SValeria Barra const CeedScalar xx[3] = {X[i+0*Q], 88ed264d09SValeria Barra X[i+1*Q], 89ed264d09SValeria Barra X[i+2*Q] 90ed264d09SValeria Barra }; 91ed264d09SValeria Barra 92ed264d09SValeria Barra // Read dxxdX Jacobian entries, stored as 93ed264d09SValeria Barra // 0 3 94ed264d09SValeria Barra // 1 4 95ed264d09SValeria Barra // 2 5 96ed264d09SValeria Barra const CeedScalar dxxdX[3][2] = {{J[i+Q*0], 97ed264d09SValeria Barra J[i+Q*3]}, 98ed264d09SValeria Barra {J[i+Q*1], 99ed264d09SValeria Barra J[i+Q*4]}, 100ed264d09SValeria Barra {J[i+Q*2], 101ed264d09SValeria Barra J[i+Q*5]} 102ed264d09SValeria Barra }; 103ed264d09SValeria Barra 104ed264d09SValeria Barra // Setup 105ed264d09SValeria Barra // x = xx (xx^T xx)^{-1/2} 106ed264d09SValeria Barra // dx/dxx = I (xx^T xx)^{-1/2} - xx xx^T (xx^T xx)^{-3/2} 107ed264d09SValeria Barra const CeedScalar modxxsq = xx[0]*xx[0]+xx[1]*xx[1]+xx[2]*xx[2]; 108ed264d09SValeria Barra CeedScalar xxsq[3][3]; 109ed264d09SValeria Barra for (int j=0; j<3; j++) 110ed264d09SValeria Barra for (int k=0; k<3; k++) 111ed264d09SValeria Barra xxsq[j][k] = xx[j]*xx[k] / (sqrt(modxxsq) * modxxsq); 112ed264d09SValeria Barra 113ed264d09SValeria Barra const CeedScalar dxdxx[3][3] = {{1./sqrt(modxxsq) - xxsq[0][0], 114ed264d09SValeria Barra -xxsq[0][1], 115ed264d09SValeria Barra -xxsq[0][2]}, 116ed264d09SValeria Barra {-xxsq[1][0], 117ed264d09SValeria Barra 1./sqrt(modxxsq) - xxsq[1][1], 118ed264d09SValeria Barra -xxsq[1][2]}, 119ed264d09SValeria Barra {-xxsq[2][0], 120ed264d09SValeria Barra -xxsq[2][1], 121ed264d09SValeria Barra 1./sqrt(modxxsq) - xxsq[2][2]} 122ed264d09SValeria Barra }; 123ed264d09SValeria Barra 124ed264d09SValeria Barra CeedScalar dxdX[3][2]; 125ed264d09SValeria Barra for (int j=0; j<3; j++) 126ed264d09SValeria Barra for (int k=0; k<2; k++) { 127ed264d09SValeria Barra dxdX[j][k] = 0; 128ed264d09SValeria Barra for (int l=0; l<3; l++) 129ed264d09SValeria Barra dxdX[j][k] += dxdxx[j][l]*dxxdX[l][k]; 130ed264d09SValeria Barra } 131ed264d09SValeria Barra 132ed264d09SValeria Barra // J is given by the cross product of the columns of dxdX 133ed264d09SValeria Barra const CeedScalar J[3]= {dxdX[1][0]*dxdX[2][1] - dxdX[2][0]*dxdX[1][1], 134ed264d09SValeria Barra dxdX[2][0]*dxdX[0][1] - dxdX[0][0]*dxdX[2][1], 135ed264d09SValeria Barra dxdX[0][0]*dxdX[1][1] - dxdX[1][0]*dxdX[0][1] 136ed264d09SValeria Barra }; 137ed264d09SValeria Barra 138ed264d09SValeria Barra // Use the magnitude of J as our detJ (volume scaling factor) 139ed264d09SValeria Barra const CeedScalar modJ = sqrt(J[0]*J[0]+J[1]*J[1]+J[2]*J[2]); 140ed264d09SValeria Barra 141ed264d09SValeria Barra // Interp-to-Interp qdata 142ed264d09SValeria Barra qdata[i+Q*0] = modJ * w[i]; 143ed264d09SValeria Barra 14408fade8cSvaleriabarra // dxdX_k,j * dxdX_j,k 145ed264d09SValeria Barra CeedScalar dxdXTdxdX[2][2]; 146ed264d09SValeria Barra for (int j=0; j<2; j++) 147ed264d09SValeria Barra for (int k=0; k<2; k++) { 148ed264d09SValeria Barra dxdXTdxdX[j][k] = 0; 149ed264d09SValeria Barra for (int l=0; l<3; l++) 150ed264d09SValeria Barra dxdXTdxdX[j][k] += dxdX[l][j]*dxdX[l][k]; 151ed264d09SValeria Barra } 152ed264d09SValeria Barra 153ed264d09SValeria Barra const CeedScalar detdxdXTdxdX = dxdXTdxdX[0][0] * dxdXTdxdX[1][1] 154ed264d09SValeria Barra -dxdXTdxdX[1][0] * dxdXTdxdX[0][1]; 155ed264d09SValeria Barra 15608fade8cSvaleriabarra // Compute inverse of dxdXTdxdX, which is the 2x2 contravariant metric tensor g^{ij} 157ed264d09SValeria Barra CeedScalar dxdXTdxdXinv[2][2]; 158ed264d09SValeria Barra dxdXTdxdXinv[0][0] = dxdXTdxdX[1][1] / detdxdXTdxdX; 159ed264d09SValeria Barra dxdXTdxdXinv[0][1] = -dxdXTdxdX[0][1] / detdxdXTdxdX; 160ed264d09SValeria Barra dxdXTdxdXinv[1][0] = -dxdXTdxdX[1][0] / detdxdXTdxdX; 161ed264d09SValeria Barra dxdXTdxdXinv[1][1] = dxdXTdxdX[0][0] / detdxdXTdxdX; 162ed264d09SValeria Barra 163ed264d09SValeria Barra // Stored in Voigt convention 164ac4340cfSJed Brown qdata[i+Q*1] = dxdXTdxdXinv[0][0]; 165ac4340cfSJed Brown qdata[i+Q*2] = dxdXTdxdXinv[1][1]; 166ac4340cfSJed Brown qdata[i+Q*3] = dxdXTdxdXinv[0][1]; 167ed264d09SValeria Barra } // End of Quadrature Point Loop 168ed264d09SValeria Barra 169ed264d09SValeria Barra // Return 170ed264d09SValeria Barra return 0; 171ed264d09SValeria Barra } 172ed264d09SValeria Barra 173ed264d09SValeria Barra // ***************************************************************************** 174ed264d09SValeria Barra // This QFunction sets up the rhs and true solution for the problem 175ed264d09SValeria Barra // ***************************************************************************** 176ed264d09SValeria Barra 177ed264d09SValeria Barra // ----------------------------------------------------------------------------- 178ed264d09SValeria Barra CEED_QFUNCTION(SetupDiffRhs)(void *ctx, CeedInt Q, 179ed264d09SValeria Barra const CeedScalar *const *in, 180ed264d09SValeria Barra CeedScalar *const *out) { 181ed264d09SValeria Barra // Inputs 182ed264d09SValeria Barra const CeedScalar *X = in[0], *qdata = in[1]; 183ed264d09SValeria Barra // Outputs 184ed264d09SValeria Barra CeedScalar *true_soln = out[0], *rhs = out[1]; 185ed264d09SValeria Barra 186ed264d09SValeria Barra // Context 187ed264d09SValeria Barra const CeedScalar *context = (const CeedScalar*)ctx; 188ed264d09SValeria Barra const CeedScalar R = context[0]; 189ed264d09SValeria Barra 190ed264d09SValeria Barra // Quadrature Point Loop 191ed264d09SValeria Barra CeedPragmaSIMD 192ed264d09SValeria Barra for (CeedInt i=0; i<Q; i++) { 193ed264d09SValeria Barra // Read global Cartesian coordinates 194ed264d09SValeria Barra CeedScalar x = X[i+Q*0], y = X[i+Q*1], z = X[i+Q*2]; 195ed264d09SValeria Barra // Normalize quadrature point coordinates to sphere 196ed264d09SValeria Barra CeedScalar rad = sqrt(x*x + y*y + z*z); 197ed264d09SValeria Barra x *= R / rad; 198ed264d09SValeria Barra y *= R / rad; 199ed264d09SValeria Barra z *= R / rad; 200ed264d09SValeria Barra // Compute latitude and longitude 201ed264d09SValeria Barra const CeedScalar theta = asin(z / R); // latitude 202ed264d09SValeria Barra const CeedScalar lambda = atan2(y, x); // longitude 203ed264d09SValeria Barra 204ed264d09SValeria Barra true_soln[i+Q*0] = sin(lambda) * cos(theta); 205ed264d09SValeria Barra 206ed264d09SValeria Barra rhs[i+Q*0] = qdata[i+Q*0] * 2 * sin(lambda)*cos(theta) / (R*R); 207ed264d09SValeria Barra 208ed264d09SValeria Barra } // End of Quadrature Point Loop 209ed264d09SValeria Barra 210ed264d09SValeria Barra return 0; 211ed264d09SValeria Barra } 212ed264d09SValeria Barra 213ed264d09SValeria Barra // ***************************************************************************** 214ed264d09SValeria Barra // This QFunction applies the diffusion operator for a scalar field. 215ed264d09SValeria Barra // 216ed264d09SValeria Barra // Inputs: 217ed264d09SValeria Barra // ug - Input vector gradient at quadrature points 218ed264d09SValeria Barra // qdata - Geometric factors 219ed264d09SValeria Barra // 220ed264d09SValeria Barra // Output: 221ed264d09SValeria Barra // vg - Output vector (test functions) gradient at quadrature points 222ed264d09SValeria Barra // 223ed264d09SValeria Barra // ***************************************************************************** 224ed264d09SValeria Barra 225ed264d09SValeria Barra // ----------------------------------------------------------------------------- 226ed264d09SValeria Barra CEED_QFUNCTION(Diff)(void *ctx, CeedInt Q, 227ed264d09SValeria Barra const CeedScalar *const *in, CeedScalar *const *out) { 228ed264d09SValeria Barra // Inputs 229ed264d09SValeria Barra const CeedScalar *ug = in[0], *qdata = in[1]; 230ed264d09SValeria Barra // Outputs 231ed264d09SValeria Barra CeedScalar *vg = out[0]; 232ed264d09SValeria Barra 233ed264d09SValeria Barra // Quadrature Point Loop 234ed264d09SValeria Barra CeedPragmaSIMD 235ed264d09SValeria Barra for (CeedInt i=0; i<Q; i++) { 236ed264d09SValeria Barra // Read spatial derivatives of u 237ed264d09SValeria Barra const CeedScalar du[2] = {ug[i+Q*0], 238ed264d09SValeria Barra ug[i+Q*1] 239ed264d09SValeria Barra }; 240ed264d09SValeria Barra // Read qdata 241ed264d09SValeria Barra const CeedScalar wJ = qdata[i+Q*0]; 242ed264d09SValeria Barra // -- Grad-to-Grad qdata 243ed264d09SValeria Barra // ---- dXdx_j,k * dXdx_k,j 244ed264d09SValeria Barra const CeedScalar dXdxdXdxT[2][2] = {{qdata[i+Q*1], 245ed264d09SValeria Barra qdata[i+Q*3]}, 246ed264d09SValeria Barra {qdata[i+Q*3], 247ed264d09SValeria Barra qdata[i+Q*2]} 248ed264d09SValeria Barra }; 249ed264d09SValeria Barra 250ed264d09SValeria Barra for (int j=0; j<2; j++) // j = direction of vg 251ed264d09SValeria Barra vg[i+j*Q] = wJ * (du[0] * dXdxdXdxT[0][j] + 252ed264d09SValeria Barra du[1] * dXdxdXdxT[1][j]); 253ed264d09SValeria Barra 254ed264d09SValeria Barra } // End of Quadrature Point Loop 255ed264d09SValeria Barra 256ed264d09SValeria Barra return 0; 257ed264d09SValeria Barra } 258ed264d09SValeria Barra // ----------------------------------------------------------------------------- 259*f6b55d2cSvaleriabarra 260*f6b55d2cSvaleriabarra #endif // bp3sphere_h 261