xref: /libCEED/examples/petsc/qfunctions/bps/bp3sphere.h (revision f6b55d2cd51f3d398370612efe4c4d20233baf37)
1ed264d09SValeria Barra // Copyright (c) 2017, Lawrence Livermore National Security, LLC. Produced at
2ed264d09SValeria Barra // the Lawrence Livermore National Laboratory. LLNL-CODE-734707. All Rights
3ed264d09SValeria Barra // reserved. See files LICENSE and NOTICE for details.
4ed264d09SValeria Barra //
5ed264d09SValeria Barra // This file is part of CEED, a collection of benchmarks, miniapps, software
6ed264d09SValeria Barra // libraries and APIs for efficient high-order finite element and spectral
7ed264d09SValeria Barra // element discretizations for exascale applications. For more information and
8ed264d09SValeria Barra // source code availability see http://github.com/ceed.
9ed264d09SValeria Barra //
10ed264d09SValeria Barra // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC,
11ed264d09SValeria Barra // a collaborative effort of two U.S. Department of Energy organizations (Office
12ed264d09SValeria Barra // of Science and the National Nuclear Security Administration) responsible for
13ed264d09SValeria Barra // the planning and preparation of a capable exascale ecosystem, including
14ed264d09SValeria Barra // software, applications, hardware, advanced system engineering and early
15ed264d09SValeria Barra // testbed platforms, in support of the nation's exascale computing imperative.
16ed264d09SValeria Barra 
17ed264d09SValeria Barra /// @file
18ed264d09SValeria Barra /// libCEED QFunctions for diffusion operator example for a scalar field on the sphere using PETSc
19ed264d09SValeria Barra 
20*f6b55d2cSvaleriabarra #ifndef bp3sphere_h
21*f6b55d2cSvaleriabarra #define bp3sphere_h
22*f6b55d2cSvaleriabarra #include <ceed.h>
23*f6b55d2cSvaleriabarra 
24ed264d09SValeria Barra #ifndef __CUDACC__
25ed264d09SValeria Barra #  include <math.h>
26ed264d09SValeria Barra #endif
27ed264d09SValeria Barra 
28ed264d09SValeria Barra // *****************************************************************************
29ed264d09SValeria Barra // This QFunction sets up the geometric factors required for integration and
30ed264d09SValeria Barra //   coordinate transformations when reference coordinates have a different
31ed264d09SValeria Barra //   dimension than the one of physical coordinates
32ed264d09SValeria Barra //
33ed264d09SValeria Barra // Reference (parent) 2D coordinates: X \in [-1, 1]^2
34ed264d09SValeria Barra //
35ed264d09SValeria Barra // Global 3D physical coordinates given by the mesh: xx \in [-R, R]^3
36ed264d09SValeria Barra //   with R radius of the sphere
37ed264d09SValeria Barra //
38ed264d09SValeria Barra // Local 3D physical coordinates on the 2D manifold: x \in [-l, l]^3
39ed264d09SValeria Barra //   with l half edge of the cube inscribed in the sphere
40ed264d09SValeria Barra //
41ed264d09SValeria Barra // Change of coordinates matrix computed by the library:
42ed264d09SValeria Barra //   (physical 3D coords relative to reference 2D coords)
43ed264d09SValeria Barra //   dxx_j/dX_i (indicial notation) [3 * 2]
44ed264d09SValeria Barra //
45ed264d09SValeria Barra // Change of coordinates x (on the 2D manifold) relative to xx (phyisical 3D):
46ed264d09SValeria Barra //   dx_i/dxx_j (indicial notation) [3 * 3]
47ed264d09SValeria Barra //
48ed264d09SValeria Barra // Change of coordinates x (on the 2D manifold) relative to X (reference 2D):
49ed264d09SValeria Barra //   (by chain rule)
50ed264d09SValeria Barra //   dx_i/dX_j [3 * 2] = dx_i/dxx_k [3 * 3] * dxx_k/dX_j [3 * 2]
51ed264d09SValeria Barra //
52ed264d09SValeria Barra // modJ is given by the magnitude of the cross product of the columns of dx_i/dX_j
53ed264d09SValeria Barra //
54ed264d09SValeria Barra // The quadrature data is stored in the array qdata.
55ed264d09SValeria Barra //
56ed264d09SValeria Barra // We require the determinant of the Jacobian to properly compute integrals of
57ed264d09SValeria Barra //   the form: int( u v )
58ed264d09SValeria Barra //
59ed264d09SValeria Barra // qdata[0]: modJ * w
60ed264d09SValeria Barra //
61ed264d09SValeria Barra // We use the Moore–Penrose (left) pseudoinverse of dx_i/dX_j, to compute dX_i/dx_j (and its transpose),
62ed264d09SValeria Barra //   needed to properly compute integrals of the form: int( gradv gradu )
63ed264d09SValeria Barra //
64ed264d09SValeria Barra // dX_i/dx_j [2 * 3] = (dx_i/dX_j)+ = (dxdX^T dxdX)^(-1) dxdX
65ed264d09SValeria Barra //
66ac4340cfSJed Brown // and the product simplifies to yield the contravariant metric tensor
67ac4340cfSJed Brown //
68ac4340cfSJed Brown // g^{ij} = dX_i/dx_k dX_j/dx_k = (dxdX^T dxdX)^{-1}
69ac4340cfSJed Brown //
7008fade8cSvaleriabarra // Stored: g^{ij} (in Voigt convention) in
7108fade8cSvaleriabarra //
7208fade8cSvaleriabarra //   qdata[1:3]: [dXdxdXdxT00 dXdxdXdxT01]
7308fade8cSvaleriabarra //               [dXdxdXdxT01 dXdxdXdxT11]
74ed264d09SValeria Barra // *****************************************************************************
75ed264d09SValeria Barra 
76ed264d09SValeria Barra // -----------------------------------------------------------------------------
77ed264d09SValeria Barra CEED_QFUNCTION(SetupDiffGeo)(void *ctx, CeedInt Q,
78ed264d09SValeria Barra                              const CeedScalar *const *in,
79ed264d09SValeria Barra                              CeedScalar *const *out) {
80ed264d09SValeria Barra   const CeedScalar *X = in[0], *J = in[1], *w = in[2];
81ed264d09SValeria Barra   CeedScalar *qdata = out[0];
82ed264d09SValeria Barra 
83ed264d09SValeria Barra   // Quadrature Point Loop
84ed264d09SValeria Barra   CeedPragmaSIMD
85ed264d09SValeria Barra   for (CeedInt i=0; i<Q; i++) {
86ed264d09SValeria Barra     // Read global Cartesian coordinates
87ed264d09SValeria Barra     const CeedScalar xx[3] = {X[i+0*Q],
88ed264d09SValeria Barra                               X[i+1*Q],
89ed264d09SValeria Barra                               X[i+2*Q]
90ed264d09SValeria Barra                              };
91ed264d09SValeria Barra 
92ed264d09SValeria Barra     // Read dxxdX Jacobian entries, stored as
93ed264d09SValeria Barra     // 0 3
94ed264d09SValeria Barra     // 1 4
95ed264d09SValeria Barra     // 2 5
96ed264d09SValeria Barra     const CeedScalar dxxdX[3][2] = {{J[i+Q*0],
97ed264d09SValeria Barra                                      J[i+Q*3]},
98ed264d09SValeria Barra                                     {J[i+Q*1],
99ed264d09SValeria Barra                                      J[i+Q*4]},
100ed264d09SValeria Barra                                     {J[i+Q*2],
101ed264d09SValeria Barra                                      J[i+Q*5]}
102ed264d09SValeria Barra                                    };
103ed264d09SValeria Barra 
104ed264d09SValeria Barra     // Setup
105ed264d09SValeria Barra     // x = xx (xx^T xx)^{-1/2}
106ed264d09SValeria Barra     // dx/dxx = I (xx^T xx)^{-1/2} - xx xx^T (xx^T xx)^{-3/2}
107ed264d09SValeria Barra     const CeedScalar modxxsq = xx[0]*xx[0]+xx[1]*xx[1]+xx[2]*xx[2];
108ed264d09SValeria Barra     CeedScalar xxsq[3][3];
109ed264d09SValeria Barra     for (int j=0; j<3; j++)
110ed264d09SValeria Barra       for (int k=0; k<3; k++)
111ed264d09SValeria Barra         xxsq[j][k] = xx[j]*xx[k] / (sqrt(modxxsq) * modxxsq);
112ed264d09SValeria Barra 
113ed264d09SValeria Barra     const CeedScalar dxdxx[3][3] = {{1./sqrt(modxxsq) - xxsq[0][0],
114ed264d09SValeria Barra                                      -xxsq[0][1],
115ed264d09SValeria Barra                                      -xxsq[0][2]},
116ed264d09SValeria Barra                                     {-xxsq[1][0],
117ed264d09SValeria Barra                                      1./sqrt(modxxsq) - xxsq[1][1],
118ed264d09SValeria Barra                                      -xxsq[1][2]},
119ed264d09SValeria Barra                                     {-xxsq[2][0],
120ed264d09SValeria Barra                                      -xxsq[2][1],
121ed264d09SValeria Barra                                      1./sqrt(modxxsq) - xxsq[2][2]}
122ed264d09SValeria Barra                                    };
123ed264d09SValeria Barra 
124ed264d09SValeria Barra     CeedScalar dxdX[3][2];
125ed264d09SValeria Barra     for (int j=0; j<3; j++)
126ed264d09SValeria Barra       for (int k=0; k<2; k++) {
127ed264d09SValeria Barra         dxdX[j][k] = 0;
128ed264d09SValeria Barra         for (int l=0; l<3; l++)
129ed264d09SValeria Barra           dxdX[j][k] += dxdxx[j][l]*dxxdX[l][k];
130ed264d09SValeria Barra       }
131ed264d09SValeria Barra 
132ed264d09SValeria Barra     // J is given by the cross product of the columns of dxdX
133ed264d09SValeria Barra     const CeedScalar J[3]= {dxdX[1][0]*dxdX[2][1] - dxdX[2][0]*dxdX[1][1],
134ed264d09SValeria Barra                             dxdX[2][0]*dxdX[0][1] - dxdX[0][0]*dxdX[2][1],
135ed264d09SValeria Barra                             dxdX[0][0]*dxdX[1][1] - dxdX[1][0]*dxdX[0][1]
136ed264d09SValeria Barra                            };
137ed264d09SValeria Barra 
138ed264d09SValeria Barra     // Use the magnitude of J as our detJ (volume scaling factor)
139ed264d09SValeria Barra     const CeedScalar modJ = sqrt(J[0]*J[0]+J[1]*J[1]+J[2]*J[2]);
140ed264d09SValeria Barra 
141ed264d09SValeria Barra     // Interp-to-Interp qdata
142ed264d09SValeria Barra     qdata[i+Q*0] = modJ * w[i];
143ed264d09SValeria Barra 
14408fade8cSvaleriabarra     // dxdX_k,j * dxdX_j,k
145ed264d09SValeria Barra     CeedScalar dxdXTdxdX[2][2];
146ed264d09SValeria Barra     for (int j=0; j<2; j++)
147ed264d09SValeria Barra       for (int k=0; k<2; k++) {
148ed264d09SValeria Barra         dxdXTdxdX[j][k] = 0;
149ed264d09SValeria Barra         for (int l=0; l<3; l++)
150ed264d09SValeria Barra           dxdXTdxdX[j][k] += dxdX[l][j]*dxdX[l][k];
151ed264d09SValeria Barra       }
152ed264d09SValeria Barra 
153ed264d09SValeria Barra     const CeedScalar detdxdXTdxdX =  dxdXTdxdX[0][0] * dxdXTdxdX[1][1]
154ed264d09SValeria Barra                                     -dxdXTdxdX[1][0] * dxdXTdxdX[0][1];
155ed264d09SValeria Barra 
15608fade8cSvaleriabarra     // Compute inverse of dxdXTdxdX, which is the 2x2 contravariant metric tensor g^{ij}
157ed264d09SValeria Barra     CeedScalar dxdXTdxdXinv[2][2];
158ed264d09SValeria Barra     dxdXTdxdXinv[0][0] =  dxdXTdxdX[1][1] / detdxdXTdxdX;
159ed264d09SValeria Barra     dxdXTdxdXinv[0][1] = -dxdXTdxdX[0][1] / detdxdXTdxdX;
160ed264d09SValeria Barra     dxdXTdxdXinv[1][0] = -dxdXTdxdX[1][0] / detdxdXTdxdX;
161ed264d09SValeria Barra     dxdXTdxdXinv[1][1] =  dxdXTdxdX[0][0] / detdxdXTdxdX;
162ed264d09SValeria Barra 
163ed264d09SValeria Barra     // Stored in Voigt convention
164ac4340cfSJed Brown     qdata[i+Q*1] = dxdXTdxdXinv[0][0];
165ac4340cfSJed Brown     qdata[i+Q*2] = dxdXTdxdXinv[1][1];
166ac4340cfSJed Brown     qdata[i+Q*3] = dxdXTdxdXinv[0][1];
167ed264d09SValeria Barra   } // End of Quadrature Point Loop
168ed264d09SValeria Barra 
169ed264d09SValeria Barra   // Return
170ed264d09SValeria Barra   return 0;
171ed264d09SValeria Barra }
172ed264d09SValeria Barra 
173ed264d09SValeria Barra // *****************************************************************************
174ed264d09SValeria Barra // This QFunction sets up the rhs and true solution for the problem
175ed264d09SValeria Barra // *****************************************************************************
176ed264d09SValeria Barra 
177ed264d09SValeria Barra // -----------------------------------------------------------------------------
178ed264d09SValeria Barra CEED_QFUNCTION(SetupDiffRhs)(void *ctx, CeedInt Q,
179ed264d09SValeria Barra                              const CeedScalar *const *in,
180ed264d09SValeria Barra                              CeedScalar *const *out) {
181ed264d09SValeria Barra   // Inputs
182ed264d09SValeria Barra   const CeedScalar *X = in[0], *qdata = in[1];
183ed264d09SValeria Barra   // Outputs
184ed264d09SValeria Barra   CeedScalar *true_soln = out[0], *rhs = out[1];
185ed264d09SValeria Barra 
186ed264d09SValeria Barra   // Context
187ed264d09SValeria Barra   const CeedScalar *context = (const CeedScalar*)ctx;
188ed264d09SValeria Barra   const CeedScalar R        = context[0];
189ed264d09SValeria Barra 
190ed264d09SValeria Barra   // Quadrature Point Loop
191ed264d09SValeria Barra   CeedPragmaSIMD
192ed264d09SValeria Barra   for (CeedInt i=0; i<Q; i++) {
193ed264d09SValeria Barra     // Read global Cartesian coordinates
194ed264d09SValeria Barra     CeedScalar x = X[i+Q*0], y = X[i+Q*1], z = X[i+Q*2];
195ed264d09SValeria Barra     // Normalize quadrature point coordinates to sphere
196ed264d09SValeria Barra     CeedScalar rad = sqrt(x*x + y*y + z*z);
197ed264d09SValeria Barra     x *= R / rad;
198ed264d09SValeria Barra     y *= R / rad;
199ed264d09SValeria Barra     z *= R / rad;
200ed264d09SValeria Barra     // Compute latitude and longitude
201ed264d09SValeria Barra     const CeedScalar theta  = asin(z / R); // latitude
202ed264d09SValeria Barra     const CeedScalar lambda = atan2(y, x); // longitude
203ed264d09SValeria Barra 
204ed264d09SValeria Barra     true_soln[i+Q*0] = sin(lambda) * cos(theta);
205ed264d09SValeria Barra 
206ed264d09SValeria Barra     rhs[i+Q*0] = qdata[i+Q*0] * 2 * sin(lambda)*cos(theta) / (R*R);
207ed264d09SValeria Barra 
208ed264d09SValeria Barra   } // End of Quadrature Point Loop
209ed264d09SValeria Barra 
210ed264d09SValeria Barra   return 0;
211ed264d09SValeria Barra }
212ed264d09SValeria Barra 
213ed264d09SValeria Barra // *****************************************************************************
214ed264d09SValeria Barra // This QFunction applies the diffusion operator for a scalar field.
215ed264d09SValeria Barra //
216ed264d09SValeria Barra // Inputs:
217ed264d09SValeria Barra //   ug     - Input vector gradient at quadrature points
218ed264d09SValeria Barra //   qdata  - Geometric factors
219ed264d09SValeria Barra //
220ed264d09SValeria Barra // Output:
221ed264d09SValeria Barra //   vg     - Output vector (test functions) gradient at quadrature points
222ed264d09SValeria Barra //
223ed264d09SValeria Barra // *****************************************************************************
224ed264d09SValeria Barra 
225ed264d09SValeria Barra // -----------------------------------------------------------------------------
226ed264d09SValeria Barra CEED_QFUNCTION(Diff)(void *ctx, CeedInt Q,
227ed264d09SValeria Barra                      const CeedScalar *const *in, CeedScalar *const *out) {
228ed264d09SValeria Barra   // Inputs
229ed264d09SValeria Barra   const CeedScalar *ug = in[0], *qdata = in[1];
230ed264d09SValeria Barra   // Outputs
231ed264d09SValeria Barra   CeedScalar *vg = out[0];
232ed264d09SValeria Barra 
233ed264d09SValeria Barra   // Quadrature Point Loop
234ed264d09SValeria Barra   CeedPragmaSIMD
235ed264d09SValeria Barra   for (CeedInt i=0; i<Q; i++) {
236ed264d09SValeria Barra     // Read spatial derivatives of u
237ed264d09SValeria Barra     const CeedScalar du[2]           =  {ug[i+Q*0],
238ed264d09SValeria Barra                                          ug[i+Q*1]
239ed264d09SValeria Barra                                         };
240ed264d09SValeria Barra     // Read qdata
241ed264d09SValeria Barra     const CeedScalar wJ              =   qdata[i+Q*0];
242ed264d09SValeria Barra     // -- Grad-to-Grad qdata
243ed264d09SValeria Barra     // ---- dXdx_j,k * dXdx_k,j
244ed264d09SValeria Barra     const CeedScalar dXdxdXdxT[2][2] = {{qdata[i+Q*1],
245ed264d09SValeria Barra                                          qdata[i+Q*3]},
246ed264d09SValeria Barra                                         {qdata[i+Q*3],
247ed264d09SValeria Barra                                          qdata[i+Q*2]}
248ed264d09SValeria Barra                                        };
249ed264d09SValeria Barra 
250ed264d09SValeria Barra     for (int j=0; j<2; j++) // j = direction of vg
251ed264d09SValeria Barra       vg[i+j*Q] = wJ * (du[0] * dXdxdXdxT[0][j] +
252ed264d09SValeria Barra                         du[1] * dXdxdXdxT[1][j]);
253ed264d09SValeria Barra 
254ed264d09SValeria Barra   } // End of Quadrature Point Loop
255ed264d09SValeria Barra 
256ed264d09SValeria Barra   return 0;
257ed264d09SValeria Barra }
258ed264d09SValeria Barra // -----------------------------------------------------------------------------
259*f6b55d2cSvaleriabarra 
260*f6b55d2cSvaleriabarra #endif // bp3sphere_h
261