xref: /libCEED/examples/petsc/qfunctions/bps/bp2.h (revision cb32e2e7f026784d97a57f1901677e9727def907)
1*cb32e2e7SValeria Barra // Copyright (c) 2017, Lawrence Livermore National Security, LLC. Produced at
2*cb32e2e7SValeria Barra // the Lawrence Livermore National Laboratory. LLNL-CODE-734707. All Rights
3*cb32e2e7SValeria Barra // reserved. See files LICENSE and NOTICE for details.
4*cb32e2e7SValeria Barra //
5*cb32e2e7SValeria Barra // This file is part of CEED, a collection of benchmarks, miniapps, software
6*cb32e2e7SValeria Barra // libraries and APIs for efficient high-order finite element and spectral
7*cb32e2e7SValeria Barra // element discretizations for exascale applications. For more information and
8*cb32e2e7SValeria Barra // source code availability see http://github.com/ceed.
9*cb32e2e7SValeria Barra //
10*cb32e2e7SValeria Barra // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC,
11*cb32e2e7SValeria Barra // a collaborative effort of two U.S. Department of Energy organizations (Office
12*cb32e2e7SValeria Barra // of Science and the National Nuclear Security Administration) responsible for
13*cb32e2e7SValeria Barra // the planning and preparation of a capable exascale ecosystem, including
14*cb32e2e7SValeria Barra // software, applications, hardware, advanced system engineering and early
15*cb32e2e7SValeria Barra // testbed platforms, in support of the nation's exascale computing imperative.
16*cb32e2e7SValeria Barra 
17*cb32e2e7SValeria Barra /// @file
18*cb32e2e7SValeria Barra /// libCEED QFunctions for mass operator example using PETSc
19*cb32e2e7SValeria Barra 
20*cb32e2e7SValeria Barra #ifndef __CUDACC__
21*cb32e2e7SValeria Barra #  include <math.h>
22*cb32e2e7SValeria Barra #endif
23*cb32e2e7SValeria Barra 
24*cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
25*cb32e2e7SValeria Barra CEED_QFUNCTION(SetupMassRhs3)(void *ctx, const CeedInt Q,
26*cb32e2e7SValeria Barra                               const CeedScalar *const *in,
27*cb32e2e7SValeria Barra                               CeedScalar *const *out) {
28*cb32e2e7SValeria Barra   const CeedScalar *x = in[0], *J = in[1], *w = in[2];
29*cb32e2e7SValeria Barra   CeedScalar *true_soln = out[0], *rhs = out[1];
30*cb32e2e7SValeria Barra 
31*cb32e2e7SValeria Barra   // Quadrature Point Loop
32*cb32e2e7SValeria Barra   CeedPragmaSIMD
33*cb32e2e7SValeria Barra   for (CeedInt i=0; i<Q; i++) {
34*cb32e2e7SValeria Barra     const CeedScalar det = (J[i+Q*0]*(J[i+Q*4]*J[i+Q*8] - J[i+Q*5]*J[i+Q*7]) -
35*cb32e2e7SValeria Barra                             J[i+Q*1]*(J[i+Q*3]*J[i+Q*8] - J[i+Q*5]*J[i+Q*6]) +
36*cb32e2e7SValeria Barra                             J[i+Q*2]*(J[i+Q*3]*J[i+Q*7] - J[i+Q*4]*J[i+Q*6]));
37*cb32e2e7SValeria Barra 
38*cb32e2e7SValeria Barra     // Component 1
39*cb32e2e7SValeria Barra     true_soln[i+0*Q] =  sqrt(x[i]*x[i] + x[i+Q]*x[i+Q] + x[i+2*Q]*x[i+2*Q]);
40*cb32e2e7SValeria Barra     // Component 2
41*cb32e2e7SValeria Barra     true_soln[i+1*Q] = true_soln[i+0*Q];
42*cb32e2e7SValeria Barra     // Component 3
43*cb32e2e7SValeria Barra     true_soln[i+2*Q] = true_soln[i+0*Q];
44*cb32e2e7SValeria Barra 
45*cb32e2e7SValeria Barra     // Component 1
46*cb32e2e7SValeria Barra     rhs[i+0*Q] = det * w[i] * true_soln[i+0*Q];
47*cb32e2e7SValeria Barra     // Component 2
48*cb32e2e7SValeria Barra     rhs[i+1*Q] = rhs[i+0*Q];
49*cb32e2e7SValeria Barra     // Component 3
50*cb32e2e7SValeria Barra     rhs[i+2*Q] = rhs[i+0*Q];
51*cb32e2e7SValeria Barra   } // End of Quadrature Point Loop
52*cb32e2e7SValeria Barra   return 0;
53*cb32e2e7SValeria Barra }
54*cb32e2e7SValeria Barra 
55*cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
56*cb32e2e7SValeria Barra CEED_QFUNCTION(Mass3)(void *ctx, const CeedInt Q,
57*cb32e2e7SValeria Barra                       const CeedScalar *const *in, CeedScalar *const *out) {
58*cb32e2e7SValeria Barra   const CeedScalar *u = in[0], *qdata = in[1];
59*cb32e2e7SValeria Barra   CeedScalar *v = out[0];
60*cb32e2e7SValeria Barra 
61*cb32e2e7SValeria Barra   // Quadrature Point Loop
62*cb32e2e7SValeria Barra   CeedPragmaSIMD
63*cb32e2e7SValeria Barra   for (CeedInt i=0; i<Q; i++) {
64*cb32e2e7SValeria Barra     const CeedScalar r = qdata[i];
65*cb32e2e7SValeria Barra     // Component 1
66*cb32e2e7SValeria Barra     v[i+0*Q] = r * u[i+0*Q];
67*cb32e2e7SValeria Barra     // Component 2
68*cb32e2e7SValeria Barra     v[i+1*Q] = r * u[i+1*Q];
69*cb32e2e7SValeria Barra     // Component 3
70*cb32e2e7SValeria Barra     v[i+2*Q] = r * u[i+2*Q];
71*cb32e2e7SValeria Barra   } // End of Quadrature Point Loop
72*cb32e2e7SValeria Barra   return 0;
73*cb32e2e7SValeria Barra }
74*cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
75