1*cb32e2e7SValeria Barra // Copyright (c) 2017, Lawrence Livermore National Security, LLC. Produced at 2*cb32e2e7SValeria Barra // the Lawrence Livermore National Laboratory. LLNL-CODE-734707. All Rights 3*cb32e2e7SValeria Barra // reserved. See files LICENSE and NOTICE for details. 4*cb32e2e7SValeria Barra // 5*cb32e2e7SValeria Barra // This file is part of CEED, a collection of benchmarks, miniapps, software 6*cb32e2e7SValeria Barra // libraries and APIs for efficient high-order finite element and spectral 7*cb32e2e7SValeria Barra // element discretizations for exascale applications. For more information and 8*cb32e2e7SValeria Barra // source code availability see http://github.com/ceed. 9*cb32e2e7SValeria Barra // 10*cb32e2e7SValeria Barra // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, 11*cb32e2e7SValeria Barra // a collaborative effort of two U.S. Department of Energy organizations (Office 12*cb32e2e7SValeria Barra // of Science and the National Nuclear Security Administration) responsible for 13*cb32e2e7SValeria Barra // the planning and preparation of a capable exascale ecosystem, including 14*cb32e2e7SValeria Barra // software, applications, hardware, advanced system engineering and early 15*cb32e2e7SValeria Barra // testbed platforms, in support of the nation's exascale computing imperative. 16*cb32e2e7SValeria Barra 17*cb32e2e7SValeria Barra /// @file 18*cb32e2e7SValeria Barra /// libCEED QFunctions for mass operator example using PETSc 19*cb32e2e7SValeria Barra 20*cb32e2e7SValeria Barra #ifndef __CUDACC__ 21*cb32e2e7SValeria Barra # include <math.h> 22*cb32e2e7SValeria Barra #endif 23*cb32e2e7SValeria Barra 24*cb32e2e7SValeria Barra // ----------------------------------------------------------------------------- 25*cb32e2e7SValeria Barra CEED_QFUNCTION(SetupMassRhs3)(void *ctx, const CeedInt Q, 26*cb32e2e7SValeria Barra const CeedScalar *const *in, 27*cb32e2e7SValeria Barra CeedScalar *const *out) { 28*cb32e2e7SValeria Barra const CeedScalar *x = in[0], *J = in[1], *w = in[2]; 29*cb32e2e7SValeria Barra CeedScalar *true_soln = out[0], *rhs = out[1]; 30*cb32e2e7SValeria Barra 31*cb32e2e7SValeria Barra // Quadrature Point Loop 32*cb32e2e7SValeria Barra CeedPragmaSIMD 33*cb32e2e7SValeria Barra for (CeedInt i=0; i<Q; i++) { 34*cb32e2e7SValeria Barra const CeedScalar det = (J[i+Q*0]*(J[i+Q*4]*J[i+Q*8] - J[i+Q*5]*J[i+Q*7]) - 35*cb32e2e7SValeria Barra J[i+Q*1]*(J[i+Q*3]*J[i+Q*8] - J[i+Q*5]*J[i+Q*6]) + 36*cb32e2e7SValeria Barra J[i+Q*2]*(J[i+Q*3]*J[i+Q*7] - J[i+Q*4]*J[i+Q*6])); 37*cb32e2e7SValeria Barra 38*cb32e2e7SValeria Barra // Component 1 39*cb32e2e7SValeria Barra true_soln[i+0*Q] = sqrt(x[i]*x[i] + x[i+Q]*x[i+Q] + x[i+2*Q]*x[i+2*Q]); 40*cb32e2e7SValeria Barra // Component 2 41*cb32e2e7SValeria Barra true_soln[i+1*Q] = true_soln[i+0*Q]; 42*cb32e2e7SValeria Barra // Component 3 43*cb32e2e7SValeria Barra true_soln[i+2*Q] = true_soln[i+0*Q]; 44*cb32e2e7SValeria Barra 45*cb32e2e7SValeria Barra // Component 1 46*cb32e2e7SValeria Barra rhs[i+0*Q] = det * w[i] * true_soln[i+0*Q]; 47*cb32e2e7SValeria Barra // Component 2 48*cb32e2e7SValeria Barra rhs[i+1*Q] = rhs[i+0*Q]; 49*cb32e2e7SValeria Barra // Component 3 50*cb32e2e7SValeria Barra rhs[i+2*Q] = rhs[i+0*Q]; 51*cb32e2e7SValeria Barra } // End of Quadrature Point Loop 52*cb32e2e7SValeria Barra return 0; 53*cb32e2e7SValeria Barra } 54*cb32e2e7SValeria Barra 55*cb32e2e7SValeria Barra // ----------------------------------------------------------------------------- 56*cb32e2e7SValeria Barra CEED_QFUNCTION(Mass3)(void *ctx, const CeedInt Q, 57*cb32e2e7SValeria Barra const CeedScalar *const *in, CeedScalar *const *out) { 58*cb32e2e7SValeria Barra const CeedScalar *u = in[0], *qdata = in[1]; 59*cb32e2e7SValeria Barra CeedScalar *v = out[0]; 60*cb32e2e7SValeria Barra 61*cb32e2e7SValeria Barra // Quadrature Point Loop 62*cb32e2e7SValeria Barra CeedPragmaSIMD 63*cb32e2e7SValeria Barra for (CeedInt i=0; i<Q; i++) { 64*cb32e2e7SValeria Barra const CeedScalar r = qdata[i]; 65*cb32e2e7SValeria Barra // Component 1 66*cb32e2e7SValeria Barra v[i+0*Q] = r * u[i+0*Q]; 67*cb32e2e7SValeria Barra // Component 2 68*cb32e2e7SValeria Barra v[i+1*Q] = r * u[i+1*Q]; 69*cb32e2e7SValeria Barra // Component 3 70*cb32e2e7SValeria Barra v[i+2*Q] = r * u[i+2*Q]; 71*cb32e2e7SValeria Barra } // End of Quadrature Point Loop 72*cb32e2e7SValeria Barra return 0; 73*cb32e2e7SValeria Barra } 74*cb32e2e7SValeria Barra // ----------------------------------------------------------------------------- 75