16ea7c6c1SJed Brown // Copyright (c) 2017, Lawrence Livermore National Security, LLC. Produced at 26ea7c6c1SJed Brown // the Lawrence Livermore National Laboratory. LLNL-CODE-734707. All Rights 36ea7c6c1SJed Brown // reserved. See files LICENSE and NOTICE for details. 46ea7c6c1SJed Brown // 56ea7c6c1SJed Brown // This file is part of CEED, a collection of benchmarks, miniapps, software 66ea7c6c1SJed Brown // libraries and APIs for efficient high-order finite element and spectral 76ea7c6c1SJed Brown // element discretizations for exascale applications. For more information and 86ea7c6c1SJed Brown // source code availability see http://github.com/ceed. 96ea7c6c1SJed Brown // 106ea7c6c1SJed Brown // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, 116ea7c6c1SJed Brown // a collaborative effort of two U.S. Department of Energy organizations (Office 126ea7c6c1SJed Brown // of Science and the National Nuclear Security Administration) responsible for 136ea7c6c1SJed Brown // the planning and preparation of a capable exascale ecosystem, including 146ea7c6c1SJed Brown // software, applications, hardware, advanced system engineering and early 156ea7c6c1SJed Brown // testbed platforms, in support of the nation's exascale computing imperative. 166ea7c6c1SJed Brown 175d6bafb2Sjeremylt /// @file 185d6bafb2Sjeremylt /// Private header for frontend components of libCEED 196ea7c6c1SJed Brown #ifndef _ceed_impl_h 206ea7c6c1SJed Brown #define _ceed_impl_h 216ea7c6c1SJed Brown 226ea7c6c1SJed Brown #include <ceed.h> 232f86a920SJeremy L Thompson #include <ceed-backend.h> 24ff8ca64bSJed Brown #include <stdbool.h> 256ea7c6c1SJed Brown 260e4d4210Sjeremylt #define CEED_EPSILON 1E-16 276ea7c6c1SJed Brown 28fe2413ffSjeremylt // Lookup table field for backend functions 29fe2413ffSjeremylt typedef struct { 30fe2413ffSjeremylt const char *fname; 31fe2413ffSjeremylt size_t offset; 32fe2413ffSjeremylt } foffset; 33fe2413ffSjeremylt 34aefd8378Sjeremylt // Lookup table field for object delegates 35aefd8378Sjeremylt typedef struct { 36aefd8378Sjeremylt char *objname; 37aefd8378Sjeremylt Ceed delegate; 38aefd8378Sjeremylt } objdelegate; 39aefd8378Sjeremylt 406ea7c6c1SJed Brown struct Ceed_private { 41e07206deSjeremylt const char *resource; 425fe0d4faSjeremylt Ceed delegate; 432f86a920SJeremy L Thompson Ceed parent; 44aefd8378Sjeremylt objdelegate *objdelegates; 45aefd8378Sjeremylt int objdelegatecount; 465107b09fSJeremy L Thompson Ceed opfallbackceed, opfallbackparent; 475107b09fSJeremy L Thompson const char *opfallbackresource; 482f86a920SJeremy L Thompson int (*Error)(Ceed, const char *, int, const char *, int, const char *, 492f86a920SJeremy L Thompson va_list); 50c907536fSjeremylt int (*GetPreferredMemType)(CeedMemType *); 516ea7c6c1SJed Brown int (*Destroy)(Ceed); 52f8902d9eSjeremylt int (*VectorCreate)(CeedInt, CeedVector); 53667bc5fcSjeremylt int (*ElemRestrictionCreate)(CeedMemType, CeedCopyMode, 54667bc5fcSjeremylt const CeedInt *, CeedElemRestriction); 55667bc5fcSjeremylt int (*ElemRestrictionCreateBlocked)(CeedMemType, CeedCopyMode, 56667bc5fcSjeremylt const CeedInt *, CeedElemRestriction); 57667bc5fcSjeremylt int (*BasisCreateTensorH1)(CeedInt, CeedInt, CeedInt, const CeedScalar *, 582f86a920SJeremy L Thompson const CeedScalar *, const CeedScalar *, 592f86a920SJeremy L Thompson const CeedScalar *, CeedBasis); 60667bc5fcSjeremylt int (*BasisCreateH1)(CeedElemTopology, CeedInt, CeedInt, CeedInt, 61a8de75f0Sjeremylt const CeedScalar *, 622f86a920SJeremy L Thompson const CeedScalar *, const CeedScalar *, 632f86a920SJeremy L Thompson const CeedScalar *, CeedBasis); 64c71e1dcdSjeremylt int (*TensorContractCreate)(CeedBasis, CeedTensorContract); 656ea7c6c1SJed Brown int (*QFunctionCreate)(CeedQFunction); 666ea7c6c1SJed Brown int (*OperatorCreate)(CeedOperator); 6752d6035fSJeremy L Thompson int (*CompositeOperatorCreate)(CeedOperator); 6880061934SJed Brown int refcount; 696ea7c6c1SJed Brown void *data; 706e79d475Sjeremylt foffset *foffsets; 716ea7c6c1SJed Brown }; 726ea7c6c1SJed Brown 736ea7c6c1SJed Brown struct CeedVector_private { 746ea7c6c1SJed Brown Ceed ceed; 756ea7c6c1SJed Brown int (*SetArray)(CeedVector, CeedMemType, CeedCopyMode, CeedScalar *); 762a1ab385Sjeremylt int (*SetValue)(CeedVector, CeedScalar); 7754540941SJeremy L Thompson int (*SyncArray)(CeedVector, CeedMemType); 786ea7c6c1SJed Brown int (*GetArray)(CeedVector, CeedMemType, CeedScalar **); 796ea7c6c1SJed Brown int (*GetArrayRead)(CeedVector, CeedMemType, const CeedScalar **); 80f05116b9SJeremy L Thompson int (*RestoreArray)(CeedVector); 81f05116b9SJeremy L Thompson int (*RestoreArrayRead)(CeedVector); 826ea7c6c1SJed Brown int (*Destroy)(CeedVector); 83540765feSJed Brown int refcount; 846ea7c6c1SJed Brown CeedInt length; 8536ac90ebSjeremylt uint64_t state; 862cd729eeSjeremylt uint64_t numreaders; 876ea7c6c1SJed Brown void *data; 886ea7c6c1SJed Brown }; 896ea7c6c1SJed Brown 906ea7c6c1SJed Brown struct CeedElemRestriction_private { 916ea7c6c1SJed Brown Ceed ceed; 92ff8ca64bSJed Brown int (*Apply)(CeedElemRestriction, CeedTransposeMode, CeedTransposeMode, 936ea7c6c1SJed Brown CeedVector, CeedVector, CeedRequest *); 94be9261b7Sjeremylt int (*ApplyBlock)(CeedElemRestriction, CeedInt, CeedTransposeMode, 95be9261b7Sjeremylt CeedTransposeMode, CeedVector, CeedVector, CeedRequest *); 966ea7c6c1SJed Brown int (*Destroy)(CeedElemRestriction); 97675ef50dSJed Brown int refcount; 986ea7c6c1SJed Brown CeedInt nelem; /* number of elements */ 998795c945Sjeremylt CeedInt elemsize; /* number of nodes per element */ 1008795c945Sjeremylt CeedInt nnodes; /* size of the L-vector, can be used for checking for 1016ea7c6c1SJed Brown correct vector sizes */ 102ff8ca64bSJed Brown CeedInt ncomp; /* number of components */ 1034e35ef05Sjeremylt CeedInt blksize; /* number of elements in a batch */ 1044e35ef05Sjeremylt CeedInt nblk; /* number of blocks of elements */ 1056ea7c6c1SJed Brown void *data; /* place for the backend to store any data */ 1066ea7c6c1SJed Brown }; 1076ea7c6c1SJed Brown 1086ea7c6c1SJed Brown struct CeedBasis_private { 1096ea7c6c1SJed Brown Ceed ceed; 1104b8bea3bSJed Brown int (*Apply)(CeedBasis, CeedInt, CeedTransposeMode, CeedEvalMode, 111aedaa0e5Sjeremylt CeedVector, CeedVector); 1126ea7c6c1SJed Brown int (*Destroy)(CeedBasis); 113c3725256SJed Brown int refcount; 114a8de75f0Sjeremylt bool tensorbasis; /* flag for tensor basis */ 1150f5de9e9Sjeremylt CeedInt dim; /* topological dimension */ 1160f5de9e9Sjeremylt CeedInt ncomp; /* number of field components (1 for scalar fields) */ 1170f5de9e9Sjeremylt CeedInt P1d; /* number of nodes in one dimension */ 1180f5de9e9Sjeremylt CeedInt Q1d; /* number of quadrature points in one dimension */ 119a8de75f0Sjeremylt CeedInt P; /* total number of nodes */ 120a8de75f0Sjeremylt CeedInt Q; /* total number of quadrature points */ 1210f5de9e9Sjeremylt CeedScalar *qref1d; /* Array of length Q1d holding the locations of 1220f5de9e9Sjeremylt quadrature points on the 1D reference element [-1, 1] */ 1230f5de9e9Sjeremylt CeedScalar *qweight1d; /* array of length Q1d holding the quadrature weights on 1240f5de9e9Sjeremylt the reference element */ 1254b8bea3bSJed Brown CeedScalar 126*00f91b2bSjeremylt *interp; /* row-major matrix of shape [Q, P] expressing the values of 127*00f91b2bSjeremylt nodal basis functions at quadrature points */ 128*00f91b2bSjeremylt CeedScalar 1294b8bea3bSJed Brown *interp1d; /* row-major matrix of shape [Q1d, P1d] expressing the values of 1300f5de9e9Sjeremylt nodal basis functions at quadrature points */ 1314b8bea3bSJed Brown CeedScalar 132*00f91b2bSjeremylt *grad; /* row-major matrix of shape [dim*Q, P] matrix expressing derivatives of 133*00f91b2bSjeremylt nodal basis functions at quadrature points */ 134*00f91b2bSjeremylt CeedScalar 1354b8bea3bSJed Brown *grad1d; /* row-major matrix of shape [Q1d, P1d] matrix expressing derivatives of 1360f5de9e9Sjeremylt nodal basis functions at quadrature points */ 1372f86a920SJeremy L Thompson CeedTensorContract contract; /* tensor contraction object */ 138c01dd730Scamierjs void *data; /* place for the backend to store any data */ 1396ea7c6c1SJed Brown }; 1406ea7c6c1SJed Brown 1412f86a920SJeremy L Thompson struct CeedTensorContract_private { 1422f86a920SJeremy L Thompson Ceed ceed; 1432f86a920SJeremy L Thompson int (*Apply)(CeedTensorContract, CeedInt, CeedInt, CeedInt, CeedInt, 1442f86a920SJeremy L Thompson const CeedScalar *restrict, CeedTransposeMode, const CeedInt, 1452f86a920SJeremy L Thompson const CeedScalar *restrict, CeedScalar *restrict); 1462f86a920SJeremy L Thompson int (*Destroy)(CeedTensorContract); 1472f86a920SJeremy L Thompson int refcount; 1482f86a920SJeremy L Thompson void *data; 1492f86a920SJeremy L Thompson }; 1502f86a920SJeremy L Thompson 151d1bcdac9Sjeremylt struct CeedQFunctionField_private { 152ff8ca64bSJed Brown const char *fieldname; 1534d537eeaSYohann CeedInt size; 154ff8ca64bSJed Brown CeedEvalMode emode; 155ff8ca64bSJed Brown }; 156ff8ca64bSJed Brown 1576ea7c6c1SJed Brown struct CeedQFunction_private { 1586ea7c6c1SJed Brown Ceed ceed; 1592f86a920SJeremy L Thompson int (*Apply)(CeedQFunction, CeedInt, CeedVector *, CeedVector *); 1606ea7c6c1SJed Brown int (*Destroy)(CeedQFunction); 1612123d1aaSJed Brown int refcount; 1626ea7c6c1SJed Brown CeedInt vlength; // Number of quadrature points must be padded to a multiple of vlength 163fe2413ffSjeremylt CeedQFunctionField *inputfields; 164fe2413ffSjeremylt CeedQFunctionField *outputfields; 165ff8ca64bSJed Brown CeedInt numinputfields, numoutputfields; 1669f0427d9SYohann CeedQFunctionUser function; 167288c0443SJeremy L Thompson const char *sourcepath; 168288c0443SJeremy L Thompson const char *qfname; 169418fb8c2Sjeremylt bool fortranstatus; 1700219ea01SJeremy L Thompson bool identity; 1716ea7c6c1SJed Brown void *ctx; /* user context for function */ 1726ea7c6c1SJed Brown size_t ctxsize; /* size of user context; may be used to copy to a device */ 1736ea7c6c1SJed Brown void *data; /* backend data */ 1746ea7c6c1SJed Brown }; 1756ea7c6c1SJed Brown 1761e35832bSjeremylt /// Struct to handle the context data to use the Fortran QFunction stub 1771e35832bSjeremylt /// @ingroup CeedQFunction 178069aeabaSjeremylt typedef struct { 1791e35832bSjeremylt CeedScalar *innerctx; 180069aeabaSjeremylt size_t innerctxsize; 181069aeabaSjeremylt void (*f)(void *ctx, int *nq, 182069aeabaSjeremylt const CeedScalar *u,const CeedScalar *u1, 183069aeabaSjeremylt const CeedScalar *u2,const CeedScalar *u3, 184069aeabaSjeremylt const CeedScalar *u4,const CeedScalar *u5, 185069aeabaSjeremylt const CeedScalar *u6,const CeedScalar *u7, 186069aeabaSjeremylt const CeedScalar *u8,const CeedScalar *u9, 187069aeabaSjeremylt const CeedScalar *u10,const CeedScalar *u11, 188069aeabaSjeremylt const CeedScalar *u12,const CeedScalar *u13, 189069aeabaSjeremylt const CeedScalar *u14,const CeedScalar *u15, 190069aeabaSjeremylt CeedScalar *v,CeedScalar *v1,CeedScalar *v2, 191069aeabaSjeremylt CeedScalar *v3,CeedScalar *v4,CeedScalar *v5, 192069aeabaSjeremylt CeedScalar *v6,CeedScalar *v7,CeedScalar *v8, 193069aeabaSjeremylt CeedScalar *v9, CeedScalar *v10,CeedScalar *v11, 194069aeabaSjeremylt CeedScalar *v12,CeedScalar *v13,CeedScalar *v14, 195069aeabaSjeremylt CeedScalar *v15, int *err); 196069aeabaSjeremylt } fContext; 197069aeabaSjeremylt 198d1bcdac9Sjeremylt struct CeedOperatorField_private { 199ff8ca64bSJed Brown CeedElemRestriction Erestrict; /// Restriction from L-vector or NULL if identity 2004dccadb6Sjeremylt CeedTransposeMode lmode; /// Transpose mode for lvector ordering 201ff8ca64bSJed Brown CeedBasis basis; /// Basis or NULL for collocated fields 2024b8bea3bSJed Brown CeedVector 2034b8bea3bSJed Brown vec; /// State vector for passive fields, NULL for active fields 204ff8ca64bSJed Brown }; 205ff8ca64bSJed Brown 2066ea7c6c1SJed Brown struct CeedOperator_private { 2076ea7c6c1SJed Brown Ceed ceed; 2085107b09fSJeremy L Thompson CeedOperator opfallback; 2095107b09fSJeremy L Thompson CeedQFunction qffallback; 210c4da7380SJed Brown int refcount; 2111d102b48SJeremy L Thompson int (*AssembleLinearQFunction)(CeedOperator, CeedVector *, 2121d102b48SJeremy L Thompson CeedElemRestriction *, CeedRequest *); 213b7ec98d8SJeremy L Thompson int (*AssembleLinearDiagonal)(CeedOperator, CeedVector *, CeedRequest *); 214ff8ca64bSJed Brown int (*Apply)(CeedOperator, CeedVector, CeedVector, CeedRequest *); 215250756a7Sjeremylt int (*ApplyComposite)(CeedOperator, CeedVector, CeedVector, CeedRequest *); 216cae8b89aSjeremylt int (*ApplyAdd)(CeedOperator, CeedVector, CeedVector, CeedRequest *); 217250756a7Sjeremylt int (*ApplyAddComposite)(CeedOperator, CeedVector, CeedVector, CeedRequest *); 2186ea7c6c1SJed Brown int (*ApplyJacobian)(CeedOperator, CeedVector, CeedVector, CeedVector, 2196ea7c6c1SJed Brown CeedVector, CeedRequest *); 2206ea7c6c1SJed Brown int (*Destroy)(CeedOperator); 221fe2413ffSjeremylt CeedOperatorField *inputfields; 222fe2413ffSjeremylt CeedOperatorField *outputfields; 223ff8ca64bSJed Brown CeedInt numelements; /// Number of elements 224ff8ca64bSJed Brown CeedInt numqpoints; /// Number of quadrature points over all elements 225ef700c2cSjeremylt CeedInt nfields; /// Number of fields that have been set 2266ea7c6c1SJed Brown CeedQFunction qf; 2276ea7c6c1SJed Brown CeedQFunction dqf; 2286ea7c6c1SJed Brown CeedQFunction dqfT; 229ff8ca64bSJed Brown bool setupdone; 23052d6035fSJeremy L Thompson bool composite; 2312cb0afc5Sjeremylt bool hasrestriction; 23252d6035fSJeremy L Thompson CeedOperator *suboperators; 23352d6035fSJeremy L Thompson CeedInt numsub; 2346ea7c6c1SJed Brown void *data; 2356ea7c6c1SJed Brown }; 2366ea7c6c1SJed Brown 237d863ab9bSjeremylt CEED_INTERN int CeedErrorReturn(Ceed, const char *, int, const char *, int, 238d863ab9bSjeremylt const char *, va_list); 239d863ab9bSjeremylt CEED_INTERN int CeedErrorAbort(Ceed, const char *, int, const char *, int, 240d863ab9bSjeremylt const char *, va_list); 241d863ab9bSjeremylt CEED_INTERN int CeedErrorExit(Ceed, const char *, int, const char *, int, 242d863ab9bSjeremylt const char *, va_list); 243d863ab9bSjeremylt CEED_INTERN int CeedSetErrorHandler(Ceed ceed, 2442f86a920SJeremy L Thompson int (eh)(Ceed, const char *, int, 2452f86a920SJeremy L Thompson const char *, int, const char *, 2462f86a920SJeremy L Thompson va_list)); 247d863ab9bSjeremylt 2483bd813ffSjeremylt CEED_INTERN int CeedMatrixMultiply(Ceed ceed, CeedScalar *matA, 2493bd813ffSjeremylt CeedScalar *matB, CeedScalar *matC, 2503bd813ffSjeremylt CeedInt m, CeedInt n, CeedInt kk); 2513bd813ffSjeremylt 2526ea7c6c1SJed Brown #endif 253