16ea7c6c1SJed Brown // Copyright (c) 2017, Lawrence Livermore National Security, LLC. Produced at 26ea7c6c1SJed Brown // the Lawrence Livermore National Laboratory. LLNL-CODE-734707. All Rights 36ea7c6c1SJed Brown // reserved. See files LICENSE and NOTICE for details. 46ea7c6c1SJed Brown // 56ea7c6c1SJed Brown // This file is part of CEED, a collection of benchmarks, miniapps, software 66ea7c6c1SJed Brown // libraries and APIs for efficient high-order finite element and spectral 76ea7c6c1SJed Brown // element discretizations for exascale applications. For more information and 86ea7c6c1SJed Brown // source code availability see http://github.com/ceed. 96ea7c6c1SJed Brown // 106ea7c6c1SJed Brown // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, 116ea7c6c1SJed Brown // a collaborative effort of two U.S. Department of Energy organizations (Office 126ea7c6c1SJed Brown // of Science and the National Nuclear Security Administration) responsible for 136ea7c6c1SJed Brown // the planning and preparation of a capable exascale ecosystem, including 146ea7c6c1SJed Brown // software, applications, hardware, advanced system engineering and early 156ea7c6c1SJed Brown // testbed platforms, in support of the nation's exascale computing imperative. 166ea7c6c1SJed Brown 175d6bafb2Sjeremylt /// @file 185d6bafb2Sjeremylt /// Private header for frontend components of libCEED 196ea7c6c1SJed Brown #ifndef _ceed_impl_h 206ea7c6c1SJed Brown #define _ceed_impl_h 216ea7c6c1SJed Brown 226ea7c6c1SJed Brown #include <ceed.h> 232f86a920SJeremy L Thompson #include <ceed-backend.h> 24ff8ca64bSJed Brown #include <stdbool.h> 256ea7c6c1SJed Brown 26*0e4d4210Sjeremylt #define CEED_EPSILON 1E-16 276ea7c6c1SJed Brown 28fe2413ffSjeremylt // Lookup table field for backend functions 29fe2413ffSjeremylt typedef struct { 30fe2413ffSjeremylt const char *fname; 31fe2413ffSjeremylt size_t offset; 32fe2413ffSjeremylt } foffset; 33fe2413ffSjeremylt 34aefd8378Sjeremylt // Lookup table field for object delegates 35aefd8378Sjeremylt typedef struct { 36aefd8378Sjeremylt char *objname; 37aefd8378Sjeremylt Ceed delegate; 38aefd8378Sjeremylt } objdelegate; 39aefd8378Sjeremylt 406ea7c6c1SJed Brown struct Ceed_private { 41e07206deSjeremylt const char *resource; 425fe0d4faSjeremylt Ceed delegate; 432f86a920SJeremy L Thompson Ceed parent; 44aefd8378Sjeremylt objdelegate *objdelegates; 45aefd8378Sjeremylt int objdelegatecount; 465107b09fSJeremy L Thompson Ceed opfallbackceed, opfallbackparent; 475107b09fSJeremy L Thompson const char *opfallbackresource; 482f86a920SJeremy L Thompson int (*Error)(Ceed, const char *, int, const char *, int, const char *, 492f86a920SJeremy L Thompson va_list); 50c907536fSjeremylt int (*GetPreferredMemType)(CeedMemType *); 516ea7c6c1SJed Brown int (*Destroy)(Ceed); 52f8902d9eSjeremylt int (*VectorCreate)(CeedInt, CeedVector); 53667bc5fcSjeremylt int (*ElemRestrictionCreate)(CeedMemType, CeedCopyMode, 54667bc5fcSjeremylt const CeedInt *, CeedElemRestriction); 55667bc5fcSjeremylt int (*ElemRestrictionCreateBlocked)(CeedMemType, CeedCopyMode, 56667bc5fcSjeremylt const CeedInt *, CeedElemRestriction); 57667bc5fcSjeremylt int (*BasisCreateTensorH1)(CeedInt, CeedInt, CeedInt, const CeedScalar *, 582f86a920SJeremy L Thompson const CeedScalar *, const CeedScalar *, 592f86a920SJeremy L Thompson const CeedScalar *, CeedBasis); 60667bc5fcSjeremylt int (*BasisCreateH1)(CeedElemTopology, CeedInt, CeedInt, CeedInt, 61a8de75f0Sjeremylt const CeedScalar *, 622f86a920SJeremy L Thompson const CeedScalar *, const CeedScalar *, 632f86a920SJeremy L Thompson const CeedScalar *, CeedBasis); 64c71e1dcdSjeremylt int (*TensorContractCreate)(CeedBasis, CeedTensorContract); 656ea7c6c1SJed Brown int (*QFunctionCreate)(CeedQFunction); 666ea7c6c1SJed Brown int (*OperatorCreate)(CeedOperator); 6752d6035fSJeremy L Thompson int (*CompositeOperatorCreate)(CeedOperator); 6880061934SJed Brown int refcount; 696ea7c6c1SJed Brown void *data; 706e79d475Sjeremylt foffset *foffsets; 716ea7c6c1SJed Brown }; 726ea7c6c1SJed Brown 736ea7c6c1SJed Brown struct CeedVector_private { 746ea7c6c1SJed Brown Ceed ceed; 756ea7c6c1SJed Brown int (*SetArray)(CeedVector, CeedMemType, CeedCopyMode, CeedScalar *); 762a1ab385Sjeremylt int (*SetValue)(CeedVector, CeedScalar); 7754540941SJeremy L Thompson int (*SyncArray)(CeedVector, CeedMemType); 786ea7c6c1SJed Brown int (*GetArray)(CeedVector, CeedMemType, CeedScalar **); 796ea7c6c1SJed Brown int (*GetArrayRead)(CeedVector, CeedMemType, const CeedScalar **); 80f05116b9SJeremy L Thompson int (*RestoreArray)(CeedVector); 81f05116b9SJeremy L Thompson int (*RestoreArrayRead)(CeedVector); 826ea7c6c1SJed Brown int (*Destroy)(CeedVector); 83540765feSJed Brown int refcount; 846ea7c6c1SJed Brown CeedInt length; 8536ac90ebSjeremylt uint64_t state; 862cd729eeSjeremylt uint64_t numreaders; 876ea7c6c1SJed Brown void *data; 886ea7c6c1SJed Brown }; 896ea7c6c1SJed Brown 906ea7c6c1SJed Brown struct CeedElemRestriction_private { 916ea7c6c1SJed Brown Ceed ceed; 92ff8ca64bSJed Brown int (*Apply)(CeedElemRestriction, CeedTransposeMode, CeedTransposeMode, 936ea7c6c1SJed Brown CeedVector, CeedVector, CeedRequest *); 94be9261b7Sjeremylt int (*ApplyBlock)(CeedElemRestriction, CeedInt, CeedTransposeMode, 95be9261b7Sjeremylt CeedTransposeMode, CeedVector, CeedVector, CeedRequest *); 966ea7c6c1SJed Brown int (*Destroy)(CeedElemRestriction); 97675ef50dSJed Brown int refcount; 986ea7c6c1SJed Brown CeedInt nelem; /* number of elements */ 998795c945Sjeremylt CeedInt elemsize; /* number of nodes per element */ 1008795c945Sjeremylt CeedInt nnodes; /* size of the L-vector, can be used for checking for 1016ea7c6c1SJed Brown correct vector sizes */ 102ff8ca64bSJed Brown CeedInt ncomp; /* number of components */ 1034e35ef05Sjeremylt CeedInt blksize; /* number of elements in a batch */ 1044e35ef05Sjeremylt CeedInt nblk; /* number of blocks of elements */ 1056ea7c6c1SJed Brown void *data; /* place for the backend to store any data */ 1066ea7c6c1SJed Brown }; 1076ea7c6c1SJed Brown 1086ea7c6c1SJed Brown struct CeedBasis_private { 1096ea7c6c1SJed Brown Ceed ceed; 1104b8bea3bSJed Brown int (*Apply)(CeedBasis, CeedInt, CeedTransposeMode, CeedEvalMode, 111aedaa0e5Sjeremylt CeedVector, CeedVector); 1126ea7c6c1SJed Brown int (*Destroy)(CeedBasis); 113c3725256SJed Brown int refcount; 114a8de75f0Sjeremylt bool tensorbasis; /* flag for tensor basis */ 1150f5de9e9Sjeremylt CeedInt dim; /* topological dimension */ 1160f5de9e9Sjeremylt CeedInt ncomp; /* number of field components (1 for scalar fields) */ 1170f5de9e9Sjeremylt CeedInt P1d; /* number of nodes in one dimension */ 1180f5de9e9Sjeremylt CeedInt Q1d; /* number of quadrature points in one dimension */ 119a8de75f0Sjeremylt CeedInt P; /* total number of nodes */ 120a8de75f0Sjeremylt CeedInt Q; /* total number of quadrature points */ 1210f5de9e9Sjeremylt CeedScalar *qref1d; /* Array of length Q1d holding the locations of 1220f5de9e9Sjeremylt quadrature points on the 1D reference element [-1, 1] */ 1230f5de9e9Sjeremylt CeedScalar *qweight1d; /* array of length Q1d holding the quadrature weights on 1240f5de9e9Sjeremylt the reference element */ 1254b8bea3bSJed Brown CeedScalar 1264b8bea3bSJed Brown *interp1d; /* row-major matrix of shape [Q1d, P1d] expressing the values of 1270f5de9e9Sjeremylt nodal basis functions at quadrature points */ 1284b8bea3bSJed Brown CeedScalar 1294b8bea3bSJed Brown *grad1d; /* row-major matrix of shape [Q1d, P1d] matrix expressing derivatives of 1300f5de9e9Sjeremylt nodal basis functions at quadrature points */ 1312f86a920SJeremy L Thompson CeedTensorContract contract; /* tensor contraction object */ 132c01dd730Scamierjs void *data; /* place for the backend to store any data */ 1336ea7c6c1SJed Brown }; 1346ea7c6c1SJed Brown 1352f86a920SJeremy L Thompson struct CeedTensorContract_private { 1362f86a920SJeremy L Thompson Ceed ceed; 1372f86a920SJeremy L Thompson int (*Apply)(CeedTensorContract, CeedInt, CeedInt, CeedInt, CeedInt, 1382f86a920SJeremy L Thompson const CeedScalar *restrict, CeedTransposeMode, const CeedInt, 1392f86a920SJeremy L Thompson const CeedScalar *restrict, CeedScalar *restrict); 1402f86a920SJeremy L Thompson int (*Destroy)(CeedTensorContract); 1412f86a920SJeremy L Thompson int refcount; 1422f86a920SJeremy L Thompson void *data; 1432f86a920SJeremy L Thompson }; 1442f86a920SJeremy L Thompson 145d1bcdac9Sjeremylt struct CeedQFunctionField_private { 146ff8ca64bSJed Brown const char *fieldname; 1474d537eeaSYohann CeedInt size; 148ff8ca64bSJed Brown CeedEvalMode emode; 149ff8ca64bSJed Brown }; 150ff8ca64bSJed Brown 1516ea7c6c1SJed Brown struct CeedQFunction_private { 1526ea7c6c1SJed Brown Ceed ceed; 1532f86a920SJeremy L Thompson int (*Apply)(CeedQFunction, CeedInt, CeedVector *, CeedVector *); 1546ea7c6c1SJed Brown int (*Destroy)(CeedQFunction); 1552123d1aaSJed Brown int refcount; 1566ea7c6c1SJed Brown CeedInt vlength; // Number of quadrature points must be padded to a multiple of vlength 157fe2413ffSjeremylt CeedQFunctionField *inputfields; 158fe2413ffSjeremylt CeedQFunctionField *outputfields; 159ff8ca64bSJed Brown CeedInt numinputfields, numoutputfields; 1609f0427d9SYohann CeedQFunctionUser function; 161288c0443SJeremy L Thompson const char *sourcepath; 162288c0443SJeremy L Thompson const char *qfname; 163418fb8c2Sjeremylt bool fortranstatus; 1640219ea01SJeremy L Thompson bool identity; 1656ea7c6c1SJed Brown void *ctx; /* user context for function */ 1666ea7c6c1SJed Brown size_t ctxsize; /* size of user context; may be used to copy to a device */ 1676ea7c6c1SJed Brown void *data; /* backend data */ 1686ea7c6c1SJed Brown }; 1696ea7c6c1SJed Brown 1701e35832bSjeremylt /// Struct to handle the context data to use the Fortran QFunction stub 1711e35832bSjeremylt /// @ingroup CeedQFunction 172069aeabaSjeremylt typedef struct { 1731e35832bSjeremylt CeedScalar *innerctx; 174069aeabaSjeremylt size_t innerctxsize; 175069aeabaSjeremylt void (*f)(void *ctx, int *nq, 176069aeabaSjeremylt const CeedScalar *u,const CeedScalar *u1, 177069aeabaSjeremylt const CeedScalar *u2,const CeedScalar *u3, 178069aeabaSjeremylt const CeedScalar *u4,const CeedScalar *u5, 179069aeabaSjeremylt const CeedScalar *u6,const CeedScalar *u7, 180069aeabaSjeremylt const CeedScalar *u8,const CeedScalar *u9, 181069aeabaSjeremylt const CeedScalar *u10,const CeedScalar *u11, 182069aeabaSjeremylt const CeedScalar *u12,const CeedScalar *u13, 183069aeabaSjeremylt const CeedScalar *u14,const CeedScalar *u15, 184069aeabaSjeremylt CeedScalar *v,CeedScalar *v1,CeedScalar *v2, 185069aeabaSjeremylt CeedScalar *v3,CeedScalar *v4,CeedScalar *v5, 186069aeabaSjeremylt CeedScalar *v6,CeedScalar *v7,CeedScalar *v8, 187069aeabaSjeremylt CeedScalar *v9, CeedScalar *v10,CeedScalar *v11, 188069aeabaSjeremylt CeedScalar *v12,CeedScalar *v13,CeedScalar *v14, 189069aeabaSjeremylt CeedScalar *v15, int *err); 190069aeabaSjeremylt } fContext; 191069aeabaSjeremylt 192d1bcdac9Sjeremylt struct CeedOperatorField_private { 193ff8ca64bSJed Brown CeedElemRestriction Erestrict; /// Restriction from L-vector or NULL if identity 1944dccadb6Sjeremylt CeedTransposeMode lmode; /// Transpose mode for lvector ordering 195ff8ca64bSJed Brown CeedBasis basis; /// Basis or NULL for collocated fields 1964b8bea3bSJed Brown CeedVector 1974b8bea3bSJed Brown vec; /// State vector for passive fields, NULL for active fields 198ff8ca64bSJed Brown }; 199ff8ca64bSJed Brown 2006ea7c6c1SJed Brown struct CeedOperator_private { 2016ea7c6c1SJed Brown Ceed ceed; 2025107b09fSJeremy L Thompson CeedOperator opfallback; 2035107b09fSJeremy L Thompson CeedQFunction qffallback; 204c4da7380SJed Brown int refcount; 2051d102b48SJeremy L Thompson int (*AssembleLinearQFunction)(CeedOperator, CeedVector *, 2061d102b48SJeremy L Thompson CeedElemRestriction *, CeedRequest *); 207b7ec98d8SJeremy L Thompson int (*AssembleLinearDiagonal)(CeedOperator, CeedVector *, CeedRequest *); 208ff8ca64bSJed Brown int (*Apply)(CeedOperator, CeedVector, CeedVector, CeedRequest *); 209250756a7Sjeremylt int (*ApplyComposite)(CeedOperator, CeedVector, CeedVector, CeedRequest *); 210cae8b89aSjeremylt int (*ApplyAdd)(CeedOperator, CeedVector, CeedVector, CeedRequest *); 211250756a7Sjeremylt int (*ApplyAddComposite)(CeedOperator, CeedVector, CeedVector, CeedRequest *); 2126ea7c6c1SJed Brown int (*ApplyJacobian)(CeedOperator, CeedVector, CeedVector, CeedVector, 2136ea7c6c1SJed Brown CeedVector, CeedRequest *); 2146ea7c6c1SJed Brown int (*Destroy)(CeedOperator); 215fe2413ffSjeremylt CeedOperatorField *inputfields; 216fe2413ffSjeremylt CeedOperatorField *outputfields; 217ff8ca64bSJed Brown CeedInt numelements; /// Number of elements 218ff8ca64bSJed Brown CeedInt numqpoints; /// Number of quadrature points over all elements 219ef700c2cSjeremylt CeedInt nfields; /// Number of fields that have been set 2206ea7c6c1SJed Brown CeedQFunction qf; 2216ea7c6c1SJed Brown CeedQFunction dqf; 2226ea7c6c1SJed Brown CeedQFunction dqfT; 223ff8ca64bSJed Brown bool setupdone; 22452d6035fSJeremy L Thompson bool composite; 2252cb0afc5Sjeremylt bool hasrestriction; 22652d6035fSJeremy L Thompson CeedOperator *suboperators; 22752d6035fSJeremy L Thompson CeedInt numsub; 2286ea7c6c1SJed Brown void *data; 2296ea7c6c1SJed Brown }; 2306ea7c6c1SJed Brown 231d863ab9bSjeremylt CEED_INTERN int CeedErrorReturn(Ceed, const char *, int, const char *, int, 232d863ab9bSjeremylt const char *, va_list); 233d863ab9bSjeremylt CEED_INTERN int CeedErrorAbort(Ceed, const char *, int, const char *, int, 234d863ab9bSjeremylt const char *, va_list); 235d863ab9bSjeremylt CEED_INTERN int CeedErrorExit(Ceed, const char *, int, const char *, int, 236d863ab9bSjeremylt const char *, va_list); 237d863ab9bSjeremylt CEED_INTERN int CeedSetErrorHandler(Ceed ceed, 2382f86a920SJeremy L Thompson int (eh)(Ceed, const char *, int, 2392f86a920SJeremy L Thompson const char *, int, const char *, 2402f86a920SJeremy L Thompson va_list)); 241d863ab9bSjeremylt 2423bd813ffSjeremylt CEED_INTERN int CeedMatrixMultiply(Ceed ceed, CeedScalar *matA, 2433bd813ffSjeremylt CeedScalar *matB, CeedScalar *matC, 2443bd813ffSjeremylt CeedInt m, CeedInt n, CeedInt kk); 2453bd813ffSjeremylt 2466ea7c6c1SJed Brown #endif 247