16ea7c6c1SJed Brown // Copyright (c) 2017, Lawrence Livermore National Security, LLC. Produced at 26ea7c6c1SJed Brown // the Lawrence Livermore National Laboratory. LLNL-CODE-734707. All Rights 36ea7c6c1SJed Brown // reserved. See files LICENSE and NOTICE for details. 46ea7c6c1SJed Brown // 56ea7c6c1SJed Brown // This file is part of CEED, a collection of benchmarks, miniapps, software 66ea7c6c1SJed Brown // libraries and APIs for efficient high-order finite element and spectral 76ea7c6c1SJed Brown // element discretizations for exascale applications. For more information and 86ea7c6c1SJed Brown // source code availability see http://github.com/ceed. 96ea7c6c1SJed Brown // 106ea7c6c1SJed Brown // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, 116ea7c6c1SJed Brown // a collaborative effort of two U.S. Department of Energy organizations (Office 126ea7c6c1SJed Brown // of Science and the National Nuclear Security Administration) responsible for 136ea7c6c1SJed Brown // the planning and preparation of a capable exascale ecosystem, including 146ea7c6c1SJed Brown // software, applications, hardware, advanced system engineering and early 156ea7c6c1SJed Brown // testbed platforms, in support of the nation's exascale computing imperative. 166ea7c6c1SJed Brown 175d6bafb2Sjeremylt /// @file 185d6bafb2Sjeremylt /// Private header for frontend components of libCEED 196ea7c6c1SJed Brown #ifndef _ceed_impl_h 206ea7c6c1SJed Brown #define _ceed_impl_h 216ea7c6c1SJed Brown 226ea7c6c1SJed Brown #include <ceed.h> 232f86a920SJeremy L Thompson #include <ceed-backend.h> 24ff8ca64bSJed Brown #include <stdbool.h> 256ea7c6c1SJed Brown 266ea7c6c1SJed Brown #define CEED_INTERN CEED_EXTERN __attribute__((visibility ("hidden"))) 276ea7c6c1SJed Brown 286ea7c6c1SJed Brown #define CEED_MAX_RESOURCE_LEN 1024 296ea7c6c1SJed Brown #define CEED_ALIGN 64 302f86a920SJeremy L Thompson 3152d6035fSJeremy L Thompson #define CEED_COMPOSITE_MAX 16 326ea7c6c1SJed Brown 33fe2413ffSjeremylt // Lookup table field for backend functions 34fe2413ffSjeremylt typedef struct { 35fe2413ffSjeremylt const char *fname; 36fe2413ffSjeremylt size_t offset; 37fe2413ffSjeremylt } foffset; 38fe2413ffSjeremylt 39aefd8378Sjeremylt // Lookup table field for object delegates 40aefd8378Sjeremylt typedef struct { 41aefd8378Sjeremylt char *objname; 42aefd8378Sjeremylt Ceed delegate; 43aefd8378Sjeremylt } objdelegate; 44aefd8378Sjeremylt 456ea7c6c1SJed Brown struct Ceed_private { 46e07206deSjeremylt const char *resource; 475fe0d4faSjeremylt Ceed delegate; 482f86a920SJeremy L Thompson Ceed parent; 49aefd8378Sjeremylt objdelegate *objdelegates; 50aefd8378Sjeremylt int objdelegatecount; 515107b09fSJeremy L Thompson Ceed opfallbackceed, opfallbackparent; 525107b09fSJeremy L Thompson const char *opfallbackresource; 532f86a920SJeremy L Thompson int (*Error)(Ceed, const char *, int, const char *, int, const char *, 542f86a920SJeremy L Thompson va_list); 55c907536fSjeremylt int (*GetPreferredMemType)(CeedMemType *); 566ea7c6c1SJed Brown int (*Destroy)(Ceed); 57f8902d9eSjeremylt int (*VectorCreate)(CeedInt, CeedVector); 58667bc5fcSjeremylt int (*ElemRestrictionCreate)(CeedMemType, CeedCopyMode, 59667bc5fcSjeremylt const CeedInt *, CeedElemRestriction); 60667bc5fcSjeremylt int (*ElemRestrictionCreateBlocked)(CeedMemType, CeedCopyMode, 61667bc5fcSjeremylt const CeedInt *, CeedElemRestriction); 62667bc5fcSjeremylt int (*BasisCreateTensorH1)(CeedInt, CeedInt, CeedInt, const CeedScalar *, 632f86a920SJeremy L Thompson const CeedScalar *, const CeedScalar *, 642f86a920SJeremy L Thompson const CeedScalar *, CeedBasis); 65667bc5fcSjeremylt int (*BasisCreateH1)(CeedElemTopology, CeedInt, CeedInt, CeedInt, 66a8de75f0Sjeremylt const CeedScalar *, 672f86a920SJeremy L Thompson const CeedScalar *, const CeedScalar *, 682f86a920SJeremy L Thompson const CeedScalar *, CeedBasis); 69c71e1dcdSjeremylt int (*TensorContractCreate)(CeedBasis, CeedTensorContract); 706ea7c6c1SJed Brown int (*QFunctionCreate)(CeedQFunction); 716ea7c6c1SJed Brown int (*OperatorCreate)(CeedOperator); 7252d6035fSJeremy L Thompson int (*CompositeOperatorCreate)(CeedOperator); 7380061934SJed Brown int refcount; 746ea7c6c1SJed Brown void *data; 756e79d475Sjeremylt foffset *foffsets; 766ea7c6c1SJed Brown }; 776ea7c6c1SJed Brown 786ea7c6c1SJed Brown struct CeedVector_private { 796ea7c6c1SJed Brown Ceed ceed; 806ea7c6c1SJed Brown int (*SetArray)(CeedVector, CeedMemType, CeedCopyMode, CeedScalar *); 812a1ab385Sjeremylt int (*SetValue)(CeedVector, CeedScalar); 8254540941SJeremy L Thompson int (*SyncArray)(CeedVector, CeedMemType); 836ea7c6c1SJed Brown int (*GetArray)(CeedVector, CeedMemType, CeedScalar **); 846ea7c6c1SJed Brown int (*GetArrayRead)(CeedVector, CeedMemType, const CeedScalar **); 85f05116b9SJeremy L Thompson int (*RestoreArray)(CeedVector); 86f05116b9SJeremy L Thompson int (*RestoreArrayRead)(CeedVector); 876ea7c6c1SJed Brown int (*Destroy)(CeedVector); 88540765feSJed Brown int refcount; 896ea7c6c1SJed Brown CeedInt length; 9036ac90ebSjeremylt uint64_t state; 912cd729eeSjeremylt uint64_t numreaders; 926ea7c6c1SJed Brown void *data; 936ea7c6c1SJed Brown }; 946ea7c6c1SJed Brown 956ea7c6c1SJed Brown struct CeedElemRestriction_private { 966ea7c6c1SJed Brown Ceed ceed; 97ff8ca64bSJed Brown int (*Apply)(CeedElemRestriction, CeedTransposeMode, CeedTransposeMode, 986ea7c6c1SJed Brown CeedVector, CeedVector, CeedRequest *); 99be9261b7Sjeremylt int (*ApplyBlock)(CeedElemRestriction, CeedInt, CeedTransposeMode, 100be9261b7Sjeremylt CeedTransposeMode, CeedVector, CeedVector, CeedRequest *); 1016ea7c6c1SJed Brown int (*Destroy)(CeedElemRestriction); 102675ef50dSJed Brown int refcount; 1036ea7c6c1SJed Brown CeedInt nelem; /* number of elements */ 1048795c945Sjeremylt CeedInt elemsize; /* number of nodes per element */ 1058795c945Sjeremylt CeedInt nnodes; /* size of the L-vector, can be used for checking for 1066ea7c6c1SJed Brown correct vector sizes */ 107ff8ca64bSJed Brown CeedInt ncomp; /* number of components */ 1084e35ef05Sjeremylt CeedInt blksize; /* number of elements in a batch */ 1094e35ef05Sjeremylt CeedInt nblk; /* number of blocks of elements */ 1106ea7c6c1SJed Brown void *data; /* place for the backend to store any data */ 1116ea7c6c1SJed Brown }; 1126ea7c6c1SJed Brown 1136ea7c6c1SJed Brown struct CeedBasis_private { 1146ea7c6c1SJed Brown Ceed ceed; 1154b8bea3bSJed Brown int (*Apply)(CeedBasis, CeedInt, CeedTransposeMode, CeedEvalMode, 116aedaa0e5Sjeremylt CeedVector, CeedVector); 1176ea7c6c1SJed Brown int (*Destroy)(CeedBasis); 118c3725256SJed Brown int refcount; 119a8de75f0Sjeremylt bool tensorbasis; /* flag for tensor basis */ 1200f5de9e9Sjeremylt CeedInt dim; /* topological dimension */ 1210f5de9e9Sjeremylt CeedInt ncomp; /* number of field components (1 for scalar fields) */ 1220f5de9e9Sjeremylt CeedInt P1d; /* number of nodes in one dimension */ 1230f5de9e9Sjeremylt CeedInt Q1d; /* number of quadrature points in one dimension */ 124a8de75f0Sjeremylt CeedInt P; /* total number of nodes */ 125a8de75f0Sjeremylt CeedInt Q; /* total number of quadrature points */ 1260f5de9e9Sjeremylt CeedScalar *qref1d; /* Array of length Q1d holding the locations of 1270f5de9e9Sjeremylt quadrature points on the 1D reference element [-1, 1] */ 1280f5de9e9Sjeremylt CeedScalar *qweight1d; /* array of length Q1d holding the quadrature weights on 1290f5de9e9Sjeremylt the reference element */ 1304b8bea3bSJed Brown CeedScalar 1314b8bea3bSJed Brown *interp1d; /* row-major matrix of shape [Q1d, P1d] expressing the values of 1320f5de9e9Sjeremylt nodal basis functions at quadrature points */ 1334b8bea3bSJed Brown CeedScalar 1344b8bea3bSJed Brown *grad1d; /* row-major matrix of shape [Q1d, P1d] matrix expressing derivatives of 1350f5de9e9Sjeremylt nodal basis functions at quadrature points */ 1362f86a920SJeremy L Thompson CeedTensorContract contract; /* tensor contraction object */ 137c01dd730Scamierjs void *data; /* place for the backend to store any data */ 1386ea7c6c1SJed Brown }; 1396ea7c6c1SJed Brown 1402f86a920SJeremy L Thompson struct CeedTensorContract_private { 1412f86a920SJeremy L Thompson Ceed ceed; 1422f86a920SJeremy L Thompson int (*Apply)(CeedTensorContract, CeedInt, CeedInt, CeedInt, CeedInt, 1432f86a920SJeremy L Thompson const CeedScalar *restrict, CeedTransposeMode, const CeedInt, 1442f86a920SJeremy L Thompson const CeedScalar *restrict, CeedScalar *restrict); 1452f86a920SJeremy L Thompson int (*Destroy)(CeedTensorContract); 1462f86a920SJeremy L Thompson int refcount; 1472f86a920SJeremy L Thompson void *data; 1482f86a920SJeremy L Thompson }; 1492f86a920SJeremy L Thompson 150d1bcdac9Sjeremylt struct CeedQFunctionField_private { 151ff8ca64bSJed Brown const char *fieldname; 1524d537eeaSYohann CeedInt size; 153ff8ca64bSJed Brown CeedEvalMode emode; 154ff8ca64bSJed Brown }; 155ff8ca64bSJed Brown 1566ea7c6c1SJed Brown struct CeedQFunction_private { 1576ea7c6c1SJed Brown Ceed ceed; 1582f86a920SJeremy L Thompson int (*Apply)(CeedQFunction, CeedInt, CeedVector *, CeedVector *); 1596ea7c6c1SJed Brown int (*Destroy)(CeedQFunction); 1602123d1aaSJed Brown int refcount; 1616ea7c6c1SJed Brown CeedInt vlength; // Number of quadrature points must be padded to a multiple of vlength 162fe2413ffSjeremylt CeedQFunctionField *inputfields; 163fe2413ffSjeremylt CeedQFunctionField *outputfields; 164ff8ca64bSJed Brown CeedInt numinputfields, numoutputfields; 1659f0427d9SYohann CeedQFunctionUser function; 166288c0443SJeremy L Thompson const char *sourcepath; 167288c0443SJeremy L Thompson const char *qfname; 168418fb8c2Sjeremylt bool fortranstatus; 1690219ea01SJeremy L Thompson bool identity; 1706ea7c6c1SJed Brown void *ctx; /* user context for function */ 1716ea7c6c1SJed Brown size_t ctxsize; /* size of user context; may be used to copy to a device */ 1726ea7c6c1SJed Brown void *data; /* backend data */ 1736ea7c6c1SJed Brown }; 1746ea7c6c1SJed Brown 1751e35832bSjeremylt /// Struct to handle the context data to use the Fortran QFunction stub 1761e35832bSjeremylt /// @ingroup CeedQFunction 177069aeabaSjeremylt typedef struct { 1781e35832bSjeremylt CeedScalar *innerctx; 179069aeabaSjeremylt size_t innerctxsize; 180069aeabaSjeremylt void (*f)(void *ctx, int *nq, 181069aeabaSjeremylt const CeedScalar *u,const CeedScalar *u1, 182069aeabaSjeremylt const CeedScalar *u2,const CeedScalar *u3, 183069aeabaSjeremylt const CeedScalar *u4,const CeedScalar *u5, 184069aeabaSjeremylt const CeedScalar *u6,const CeedScalar *u7, 185069aeabaSjeremylt const CeedScalar *u8,const CeedScalar *u9, 186069aeabaSjeremylt const CeedScalar *u10,const CeedScalar *u11, 187069aeabaSjeremylt const CeedScalar *u12,const CeedScalar *u13, 188069aeabaSjeremylt const CeedScalar *u14,const CeedScalar *u15, 189069aeabaSjeremylt CeedScalar *v,CeedScalar *v1,CeedScalar *v2, 190069aeabaSjeremylt CeedScalar *v3,CeedScalar *v4,CeedScalar *v5, 191069aeabaSjeremylt CeedScalar *v6,CeedScalar *v7,CeedScalar *v8, 192069aeabaSjeremylt CeedScalar *v9, CeedScalar *v10,CeedScalar *v11, 193069aeabaSjeremylt CeedScalar *v12,CeedScalar *v13,CeedScalar *v14, 194069aeabaSjeremylt CeedScalar *v15, int *err); 195069aeabaSjeremylt } fContext; 196069aeabaSjeremylt 197d1bcdac9Sjeremylt struct CeedOperatorField_private { 198ff8ca64bSJed Brown CeedElemRestriction Erestrict; /// Restriction from L-vector or NULL if identity 1994dccadb6Sjeremylt CeedTransposeMode lmode; /// Transpose mode for lvector ordering 200ff8ca64bSJed Brown CeedBasis basis; /// Basis or NULL for collocated fields 2014b8bea3bSJed Brown CeedVector 2024b8bea3bSJed Brown vec; /// State vector for passive fields, NULL for active fields 203ff8ca64bSJed Brown }; 204ff8ca64bSJed Brown 2056ea7c6c1SJed Brown struct CeedOperator_private { 2066ea7c6c1SJed Brown Ceed ceed; 2075107b09fSJeremy L Thompson CeedOperator opfallback; 2085107b09fSJeremy L Thompson CeedQFunction qffallback; 209c4da7380SJed Brown int refcount; 2101d102b48SJeremy L Thompson int (*AssembleLinearQFunction)(CeedOperator, CeedVector *, 2111d102b48SJeremy L Thompson CeedElemRestriction *, CeedRequest *); 212b7ec98d8SJeremy L Thompson int (*AssembleLinearDiagonal)(CeedOperator, CeedVector *, CeedRequest *); 213ff8ca64bSJed Brown int (*Apply)(CeedOperator, CeedVector, CeedVector, CeedRequest *); 214*cae8b89aSjeremylt int (*ApplyAdd)(CeedOperator, CeedVector, CeedVector, CeedRequest *); 2156ea7c6c1SJed Brown int (*ApplyJacobian)(CeedOperator, CeedVector, CeedVector, CeedVector, 2166ea7c6c1SJed Brown CeedVector, CeedRequest *); 2176ea7c6c1SJed Brown int (*Destroy)(CeedOperator); 218fe2413ffSjeremylt CeedOperatorField *inputfields; 219fe2413ffSjeremylt CeedOperatorField *outputfields; 220ff8ca64bSJed Brown CeedInt numelements; /// Number of elements 221ff8ca64bSJed Brown CeedInt numqpoints; /// Number of quadrature points over all elements 222ef700c2cSjeremylt CeedInt nfields; /// Number of fields that have been set 2236ea7c6c1SJed Brown CeedQFunction qf; 2246ea7c6c1SJed Brown CeedQFunction dqf; 2256ea7c6c1SJed Brown CeedQFunction dqfT; 226ff8ca64bSJed Brown bool setupdone; 22752d6035fSJeremy L Thompson bool composite; 2282cb0afc5Sjeremylt bool hasrestriction; 22952d6035fSJeremy L Thompson CeedOperator *suboperators; 23052d6035fSJeremy L Thompson CeedInt numsub; 2316ea7c6c1SJed Brown void *data; 2326ea7c6c1SJed Brown }; 2336ea7c6c1SJed Brown 234d863ab9bSjeremylt CEED_INTERN int CeedErrorReturn(Ceed, const char *, int, const char *, int, 235d863ab9bSjeremylt const char *, va_list); 236d863ab9bSjeremylt CEED_INTERN int CeedErrorAbort(Ceed, const char *, int, const char *, int, 237d863ab9bSjeremylt const char *, va_list); 238d863ab9bSjeremylt CEED_INTERN int CeedErrorExit(Ceed, const char *, int, const char *, int, 239d863ab9bSjeremylt const char *, va_list); 240d863ab9bSjeremylt CEED_INTERN int CeedSetErrorHandler(Ceed ceed, 2412f86a920SJeremy L Thompson int (eh)(Ceed, const char *, int, 2422f86a920SJeremy L Thompson const char *, int, const char *, 2432f86a920SJeremy L Thompson va_list)); 244d863ab9bSjeremylt 2456ea7c6c1SJed Brown #endif 246