16ea7c6c1SJed Brown // Copyright (c) 2017, Lawrence Livermore National Security, LLC. Produced at 26ea7c6c1SJed Brown // the Lawrence Livermore National Laboratory. LLNL-CODE-734707. All Rights 36ea7c6c1SJed Brown // reserved. See files LICENSE and NOTICE for details. 46ea7c6c1SJed Brown // 56ea7c6c1SJed Brown // This file is part of CEED, a collection of benchmarks, miniapps, software 66ea7c6c1SJed Brown // libraries and APIs for efficient high-order finite element and spectral 76ea7c6c1SJed Brown // element discretizations for exascale applications. For more information and 86ea7c6c1SJed Brown // source code availability see http://github.com/ceed. 96ea7c6c1SJed Brown // 106ea7c6c1SJed Brown // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, 116ea7c6c1SJed Brown // a collaborative effort of two U.S. Department of Energy organizations (Office 126ea7c6c1SJed Brown // of Science and the National Nuclear Security Administration) responsible for 136ea7c6c1SJed Brown // the planning and preparation of a capable exascale ecosystem, including 146ea7c6c1SJed Brown // software, applications, hardware, advanced system engineering and early 156ea7c6c1SJed Brown // testbed platforms, in support of the nation's exascale computing imperative. 166ea7c6c1SJed Brown 176ea7c6c1SJed Brown #ifndef _ceed_impl_h 186ea7c6c1SJed Brown #define _ceed_impl_h 196ea7c6c1SJed Brown 206ea7c6c1SJed Brown #include <ceed.h> 21ff8ca64bSJed Brown #include <stdbool.h> 226ea7c6c1SJed Brown 236ea7c6c1SJed Brown #define CEED_INTERN CEED_EXTERN __attribute__((visibility ("hidden"))) 246ea7c6c1SJed Brown 256ea7c6c1SJed Brown #define CEED_MAX_RESOURCE_LEN 1024 266ea7c6c1SJed Brown #define CEED_ALIGN 64 276ea7c6c1SJed Brown 286ea7c6c1SJed Brown struct Ceed_private { 29*5fe0d4faSjeremylt Ceed delegate; 306ea7c6c1SJed Brown int (*Error)(Ceed, const char *, int, const char *, int, const char *, va_list); 316ea7c6c1SJed Brown int (*Destroy)(Ceed); 32667bc5fcSjeremylt int (*VecCreate)(CeedInt, CeedVector); 33667bc5fcSjeremylt int (*ElemRestrictionCreate)(CeedMemType, CeedCopyMode, 34667bc5fcSjeremylt const CeedInt *, CeedElemRestriction); 35667bc5fcSjeremylt int (*ElemRestrictionCreateBlocked)(CeedMemType, CeedCopyMode, 36667bc5fcSjeremylt const CeedInt *, CeedElemRestriction); 37667bc5fcSjeremylt int (*BasisCreateTensorH1)(CeedInt, CeedInt, CeedInt, const CeedScalar *, 386ea7c6c1SJed Brown const CeedScalar *, const CeedScalar *, const CeedScalar *, CeedBasis); 39667bc5fcSjeremylt int (*BasisCreateH1)(CeedElemTopology, CeedInt, CeedInt, CeedInt, 40a8de75f0Sjeremylt const CeedScalar *, 41a8de75f0Sjeremylt const CeedScalar *, const CeedScalar *, const CeedScalar *, CeedBasis); 426ea7c6c1SJed Brown int (*QFunctionCreate)(CeedQFunction); 436ea7c6c1SJed Brown int (*OperatorCreate)(CeedOperator); 4480061934SJed Brown int refcount; 456ea7c6c1SJed Brown void *data; 466ea7c6c1SJed Brown }; 476ea7c6c1SJed Brown 486ea7c6c1SJed Brown /* In the next 3 functions, p has to be the address of a pointer type, i.e. p 496ea7c6c1SJed Brown has to be a pointer to a pointer. */ 50c7c22b02Scamierjs CEED_INTERN int CeedMallocArray(size_t n, size_t unit, void *p); 51c7c22b02Scamierjs CEED_INTERN int CeedCallocArray(size_t n, size_t unit, void *p); 52c7c22b02Scamierjs CEED_INTERN int CeedReallocArray(size_t n, size_t unit, void *p); 53c7c22b02Scamierjs CEED_INTERN int CeedFree(void *p); 546ea7c6c1SJed Brown 556ea7c6c1SJed Brown #define CeedChk(ierr) do { if (ierr) return ierr; } while (0) 566ea7c6c1SJed Brown /* Note that CeedMalloc and CeedCalloc will, generally, return pointers with 576ea7c6c1SJed Brown different memory alignments: CeedMalloc returns pointers aligned at 586ea7c6c1SJed Brown CEED_ALIGN bytes, while CeedCalloc uses the alignment of calloc. */ 59c7c22b02Scamierjs #define CeedMalloc(n, p) CeedMallocArray((n), sizeof(**(p)), p) 60c7c22b02Scamierjs #define CeedCalloc(n, p) CeedCallocArray((n), sizeof(**(p)), p) 61c7c22b02Scamierjs #define CeedRealloc(n, p) CeedReallocArray((n), sizeof(**(p)), p) 626ea7c6c1SJed Brown 636ea7c6c1SJed Brown struct CeedVector_private { 646ea7c6c1SJed Brown Ceed ceed; 656ea7c6c1SJed Brown int (*SetArray)(CeedVector, CeedMemType, CeedCopyMode, CeedScalar *); 662a1ab385Sjeremylt int (*SetValue)(CeedVector, CeedScalar); 676ea7c6c1SJed Brown int (*GetArray)(CeedVector, CeedMemType, CeedScalar **); 686ea7c6c1SJed Brown int (*GetArrayRead)(CeedVector, CeedMemType, const CeedScalar **); 696ea7c6c1SJed Brown int (*RestoreArray)(CeedVector, CeedScalar **); 706ea7c6c1SJed Brown int (*RestoreArrayRead)(CeedVector, const CeedScalar **); 716ea7c6c1SJed Brown int (*Destroy)(CeedVector); 72540765feSJed Brown int refcount; 736ea7c6c1SJed Brown CeedInt length; 7436ac90ebSjeremylt uint64_t state; 756ea7c6c1SJed Brown void *data; 766ea7c6c1SJed Brown }; 776ea7c6c1SJed Brown 786ea7c6c1SJed Brown struct CeedElemRestriction_private { 796ea7c6c1SJed Brown Ceed ceed; 80ff8ca64bSJed Brown int (*Apply)(CeedElemRestriction, CeedTransposeMode, CeedTransposeMode, 816ea7c6c1SJed Brown CeedVector, CeedVector, CeedRequest *); 826ea7c6c1SJed Brown int (*Destroy)(CeedElemRestriction); 83675ef50dSJed Brown int refcount; 846ea7c6c1SJed Brown CeedInt nelem; /* number of elements */ 856ea7c6c1SJed Brown CeedInt elemsize; /* number of dofs per element */ 866ea7c6c1SJed Brown CeedInt ndof; /* size of the L-vector, can be used for checking for 876ea7c6c1SJed Brown correct vector sizes */ 88ff8ca64bSJed Brown CeedInt ncomp; /* number of components */ 894e35ef05Sjeremylt CeedInt blksize; /* number of elements in a batch */ 904e35ef05Sjeremylt CeedInt nblk; /* number of blocks of elements */ 916ea7c6c1SJed Brown void *data; /* place for the backend to store any data */ 926ea7c6c1SJed Brown }; 936ea7c6c1SJed Brown 946ea7c6c1SJed Brown struct CeedBasis_private { 956ea7c6c1SJed Brown Ceed ceed; 964b8bea3bSJed Brown int (*Apply)(CeedBasis, CeedInt, CeedTransposeMode, CeedEvalMode, 974b8bea3bSJed Brown const CeedScalar *, 986ea7c6c1SJed Brown CeedScalar *); 996ea7c6c1SJed Brown int (*Destroy)(CeedBasis); 100c3725256SJed Brown int refcount; 101a8de75f0Sjeremylt bool tensorbasis; /* flag for tensor basis */ 1020f5de9e9Sjeremylt CeedInt dim; /* topological dimension */ 1030f5de9e9Sjeremylt CeedInt ncomp; /* number of field components (1 for scalar fields) */ 1040f5de9e9Sjeremylt CeedInt P1d; /* number of nodes in one dimension */ 1050f5de9e9Sjeremylt CeedInt Q1d; /* number of quadrature points in one dimension */ 106a8de75f0Sjeremylt CeedInt P; /* total number of nodes */ 107a8de75f0Sjeremylt CeedInt Q; /* total number of quadrature points */ 1080f5de9e9Sjeremylt CeedScalar *qref1d; /* Array of length Q1d holding the locations of 1090f5de9e9Sjeremylt quadrature points on the 1D reference element [-1, 1] */ 1100f5de9e9Sjeremylt CeedScalar *qweight1d; /* array of length Q1d holding the quadrature weights on 1110f5de9e9Sjeremylt the reference element */ 1124b8bea3bSJed Brown CeedScalar 1134b8bea3bSJed Brown *interp1d; /* row-major matrix of shape [Q1d, P1d] expressing the values of 1140f5de9e9Sjeremylt nodal basis functions at quadrature points */ 1154b8bea3bSJed Brown CeedScalar 1164b8bea3bSJed Brown *grad1d; /* row-major matrix of shape [Q1d, P1d] matrix expressing derivatives of 1170f5de9e9Sjeremylt nodal basis functions at quadrature points */ 118c01dd730Scamierjs void *data; /* place for the backend to store any data */ 1196ea7c6c1SJed Brown }; 1206ea7c6c1SJed Brown 121ff8ca64bSJed Brown struct CeedQFunctionField { 122ff8ca64bSJed Brown const char *fieldname; 123ff8ca64bSJed Brown CeedInt ncomp; 124ff8ca64bSJed Brown CeedEvalMode emode; 125ff8ca64bSJed Brown }; 126ff8ca64bSJed Brown 1276ea7c6c1SJed Brown struct CeedQFunction_private { 1286ea7c6c1SJed Brown Ceed ceed; 129ff8ca64bSJed Brown int (*Apply)(CeedQFunction, CeedInt, const CeedScalar *const *, 1306ea7c6c1SJed Brown CeedScalar *const *); 1316ea7c6c1SJed Brown int (*Destroy)(CeedQFunction); 1322123d1aaSJed Brown int refcount; 1336ea7c6c1SJed Brown CeedInt vlength; // Number of quadrature points must be padded to a multiple of vlength 134ff8ca64bSJed Brown struct CeedQFunctionField inputfields[16]; 135ff8ca64bSJed Brown struct CeedQFunctionField outputfields[16]; 136ff8ca64bSJed Brown CeedInt numinputfields, numoutputfields; 137ff8ca64bSJed Brown int (*function)(void*, CeedInt, const CeedScalar *const*, CeedScalar *const*); 1386ea7c6c1SJed Brown const char *focca; 1396ea7c6c1SJed Brown void *ctx; /* user context for function */ 1406ea7c6c1SJed Brown size_t ctxsize; /* size of user context; may be used to copy to a device */ 1416ea7c6c1SJed Brown void *data; /* backend data */ 1426ea7c6c1SJed Brown }; 1436ea7c6c1SJed Brown 144ff8ca64bSJed Brown struct CeedOperatorField { 145ff8ca64bSJed Brown CeedElemRestriction Erestrict; /// Restriction from L-vector or NULL if identity 146ff8ca64bSJed Brown CeedBasis basis; /// Basis or NULL for collocated fields 1474b8bea3bSJed Brown CeedVector 1484b8bea3bSJed Brown vec; /// State vector for passive fields, NULL for active fields 149ff8ca64bSJed Brown }; 150ff8ca64bSJed Brown 1516ea7c6c1SJed Brown struct CeedOperator_private { 1526ea7c6c1SJed Brown Ceed ceed; 153c4da7380SJed Brown int refcount; 154ff8ca64bSJed Brown int (*Apply)(CeedOperator, CeedVector, CeedVector, CeedRequest *); 1556ea7c6c1SJed Brown int (*ApplyJacobian)(CeedOperator, CeedVector, CeedVector, CeedVector, 1566ea7c6c1SJed Brown CeedVector, CeedRequest *); 1576ea7c6c1SJed Brown int (*GetQData)(CeedOperator, CeedVector *); 1586ea7c6c1SJed Brown int (*Destroy)(CeedOperator); 159ff8ca64bSJed Brown struct CeedOperatorField inputfields[16]; 160ff8ca64bSJed Brown struct CeedOperatorField outputfields[16]; 161ff8ca64bSJed Brown CeedInt numelements; /// Number of elements 162ff8ca64bSJed Brown CeedInt numqpoints; /// Number of quadrature points over all elements 163ef700c2cSjeremylt CeedInt nfields; /// Number of fields that have been set 1646ea7c6c1SJed Brown CeedQFunction qf; 1656ea7c6c1SJed Brown CeedQFunction dqf; 1666ea7c6c1SJed Brown CeedQFunction dqfT; 167ff8ca64bSJed Brown bool setupdone; 1686ea7c6c1SJed Brown void *data; 1696ea7c6c1SJed Brown }; 1706ea7c6c1SJed Brown 1716ea7c6c1SJed Brown #endif 172