1ec3da8bcSJed Brown // Copyright (c) 2017, Lawrence Livermore National Security, LLC. Produced at 2ec3da8bcSJed Brown // the Lawrence Livermore National Laboratory. LLNL-CODE-734707. All Rights 3ec3da8bcSJed Brown // reserved. See files LICENSE and NOTICE for details. 4ec3da8bcSJed Brown // 5ec3da8bcSJed Brown // This file is part of CEED, a collection of benchmarks, miniapps, software 6ec3da8bcSJed Brown // libraries and APIs for efficient high-order finite element and spectral 7ec3da8bcSJed Brown // element discretizations for exascale applications. For more information and 8ec3da8bcSJed Brown // source code availability see http://github.com/ceed. 9ec3da8bcSJed Brown // 10ec3da8bcSJed Brown // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, 11ec3da8bcSJed Brown // a collaborative effort of two U.S. Department of Energy organizations (Office 12ec3da8bcSJed Brown // of Science and the National Nuclear Security Administration) responsible for 13ec3da8bcSJed Brown // the planning and preparation of a capable exascale ecosystem, including 14ec3da8bcSJed Brown // software, applications, hardware, advanced system engineering and early 15ec3da8bcSJed Brown // testbed platforms, in support of the nation's exascale computing imperative. 16ec3da8bcSJed Brown 17ec3da8bcSJed Brown /// @file 18ec3da8bcSJed Brown /// Public header for backend components of libCEED 19ec3da8bcSJed Brown #ifndef _ceed_backend_h 20ec3da8bcSJed Brown #define _ceed_backend_h 21ec3da8bcSJed Brown 22ec3da8bcSJed Brown #include <ceed/ceed.h> 23d0c91ce9Sjeremylt #include <limits.h> 24ec3da8bcSJed Brown #include <stdbool.h> 25ec3da8bcSJed Brown 26ec3da8bcSJed Brown #define CEED_INTERN CEED_EXTERN __attribute__((visibility ("hidden"))) 27ec3da8bcSJed Brown #define CEED_UNUSED __attribute__((unused)) 28ec3da8bcSJed Brown 29ec3da8bcSJed Brown #define CEED_MAX_RESOURCE_LEN 1024 30d0c91ce9Sjeremylt #define CEED_MAX_BACKEND_PRIORITY UINT_MAX 31ec3da8bcSJed Brown #define CEED_ALIGN 64 32ec3da8bcSJed Brown #define CEED_COMPOSITE_MAX 16 33*bf4cb664SJeremy L Thompson #define CEED_FIELD_MAX 16 34ec3da8bcSJed Brown 3503d18186Sjeremylt /** 3603d18186Sjeremylt @ingroup Ceed 37eaf62fffSJeremy L Thompson This macro provides the ability to disable optimization flags for functions that 3803d18186Sjeremylt are sensitive to floting point optimizations. 3903d18186Sjeremylt **/ 4003d18186Sjeremylt #ifndef CeedPragmaOptimizeOff 4103d18186Sjeremylt # if defined(__clang__) 4203d18186Sjeremylt # define CeedPragmaOptimizeOff _Pragma("clang optimize off") 4303d18186Sjeremylt # elif defined(__GNUC__) 4403d18186Sjeremylt # define CeedPragmaOptimizeOff _Pragma("GCC push_options") _Pragma("GCC optimize 0") 4503d18186Sjeremylt # elif defined(__INTEL_COMPILER) || defined(__INTEL_LLVM_COMPILER) 4603d18186Sjeremylt # define CeedPragmaOptimizeOff _Pragma("optimize('', off)") 4703d18186Sjeremylt # else 4803d18186Sjeremylt # define CeedPragmaOptimizeOff 4903d18186Sjeremylt # endif 5003d18186Sjeremylt #endif 5103d18186Sjeremylt 5203d18186Sjeremylt /** 5303d18186Sjeremylt @ingroup Ceed 5403d18186Sjeremylt This macro restores previously set optimization flags after CeedPragmaOptimizeOff. 5503d18186Sjeremylt **/ 5603d18186Sjeremylt #ifndef CeedPragmaOptimizeOn 5703d18186Sjeremylt # if defined(__clang__) 5803d18186Sjeremylt # define CeedPragmaOptimizeOn _Pragma("clang optimize on") 5903d18186Sjeremylt # elif defined(__GNUC__) 6003d18186Sjeremylt # define CeedPragmaOptimizeOn _Pragma("GCC pop_options") 6103d18186Sjeremylt # elif defined(__INTEL_COMPILER) || defined(__INTEL_LLVM_COMPILER) 6203d18186Sjeremylt # define CeedPragmaOptimizeOff _Pragma("optimize('', on)") 6303d18186Sjeremylt # else 6403d18186Sjeremylt # define CeedPragmaOptimizeOn 6503d18186Sjeremylt # endif 6603d18186Sjeremylt #endif 6703d18186Sjeremylt 68ec3da8bcSJed Brown /// CEED_DEBUG_COLOR default value, forward CeedDebug* declarations & macros 693f21f6b1SJeremy L Thompson #define CEED_DEBUG_COLOR_NONE 255 703f21f6b1SJeremy L Thompson 713f21f6b1SJeremy L Thompson CEED_EXTERN void CeedDebugImpl256(const unsigned char, const char *, ...); 723f21f6b1SJeremy L Thompson CEED_EXTERN bool CeedDebugFlag(const Ceed ceed); 733f21f6b1SJeremy L Thompson CEED_EXTERN bool CeedDebugFlagEnv(void); 743f21f6b1SJeremy L Thompson #define CeedDebug256(ceed, color, ...) \ 753f21f6b1SJeremy L Thompson { if (CeedDebugFlag(ceed)) CeedDebugImpl256(color, ## __VA_ARGS__); } 763f21f6b1SJeremy L Thompson #define CeedDebug(ceed, ...) CeedDebug256(ceed, (unsigned char)CEED_DEBUG_COLOR_NONE, ## __VA_ARGS__) 773f21f6b1SJeremy L Thompson #define CeedDebugEnv256(color, ...) \ 783f21f6b1SJeremy L Thompson { if (CeedDebugFlagEnv()) CeedDebugImpl256(color, ## __VA_ARGS__); } 793f21f6b1SJeremy L Thompson #define CeedDebugEnv(...) CeedDebugEnv256((unsigned char)CEED_DEBUG_COLOR_NONE, ## __VA_ARGS__) 80ec3da8bcSJed Brown 81ec3da8bcSJed Brown /// Handle for object handling TensorContraction 82ec3da8bcSJed Brown /// @ingroup CeedBasis 83ec3da8bcSJed Brown typedef struct CeedTensorContract_private *CeedTensorContract; 84ec3da8bcSJed Brown 85ec3da8bcSJed Brown /* In the next 3 functions, p has to be the address of a pointer type, i.e. p 86ec3da8bcSJed Brown has to be a pointer to a pointer. */ 87ec3da8bcSJed Brown CEED_INTERN int CeedMallocArray(size_t n, size_t unit, void *p); 88ec3da8bcSJed Brown CEED_INTERN int CeedCallocArray(size_t n, size_t unit, void *p); 89ec3da8bcSJed Brown CEED_INTERN int CeedReallocArray(size_t n, size_t unit, void *p); 90ec3da8bcSJed Brown CEED_INTERN int CeedFree(void *p); 91ec3da8bcSJed Brown 92ec3da8bcSJed Brown #define CeedChk(ierr) do { int ierr_ = ierr; if (ierr_) return ierr_; } while (0) 93ec3da8bcSJed Brown #define CeedChkBackend(ierr) do { int ierr_ = ierr; if (ierr_) { if (ierr_ > CEED_ERROR_SUCCESS) return CEED_ERROR_BACKEND; else return ierr_; } } while (0) 94ec3da8bcSJed Brown /* Note that CeedMalloc and CeedCalloc will, generally, return pointers with 95ec3da8bcSJed Brown different memory alignments: CeedMalloc returns pointers aligned at 96ec3da8bcSJed Brown CEED_ALIGN bytes, while CeedCalloc uses the alignment of calloc. */ 97ec3da8bcSJed Brown #define CeedMalloc(n, p) CeedMallocArray((n), sizeof(**(p)), p) 98ec3da8bcSJed Brown #define CeedCalloc(n, p) CeedCallocArray((n), sizeof(**(p)), p) 99ec3da8bcSJed Brown #define CeedRealloc(n, p) CeedReallocArray((n), sizeof(**(p)), p) 100ec3da8bcSJed Brown 101ec3da8bcSJed Brown CEED_EXTERN int CeedRegister(const char *prefix, 102ec3da8bcSJed Brown int (*init)(const char *, Ceed), 103ec3da8bcSJed Brown unsigned int priority); 1046a406739SJeremy L Thompson CEED_EXTERN int CeedRegisterImpl(const char *prefix, 1056a406739SJeremy L Thompson int (*init)(const char *, Ceed), 1066a406739SJeremy L Thompson unsigned int priority); 107ec3da8bcSJed Brown 108d1d35e2fSjeremylt CEED_EXTERN int CeedIsDebug(Ceed ceed, bool *is_debug); 109ec3da8bcSJed Brown CEED_EXTERN int CeedGetParent(Ceed ceed, Ceed *parent); 110ec3da8bcSJed Brown CEED_EXTERN int CeedGetDelegate(Ceed ceed, Ceed *delegate); 111ec3da8bcSJed Brown CEED_EXTERN int CeedSetDelegate(Ceed ceed, Ceed delegate); 112ec3da8bcSJed Brown CEED_EXTERN int CeedGetObjectDelegate(Ceed ceed, Ceed *delegate, 113d1d35e2fSjeremylt const char *obj_name); 114ec3da8bcSJed Brown CEED_EXTERN int CeedSetObjectDelegate(Ceed ceed, Ceed delegate, 115d1d35e2fSjeremylt const char *obj_name); 116eaf62fffSJeremy L Thompson CEED_EXTERN int CeedOperatorGetActiveBasis(CeedOperator op, 117eaf62fffSJeremy L Thompson CeedBasis *active_basis); 118eaf62fffSJeremy L Thompson CEED_EXTERN int CeedOperatorGetActiveElemRestriction(CeedOperator op, CeedElemRestriction *active_rstr); 119ec3da8bcSJed Brown CEED_EXTERN int CeedGetOperatorFallbackResource(Ceed ceed, 120ec3da8bcSJed Brown const char **resource); 121ec3da8bcSJed Brown CEED_EXTERN int CeedSetOperatorFallbackResource(Ceed ceed, 122ec3da8bcSJed Brown const char *resource); 123ec3da8bcSJed Brown CEED_EXTERN int CeedGetOperatorFallbackParentCeed(Ceed ceed, Ceed *parent); 124d1d35e2fSjeremylt CEED_EXTERN int CeedSetDeterministic(Ceed ceed, bool is_deterministic); 125ec3da8bcSJed Brown CEED_EXTERN int CeedSetBackendFunction(Ceed ceed, 126ec3da8bcSJed Brown const char *type, void *object, 127d1d35e2fSjeremylt const char *func_name, int (*f)()); 128ec3da8bcSJed Brown CEED_EXTERN int CeedGetData(Ceed ceed, void *data); 129ec3da8bcSJed Brown CEED_EXTERN int CeedSetData(Ceed ceed, void *data); 1309560d06aSjeremylt CEED_EXTERN int CeedReference(Ceed ceed); 131ec3da8bcSJed Brown 132ec3da8bcSJed Brown CEED_EXTERN int CeedVectorGetState(CeedVector vec, uint64_t *state); 133ec3da8bcSJed Brown CEED_EXTERN int CeedVectorAddReference(CeedVector vec); 134ec3da8bcSJed Brown CEED_EXTERN int CeedVectorGetData(CeedVector vec, void *data); 135ec3da8bcSJed Brown CEED_EXTERN int CeedVectorSetData(CeedVector vec, void *data); 1369560d06aSjeremylt CEED_EXTERN int CeedVectorReference(CeedVector vec); 137ec3da8bcSJed Brown 138ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionGetStrides(CeedElemRestriction rstr, 139ec3da8bcSJed Brown CeedInt (*strides)[3]); 140ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionGetOffsets(CeedElemRestriction rstr, 141d1d35e2fSjeremylt CeedMemType mem_type, const CeedInt **offsets); 142ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionRestoreOffsets(CeedElemRestriction rstr, 143ec3da8bcSJed Brown const CeedInt **offsets); 144ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionIsStrided(CeedElemRestriction rstr, 145d1d35e2fSjeremylt bool *is_strided); 146ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionHasBackendStrides(CeedElemRestriction rstr, 147d1d35e2fSjeremylt bool *has_backend_strides); 148ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionGetELayout(CeedElemRestriction rstr, 149ec3da8bcSJed Brown CeedInt (*layout)[3]); 150ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionSetELayout(CeedElemRestriction rstr, 151ec3da8bcSJed Brown CeedInt layout[3]); 152ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionGetData(CeedElemRestriction rstr, 153ec3da8bcSJed Brown void *data); 154ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionSetData(CeedElemRestriction rstr, 155ec3da8bcSJed Brown void *data); 1569560d06aSjeremylt CEED_EXTERN int CeedElemRestrictionReference(CeedElemRestriction rstr); 157ec3da8bcSJed Brown 158ec3da8bcSJed Brown CEED_EXTERN int CeedBasisGetCollocatedGrad(CeedBasis basis, 159d1d35e2fSjeremylt CeedScalar *colo_grad_1d); 160ec3da8bcSJed Brown CEED_EXTERN int CeedHouseholderApplyQ(CeedScalar *A, const CeedScalar *Q, 161d1d35e2fSjeremylt const CeedScalar *tau, CeedTransposeMode t_mode, CeedInt m, CeedInt n, 162ec3da8bcSJed Brown CeedInt k, CeedInt row, CeedInt col); 163d1d35e2fSjeremylt CEED_EXTERN int CeedBasisIsTensor(CeedBasis basis, bool *is_tensor); 164ec3da8bcSJed Brown CEED_EXTERN int CeedBasisGetData(CeedBasis basis, void *data); 165ec3da8bcSJed Brown CEED_EXTERN int CeedBasisSetData(CeedBasis basis, void *data); 1669560d06aSjeremylt CEED_EXTERN int CeedBasisReference(CeedBasis basis); 167ec3da8bcSJed Brown 168ec3da8bcSJed Brown CEED_EXTERN int CeedBasisGetTopologyDimension(CeedElemTopology topo, 169ec3da8bcSJed Brown CeedInt *dim); 170ec3da8bcSJed Brown 171ec3da8bcSJed Brown CEED_EXTERN int CeedBasisGetTensorContract(CeedBasis basis, 172ec3da8bcSJed Brown CeedTensorContract *contract); 173ec3da8bcSJed Brown CEED_EXTERN int CeedBasisSetTensorContract(CeedBasis basis, 17434359f16Sjeremylt CeedTensorContract contract); 175ec3da8bcSJed Brown CEED_EXTERN int CeedTensorContractCreate(Ceed ceed, CeedBasis basis, 176ec3da8bcSJed Brown CeedTensorContract *contract); 177ec3da8bcSJed Brown CEED_EXTERN int CeedTensorContractApply(CeedTensorContract contract, CeedInt A, 178ec3da8bcSJed Brown CeedInt B, CeedInt C, CeedInt J, 179ec3da8bcSJed Brown const CeedScalar *__restrict__ t, 180d1d35e2fSjeremylt CeedTransposeMode t_mode, 181ec3da8bcSJed Brown const CeedInt Add, 182ec3da8bcSJed Brown const CeedScalar *__restrict__ u, 183ec3da8bcSJed Brown CeedScalar *__restrict__ v); 184ec3da8bcSJed Brown CEED_EXTERN int CeedTensorContractGetCeed(CeedTensorContract contract, 185ec3da8bcSJed Brown Ceed *ceed); 186ec3da8bcSJed Brown CEED_EXTERN int CeedTensorContractGetData(CeedTensorContract contract, 187ec3da8bcSJed Brown void *data); 188ec3da8bcSJed Brown CEED_EXTERN int CeedTensorContractSetData(CeedTensorContract contract, 189ec3da8bcSJed Brown void *data); 1909560d06aSjeremylt CEED_EXTERN int CeedTensorContractReference(CeedTensorContract contract); 191ec3da8bcSJed Brown CEED_EXTERN int CeedTensorContractDestroy(CeedTensorContract *contract); 192ec3da8bcSJed Brown 193ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionRegister(const char *, const char *, CeedInt, 194ec3da8bcSJed Brown CeedQFunctionUser, int (*init)(Ceed, const char *, CeedQFunction)); 195ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionSetFortranStatus(CeedQFunction qf, bool status); 196ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionGetVectorLength(CeedQFunction qf, 197d1d35e2fSjeremylt CeedInt *vec_length); 198ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionGetNumArgs(CeedQFunction qf, 199d1d35e2fSjeremylt CeedInt *num_input_fields, 200d1d35e2fSjeremylt CeedInt *num_output_fields); 20143e1b16fSJeremy L Thompson CEED_EXTERN int CeedQFunctionGetKernelName(CeedQFunction qf, char **kernel_name); 20243e1b16fSJeremy L Thompson CEED_EXTERN int CeedQFunctionGetSourcePath(CeedQFunction qf, char **source_path); 2033d3250a0SJeremy L Thompson CEED_EXTERN int CeedQFunctionLoadSourceToBuffer(CeedQFunction qf, char **source_buffer); 204ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionGetUserFunction(CeedQFunction qf, 205ec3da8bcSJed Brown CeedQFunctionUser *f); 206ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionGetContext(CeedQFunction qf, 207ec3da8bcSJed Brown CeedQFunctionContext *ctx); 208ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionGetInnerContext(CeedQFunction qf, 209ec3da8bcSJed Brown CeedQFunctionContext *ctx); 210d1d35e2fSjeremylt CEED_EXTERN int CeedQFunctionIsIdentity(CeedQFunction qf, bool *is_identity); 211ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionGetData(CeedQFunction qf, void *data); 212ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionSetData(CeedQFunction qf, void *data); 2139560d06aSjeremylt CEED_EXTERN int CeedQFunctionReference(CeedQFunction qf); 214ec3da8bcSJed Brown 215ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionContextGetCeed(CeedQFunctionContext cxt, 216ec3da8bcSJed Brown Ceed *ceed); 217ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionContextGetState(CeedQFunctionContext ctx, 218ec3da8bcSJed Brown uint64_t *state); 219ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionContextGetBackendData(CeedQFunctionContext ctx, 220ec3da8bcSJed Brown void *data); 221ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionContextSetBackendData(CeedQFunctionContext ctx, 222ec3da8bcSJed Brown void *data); 2239560d06aSjeremylt CEED_EXTERN int CeedQFunctionContextReference(CeedQFunctionContext ctx); 224ec3da8bcSJed Brown 225d1d35e2fSjeremylt CEED_EXTERN int CeedOperatorGetNumArgs(CeedOperator op, CeedInt *num_args); 226d1d35e2fSjeremylt CEED_EXTERN int CeedOperatorIsSetupDone(CeedOperator op, bool *is_setup_done); 227ec3da8bcSJed Brown CEED_EXTERN int CeedOperatorGetQFunction(CeedOperator op, CeedQFunction *qf); 228d1d35e2fSjeremylt CEED_EXTERN int CeedOperatorIsComposite(CeedOperator op, bool *is_composite); 229d1d35e2fSjeremylt CEED_EXTERN int CeedOperatorGetNumSub(CeedOperator op, CeedInt *num_suboperators); 230ec3da8bcSJed Brown CEED_EXTERN int CeedOperatorGetSubList(CeedOperator op, 231d1d35e2fSjeremylt CeedOperator **sub_operators); 232ec3da8bcSJed Brown CEED_EXTERN int CeedOperatorGetData(CeedOperator op, void *data); 233ec3da8bcSJed Brown CEED_EXTERN int CeedOperatorSetData(CeedOperator op, void *data); 2349560d06aSjeremylt CEED_EXTERN int CeedOperatorReference(CeedOperator op); 235ec3da8bcSJed Brown CEED_EXTERN int CeedOperatorSetSetupDone(CeedOperator op); 236ec3da8bcSJed Brown 237d1d35e2fSjeremylt CEED_INTERN int CeedMatrixMultiply(Ceed ceed, const CeedScalar *mat_A, 238d1d35e2fSjeremylt const CeedScalar *mat_B, CeedScalar *mat_C, 239ec3da8bcSJed Brown CeedInt m, CeedInt n, CeedInt kk); 240ec3da8bcSJed Brown 241ec3da8bcSJed Brown #endif 242