1ec3da8bcSJed Brown // Copyright (c) 2017, Lawrence Livermore National Security, LLC. Produced at 2ec3da8bcSJed Brown // the Lawrence Livermore National Laboratory. LLNL-CODE-734707. All Rights 3ec3da8bcSJed Brown // reserved. See files LICENSE and NOTICE for details. 4ec3da8bcSJed Brown // 5ec3da8bcSJed Brown // This file is part of CEED, a collection of benchmarks, miniapps, software 6ec3da8bcSJed Brown // libraries and APIs for efficient high-order finite element and spectral 7ec3da8bcSJed Brown // element discretizations for exascale applications. For more information and 8ec3da8bcSJed Brown // source code availability see http://github.com/ceed. 9ec3da8bcSJed Brown // 10ec3da8bcSJed Brown // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, 11ec3da8bcSJed Brown // a collaborative effort of two U.S. Department of Energy organizations (Office 12ec3da8bcSJed Brown // of Science and the National Nuclear Security Administration) responsible for 13ec3da8bcSJed Brown // the planning and preparation of a capable exascale ecosystem, including 14ec3da8bcSJed Brown // software, applications, hardware, advanced system engineering and early 15ec3da8bcSJed Brown // testbed platforms, in support of the nation's exascale computing imperative. 16ec3da8bcSJed Brown 17ec3da8bcSJed Brown /// @file 18ec3da8bcSJed Brown /// Public header for backend components of libCEED 19ec3da8bcSJed Brown #ifndef _ceed_backend_h 20ec3da8bcSJed Brown #define _ceed_backend_h 21ec3da8bcSJed Brown 22ec3da8bcSJed Brown #include <ceed/ceed.h> 23d0c91ce9Sjeremylt #include <limits.h> 24ec3da8bcSJed Brown #include <stdbool.h> 25ec3da8bcSJed Brown 26ec3da8bcSJed Brown #define CEED_INTERN CEED_EXTERN __attribute__((visibility ("hidden"))) 27ec3da8bcSJed Brown #define CEED_UNUSED __attribute__((unused)) 28ec3da8bcSJed Brown 29ec3da8bcSJed Brown #define CEED_MAX_RESOURCE_LEN 1024 30d0c91ce9Sjeremylt #define CEED_MAX_BACKEND_PRIORITY UINT_MAX 31ec3da8bcSJed Brown #define CEED_ALIGN 64 32ec3da8bcSJed Brown #define CEED_COMPOSITE_MAX 16 33ec3da8bcSJed Brown 3403d18186Sjeremylt /** 3503d18186Sjeremylt @ingroup Ceed 36eaf62fffSJeremy L Thompson This macro provides the ability to disable optimization flags for functions that 3703d18186Sjeremylt are sensitive to floting point optimizations. 3803d18186Sjeremylt **/ 3903d18186Sjeremylt #ifndef CeedPragmaOptimizeOff 4003d18186Sjeremylt # if defined(__clang__) 4103d18186Sjeremylt # define CeedPragmaOptimizeOff _Pragma("clang optimize off") 4203d18186Sjeremylt # elif defined(__GNUC__) 4303d18186Sjeremylt # define CeedPragmaOptimizeOff _Pragma("GCC push_options") _Pragma("GCC optimize 0") 4403d18186Sjeremylt # elif defined(__INTEL_COMPILER) || defined(__INTEL_LLVM_COMPILER) 4503d18186Sjeremylt # define CeedPragmaOptimizeOff _Pragma("optimize('', off)") 4603d18186Sjeremylt # else 4703d18186Sjeremylt # define CeedPragmaOptimizeOff 4803d18186Sjeremylt # endif 4903d18186Sjeremylt #endif 5003d18186Sjeremylt 5103d18186Sjeremylt /** 5203d18186Sjeremylt @ingroup Ceed 5303d18186Sjeremylt This macro restores previously set optimization flags after CeedPragmaOptimizeOff. 5403d18186Sjeremylt **/ 5503d18186Sjeremylt #ifndef CeedPragmaOptimizeOn 5603d18186Sjeremylt # if defined(__clang__) 5703d18186Sjeremylt # define CeedPragmaOptimizeOn _Pragma("clang optimize on") 5803d18186Sjeremylt # elif defined(__GNUC__) 5903d18186Sjeremylt # define CeedPragmaOptimizeOn _Pragma("GCC pop_options") 6003d18186Sjeremylt # elif defined(__INTEL_COMPILER) || defined(__INTEL_LLVM_COMPILER) 6103d18186Sjeremylt # define CeedPragmaOptimizeOff _Pragma("optimize('', on)") 6203d18186Sjeremylt # else 6303d18186Sjeremylt # define CeedPragmaOptimizeOn 6403d18186Sjeremylt # endif 6503d18186Sjeremylt #endif 6603d18186Sjeremylt 67ec3da8bcSJed Brown /// CEED_DEBUG_COLOR default value, forward CeedDebug* declarations & macros 68*3f21f6b1SJeremy L Thompson #define CEED_DEBUG_COLOR_NONE 255 69*3f21f6b1SJeremy L Thompson 70*3f21f6b1SJeremy L Thompson CEED_EXTERN void CeedDebugImpl256(const unsigned char, const char *, ...); 71*3f21f6b1SJeremy L Thompson CEED_EXTERN bool CeedDebugFlag(const Ceed ceed); 72*3f21f6b1SJeremy L Thompson CEED_EXTERN bool CeedDebugFlagEnv(void); 73*3f21f6b1SJeremy L Thompson #define CeedDebug256(ceed, color, ...) \ 74*3f21f6b1SJeremy L Thompson { if (CeedDebugFlag(ceed)) CeedDebugImpl256(color, ## __VA_ARGS__); } 75*3f21f6b1SJeremy L Thompson #define CeedDebug(ceed, ...) CeedDebug256(ceed, (unsigned char)CEED_DEBUG_COLOR_NONE, ## __VA_ARGS__) 76*3f21f6b1SJeremy L Thompson #define CeedDebugEnv256(color, ...) \ 77*3f21f6b1SJeremy L Thompson { if (CeedDebugFlagEnv()) CeedDebugImpl256(color, ## __VA_ARGS__); } 78*3f21f6b1SJeremy L Thompson #define CeedDebugEnv(...) CeedDebugEnv256((unsigned char)CEED_DEBUG_COLOR_NONE, ## __VA_ARGS__) 79ec3da8bcSJed Brown 80ec3da8bcSJed Brown /// Handle for object handling TensorContraction 81ec3da8bcSJed Brown /// @ingroup CeedBasis 82ec3da8bcSJed Brown typedef struct CeedTensorContract_private *CeedTensorContract; 83ec3da8bcSJed Brown 84ec3da8bcSJed Brown /* In the next 3 functions, p has to be the address of a pointer type, i.e. p 85ec3da8bcSJed Brown has to be a pointer to a pointer. */ 86ec3da8bcSJed Brown CEED_INTERN int CeedMallocArray(size_t n, size_t unit, void *p); 87ec3da8bcSJed Brown CEED_INTERN int CeedCallocArray(size_t n, size_t unit, void *p); 88ec3da8bcSJed Brown CEED_INTERN int CeedReallocArray(size_t n, size_t unit, void *p); 89ec3da8bcSJed Brown CEED_INTERN int CeedFree(void *p); 90ec3da8bcSJed Brown 91ec3da8bcSJed Brown #define CeedChk(ierr) do { int ierr_ = ierr; if (ierr_) return ierr_; } while (0) 92ec3da8bcSJed Brown #define CeedChkBackend(ierr) do { int ierr_ = ierr; if (ierr_) { if (ierr_ > CEED_ERROR_SUCCESS) return CEED_ERROR_BACKEND; else return ierr_; } } while (0) 93ec3da8bcSJed Brown /* Note that CeedMalloc and CeedCalloc will, generally, return pointers with 94ec3da8bcSJed Brown different memory alignments: CeedMalloc returns pointers aligned at 95ec3da8bcSJed Brown CEED_ALIGN bytes, while CeedCalloc uses the alignment of calloc. */ 96ec3da8bcSJed Brown #define CeedMalloc(n, p) CeedMallocArray((n), sizeof(**(p)), p) 97ec3da8bcSJed Brown #define CeedCalloc(n, p) CeedCallocArray((n), sizeof(**(p)), p) 98ec3da8bcSJed Brown #define CeedRealloc(n, p) CeedReallocArray((n), sizeof(**(p)), p) 99ec3da8bcSJed Brown 100ec3da8bcSJed Brown CEED_EXTERN int CeedRegister(const char *prefix, 101ec3da8bcSJed Brown int (*init)(const char *, Ceed), 102ec3da8bcSJed Brown unsigned int priority); 103ec3da8bcSJed Brown 104d1d35e2fSjeremylt CEED_EXTERN int CeedIsDebug(Ceed ceed, bool *is_debug); 105ec3da8bcSJed Brown CEED_EXTERN int CeedGetParent(Ceed ceed, Ceed *parent); 106ec3da8bcSJed Brown CEED_EXTERN int CeedGetDelegate(Ceed ceed, Ceed *delegate); 107ec3da8bcSJed Brown CEED_EXTERN int CeedSetDelegate(Ceed ceed, Ceed delegate); 108ec3da8bcSJed Brown CEED_EXTERN int CeedGetObjectDelegate(Ceed ceed, Ceed *delegate, 109d1d35e2fSjeremylt const char *obj_name); 110ec3da8bcSJed Brown CEED_EXTERN int CeedSetObjectDelegate(Ceed ceed, Ceed delegate, 111d1d35e2fSjeremylt const char *obj_name); 112eaf62fffSJeremy L Thompson CEED_EXTERN int CeedOperatorGetActiveBasis(CeedOperator op, 113eaf62fffSJeremy L Thompson CeedBasis *active_basis); 114eaf62fffSJeremy L Thompson CEED_EXTERN int CeedOperatorGetActiveElemRestriction(CeedOperator op, CeedElemRestriction *active_rstr); 115ec3da8bcSJed Brown CEED_EXTERN int CeedGetOperatorFallbackResource(Ceed ceed, 116ec3da8bcSJed Brown const char **resource); 117ec3da8bcSJed Brown CEED_EXTERN int CeedSetOperatorFallbackResource(Ceed ceed, 118ec3da8bcSJed Brown const char *resource); 119ec3da8bcSJed Brown CEED_EXTERN int CeedGetOperatorFallbackParentCeed(Ceed ceed, Ceed *parent); 120d1d35e2fSjeremylt CEED_EXTERN int CeedSetDeterministic(Ceed ceed, bool is_deterministic); 121ec3da8bcSJed Brown CEED_EXTERN int CeedSetBackendFunction(Ceed ceed, 122ec3da8bcSJed Brown const char *type, void *object, 123d1d35e2fSjeremylt const char *func_name, int (*f)()); 124ec3da8bcSJed Brown CEED_EXTERN int CeedGetData(Ceed ceed, void *data); 125ec3da8bcSJed Brown CEED_EXTERN int CeedSetData(Ceed ceed, void *data); 1269560d06aSjeremylt CEED_EXTERN int CeedReference(Ceed ceed); 127ec3da8bcSJed Brown 128ec3da8bcSJed Brown CEED_EXTERN int CeedVectorGetState(CeedVector vec, uint64_t *state); 129ec3da8bcSJed Brown CEED_EXTERN int CeedVectorAddReference(CeedVector vec); 130ec3da8bcSJed Brown CEED_EXTERN int CeedVectorGetData(CeedVector vec, void *data); 131ec3da8bcSJed Brown CEED_EXTERN int CeedVectorSetData(CeedVector vec, void *data); 1329560d06aSjeremylt CEED_EXTERN int CeedVectorReference(CeedVector vec); 133ec3da8bcSJed Brown 134ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionGetStrides(CeedElemRestriction rstr, 135ec3da8bcSJed Brown CeedInt (*strides)[3]); 136ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionGetOffsets(CeedElemRestriction rstr, 137d1d35e2fSjeremylt CeedMemType mem_type, const CeedInt **offsets); 138ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionRestoreOffsets(CeedElemRestriction rstr, 139ec3da8bcSJed Brown const CeedInt **offsets); 140ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionIsStrided(CeedElemRestriction rstr, 141d1d35e2fSjeremylt bool *is_strided); 142ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionHasBackendStrides(CeedElemRestriction rstr, 143d1d35e2fSjeremylt bool *has_backend_strides); 144ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionGetELayout(CeedElemRestriction rstr, 145ec3da8bcSJed Brown CeedInt (*layout)[3]); 146ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionSetELayout(CeedElemRestriction rstr, 147ec3da8bcSJed Brown CeedInt layout[3]); 148ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionGetData(CeedElemRestriction rstr, 149ec3da8bcSJed Brown void *data); 150ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionSetData(CeedElemRestriction rstr, 151ec3da8bcSJed Brown void *data); 1529560d06aSjeremylt CEED_EXTERN int CeedElemRestrictionReference(CeedElemRestriction rstr); 153ec3da8bcSJed Brown 154ec3da8bcSJed Brown CEED_EXTERN int CeedBasisGetCollocatedGrad(CeedBasis basis, 155d1d35e2fSjeremylt CeedScalar *colo_grad_1d); 156ec3da8bcSJed Brown CEED_EXTERN int CeedHouseholderApplyQ(CeedScalar *A, const CeedScalar *Q, 157d1d35e2fSjeremylt const CeedScalar *tau, CeedTransposeMode t_mode, CeedInt m, CeedInt n, 158ec3da8bcSJed Brown CeedInt k, CeedInt row, CeedInt col); 159d1d35e2fSjeremylt CEED_EXTERN int CeedBasisIsTensor(CeedBasis basis, bool *is_tensor); 160ec3da8bcSJed Brown CEED_EXTERN int CeedBasisGetData(CeedBasis basis, void *data); 161ec3da8bcSJed Brown CEED_EXTERN int CeedBasisSetData(CeedBasis basis, void *data); 1629560d06aSjeremylt CEED_EXTERN int CeedBasisReference(CeedBasis basis); 163ec3da8bcSJed Brown 164ec3da8bcSJed Brown CEED_EXTERN int CeedBasisGetTopologyDimension(CeedElemTopology topo, 165ec3da8bcSJed Brown CeedInt *dim); 166ec3da8bcSJed Brown 167ec3da8bcSJed Brown CEED_EXTERN int CeedBasisGetTensorContract(CeedBasis basis, 168ec3da8bcSJed Brown CeedTensorContract *contract); 169ec3da8bcSJed Brown CEED_EXTERN int CeedBasisSetTensorContract(CeedBasis basis, 17034359f16Sjeremylt CeedTensorContract contract); 171ec3da8bcSJed Brown CEED_EXTERN int CeedTensorContractCreate(Ceed ceed, CeedBasis basis, 172ec3da8bcSJed Brown CeedTensorContract *contract); 173ec3da8bcSJed Brown CEED_EXTERN int CeedTensorContractApply(CeedTensorContract contract, CeedInt A, 174ec3da8bcSJed Brown CeedInt B, CeedInt C, CeedInt J, 175ec3da8bcSJed Brown const CeedScalar *__restrict__ t, 176d1d35e2fSjeremylt CeedTransposeMode t_mode, 177ec3da8bcSJed Brown const CeedInt Add, 178ec3da8bcSJed Brown const CeedScalar *__restrict__ u, 179ec3da8bcSJed Brown CeedScalar *__restrict__ v); 180ec3da8bcSJed Brown CEED_EXTERN int CeedTensorContractGetCeed(CeedTensorContract contract, 181ec3da8bcSJed Brown Ceed *ceed); 182ec3da8bcSJed Brown CEED_EXTERN int CeedTensorContractGetData(CeedTensorContract contract, 183ec3da8bcSJed Brown void *data); 184ec3da8bcSJed Brown CEED_EXTERN int CeedTensorContractSetData(CeedTensorContract contract, 185ec3da8bcSJed Brown void *data); 1869560d06aSjeremylt CEED_EXTERN int CeedTensorContractReference(CeedTensorContract contract); 187ec3da8bcSJed Brown CEED_EXTERN int CeedTensorContractDestroy(CeedTensorContract *contract); 188ec3da8bcSJed Brown 189ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionRegister(const char *, const char *, CeedInt, 190ec3da8bcSJed Brown CeedQFunctionUser, int (*init)(Ceed, const char *, CeedQFunction)); 191ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionSetFortranStatus(CeedQFunction qf, bool status); 192ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionGetVectorLength(CeedQFunction qf, 193d1d35e2fSjeremylt CeedInt *vec_length); 194ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionGetNumArgs(CeedQFunction qf, 195d1d35e2fSjeremylt CeedInt *num_input_fields, 196d1d35e2fSjeremylt CeedInt *num_output_fields); 19743e1b16fSJeremy L Thompson CEED_EXTERN int CeedQFunctionGetKernelName(CeedQFunction qf, char **kernel_name); 19843e1b16fSJeremy L Thompson CEED_EXTERN int CeedQFunctionGetSourcePath(CeedQFunction qf, char **source_path); 1993d3250a0SJeremy L Thompson CEED_EXTERN int CeedQFunctionLoadSourceToBuffer(CeedQFunction qf, char **source_buffer); 200ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionGetUserFunction(CeedQFunction qf, 201ec3da8bcSJed Brown CeedQFunctionUser *f); 202ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionGetContext(CeedQFunction qf, 203ec3da8bcSJed Brown CeedQFunctionContext *ctx); 204ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionGetInnerContext(CeedQFunction qf, 205ec3da8bcSJed Brown CeedQFunctionContext *ctx); 206d1d35e2fSjeremylt CEED_EXTERN int CeedQFunctionIsIdentity(CeedQFunction qf, bool *is_identity); 207ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionGetData(CeedQFunction qf, void *data); 208ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionSetData(CeedQFunction qf, void *data); 2099560d06aSjeremylt CEED_EXTERN int CeedQFunctionReference(CeedQFunction qf); 210ec3da8bcSJed Brown 211ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionContextGetCeed(CeedQFunctionContext cxt, 212ec3da8bcSJed Brown Ceed *ceed); 213ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionContextGetState(CeedQFunctionContext ctx, 214ec3da8bcSJed Brown uint64_t *state); 215ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionContextGetBackendData(CeedQFunctionContext ctx, 216ec3da8bcSJed Brown void *data); 217ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionContextSetBackendData(CeedQFunctionContext ctx, 218ec3da8bcSJed Brown void *data); 2199560d06aSjeremylt CEED_EXTERN int CeedQFunctionContextReference(CeedQFunctionContext ctx); 220ec3da8bcSJed Brown 221d1d35e2fSjeremylt CEED_EXTERN int CeedOperatorGetNumArgs(CeedOperator op, CeedInt *num_args); 222d1d35e2fSjeremylt CEED_EXTERN int CeedOperatorIsSetupDone(CeedOperator op, bool *is_setup_done); 223ec3da8bcSJed Brown CEED_EXTERN int CeedOperatorGetQFunction(CeedOperator op, CeedQFunction *qf); 224d1d35e2fSjeremylt CEED_EXTERN int CeedOperatorIsComposite(CeedOperator op, bool *is_composite); 225d1d35e2fSjeremylt CEED_EXTERN int CeedOperatorGetNumSub(CeedOperator op, CeedInt *num_suboperators); 226ec3da8bcSJed Brown CEED_EXTERN int CeedOperatorGetSubList(CeedOperator op, 227d1d35e2fSjeremylt CeedOperator **sub_operators); 228ec3da8bcSJed Brown CEED_EXTERN int CeedOperatorGetData(CeedOperator op, void *data); 229ec3da8bcSJed Brown CEED_EXTERN int CeedOperatorSetData(CeedOperator op, void *data); 2309560d06aSjeremylt CEED_EXTERN int CeedOperatorReference(CeedOperator op); 231ec3da8bcSJed Brown CEED_EXTERN int CeedOperatorSetSetupDone(CeedOperator op); 232ec3da8bcSJed Brown 233d1d35e2fSjeremylt CEED_INTERN int CeedMatrixMultiply(Ceed ceed, const CeedScalar *mat_A, 234d1d35e2fSjeremylt const CeedScalar *mat_B, CeedScalar *mat_C, 235ec3da8bcSJed Brown CeedInt m, CeedInt n, CeedInt kk); 236ec3da8bcSJed Brown 237ec3da8bcSJed Brown #endif 238