xref: /libCEED/include/ceed/backend.h (revision 43e1b16f0c7c5dbfae04543c0675e255f265ff67)
1ec3da8bcSJed Brown // Copyright (c) 2017, Lawrence Livermore National Security, LLC. Produced at
2ec3da8bcSJed Brown // the Lawrence Livermore National Laboratory. LLNL-CODE-734707. All Rights
3ec3da8bcSJed Brown // reserved. See files LICENSE and NOTICE for details.
4ec3da8bcSJed Brown //
5ec3da8bcSJed Brown // This file is part of CEED, a collection of benchmarks, miniapps, software
6ec3da8bcSJed Brown // libraries and APIs for efficient high-order finite element and spectral
7ec3da8bcSJed Brown // element discretizations for exascale applications. For more information and
8ec3da8bcSJed Brown // source code availability see http://github.com/ceed.
9ec3da8bcSJed Brown //
10ec3da8bcSJed Brown // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC,
11ec3da8bcSJed Brown // a collaborative effort of two U.S. Department of Energy organizations (Office
12ec3da8bcSJed Brown // of Science and the National Nuclear Security Administration) responsible for
13ec3da8bcSJed Brown // the planning and preparation of a capable exascale ecosystem, including
14ec3da8bcSJed Brown // software, applications, hardware, advanced system engineering and early
15ec3da8bcSJed Brown // testbed platforms, in support of the nation's exascale computing imperative.
16ec3da8bcSJed Brown 
17ec3da8bcSJed Brown /// @file
18ec3da8bcSJed Brown /// Public header for backend components of libCEED
19ec3da8bcSJed Brown #ifndef _ceed_backend_h
20ec3da8bcSJed Brown #define _ceed_backend_h
21ec3da8bcSJed Brown 
22ec3da8bcSJed Brown #include <ceed/ceed.h>
23d0c91ce9Sjeremylt #include <limits.h>
24ec3da8bcSJed Brown #include <stdbool.h>
25ec3da8bcSJed Brown 
26ec3da8bcSJed Brown #define CEED_INTERN CEED_EXTERN __attribute__((visibility ("hidden")))
27ec3da8bcSJed Brown #define CEED_UNUSED __attribute__((unused))
28ec3da8bcSJed Brown 
29ec3da8bcSJed Brown #define CEED_MAX_RESOURCE_LEN 1024
30d0c91ce9Sjeremylt #define CEED_MAX_BACKEND_PRIORITY UINT_MAX
31ec3da8bcSJed Brown #define CEED_ALIGN 64
32ec3da8bcSJed Brown #define CEED_COMPOSITE_MAX 16
33ec3da8bcSJed Brown 
3403d18186Sjeremylt /**
3503d18186Sjeremylt   @ingroup Ceed
36eaf62fffSJeremy L Thompson   This macro provides the ability to disable optimization flags for functions that
3703d18186Sjeremylt   are sensitive to floting point optimizations.
3803d18186Sjeremylt **/
3903d18186Sjeremylt #ifndef CeedPragmaOptimizeOff
4003d18186Sjeremylt #  if defined(__clang__)
4103d18186Sjeremylt #    define CeedPragmaOptimizeOff _Pragma("clang optimize off")
4203d18186Sjeremylt #  elif defined(__GNUC__)
4303d18186Sjeremylt #    define CeedPragmaOptimizeOff _Pragma("GCC push_options") _Pragma("GCC optimize 0")
4403d18186Sjeremylt #  elif defined(__INTEL_COMPILER) || defined(__INTEL_LLVM_COMPILER)
4503d18186Sjeremylt #    define CeedPragmaOptimizeOff _Pragma("optimize('', off)")
4603d18186Sjeremylt #  else
4703d18186Sjeremylt #    define CeedPragmaOptimizeOff
4803d18186Sjeremylt #  endif
4903d18186Sjeremylt #endif
5003d18186Sjeremylt 
5103d18186Sjeremylt /**
5203d18186Sjeremylt   @ingroup Ceed
5303d18186Sjeremylt   This macro restores previously set optimization flags after CeedPragmaOptimizeOff.
5403d18186Sjeremylt **/
5503d18186Sjeremylt #ifndef CeedPragmaOptimizeOn
5603d18186Sjeremylt #  if defined(__clang__)
5703d18186Sjeremylt #    define CeedPragmaOptimizeOn _Pragma("clang optimize on")
5803d18186Sjeremylt #  elif defined(__GNUC__)
5903d18186Sjeremylt #    define CeedPragmaOptimizeOn _Pragma("GCC pop_options")
6003d18186Sjeremylt #  elif defined(__INTEL_COMPILER) || defined(__INTEL_LLVM_COMPILER)
6103d18186Sjeremylt #    define CeedPragmaOptimizeOff _Pragma("optimize('', on)")
6203d18186Sjeremylt #  else
6303d18186Sjeremylt #    define CeedPragmaOptimizeOn
6403d18186Sjeremylt #  endif
6503d18186Sjeremylt #endif
6603d18186Sjeremylt 
67ec3da8bcSJed Brown /// CEED_DEBUG_COLOR default value, forward CeedDebug* declarations & macros
68ec3da8bcSJed Brown #ifndef CEED_DEBUG_COLOR
69ec3da8bcSJed Brown #define CEED_DEBUG_COLOR 0
70ec3da8bcSJed Brown #endif
71ec3da8bcSJed Brown CEED_EXTERN void CeedDebugImpl(const Ceed,const char *,...);
72ec3da8bcSJed Brown CEED_EXTERN void CeedDebugImpl256(const Ceed,const unsigned char,const char *,
73ec3da8bcSJed Brown                                   ...);
74ec3da8bcSJed Brown #define CeedDebug1(ceed,format, ...) CeedDebugImpl(ceed,format, ## __VA_ARGS__)
75ec3da8bcSJed Brown #define CeedDebug256(ceed,color, ...) CeedDebugImpl256(ceed,color, ## __VA_ARGS__)
76ec3da8bcSJed Brown #define CeedDebug(...) CeedDebug256(ceed,(unsigned char)CEED_DEBUG_COLOR, ## __VA_ARGS__)
77ec3da8bcSJed Brown 
78ec3da8bcSJed Brown /// Handle for object handling TensorContraction
79ec3da8bcSJed Brown /// @ingroup CeedBasis
80ec3da8bcSJed Brown typedef struct CeedTensorContract_private *CeedTensorContract;
81ec3da8bcSJed Brown 
82ec3da8bcSJed Brown /* In the next 3 functions, p has to be the address of a pointer type, i.e. p
83ec3da8bcSJed Brown    has to be a pointer to a pointer. */
84ec3da8bcSJed Brown CEED_INTERN int CeedMallocArray(size_t n, size_t unit, void *p);
85ec3da8bcSJed Brown CEED_INTERN int CeedCallocArray(size_t n, size_t unit, void *p);
86ec3da8bcSJed Brown CEED_INTERN int CeedReallocArray(size_t n, size_t unit, void *p);
87ec3da8bcSJed Brown CEED_INTERN int CeedFree(void *p);
88ec3da8bcSJed Brown 
89ec3da8bcSJed Brown #define CeedChk(ierr) do { int ierr_ = ierr; if (ierr_) return ierr_; } while (0)
90ec3da8bcSJed Brown #define CeedChkBackend(ierr) do { int ierr_ = ierr; if (ierr_) { if (ierr_ > CEED_ERROR_SUCCESS) return CEED_ERROR_BACKEND; else return ierr_; } } while (0)
91ec3da8bcSJed Brown /* Note that CeedMalloc and CeedCalloc will, generally, return pointers with
92ec3da8bcSJed Brown    different memory alignments: CeedMalloc returns pointers aligned at
93ec3da8bcSJed Brown    CEED_ALIGN bytes, while CeedCalloc uses the alignment of calloc. */
94ec3da8bcSJed Brown #define CeedMalloc(n, p) CeedMallocArray((n), sizeof(**(p)), p)
95ec3da8bcSJed Brown #define CeedCalloc(n, p) CeedCallocArray((n), sizeof(**(p)), p)
96ec3da8bcSJed Brown #define CeedRealloc(n, p) CeedReallocArray((n), sizeof(**(p)), p)
97ec3da8bcSJed Brown 
98ec3da8bcSJed Brown CEED_EXTERN int CeedRegister(const char *prefix,
99ec3da8bcSJed Brown                              int (*init)(const char *, Ceed),
100ec3da8bcSJed Brown                              unsigned int priority);
101ec3da8bcSJed Brown 
102d1d35e2fSjeremylt CEED_EXTERN int CeedIsDebug(Ceed ceed, bool *is_debug);
103ec3da8bcSJed Brown CEED_EXTERN int CeedGetParent(Ceed ceed, Ceed *parent);
104ec3da8bcSJed Brown CEED_EXTERN int CeedGetDelegate(Ceed ceed, Ceed *delegate);
105ec3da8bcSJed Brown CEED_EXTERN int CeedSetDelegate(Ceed ceed, Ceed delegate);
106ec3da8bcSJed Brown CEED_EXTERN int CeedGetObjectDelegate(Ceed ceed, Ceed *delegate,
107d1d35e2fSjeremylt                                       const char *obj_name);
108ec3da8bcSJed Brown CEED_EXTERN int CeedSetObjectDelegate(Ceed ceed, Ceed delegate,
109d1d35e2fSjeremylt                                       const char *obj_name);
110eaf62fffSJeremy L Thompson CEED_EXTERN int CeedOperatorGetActiveBasis(CeedOperator op,
111eaf62fffSJeremy L Thompson                                       CeedBasis *active_basis);
112eaf62fffSJeremy L Thompson CEED_EXTERN int CeedOperatorGetActiveElemRestriction(CeedOperator op, CeedElemRestriction *active_rstr);
113ec3da8bcSJed Brown CEED_EXTERN int CeedGetOperatorFallbackResource(Ceed ceed,
114ec3da8bcSJed Brown     const char **resource);
115ec3da8bcSJed Brown CEED_EXTERN int CeedSetOperatorFallbackResource(Ceed ceed,
116ec3da8bcSJed Brown     const char *resource);
117ec3da8bcSJed Brown CEED_EXTERN int CeedGetOperatorFallbackParentCeed(Ceed ceed, Ceed *parent);
118d1d35e2fSjeremylt CEED_EXTERN int CeedSetDeterministic(Ceed ceed, bool is_deterministic);
119ec3da8bcSJed Brown CEED_EXTERN int CeedSetBackendFunction(Ceed ceed,
120ec3da8bcSJed Brown                                        const char *type, void *object,
121d1d35e2fSjeremylt                                        const char *func_name, int (*f)());
122ec3da8bcSJed Brown CEED_EXTERN int CeedGetData(Ceed ceed, void *data);
123ec3da8bcSJed Brown CEED_EXTERN int CeedSetData(Ceed ceed, void *data);
1249560d06aSjeremylt CEED_EXTERN int CeedReference(Ceed ceed);
125ec3da8bcSJed Brown 
126ec3da8bcSJed Brown CEED_EXTERN int CeedVectorGetState(CeedVector vec, uint64_t *state);
127ec3da8bcSJed Brown CEED_EXTERN int CeedVectorAddReference(CeedVector vec);
128ec3da8bcSJed Brown CEED_EXTERN int CeedVectorGetData(CeedVector vec, void *data);
129ec3da8bcSJed Brown CEED_EXTERN int CeedVectorSetData(CeedVector vec, void *data);
1309560d06aSjeremylt CEED_EXTERN int CeedVectorReference(CeedVector vec);
131ec3da8bcSJed Brown 
132ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionGetStrides(CeedElemRestriction rstr,
133ec3da8bcSJed Brown     CeedInt (*strides)[3]);
134ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionGetOffsets(CeedElemRestriction rstr,
135d1d35e2fSjeremylt     CeedMemType mem_type, const CeedInt **offsets);
136ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionRestoreOffsets(CeedElemRestriction rstr,
137ec3da8bcSJed Brown     const CeedInt **offsets);
138ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionIsStrided(CeedElemRestriction rstr,
139d1d35e2fSjeremylt     bool *is_strided);
140ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionHasBackendStrides(CeedElemRestriction rstr,
141d1d35e2fSjeremylt     bool *has_backend_strides);
142ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionGetELayout(CeedElemRestriction rstr,
143ec3da8bcSJed Brown     CeedInt (*layout)[3]);
144ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionSetELayout(CeedElemRestriction rstr,
145ec3da8bcSJed Brown     CeedInt layout[3]);
146ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionGetData(CeedElemRestriction rstr,
147ec3da8bcSJed Brown     void *data);
148ec3da8bcSJed Brown CEED_EXTERN int CeedElemRestrictionSetData(CeedElemRestriction rstr,
149ec3da8bcSJed Brown     void *data);
1509560d06aSjeremylt CEED_EXTERN int CeedElemRestrictionReference(CeedElemRestriction rstr);
151ec3da8bcSJed Brown 
152ec3da8bcSJed Brown CEED_EXTERN int CeedBasisGetCollocatedGrad(CeedBasis basis,
153d1d35e2fSjeremylt     CeedScalar *colo_grad_1d);
154ec3da8bcSJed Brown CEED_EXTERN int CeedHouseholderApplyQ(CeedScalar *A, const CeedScalar *Q,
155d1d35e2fSjeremylt                                       const CeedScalar *tau, CeedTransposeMode t_mode, CeedInt m, CeedInt n,
156ec3da8bcSJed Brown                                       CeedInt k, CeedInt row, CeedInt col);
157d1d35e2fSjeremylt CEED_EXTERN int CeedBasisIsTensor(CeedBasis basis, bool *is_tensor);
158ec3da8bcSJed Brown CEED_EXTERN int CeedBasisGetData(CeedBasis basis, void *data);
159ec3da8bcSJed Brown CEED_EXTERN int CeedBasisSetData(CeedBasis basis, void *data);
1609560d06aSjeremylt CEED_EXTERN int CeedBasisReference(CeedBasis basis);
161ec3da8bcSJed Brown 
162ec3da8bcSJed Brown CEED_EXTERN int CeedBasisGetTopologyDimension(CeedElemTopology topo,
163ec3da8bcSJed Brown     CeedInt *dim);
164ec3da8bcSJed Brown 
165ec3da8bcSJed Brown CEED_EXTERN int CeedBasisGetTensorContract(CeedBasis basis,
166ec3da8bcSJed Brown     CeedTensorContract *contract);
167ec3da8bcSJed Brown CEED_EXTERN int CeedBasisSetTensorContract(CeedBasis basis,
16834359f16Sjeremylt     CeedTensorContract contract);
169ec3da8bcSJed Brown CEED_EXTERN int CeedTensorContractCreate(Ceed ceed, CeedBasis basis,
170ec3da8bcSJed Brown     CeedTensorContract *contract);
171ec3da8bcSJed Brown CEED_EXTERN int CeedTensorContractApply(CeedTensorContract contract, CeedInt A,
172ec3da8bcSJed Brown                                         CeedInt B, CeedInt C, CeedInt J,
173ec3da8bcSJed Brown                                         const CeedScalar *__restrict__ t,
174d1d35e2fSjeremylt                                         CeedTransposeMode t_mode,
175ec3da8bcSJed Brown                                         const CeedInt Add,
176ec3da8bcSJed Brown                                         const CeedScalar *__restrict__ u,
177ec3da8bcSJed Brown                                         CeedScalar *__restrict__ v);
178ec3da8bcSJed Brown CEED_EXTERN int CeedTensorContractGetCeed(CeedTensorContract contract,
179ec3da8bcSJed Brown     Ceed *ceed);
180ec3da8bcSJed Brown CEED_EXTERN int CeedTensorContractGetData(CeedTensorContract contract,
181ec3da8bcSJed Brown     void *data);
182ec3da8bcSJed Brown CEED_EXTERN int CeedTensorContractSetData(CeedTensorContract contract,
183ec3da8bcSJed Brown     void *data);
1849560d06aSjeremylt CEED_EXTERN int CeedTensorContractReference(CeedTensorContract contract);
185ec3da8bcSJed Brown CEED_EXTERN int CeedTensorContractDestroy(CeedTensorContract *contract);
186ec3da8bcSJed Brown 
187ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionRegister(const char *, const char *, CeedInt,
188ec3da8bcSJed Brown                                       CeedQFunctionUser, int (*init)(Ceed, const char *, CeedQFunction));
189ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionSetFortranStatus(CeedQFunction qf, bool status);
190ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionGetVectorLength(CeedQFunction qf,
191d1d35e2fSjeremylt     CeedInt *vec_length);
192ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionGetNumArgs(CeedQFunction qf,
193d1d35e2fSjeremylt                                         CeedInt *num_input_fields,
194d1d35e2fSjeremylt                                         CeedInt *num_output_fields);
195*43e1b16fSJeremy L Thompson CEED_EXTERN int CeedQFunctionGetKernelName(CeedQFunction qf, char **kernel_name);
196*43e1b16fSJeremy L Thompson CEED_EXTERN int CeedQFunctionGetSourcePath(CeedQFunction qf, char **source_path);
197ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionGetUserFunction(CeedQFunction qf,
198ec3da8bcSJed Brown     CeedQFunctionUser *f);
199ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionGetContext(CeedQFunction qf,
200ec3da8bcSJed Brown                                         CeedQFunctionContext *ctx);
201ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionGetInnerContext(CeedQFunction qf,
202ec3da8bcSJed Brown     CeedQFunctionContext *ctx);
203d1d35e2fSjeremylt CEED_EXTERN int CeedQFunctionIsIdentity(CeedQFunction qf, bool *is_identity);
204ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionGetData(CeedQFunction qf, void *data);
205ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionSetData(CeedQFunction qf, void *data);
2069560d06aSjeremylt CEED_EXTERN int CeedQFunctionReference(CeedQFunction qf);
207ec3da8bcSJed Brown 
208ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionContextGetCeed(CeedQFunctionContext cxt,
209ec3da8bcSJed Brown     Ceed *ceed);
210ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionContextGetState(CeedQFunctionContext ctx,
211ec3da8bcSJed Brown     uint64_t *state);
212ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionContextGetBackendData(CeedQFunctionContext ctx,
213ec3da8bcSJed Brown     void *data);
214ec3da8bcSJed Brown CEED_EXTERN int CeedQFunctionContextSetBackendData(CeedQFunctionContext ctx,
215ec3da8bcSJed Brown     void *data);
2169560d06aSjeremylt CEED_EXTERN int CeedQFunctionContextReference(CeedQFunctionContext ctx);
217ec3da8bcSJed Brown 
218d1d35e2fSjeremylt CEED_EXTERN int CeedOperatorGetNumArgs(CeedOperator op, CeedInt *num_args);
219d1d35e2fSjeremylt CEED_EXTERN int CeedOperatorIsSetupDone(CeedOperator op, bool *is_setup_done);
220ec3da8bcSJed Brown CEED_EXTERN int CeedOperatorGetQFunction(CeedOperator op, CeedQFunction *qf);
221d1d35e2fSjeremylt CEED_EXTERN int CeedOperatorIsComposite(CeedOperator op, bool *is_composite);
222d1d35e2fSjeremylt CEED_EXTERN int CeedOperatorGetNumSub(CeedOperator op, CeedInt *num_suboperators);
223ec3da8bcSJed Brown CEED_EXTERN int CeedOperatorGetSubList(CeedOperator op,
224d1d35e2fSjeremylt                                        CeedOperator **sub_operators);
225ec3da8bcSJed Brown CEED_EXTERN int CeedOperatorGetData(CeedOperator op, void *data);
226ec3da8bcSJed Brown CEED_EXTERN int CeedOperatorSetData(CeedOperator op, void *data);
2279560d06aSjeremylt CEED_EXTERN int CeedOperatorReference(CeedOperator op);
228ec3da8bcSJed Brown CEED_EXTERN int CeedOperatorSetSetupDone(CeedOperator op);
229ec3da8bcSJed Brown 
230d1d35e2fSjeremylt CEED_INTERN int CeedMatrixMultiply(Ceed ceed, const CeedScalar *mat_A,
231d1d35e2fSjeremylt                                    const CeedScalar *mat_B, CeedScalar *mat_C,
232ec3da8bcSJed Brown                                    CeedInt m, CeedInt n, CeedInt kk);
233ec3da8bcSJed Brown 
234ec3da8bcSJed Brown #endif
235