// Copyright (c) 2017, Lawrence Livermore National Security, LLC. Produced at // the Lawrence Livermore National Laboratory. LLNL-CODE-734707. All Rights // reserved. See files LICENSE and NOTICE for details. // // This file is part of CEED, a collection of benchmarks, miniapps, software // libraries and APIs for efficient high-order finite element and spectral // element discretizations for exascale applications. For more information and // source code availability see http://github.com/ceed. // // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, // a collaborative effort of two U.S. Department of Energy organizations (Office // of Science and the National Nuclear Security Administration) responsible for // the planning and preparation of a capable exascale ecosystem, including // software, applications, hardware, advanced system engineering and early // testbed platforms, in support of the nation's exascale computing imperative. // magma functions specific to ceed #include #include #include "magma.h" typedef struct { CeedScalar *dqref1d; CeedScalar *dinterp1d; CeedScalar *dgrad1d; CeedScalar *dqweight1d; } CeedBasis_Magma; typedef struct { CeedScalar *dqref; CeedScalar *dinterp; CeedScalar *dgrad; CeedScalar *dqweight; } CeedBasisNonTensor_Magma; typedef struct { CeedInt *indices; CeedInt *dindices; int own_; int down_; // cover a case where we own Device memory } CeedElemRestriction_Magma; typedef struct { const CeedScalar **inputs; CeedScalar **outputs; bool setupdone; } CeedQFunction_Magma; #define USE_MAGMA_BATCH #define USE_MAGMA_BATCH2 #define USE_MAGMA_BATCH3 #define USE_MAGMA_BATCH4 #ifdef __cplusplus CEED_INTERN { #endif void magmablas_dbasis_apply_batched_eval_interp(magma_int_t P, magma_int_t Q, magma_int_t dim, magma_int_t ncomp, const double *dT, CeedTransposeMode tmode, const double *dU, magma_int_t u_elemstride, magma_int_t u_compstride, double *dV, magma_int_t v_elemstride, magma_int_t v_compstride, magma_int_t nelem); void magmablas_dbasis_apply_batched_eval_grad(magma_int_t P, magma_int_t Q, magma_int_t dim, magma_int_t ncomp, magma_int_t nqpt, const double* dinterp1d, const double *dgrad1d, CeedTransposeMode tmode, const double *dU, magma_int_t u_elemstride, magma_int_t u_compstride, magma_int_t u_dimstride, double *dV, magma_int_t v_elemstride, magma_int_t v_compstride, magma_int_t v_dimstride, magma_int_t dim_id, magma_int_t nelem); void magmablas_dbasis_apply_batched_eval_weight(magma_int_t Q, magma_int_t dim, const double *dqweight1d, double *dV, magma_int_t v_elemstride, magma_int_t nelem); void magma_weight(magma_int_t grid, magma_int_t threads, magma_int_t nelem, magma_int_t Q, double *dqweight, double *dv); void magma_readDofs(const magma_int_t NCOMP, const magma_int_t nnodes, const magma_int_t esize, const magma_int_t nelem, magma_int_t *indices, const double *du, double *dv); void magma_readDofsTranspose(const magma_int_t NCOMP, const magma_int_t nnodes, const magma_int_t esize, const magma_int_t nelem, magma_int_t *indices, const double *du, double *dv); void magma_writeDofs(const magma_int_t NCOMP, const magma_int_t nnodes, const magma_int_t esize, const magma_int_t nelem, magma_int_t *indices, const double *du, double *dv); void magma_writeDofsTranspose(const magma_int_t NCOMP, const magma_int_t nnodes, const magma_int_t esize, const magma_int_t nelem, magma_int_t *indices, const double *du, double *dv); magma_int_t magma_isdevptr(const void *A); int CeedBasisCreateTensorH1_Magma(CeedInt dim, CeedInt P1d, CeedInt Q1d, const CeedScalar *interp1d, const CeedScalar *grad1d, const CeedScalar *qref1d, const CeedScalar *qweight1d, CeedBasis basis); int CeedBasisCreateH1_Magma(CeedElemTopology topo, CeedInt dim, CeedInt ndof, CeedInt nqpts, const CeedScalar *interp, const CeedScalar *grad, const CeedScalar *qref, const CeedScalar *qweight, CeedBasis basis); int CeedElemRestrictionCreate_Magma(CeedMemType mtype, CeedCopyMode cmode, const CeedInt *indices, CeedElemRestriction r); int CeedElemRestrictionCreateBlocked_Magma(const CeedMemType mtype, const CeedCopyMode cmode, const CeedInt *indices, const CeedElemRestriction res); #ifdef __cplusplus } #endif #define CeedDebug(...) //#define CeedDebug(format, ...) fprintf(stderr, format, ## __VA_ARGS__) // comment the line below to use the default magma_is_devptr function #define magma_is_devptr magma_isdevptr // batch stride, override using -DMAGMA_BATCH_STRIDE= #ifndef MAGMA_BATCH_STRIDE #define MAGMA_BATCH_STRIDE (1000) #endif