// Copyright (c) 2017-2018, Lawrence Livermore National Security, LLC. // Produced at the Lawrence Livermore National Laboratory. LLNL-CODE-734707. // All Rights reserved. See files LICENSE and NOTICE for details. // // This file is part of CEED, a collection of benchmarks, miniapps, software // libraries and APIs for efficient high-order finite element and spectral // element discretizations for exascale applications. For more information and // source code availability see http://github.com/ceed. // // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, // a collaborative effort of two U.S. Department of Energy organizations (Office // of Science and the National Nuclear Security Administration) responsible for // the planning and preparation of a capable exascale ecosystem, including // software, applications, hardware, advanced system engineering and early // testbed platforms, in support of the nation's exascale computing imperative. #include "ceed-ref.h" //------------------------------------------------------------------------------ // Basis Apply //------------------------------------------------------------------------------ static int CeedBasisApply_Ref(CeedBasis basis, CeedInt nelem, CeedTransposeMode tmode, CeedEvalMode emode, CeedVector U, CeedVector V) { int ierr; Ceed ceed; ierr = CeedBasisGetCeed(basis, &ceed); CeedChk(ierr); CeedInt dim, ncomp, nnodes, nqpt; ierr = CeedBasisGetDimension(basis, &dim); CeedChk(ierr); ierr = CeedBasisGetNumComponents(basis, &ncomp); CeedChk(ierr); ierr = CeedBasisGetNumNodes(basis, &nnodes); CeedChk(ierr); ierr = CeedBasisGetNumQuadraturePoints(basis, &nqpt); CeedChk(ierr); CeedTensorContract contract; ierr = CeedBasisGetTensorContract(basis, &contract); CeedChk(ierr); const CeedInt add = (tmode == CEED_TRANSPOSE); const CeedScalar *u; CeedScalar *v; if (U != CEED_VECTOR_NONE) { ierr = CeedVectorGetArrayRead(U, CEED_MEM_HOST, &u); CeedChk(ierr); } else if (emode != CEED_EVAL_WEIGHT) { // LCOV_EXCL_START return CeedError(ceed, 1, "An input vector is required for this CeedEvalMode"); // LCOV_EXCL_STOP } ierr = CeedVectorGetArray(V, CEED_MEM_HOST, &v); CeedChk(ierr); // Clear v if operating in transpose if (tmode == CEED_TRANSPOSE) { const CeedInt vsize = nelem*ncomp*nnodes; for (CeedInt i = 0; i < vsize; i++) v[i] = (CeedScalar) 0.0; } bool tensorbasis; ierr = CeedBasisGetTensorStatus(basis, &tensorbasis); CeedChk(ierr); // Tensor basis if (tensorbasis) { CeedInt P1d, Q1d; ierr = CeedBasisGetNumNodes1D(basis, &P1d); CeedChk(ierr); ierr = CeedBasisGetNumQuadraturePoints1D(basis, &Q1d); CeedChk(ierr); switch (emode) { // Interpolate to/from quadrature points case CEED_EVAL_INTERP: { CeedBasis_Ref *impl; ierr = CeedBasisGetData(basis, (void *)&impl); CeedChk(ierr); if (impl->collointerp) { memcpy(v, u, nelem*ncomp*nnodes*sizeof(u[0])); } else { CeedInt P = P1d, Q = Q1d; if (tmode == CEED_TRANSPOSE) { P = Q1d; Q = P1d; } CeedInt pre = ncomp*CeedIntPow(P, dim-1), post = nelem; CeedScalar tmp[2][nelem*ncomp*Q*CeedIntPow(P>Q?P:Q, dim-1)]; CeedScalar *interp1d; ierr = CeedBasisGetInterp1D(basis, &interp1d); CeedChk(ierr); for (CeedInt d=0; dcollograd1d) { CeedScalar tmp[2][nelem*ncomp*Q*CeedIntPow(P>Q?P:Q, dim-1)]; CeedScalar interp[nelem*ncomp*Q*CeedIntPow(P>Q?P:Q, dim-1)]; // Interpolate to quadrature points (NoTranspose) // or Grad to quadrature points (Transpose) for (CeedInt d=0; dcollograd1d), tmode, add&&(d>0), (tmode == CEED_NOTRANSPOSE ? (d==0?u:tmp[d%2]) : u + d*nqpt*ncomp*nelem), (tmode == CEED_NOTRANSPOSE ? (d==dim-1?interp:tmp[(d+1)%2]) : interp)); CeedChk(ierr); pre /= P; post *= Q; } // Grad to quadrature points (NoTranspose) // or Interpolate to nodes (Transpose) P = Q1d, Q = Q1d; if (tmode == CEED_TRANSPOSE) { P = Q1d, Q = P1d; } pre = ncomp*CeedIntPow(P, dim-1), post = nelem; for (CeedInt d=0; dcollograd1d : interp1d), tmode, add&&(d==dim-1), (tmode == CEED_NOTRANSPOSE ? interp : (d==0?interp:tmp[d%2])), (tmode == CEED_NOTRANSPOSE ? v + d*nqpt*ncomp*nelem : (d==dim-1?v:tmp[(d+1)%2]))); CeedChk(ierr); pre /= P; post *= Q; } } else if (impl->collointerp) { // Qpts collocated with nodes CeedScalar *grad1d; ierr = CeedBasisGetGrad1D(basis, &grad1d); CeedChk(ierr); // Dim contractions, identity in other directions CeedInt pre = ncomp*CeedIntPow(P, dim-1), post = nelem; for (CeedInt d=0; d0), tmode == CEED_NOTRANSPOSE ? u : u+d*ncomp*nqpt*nelem, tmode == CEED_TRANSPOSE ? v : v+d*ncomp*nqpt*nelem); CeedChk(ierr); pre /= P; post *= Q; } } else { // Underintegration, P > Q CeedScalar *grad1d; ierr = CeedBasisGetGrad1D(basis, &grad1d); CeedChk(ierr); if (tmode == CEED_TRANSPOSE) { P = Q1d, Q = P1d; } CeedScalar tmp[2][nelem*ncomp*Q*CeedIntPow(P>Q?P:Q, dim-1)]; // Dim**2 contractions, apply grad when pass == dim for (CeedInt p=0; pcollograd1d); CeedChk(ierr); ierr = CeedFree(&impl); CeedChk(ierr); return 0; } //------------------------------------------------------------------------------ // Basis Create Tensor //------------------------------------------------------------------------------ int CeedBasisCreateTensorH1_Ref(CeedInt dim, CeedInt P1d, CeedInt Q1d, const CeedScalar *interp1d, const CeedScalar *grad1d, const CeedScalar *qref1d, const CeedScalar *qweight1d, CeedBasis basis) { int ierr; Ceed ceed; ierr = CeedBasisGetCeed(basis, &ceed); CeedChk(ierr); CeedBasis_Ref *impl; ierr = CeedCalloc(1, &impl); CeedChk(ierr); // Check for collocated interp if (Q1d == P1d) { bool collocated = 1; for (CeedInt i=0; icollointerp = collocated; } // Calculate collocated grad if (Q1d >= P1d && !impl->collointerp) { ierr = CeedMalloc(Q1d*Q1d, &impl->collograd1d); CeedChk(ierr); ierr = CeedBasisGetCollocatedGrad(basis, impl->collograd1d); CeedChk(ierr); } ierr = CeedBasisSetData(basis, (void *)&impl); CeedChk(ierr); Ceed parent; ierr = CeedGetParent(ceed, &parent); CeedChk(ierr); CeedTensorContract contract; ierr = CeedTensorContractCreate(parent, basis, &contract); CeedChk(ierr); ierr = CeedBasisSetTensorContract(basis, &contract); CeedChk(ierr); ierr = CeedSetBackendFunction(ceed, "Basis", basis, "Apply", CeedBasisApply_Ref); CeedChk(ierr); ierr = CeedSetBackendFunction(ceed, "Basis", basis, "Destroy", CeedBasisDestroyTensor_Ref); CeedChk(ierr); return 0; } //------------------------------------------------------------------------------