// Copyright (c) 2017-2018, Lawrence Livermore National Security, LLC. // Produced at the Lawrence Livermore National Laboratory. LLNL-CODE-734707. // All Rights reserved. See files LICENSE and NOTICE for details. // // This file is part of CEED, a collection of benchmarks, miniapps, software // libraries and APIs for efficient high-order finite element and spectral // element discretizations for exascale applications. For more information and // source code availability see http://github.com/ceed. // // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, // a collaborative effort of two U.S. Department of Energy organizations (Office // of Science and the National Nuclear Security Administration) responsible for // the planning and preparation of a capable exascale ecosystem, including // software, applications, hardware, advanced system engineering and early // testbed platforms, in support of the nation's exascale computing imperative. #include #include "ceed-ref.h" // Contracts on the middle index // NOTRANSPOSE: V_ajc = T_jb U_abc // TRANSPOSE: V_ajc = T_bj U_abc // If Add != 0, "=" is replaced by "+=" static int CeedTensorContract_Ref(Ceed ceed, CeedInt A, CeedInt B, CeedInt C, CeedInt J, const CeedScalar *restrict t, CeedTransposeMode tmode, const CeedInt Add, const CeedScalar *restrict u, CeedScalar *restrict v) { CeedInt tstride0 = B, tstride1 = 1; if (tmode == CEED_TRANSPOSE) { tstride0 = 1; tstride1 = J; } if (!Add) for (CeedInt q=0; qQ?P:Q, dim-1)]; CeedScalar *interp1d; ierr = CeedBasisGetInterp(basis, &interp1d); CeedChk(ierr); for (CeedInt d=0; dQ?P:Q, dim-1)]; CeedInt pre = ncomp*CeedIntPow(P, dim-1), post = nelem; CeedScalar tmp[2][nelem*ncomp*Q*CeedIntPow(P>Q?P:Q, dim-1)]; CeedScalar *interp1d; ierr = CeedBasisGetInterp(basis, &interp1d); CeedChk(ierr); // Interpolate to quadrature points (NoTranspose) // or Grad to quadrature points (Transpose) for (CeedInt d=0; dcolograd1d), tmode, add&&(d>0), (tmode == CEED_NOTRANSPOSE ? (d==0?u:tmp[d%2]) : u + d*nqpt*ncomp*nelem), (tmode == CEED_NOTRANSPOSE ? (d==dim-1?interp:tmp[(d+1)%2]) : interp)); CeedChk(ierr); pre /= P; post *= Q; } // Grad to quadrature points (NoTranspose) // or Interpolate to dofs (Transpose) P = Q1d, Q = Q1d; if (tmode == CEED_TRANSPOSE) { P = Q1d, Q = P1d; } pre = ncomp*CeedIntPow(P, dim-1), post = nelem; for (CeedInt d=0; dcolograd1d : interp1d), tmode, add&&(d==dim-1), (tmode == CEED_NOTRANSPOSE ? interp : (d==0?interp:tmp[d%2])), (tmode == CEED_NOTRANSPOSE ? v + d*nqpt*ncomp*nelem : (d==dim-1?v:tmp[(d+1)%2]))); CeedChk(ierr); pre /= P; post *= Q; } } break; // Retrieve interpolation weights case CEED_EVAL_WEIGHT: { if (tmode == CEED_TRANSPOSE) return CeedError(ceed, 1, "CEED_EVAL_WEIGHT incompatible with CEED_TRANSPOSE"); CeedInt Q = Q1d; CeedScalar *qweight1d; ierr = CeedBasisGetQWeights(basis, &qweight1d); CeedChk(ierr); for (CeedInt d=0; dcolograd1d); CeedChk(ierr); ierr = CeedFree(&impl); CeedChk(ierr); return 0; } int CeedBasisCreateTensorH1_Ref(CeedInt dim, CeedInt P1d, CeedInt Q1d, const CeedScalar *interp1d, const CeedScalar *grad1d, const CeedScalar *qref1d, const CeedScalar *qweight1d, CeedBasis basis) { int ierr; Ceed ceed; ierr = CeedBasisGetCeed(basis, &ceed); CeedChk(ierr); CeedBasis_Ref *impl; ierr = CeedCalloc(1, &impl); CeedChk(ierr); ierr = CeedMalloc(Q1d*Q1d, &impl->colograd1d); CeedChk(ierr); ierr = CeedBasisGetCollocatedGrad(basis, impl->colograd1d); CeedChk(ierr); ierr = CeedBasisSetData(basis, (void *)&impl); CeedChk(ierr); ierr = CeedSetBackendFunction(ceed, "Basis", basis, "Apply", CeedBasisApply_Ref); CeedChk(ierr); ierr = CeedSetBackendFunction(ceed, "Basis", basis, "Destroy", CeedBasisDestroyTensor_Ref); CeedChk(ierr); return 0; } int CeedBasisCreateH1_Ref(CeedElemTopology topo, CeedInt dim, CeedInt ndof, CeedInt nqpts, const CeedScalar *interp, const CeedScalar *grad, const CeedScalar *qref, const CeedScalar *qweight, CeedBasis basis) { int ierr; Ceed ceed; ierr = CeedBasisGetCeed(basis, &ceed); CeedChk(ierr); ierr = CeedSetBackendFunction(ceed, "Basis", basis, "Apply", CeedBasisApply_Ref); CeedChk(ierr); ierr = CeedSetBackendFunction(ceed, "Basis", basis, "Destroy", CeedBasisDestroyNonTensor_Ref); CeedChk(ierr); return 0; }