121617c04Sjeremylt // Copyright (c) 2017-2018, Lawrence Livermore National Security, LLC. 221617c04Sjeremylt // Produced at the Lawrence Livermore National Laboratory. LLNL-CODE-734707. 321617c04Sjeremylt // All Rights reserved. See files LICENSE and NOTICE for details. 421617c04Sjeremylt // 521617c04Sjeremylt // This file is part of CEED, a collection of benchmarks, miniapps, software 621617c04Sjeremylt // libraries and APIs for efficient high-order finite element and spectral 721617c04Sjeremylt // element discretizations for exascale applications. For more information and 821617c04Sjeremylt // source code availability see http://github.com/ceed. 921617c04Sjeremylt // 1021617c04Sjeremylt // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, 1121617c04Sjeremylt // a collaborative effort of two U.S. Department of Energy organizations (Office 1221617c04Sjeremylt // of Science and the National Nuclear Security Administration) responsible for 1321617c04Sjeremylt // the planning and preparation of a capable exascale ecosystem, including 1421617c04Sjeremylt // software, applications, hardware, advanced system engineering and early 1521617c04Sjeremylt // testbed platforms, in support of the nation's exascale computing imperative. 1621617c04Sjeremylt 17ec3da8bcSJed Brown #include <ceed/ceed.h> 18ec3da8bcSJed Brown #include <ceed/backend.h> 193d576824SJeremy L Thompson #include <math.h> 203d576824SJeremy L Thompson #include <stdbool.h> 213d576824SJeremy L Thompson #include <string.h> 2221617c04Sjeremylt #include "ceed-ref.h" 2321617c04Sjeremylt 24f10650afSjeremylt //------------------------------------------------------------------------------ 25f10650afSjeremylt // Basis Apply 26f10650afSjeremylt //------------------------------------------------------------------------------ 27d1d35e2fSjeremylt static int CeedBasisApply_Ref(CeedBasis basis, CeedInt num_elem, 28d1d35e2fSjeremylt CeedTransposeMode t_mode, CeedEvalMode eval_mode, 29aedaa0e5Sjeremylt CeedVector U, CeedVector V) { 3021617c04Sjeremylt int ierr; 314ce2993fSjeremylt Ceed ceed; 32e15f9bd0SJeremy L Thompson ierr = CeedBasisGetCeed(basis, &ceed); CeedChkBackend(ierr); 33d1d35e2fSjeremylt CeedInt dim, num_comp, num_nodes, num_qpts; 34e15f9bd0SJeremy L Thompson ierr = CeedBasisGetDimension(basis, &dim); CeedChkBackend(ierr); 35d1d35e2fSjeremylt ierr = CeedBasisGetNumComponents(basis, &num_comp); CeedChkBackend(ierr); 36d1d35e2fSjeremylt ierr = CeedBasisGetNumNodes(basis, &num_nodes); CeedChkBackend(ierr); 37d1d35e2fSjeremylt ierr = CeedBasisGetNumQuadraturePoints(basis, &num_qpts); CeedChkBackend(ierr); 382f86a920SJeremy L Thompson CeedTensorContract contract; 39e15f9bd0SJeremy L Thompson ierr = CeedBasisGetTensorContract(basis, &contract); CeedChkBackend(ierr); 40d1d35e2fSjeremylt const CeedInt add = (t_mode == CEED_TRANSPOSE); 41aedaa0e5Sjeremylt const CeedScalar *u; 42aedaa0e5Sjeremylt CeedScalar *v; 43a7b7f929Sjeremylt if (U != CEED_VECTOR_NONE) { 44e15f9bd0SJeremy L Thompson ierr = CeedVectorGetArrayRead(U, CEED_MEM_HOST, &u); CeedChkBackend(ierr); 45d1d35e2fSjeremylt } else if (eval_mode != CEED_EVAL_WEIGHT) { 46c042f62fSJeremy L Thompson // LCOV_EXCL_START 47e15f9bd0SJeremy L Thompson return CeedError(ceed, CEED_ERROR_BACKEND, 48aedaa0e5Sjeremylt "An input vector is required for this CeedEvalMode"); 49c042f62fSJeremy L Thompson // LCOV_EXCL_STOP 50aedaa0e5Sjeremylt } 51*9c774eddSJeremy L Thompson ierr = CeedVectorGetArrayWrite(V, CEED_MEM_HOST, &v); CeedChkBackend(ierr); 5221617c04Sjeremylt 538d94b059Sjeremylt // Clear v if operating in transpose 54d1d35e2fSjeremylt if (t_mode == CEED_TRANSPOSE) { 55d1d35e2fSjeremylt const CeedInt v_size = num_elem*num_comp*num_nodes; 56d1d35e2fSjeremylt for (CeedInt i = 0; i < v_size; i++) 5784a01de5SJeremy L Thompson v[i] = (CeedScalar) 0.0; 5821617c04Sjeremylt } 59d1d35e2fSjeremylt bool tensor_basis; 60d1d35e2fSjeremylt ierr = CeedBasisIsTensor(basis, &tensor_basis); CeedChkBackend(ierr); 6184a01de5SJeremy L Thompson // Tensor basis 62d1d35e2fSjeremylt if (tensor_basis) { 63d1d35e2fSjeremylt CeedInt P_1d, Q_1d; 64d1d35e2fSjeremylt ierr = CeedBasisGetNumNodes1D(basis, &P_1d); CeedChkBackend(ierr); 65d1d35e2fSjeremylt ierr = CeedBasisGetNumQuadraturePoints1D(basis, &Q_1d); CeedChkBackend(ierr); 66d1d35e2fSjeremylt switch (eval_mode) { 678d94b059Sjeremylt // Interpolate to/from quadrature points 68a2b73c81Sjeremylt case CEED_EVAL_INTERP: { 69dfe03796SJeremy L Thompson CeedBasis_Ref *impl; 70e15f9bd0SJeremy L Thompson ierr = CeedBasisGetData(basis, &impl); CeedChkBackend(ierr); 718c1105f8SJeremy L Thompson if (impl->has_collo_interp) { 72d1d35e2fSjeremylt memcpy(v, u, num_elem*num_comp*num_nodes*sizeof(u[0])); 73dfe03796SJeremy L Thompson } else { 74d1d35e2fSjeremylt CeedInt P = P_1d, Q = Q_1d; 75d1d35e2fSjeremylt if (t_mode == CEED_TRANSPOSE) { 76d1d35e2fSjeremylt P = Q_1d; Q = P_1d; 7721617c04Sjeremylt } 78d1d35e2fSjeremylt CeedInt pre = num_comp*CeedIntPow(P, dim-1), post = num_elem; 79d1d35e2fSjeremylt CeedScalar tmp[2][num_elem*num_comp*Q*CeedIntPow(P>Q?P:Q, dim-1)]; 80d1d35e2fSjeremylt const CeedScalar *interp_1d; 81d1d35e2fSjeremylt ierr = CeedBasisGetInterp1D(basis, &interp_1d); CeedChkBackend(ierr); 8221617c04Sjeremylt for (CeedInt d=0; d<dim; d++) { 832f86a920SJeremy L Thompson ierr = CeedTensorContractApply(contract, pre, P, post, Q, 84d1d35e2fSjeremylt interp_1d, t_mode, add&&(d==dim-1), 85dfe03796SJeremy L Thompson d==0?u:tmp[d%2], 86dfe03796SJeremy L Thompson d==dim-1?v:tmp[(d+1)%2]); 87e15f9bd0SJeremy L Thompson CeedChkBackend(ierr); 8821617c04Sjeremylt pre /= P; 8921617c04Sjeremylt post *= Q; 9021617c04Sjeremylt } 91dfe03796SJeremy L Thompson } 92a2b73c81Sjeremylt } break; 938d94b059Sjeremylt // Evaluate the gradient to/from quadrature points 94a2b73c81Sjeremylt case CEED_EVAL_GRAD: { 9521617c04Sjeremylt // In CEED_NOTRANSPOSE mode: 96d1d35e2fSjeremylt // u has shape [dim, num_comp, P^dim, num_elem], row-major layout 97d1d35e2fSjeremylt // v has shape [dim, num_comp, Q^dim, num_elem], row-major layout 9821617c04Sjeremylt // In CEED_TRANSPOSE mode, the sizes of u and v are switched. 99d1d35e2fSjeremylt CeedInt P = P_1d, Q = Q_1d; 100d1d35e2fSjeremylt if (t_mode == CEED_TRANSPOSE) { 101d1d35e2fSjeremylt P = Q_1d, Q = Q_1d; 10221617c04Sjeremylt } 10384a01de5SJeremy L Thompson CeedBasis_Ref *impl; 104e15f9bd0SJeremy L Thompson ierr = CeedBasisGetData(basis, &impl); CeedChkBackend(ierr); 105d1d35e2fSjeremylt CeedInt pre = num_comp*CeedIntPow(P, dim-1), post = num_elem; 106d1d35e2fSjeremylt const CeedScalar *interp_1d; 107d1d35e2fSjeremylt ierr = CeedBasisGetInterp1D(basis, &interp_1d); CeedChkBackend(ierr); 1088c1105f8SJeremy L Thompson if (impl->collo_grad_1d) { 109d1d35e2fSjeremylt CeedScalar tmp[2][num_elem*num_comp*Q*CeedIntPow(P>Q?P:Q, dim-1)]; 110d1d35e2fSjeremylt CeedScalar interp[num_elem*num_comp*Q*CeedIntPow(P>Q?P:Q, dim-1)]; 11184a01de5SJeremy L Thompson // Interpolate to quadrature points (NoTranspose) 11284a01de5SJeremy L Thompson // or Grad to quadrature points (Transpose) 11321617c04Sjeremylt for (CeedInt d=0; d<dim; d++) { 1142f86a920SJeremy L Thompson ierr = CeedTensorContractApply(contract, pre, P, post, Q, 115d1d35e2fSjeremylt (t_mode == CEED_NOTRANSPOSE 116d1d35e2fSjeremylt ? interp_1d 1178c1105f8SJeremy L Thompson : impl->collo_grad_1d), 118d1d35e2fSjeremylt t_mode, add&&(d>0), 119d1d35e2fSjeremylt (t_mode == CEED_NOTRANSPOSE 12084a01de5SJeremy L Thompson ? (d==0?u:tmp[d%2]) 121d1d35e2fSjeremylt : u + d*num_qpts*num_comp*num_elem), 122d1d35e2fSjeremylt (t_mode == CEED_NOTRANSPOSE 12384a01de5SJeremy L Thompson ? (d==dim-1?interp:tmp[(d+1)%2]) 12484a01de5SJeremy L Thompson : interp)); 125e15f9bd0SJeremy L Thompson CeedChkBackend(ierr); 12621617c04Sjeremylt pre /= P; 12721617c04Sjeremylt post *= Q; 12821617c04Sjeremylt } 12984a01de5SJeremy L Thompson // Grad to quadrature points (NoTranspose) 1308795c945Sjeremylt // or Interpolate to nodes (Transpose) 131d1d35e2fSjeremylt P = Q_1d, Q = Q_1d; 132d1d35e2fSjeremylt if (t_mode == CEED_TRANSPOSE) { 133d1d35e2fSjeremylt P = Q_1d, Q = P_1d; 13484a01de5SJeremy L Thompson } 135d1d35e2fSjeremylt pre = num_comp*CeedIntPow(P, dim-1), post = num_elem; 13684a01de5SJeremy L Thompson for (CeedInt d=0; d<dim; d++) { 1372f86a920SJeremy L Thompson ierr = CeedTensorContractApply(contract, pre, P, post, Q, 138d1d35e2fSjeremylt (t_mode == CEED_NOTRANSPOSE 1398c1105f8SJeremy L Thompson ? impl->collo_grad_1d 140d1d35e2fSjeremylt : interp_1d), 141d1d35e2fSjeremylt t_mode, add&&(d==dim-1), 142d1d35e2fSjeremylt (t_mode == CEED_NOTRANSPOSE 14384a01de5SJeremy L Thompson ? interp 14484a01de5SJeremy L Thompson : (d==0?interp:tmp[d%2])), 145d1d35e2fSjeremylt (t_mode == CEED_NOTRANSPOSE 146d1d35e2fSjeremylt ? v + d*num_qpts*num_comp*num_elem 14784a01de5SJeremy L Thompson : (d==dim-1?v:tmp[(d+1)%2]))); 148e15f9bd0SJeremy L Thompson CeedChkBackend(ierr); 14984a01de5SJeremy L Thompson pre /= P; 15084a01de5SJeremy L Thompson post *= Q; 15121617c04Sjeremylt } 1528c1105f8SJeremy L Thompson } else if (impl->has_collo_interp) { // Qpts collocated with nodes 153d1d35e2fSjeremylt const CeedScalar *grad_1d; 154d1d35e2fSjeremylt ierr = CeedBasisGetGrad1D(basis, &grad_1d); CeedChkBackend(ierr); 155dfe03796SJeremy L Thompson 156dfe03796SJeremy L Thompson // Dim contractions, identity in other directions 157d1d35e2fSjeremylt CeedInt pre = num_comp*CeedIntPow(P, dim-1), post = num_elem; 158c6158135Sjeremylt for (CeedInt d=0; d<dim; d++) { 159dfe03796SJeremy L Thompson ierr = CeedTensorContractApply(contract, pre, P, post, Q, 160d1d35e2fSjeremylt grad_1d, t_mode, add&&(d>0), 161d1d35e2fSjeremylt t_mode == CEED_NOTRANSPOSE 162d1d35e2fSjeremylt ? u : u+d*num_comp*num_qpts*num_elem, 163d1d35e2fSjeremylt t_mode == CEED_TRANSPOSE 164d1d35e2fSjeremylt ? v : v+d*num_comp*num_qpts*num_elem); 165e15f9bd0SJeremy L Thompson CeedChkBackend(ierr); 166c6158135Sjeremylt pre /= P; 167c6158135Sjeremylt post *= Q; 168dfe03796SJeremy L Thompson } 169a7bd39daSjeremylt } else { // Underintegration, P > Q 170d1d35e2fSjeremylt const CeedScalar *grad_1d; 171d1d35e2fSjeremylt ierr = CeedBasisGetGrad1D(basis, &grad_1d); CeedChkBackend(ierr); 172a7bd39daSjeremylt 173d1d35e2fSjeremylt if (t_mode == CEED_TRANSPOSE) { 174d1d35e2fSjeremylt P = Q_1d, Q = P_1d; 175a7bd39daSjeremylt } 176d1d35e2fSjeremylt CeedScalar tmp[2][num_elem*num_comp*Q*CeedIntPow(P>Q?P:Q, dim-1)]; 177a7bd39daSjeremylt 178a7bd39daSjeremylt // Dim**2 contractions, apply grad when pass == dim 179a7bd39daSjeremylt for (CeedInt p=0; p<dim; p++) { 180d1d35e2fSjeremylt CeedInt pre = num_comp*CeedIntPow(P, dim-1), post = num_elem; 181a7bd39daSjeremylt for (CeedInt d=0; d<dim; d++) { 182a7bd39daSjeremylt ierr = CeedTensorContractApply(contract, pre, P, post, Q, 183d1d35e2fSjeremylt (p==d)? grad_1d : interp_1d, 184d1d35e2fSjeremylt t_mode, add&&(d==dim-1), 185a7bd39daSjeremylt (d == 0 186d1d35e2fSjeremylt ? (t_mode == CEED_NOTRANSPOSE 187d1d35e2fSjeremylt ? u : u+p*num_comp*num_qpts*num_elem) 188a7bd39daSjeremylt : tmp[d%2]), 189a7bd39daSjeremylt (d == dim-1 190d1d35e2fSjeremylt ? (t_mode == CEED_TRANSPOSE 191d1d35e2fSjeremylt ? v : v+p*num_comp*num_qpts*num_elem) 192a7bd39daSjeremylt : tmp[(d+1)%2])); 193e15f9bd0SJeremy L Thompson CeedChkBackend(ierr); 194a7bd39daSjeremylt pre /= P; 195a7bd39daSjeremylt post *= Q; 196a7bd39daSjeremylt } 197a7bd39daSjeremylt } 198a7bd39daSjeremylt } 199a2b73c81Sjeremylt } break; 2008d94b059Sjeremylt // Retrieve interpolation weights 201a2b73c81Sjeremylt case CEED_EVAL_WEIGHT: { 202d1d35e2fSjeremylt if (t_mode == CEED_TRANSPOSE) 203c042f62fSJeremy L Thompson // LCOV_EXCL_START 204e15f9bd0SJeremy L Thompson return CeedError(ceed, CEED_ERROR_BACKEND, 20521617c04Sjeremylt "CEED_EVAL_WEIGHT incompatible with CEED_TRANSPOSE"); 206c042f62fSJeremy L Thompson // LCOV_EXCL_STOP 207d1d35e2fSjeremylt CeedInt Q = Q_1d; 208d1d35e2fSjeremylt const CeedScalar *q_weight_1d; 209d1d35e2fSjeremylt ierr = CeedBasisGetQWeights(basis, &q_weight_1d); CeedChkBackend(ierr); 21021617c04Sjeremylt for (CeedInt d=0; d<dim; d++) { 211b5cf12eeSjeremylt CeedInt pre = CeedIntPow(Q, dim-d-1), post = CeedIntPow(Q, d); 212a2b73c81Sjeremylt for (CeedInt i=0; i<pre; i++) 213a2b73c81Sjeremylt for (CeedInt j=0; j<Q; j++) 21484a01de5SJeremy L Thompson for (CeedInt k=0; k<post; k++) { 215d1d35e2fSjeremylt CeedScalar w = q_weight_1d[j] 216d1d35e2fSjeremylt * (d == 0 ? 1 : v[((i*Q + j)*post + k)*num_elem]); 217d1d35e2fSjeremylt for (CeedInt e=0; e<num_elem; e++) 218d1d35e2fSjeremylt v[((i*Q + j)*post + k)*num_elem + e] = w; 21984a01de5SJeremy L Thompson } 22021617c04Sjeremylt } 221a2b73c81Sjeremylt } break; 222c042f62fSJeremy L Thompson // LCOV_EXCL_START 2238d94b059Sjeremylt // Evaluate the divergence to/from the quadrature points 224a2b73c81Sjeremylt case CEED_EVAL_DIV: 225e15f9bd0SJeremy L Thompson return CeedError(ceed, CEED_ERROR_BACKEND, "CEED_EVAL_DIV not supported"); 2268d94b059Sjeremylt // Evaluate the curl to/from the quadrature points 227a2b73c81Sjeremylt case CEED_EVAL_CURL: 228e15f9bd0SJeremy L Thompson return CeedError(ceed, CEED_ERROR_BACKEND, "CEED_EVAL_CURL not supported"); 2298d94b059Sjeremylt // Take no action, BasisApply should not have been called 230a2b73c81Sjeremylt case CEED_EVAL_NONE: 231e15f9bd0SJeremy L Thompson return CeedError(ceed, CEED_ERROR_BACKEND, 2324b8bea3bSJed Brown "CEED_EVAL_NONE does not make sense in this context"); 233c042f62fSJeremy L Thompson // LCOV_EXCL_STOP 23421617c04Sjeremylt } 235a8de75f0Sjeremylt } else { 236a8de75f0Sjeremylt // Non-tensor basis 237d1d35e2fSjeremylt switch (eval_mode) { 23884a01de5SJeremy L Thompson // Interpolate to/from quadrature points 239a8de75f0Sjeremylt case CEED_EVAL_INTERP: { 240d1d35e2fSjeremylt CeedInt P = num_nodes, Q = num_qpts; 2416c58de82SJeremy L Thompson const CeedScalar *interp; 242e15f9bd0SJeremy L Thompson ierr = CeedBasisGetInterp(basis, &interp); CeedChkBackend(ierr); 243d1d35e2fSjeremylt if (t_mode == CEED_TRANSPOSE) { 244d1d35e2fSjeremylt P = num_qpts; Q = num_nodes; 245a8de75f0Sjeremylt } 246d1d35e2fSjeremylt ierr = CeedTensorContractApply(contract, num_comp, P, num_elem, Q, 247d1d35e2fSjeremylt interp, t_mode, add, u, v); 248e15f9bd0SJeremy L Thompson CeedChkBackend(ierr); 249a8de75f0Sjeremylt } 250a8de75f0Sjeremylt break; 25184a01de5SJeremy L Thompson // Evaluate the gradient to/from quadrature points 252a8de75f0Sjeremylt case CEED_EVAL_GRAD: { 253d1d35e2fSjeremylt CeedInt P = num_nodes, Q = num_qpts; 254d1d35e2fSjeremylt CeedInt dim_stride = num_qpts * num_comp * num_elem; 255d1d35e2fSjeremylt CeedInt grad_stride = num_qpts * num_nodes; 2566c58de82SJeremy L Thompson const CeedScalar *grad; 257e15f9bd0SJeremy L Thompson ierr = CeedBasisGetGrad(basis, &grad); CeedChkBackend(ierr); 258d1d35e2fSjeremylt if (t_mode == CEED_TRANSPOSE) { 259d1d35e2fSjeremylt P = num_qpts; Q = num_nodes; 260475a782bSnbeams for (CeedInt d = 0; d < dim; d++) { 261d1d35e2fSjeremylt ierr = CeedTensorContractApply(contract, num_comp, P, num_elem, Q, 262d1d35e2fSjeremylt grad + d * grad_stride, t_mode, add, 263d1d35e2fSjeremylt u + d * dim_stride, v); CeedChkBackend(ierr); 264475a782bSnbeams } 265475a782bSnbeams } else { 266475a782bSnbeams for (CeedInt d = 0; d < dim; d++) { 267d1d35e2fSjeremylt ierr = CeedTensorContractApply(contract, num_comp, P, num_elem, Q, 268d1d35e2fSjeremylt grad + d * grad_stride, t_mode, add, 269d1d35e2fSjeremylt u, v + d * dim_stride); CeedChkBackend(ierr); 270475a782bSnbeams } 271475a782bSnbeams } 272a8de75f0Sjeremylt } 273a8de75f0Sjeremylt break; 27484a01de5SJeremy L Thompson // Retrieve interpolation weights 275a8de75f0Sjeremylt case CEED_EVAL_WEIGHT: { 276d1d35e2fSjeremylt if (t_mode == CEED_TRANSPOSE) 277c042f62fSJeremy L Thompson // LCOV_EXCL_START 278e15f9bd0SJeremy L Thompson return CeedError(ceed, CEED_ERROR_BACKEND, 279a8de75f0Sjeremylt "CEED_EVAL_WEIGHT incompatible with CEED_TRANSPOSE"); 280c042f62fSJeremy L Thompson // LCOV_EXCL_STOP 281d1d35e2fSjeremylt const CeedScalar *q_weight; 282d1d35e2fSjeremylt ierr = CeedBasisGetQWeights(basis, &q_weight); CeedChkBackend(ierr); 283d1d35e2fSjeremylt for (CeedInt i=0; i<num_qpts; i++) 284d1d35e2fSjeremylt for (CeedInt e=0; e<num_elem; e++) 285d1d35e2fSjeremylt v[i*num_elem + e] = q_weight[i]; 286a8de75f0Sjeremylt } break; 287c042f62fSJeremy L Thompson // LCOV_EXCL_START 28884a01de5SJeremy L Thompson // Evaluate the divergence to/from the quadrature points 289a8de75f0Sjeremylt case CEED_EVAL_DIV: 290e15f9bd0SJeremy L Thompson return CeedError(ceed, CEED_ERROR_BACKEND, "CEED_EVAL_DIV not supported"); 29184a01de5SJeremy L Thompson // Evaluate the curl to/from the quadrature points 292a8de75f0Sjeremylt case CEED_EVAL_CURL: 293e15f9bd0SJeremy L Thompson return CeedError(ceed, CEED_ERROR_BACKEND, "CEED_EVAL_CURL not supported"); 29484a01de5SJeremy L Thompson // Take no action, BasisApply should not have been called 295a8de75f0Sjeremylt case CEED_EVAL_NONE: 296e15f9bd0SJeremy L Thompson return CeedError(ceed, CEED_ERROR_BACKEND, 297a8de75f0Sjeremylt "CEED_EVAL_NONE does not make sense in this context"); 298c042f62fSJeremy L Thompson // LCOV_EXCL_STOP 299a8de75f0Sjeremylt } 300a8de75f0Sjeremylt } 301a7b7f929Sjeremylt if (U != CEED_VECTOR_NONE) { 302e15f9bd0SJeremy L Thompson ierr = CeedVectorRestoreArrayRead(U, &u); CeedChkBackend(ierr); 303aedaa0e5Sjeremylt } 304e15f9bd0SJeremy L Thompson ierr = CeedVectorRestoreArray(V, &v); CeedChkBackend(ierr); 305e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 30621617c04Sjeremylt } 30721617c04Sjeremylt 308f10650afSjeremylt //------------------------------------------------------------------------------ 309f10650afSjeremylt // Basis Create Non-Tensor 310f10650afSjeremylt //------------------------------------------------------------------------------ 311f10650afSjeremylt int CeedBasisCreateH1_Ref(CeedElemTopology topo, CeedInt dim, 312d1d35e2fSjeremylt CeedInt num_nodes, CeedInt num_qpts, 313f10650afSjeremylt const CeedScalar *interp, 314f10650afSjeremylt const CeedScalar *grad, 315d1d35e2fSjeremylt const CeedScalar *q_ref, 316d1d35e2fSjeremylt const CeedScalar *q_weight, 317f10650afSjeremylt CeedBasis basis) { 318f10650afSjeremylt int ierr; 319f10650afSjeremylt Ceed ceed; 320e15f9bd0SJeremy L Thompson ierr = CeedBasisGetCeed(basis, &ceed); CeedChkBackend(ierr); 321f10650afSjeremylt 322f10650afSjeremylt Ceed parent; 323e15f9bd0SJeremy L Thompson ierr = CeedGetParent(ceed, &parent); CeedChkBackend(ierr); 324f10650afSjeremylt CeedTensorContract contract; 325e15f9bd0SJeremy L Thompson ierr = CeedTensorContractCreate(parent, basis, &contract); CeedChkBackend(ierr); 32634359f16Sjeremylt ierr = CeedBasisSetTensorContract(basis, contract); CeedChkBackend(ierr); 327f10650afSjeremylt 328f10650afSjeremylt ierr = CeedSetBackendFunction(ceed, "Basis", basis, "Apply", 329e15f9bd0SJeremy L Thompson CeedBasisApply_Ref); CeedChkBackend(ierr); 330f10650afSjeremylt 331e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 332f10650afSjeremylt } 333f10650afSjeremylt 334f10650afSjeremylt //------------------------------------------------------------------------------ 335f10650afSjeremylt // Basis Destroy Tensor 336f10650afSjeremylt //------------------------------------------------------------------------------ 33784a01de5SJeremy L Thompson static int CeedBasisDestroyTensor_Ref(CeedBasis basis) { 33884a01de5SJeremy L Thompson int ierr; 3392f86a920SJeremy L Thompson 34084a01de5SJeremy L Thompson CeedBasis_Ref *impl; 341e15f9bd0SJeremy L Thompson ierr = CeedBasisGetData(basis, &impl); CeedChkBackend(ierr); 3428c1105f8SJeremy L Thompson ierr = CeedFree(&impl->collo_grad_1d); CeedChkBackend(ierr); 343e15f9bd0SJeremy L Thompson ierr = CeedFree(&impl); CeedChkBackend(ierr); 34484a01de5SJeremy L Thompson 345e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 34621617c04Sjeremylt } 34721617c04Sjeremylt 348f10650afSjeremylt //------------------------------------------------------------------------------ 349f10650afSjeremylt // Basis Create Tensor 350f10650afSjeremylt //------------------------------------------------------------------------------ 351d1d35e2fSjeremylt int CeedBasisCreateTensorH1_Ref(CeedInt dim, CeedInt P_1d, 352d1d35e2fSjeremylt CeedInt Q_1d, const CeedScalar *interp_1d, 353d1d35e2fSjeremylt const CeedScalar *grad_1d, 354d1d35e2fSjeremylt const CeedScalar *q_ref_1d, 355d1d35e2fSjeremylt const CeedScalar *q_weight_1d, 35621617c04Sjeremylt CeedBasis basis) { 357fe2413ffSjeremylt int ierr; 358fe2413ffSjeremylt Ceed ceed; 359e15f9bd0SJeremy L Thompson ierr = CeedBasisGetCeed(basis, &ceed); CeedChkBackend(ierr); 36084a01de5SJeremy L Thompson CeedBasis_Ref *impl; 361e15f9bd0SJeremy L Thompson ierr = CeedCalloc(1, &impl); CeedChkBackend(ierr); 362dfe03796SJeremy L Thompson // Check for collocated interp 363d1d35e2fSjeremylt if (Q_1d == P_1d) { 364dfe03796SJeremy L Thompson bool collocated = 1; 365d1d35e2fSjeremylt for (CeedInt i=0; i<P_1d; i++) { 366d1d35e2fSjeremylt collocated = collocated && (fabs(interp_1d[i+P_1d*i] - 1.0) < 1e-14); 367d1d35e2fSjeremylt for (CeedInt j=0; j<P_1d; j++) 368dfe03796SJeremy L Thompson if (j != i) 369d1d35e2fSjeremylt collocated = collocated && (fabs(interp_1d[j+P_1d*i]) < 1e-14); 370dfe03796SJeremy L Thompson } 3718c1105f8SJeremy L Thompson impl->has_collo_interp = collocated; 372dfe03796SJeremy L Thompson } 373dfe03796SJeremy L Thompson // Calculate collocated grad 3748c1105f8SJeremy L Thompson if (Q_1d >= P_1d && !impl->has_collo_interp) { 3758c1105f8SJeremy L Thompson ierr = CeedMalloc(Q_1d*Q_1d, &impl->collo_grad_1d); CeedChkBackend(ierr); 3768c1105f8SJeremy L Thompson ierr = CeedBasisGetCollocatedGrad(basis, impl->collo_grad_1d); 377e15f9bd0SJeremy L Thompson CeedChkBackend(ierr); 378a7bd39daSjeremylt } 379e15f9bd0SJeremy L Thompson ierr = CeedBasisSetData(basis, impl); CeedChkBackend(ierr); 380fe2413ffSjeremylt 3812f86a920SJeremy L Thompson Ceed parent; 382e15f9bd0SJeremy L Thompson ierr = CeedGetParent(ceed, &parent); CeedChkBackend(ierr); 3832f86a920SJeremy L Thompson CeedTensorContract contract; 384e15f9bd0SJeremy L Thompson ierr = CeedTensorContractCreate(parent, basis, &contract); CeedChkBackend(ierr); 38534359f16Sjeremylt ierr = CeedBasisSetTensorContract(basis, contract); CeedChkBackend(ierr); 3862f86a920SJeremy L Thompson 387fe2413ffSjeremylt ierr = CeedSetBackendFunction(ceed, "Basis", basis, "Apply", 388e15f9bd0SJeremy L Thompson CeedBasisApply_Ref); CeedChkBackend(ierr); 389fe2413ffSjeremylt ierr = CeedSetBackendFunction(ceed, "Basis", basis, "Destroy", 390e15f9bd0SJeremy L Thompson CeedBasisDestroyTensor_Ref); CeedChkBackend(ierr); 391e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 39221617c04Sjeremylt } 393a8de75f0Sjeremylt 394f10650afSjeremylt //------------------------------------------------------------------------------ 395