13d8e8822SJeremy L Thompson // Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors. 23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details. 321617c04Sjeremylt // 43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause 521617c04Sjeremylt // 63d8e8822SJeremy L Thompson // This file is part of CEED: http://github.com/ceed 721617c04Sjeremylt 849aac155SJeremy L Thompson #include <ceed.h> 9ec3da8bcSJed Brown #include <ceed/backend.h> 103d576824SJeremy L Thompson #include <stdbool.h> 113d576824SJeremy L Thompson #include <stddef.h> 123d576824SJeremy L Thompson #include <stdint.h> 132b730f8bSJeremy L Thompson 1421617c04Sjeremylt #include "ceed-ref.h" 1521617c04Sjeremylt 16f10650afSjeremylt //------------------------------------------------------------------------------ 17f10650afSjeremylt // Setup Input/Output Fields 18f10650afSjeremylt //------------------------------------------------------------------------------ 192b730f8bSJeremy L Thompson static int CeedOperatorSetupFields_Ref(CeedQFunction qf, CeedOperator op, bool is_input, CeedVector *e_vecs_full, CeedVector *e_vecs, 202b730f8bSJeremy L Thompson CeedVector *q_vecs, CeedInt start_e, CeedInt num_fields, CeedInt Q) { 21aedaa0e5Sjeremylt Ceed ceed; 22ad70ee2cSJeremy L Thompson CeedSize e_size, q_size; 23ad70ee2cSJeremy L Thompson CeedInt num_comp, size, P; 24d1d35e2fSjeremylt CeedQFunctionField *qf_fields; 25ad70ee2cSJeremy L Thompson CeedOperatorField *op_fields; 26ad70ee2cSJeremy L Thompson 27ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 284fc1f125SJeremy L Thompson if (is_input) { 292b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL)); 302b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL)); 314fc1f125SJeremy L Thompson } else { 322b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields)); 332b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, NULL, NULL, &qf_fields)); 34fe2413ffSjeremylt } 3521617c04Sjeremylt 36885ac19cSjeremylt // Loop over fields 37d1d35e2fSjeremylt for (CeedInt i = 0; i < num_fields; i++) { 38d1d35e2fSjeremylt CeedEvalMode eval_mode; 39edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 40ad70ee2cSJeremy L Thompson CeedBasis basis; 41d1d35e2fSjeremylt 42ad70ee2cSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 43d1d35e2fSjeremylt if (eval_mode != CEED_EVAL_WEIGHT) { 44edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr)); 45edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionCreateVector(elem_rstr, NULL, &e_vecs_full[i + start_e])); 46135a076eSjeremylt } 47135a076eSjeremylt 48d1d35e2fSjeremylt switch (eval_mode) { 49885ac19cSjeremylt case CEED_EVAL_NONE: 502b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_fields[i], &size)); 51d2643443SJeremy L Thompson q_size = (CeedSize)Q * size; 522b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 53aedaa0e5Sjeremylt break; 54aedaa0e5Sjeremylt case CEED_EVAL_INTERP: 55885ac19cSjeremylt case CEED_EVAL_GRAD: 56a915a514Srezgarshakeri case CEED_EVAL_DIV: 57c4e3f59bSSebastian Grimberg case CEED_EVAL_CURL: 582b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 592b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_fields[i], &size)); 602b730f8bSJeremy L Thompson CeedCallBackend(CeedBasisGetNumNodes(basis, &P)); 612b730f8bSJeremy L Thompson CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 62d2643443SJeremy L Thompson e_size = (CeedSize)P * num_comp; 632b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, e_size, &e_vecs[i])); 64d2643443SJeremy L Thompson q_size = (CeedSize)Q * size; 652b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 66885ac19cSjeremylt break; 67885ac19cSjeremylt case CEED_EVAL_WEIGHT: // Only on input fields 682b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 69d2643443SJeremy L Thompson q_size = (CeedSize)Q; 702b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 712b730f8bSJeremy L Thompson CeedCallBackend(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, q_vecs[i])); 72885ac19cSjeremylt break; 7321617c04Sjeremylt } 74885ac19cSjeremylt } 75e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 7621617c04Sjeremylt } 7721617c04Sjeremylt 78f10650afSjeremylt //------------------------------------------------------------------------------ 79f10650afSjeremylt // Setup Operator 80f10650afSjeremylt //------------------------------------------------------------------------------/* 81885ac19cSjeremylt static int CeedOperatorSetup_Ref(CeedOperator op) { 828c1105f8SJeremy L Thompson bool is_setup_done; 83ad70ee2cSJeremy L Thompson Ceed ceed; 84ad70ee2cSJeremy L Thompson CeedInt Q, num_input_fields, num_output_fields; 85ad70ee2cSJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 86ad70ee2cSJeremy L Thompson CeedQFunction qf; 87ad70ee2cSJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 88ad70ee2cSJeremy L Thompson CeedOperator_Ref *impl; 89ad70ee2cSJeremy L Thompson 902b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorIsSetupDone(op, &is_setup_done)); 918c1105f8SJeremy L Thompson if (is_setup_done) return CEED_ERROR_SUCCESS; 92ad70ee2cSJeremy L Thompson 932b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 942b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 952b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 962b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumQuadraturePoints(op, &Q)); 972b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionIsIdentity(qf, &impl->is_identity_qf)); 982b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 992b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 100885ac19cSjeremylt 101885ac19cSjeremylt // Allocate 1022b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(num_input_fields + num_output_fields, &impl->e_vecs_full)); 103885ac19cSjeremylt 1042b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->input_states)); 1052b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_vecs_in)); 1062b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_vecs_out)); 1072b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->q_vecs_in)); 1082b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->q_vecs_out)); 109885ac19cSjeremylt 1104fc1f125SJeremy L Thompson impl->num_inputs = num_input_fields; 1114fc1f125SJeremy L Thompson impl->num_outputs = num_output_fields; 112885ac19cSjeremylt 113d1d35e2fSjeremylt // Set up infield and outfield e_vecs and q_vecs 114885ac19cSjeremylt // Infields 1152b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetupFields_Ref(qf, op, true, impl->e_vecs_full, impl->e_vecs_in, impl->q_vecs_in, 0, num_input_fields, Q)); 116885ac19cSjeremylt // Outfields 1172b730f8bSJeremy L Thompson CeedCallBackend( 1182b730f8bSJeremy L Thompson CeedOperatorSetupFields_Ref(qf, op, false, impl->e_vecs_full, impl->e_vecs_out, impl->q_vecs_out, num_input_fields, num_output_fields, Q)); 119885ac19cSjeremylt 12016911fdaSjeremylt // Identity QFunctions 1210b454692Sjeremylt if (impl->is_identity_qf) { 122d1d35e2fSjeremylt CeedEvalMode in_mode, out_mode; 123d1d35e2fSjeremylt CeedQFunctionField *in_fields, *out_fields; 124ad70ee2cSJeremy L Thompson 1252b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &in_fields, NULL, &out_fields)); 1262b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(in_fields[0], &in_mode)); 1272b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(out_fields[0], &out_mode)); 128d1d35e2fSjeremylt 1290b454692Sjeremylt if (in_mode == CEED_EVAL_NONE && out_mode == CEED_EVAL_NONE) { 130edb2538eSJeremy L Thompson impl->is_identity_rstr_op = true; 1310b454692Sjeremylt } else { 132db002c03SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(impl->q_vecs_in[0], &impl->q_vecs_out[0])); 13316911fdaSjeremylt } 13416911fdaSjeremylt } 13516911fdaSjeremylt 1362b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetSetupDone(op)); 137e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 138885ac19cSjeremylt } 139885ac19cSjeremylt 140f10650afSjeremylt //------------------------------------------------------------------------------ 141f10650afSjeremylt // Setup Operator Inputs 142f10650afSjeremylt //------------------------------------------------------------------------------ 1432b730f8bSJeremy L Thompson static inline int CeedOperatorSetupInputs_Ref(CeedInt num_input_fields, CeedQFunctionField *qf_input_fields, CeedOperatorField *op_input_fields, 1442b730f8bSJeremy L Thompson CeedVector in_vec, const bool skip_active, CeedScalar *e_data_full[2 * CEED_FIELD_MAX], 145a0162de9SJeremy L Thompson CeedOperator_Ref *impl, CeedRequest *request) { 146ad70ee2cSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 147ad70ee2cSJeremy L Thompson uint64_t state; 148d1d35e2fSjeremylt CeedEvalMode eval_mode; 149d1bcdac9Sjeremylt CeedVector vec; 150edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 151885ac19cSjeremylt 152d1bcdac9Sjeremylt // Get input vector 1532b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 1541d102b48SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 1552b730f8bSJeremy L Thompson if (skip_active) continue; 1562b730f8bSJeremy L Thompson else vec = in_vec; 1571d102b48SJeremy L Thompson } 1581d102b48SJeremy L Thompson 1592b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 1601d102b48SJeremy L Thompson // Restrict and Evec 161d1d35e2fSjeremylt if (eval_mode == CEED_EVAL_WEIGHT) { // Skip 1621d102b48SJeremy L Thompson } else { 163668048e2SJed Brown // Restrict 1642b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorGetState(vec, &state)); 1658d713cf6Sjeremylt // Skip restriction if input is unchanged 1664fc1f125SJeremy L Thompson if (state != impl->input_states[i] || vec == in_vec) { 167edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 168edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApply(elem_rstr, CEED_NOTRANSPOSE, vec, impl->e_vecs_full[i], request)); 1694fc1f125SJeremy L Thompson impl->input_states[i] = state; 1708d713cf6Sjeremylt } 171668048e2SJed Brown // Get evec 1722b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorGetArrayRead(impl->e_vecs_full[i], CEED_MEM_HOST, (const CeedScalar **)&e_data_full[i])); 173885ac19cSjeremylt } 174885ac19cSjeremylt } 175e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 176885ac19cSjeremylt } 177885ac19cSjeremylt 178f10650afSjeremylt //------------------------------------------------------------------------------ 179f10650afSjeremylt // Input Basis Action 180f10650afSjeremylt //------------------------------------------------------------------------------ 1812b730f8bSJeremy L Thompson static inline int CeedOperatorInputBasis_Ref(CeedInt e, CeedInt Q, CeedQFunctionField *qf_input_fields, CeedOperatorField *op_input_fields, 1822b730f8bSJeremy L Thompson CeedInt num_input_fields, const bool skip_active, CeedScalar *e_data_full[2 * CEED_FIELD_MAX], 1832b730f8bSJeremy L Thompson CeedOperator_Ref *impl) { 184ad70ee2cSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 185a915a514Srezgarshakeri CeedInt elem_size, size, num_comp; 186d1d35e2fSjeremylt CeedEvalMode eval_mode; 187edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 1881d102b48SJeremy L Thompson CeedBasis basis; 1891d102b48SJeremy L Thompson 1901d102b48SJeremy L Thompson // Skip active input 191d1d35e2fSjeremylt if (skip_active) { 1921d102b48SJeremy L Thompson CeedVector vec; 193ad70ee2cSJeremy L Thompson 1942b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 1952b730f8bSJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) continue; 1961d102b48SJeremy L Thompson } 197d1d35e2fSjeremylt // Get elem_size, eval_mode, size 198edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 199edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size)); 2002b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 2012b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &size)); 202885ac19cSjeremylt // Basis action 203d1d35e2fSjeremylt switch (eval_mode) { 204885ac19cSjeremylt case CEED_EVAL_NONE: 2052b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorSetArray(impl->q_vecs_in[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data_full[i][e * Q * size])); 206885ac19cSjeremylt break; 207885ac19cSjeremylt case CEED_EVAL_INTERP: 208885ac19cSjeremylt case CEED_EVAL_GRAD: 209a915a514Srezgarshakeri case CEED_EVAL_DIV: 210c4e3f59bSSebastian Grimberg case CEED_EVAL_CURL: 211a915a514Srezgarshakeri CeedCallBackend(CeedOperatorFieldGetBasis(op_input_fields[i], &basis)); 212a915a514Srezgarshakeri CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 213a915a514Srezgarshakeri CeedCallBackend(CeedVectorSetArray(impl->e_vecs_in[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data_full[i][e * elem_size * num_comp])); 214c4e3f59bSSebastian Grimberg CeedCallBackend(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, eval_mode, impl->e_vecs_in[i], impl->q_vecs_in[i])); 215a915a514Srezgarshakeri break; 216885ac19cSjeremylt case CEED_EVAL_WEIGHT: 217885ac19cSjeremylt break; // No action 218885ac19cSjeremylt } 219885ac19cSjeremylt } 220e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 221885ac19cSjeremylt } 222885ac19cSjeremylt 223f10650afSjeremylt //------------------------------------------------------------------------------ 224f10650afSjeremylt // Output Basis Action 225f10650afSjeremylt //------------------------------------------------------------------------------ 2262b730f8bSJeremy L Thompson static inline int CeedOperatorOutputBasis_Ref(CeedInt e, CeedInt Q, CeedQFunctionField *qf_output_fields, CeedOperatorField *op_output_fields, 227d1d35e2fSjeremylt CeedInt num_input_fields, CeedInt num_output_fields, CeedOperator op, 2284fc1f125SJeremy L Thompson CeedScalar *e_data_full[2 * CEED_FIELD_MAX], CeedOperator_Ref *impl) { 229ad70ee2cSJeremy L Thompson for (CeedInt i = 0; i < num_output_fields; i++) { 230a915a514Srezgarshakeri CeedInt elem_size, num_comp; 231d1d35e2fSjeremylt CeedEvalMode eval_mode; 232edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 2331d102b48SJeremy L Thompson CeedBasis basis; 2341d102b48SJeremy L Thompson 235a915a514Srezgarshakeri // Get elem_size, eval_mode 236edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); 237edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size)); 2382b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); 239885ac19cSjeremylt // Basis action 240d1d35e2fSjeremylt switch (eval_mode) { 241885ac19cSjeremylt case CEED_EVAL_NONE: 242885ac19cSjeremylt break; // No action 243885ac19cSjeremylt case CEED_EVAL_INTERP: 244885ac19cSjeremylt case CEED_EVAL_GRAD: 245a915a514Srezgarshakeri case CEED_EVAL_DIV: 246c4e3f59bSSebastian Grimberg case CEED_EVAL_CURL: 247a915a514Srezgarshakeri CeedCallBackend(CeedOperatorFieldGetBasis(op_output_fields[i], &basis)); 248a915a514Srezgarshakeri CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 249a915a514Srezgarshakeri CeedCallBackend( 250a915a514Srezgarshakeri CeedVectorSetArray(impl->e_vecs_out[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data_full[i + num_input_fields][e * elem_size * num_comp])); 251c4e3f59bSSebastian Grimberg CeedCallBackend(CeedBasisApply(basis, 1, CEED_TRANSPOSE, eval_mode, impl->q_vecs_out[i], impl->e_vecs_out[i])); 252a915a514Srezgarshakeri break; 253c042f62fSJeremy L Thompson // LCOV_EXCL_START 254bbfacfcdSjeremylt case CEED_EVAL_WEIGHT: { 2554ce2993fSjeremylt Ceed ceed; 256ad70ee2cSJeremy L Thompson 2572b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 2586574a04fSJeremy L Thompson return CeedError(ceed, CEED_ERROR_BACKEND, "CEED_EVAL_WEIGHT cannot be an output evaluation mode"); 2591d102b48SJeremy L Thompson // LCOV_EXCL_STOP 260885ac19cSjeremylt } 261885ac19cSjeremylt } 262885ac19cSjeremylt } 263e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 2641d102b48SJeremy L Thompson } 2651d102b48SJeremy L Thompson 266f10650afSjeremylt //------------------------------------------------------------------------------ 267f10650afSjeremylt // Restore Input Vectors 268f10650afSjeremylt //------------------------------------------------------------------------------ 2692b730f8bSJeremy L Thompson static inline int CeedOperatorRestoreInputs_Ref(CeedInt num_input_fields, CeedQFunctionField *qf_input_fields, CeedOperatorField *op_input_fields, 2702b730f8bSJeremy L Thompson const bool skip_active, CeedScalar *e_data_full[2 * CEED_FIELD_MAX], CeedOperator_Ref *impl) { 271ad70ee2cSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 272d1d35e2fSjeremylt CeedEvalMode eval_mode; 2731d102b48SJeremy L Thompson 2741d102b48SJeremy L Thompson // Skip active inputs 275d1d35e2fSjeremylt if (skip_active) { 2761d102b48SJeremy L Thompson CeedVector vec; 277ad70ee2cSJeremy L Thompson 2782b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 2792b730f8bSJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) continue; 2801d102b48SJeremy L Thompson } 2811d102b48SJeremy L Thompson // Restore input 2822b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 283d1d35e2fSjeremylt if (eval_mode == CEED_EVAL_WEIGHT) { // Skip 2841d102b48SJeremy L Thompson } else { 2852b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArrayRead(impl->e_vecs_full[i], (const CeedScalar **)&e_data_full[i])); 2861d102b48SJeremy L Thompson } 2871d102b48SJeremy L Thompson } 288e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 2891d102b48SJeremy L Thompson } 2901d102b48SJeremy L Thompson 291f10650afSjeremylt //------------------------------------------------------------------------------ 292f10650afSjeremylt // Operator Apply 293f10650afSjeremylt //------------------------------------------------------------------------------ 2942b730f8bSJeremy L Thompson static int CeedOperatorApplyAdd_Ref(CeedOperator op, CeedVector in_vec, CeedVector out_vec, CeedRequest *request) { 295d1d35e2fSjeremylt CeedInt Q, num_elem, num_input_fields, num_output_fields, size; 296ad70ee2cSJeremy L Thompson CeedEvalMode eval_mode; 297ad70ee2cSJeremy L Thompson CeedScalar *e_data_full[2 * CEED_FIELD_MAX] = {NULL}; 298ad70ee2cSJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 299ad70ee2cSJeremy L Thompson CeedQFunction qf; 300ad70ee2cSJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 301ad70ee2cSJeremy L Thompson CeedOperator_Ref *impl; 302ad70ee2cSJeremy L Thompson 303ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 304ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 3052b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumQuadraturePoints(op, &Q)); 3062b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 3072b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 3082b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 3091d102b48SJeremy L Thompson 3101d102b48SJeremy L Thompson // Setup 3112b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetup_Ref(op)); 3121d102b48SJeremy L Thompson 3130b454692Sjeremylt // Restriction only operator 314edb2538eSJeremy L Thompson if (impl->is_identity_rstr_op) { 315edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 316ad70ee2cSJeremy L Thompson 317edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[0], &elem_rstr)); 318edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApply(elem_rstr, CEED_NOTRANSPOSE, in_vec, impl->e_vecs_full[0], request)); 319edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[0], &elem_rstr)); 320edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApply(elem_rstr, CEED_TRANSPOSE, impl->e_vecs_full[0], out_vec, request)); 3210b454692Sjeremylt return CEED_ERROR_SUCCESS; 3220b454692Sjeremylt } 3230b454692Sjeremylt 3241d102b48SJeremy L Thompson // Input Evecs and Restriction 3252b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, in_vec, false, e_data_full, impl, request)); 3261d102b48SJeremy L Thompson 3271d102b48SJeremy L Thompson // Output Evecs 328d1d35e2fSjeremylt for (CeedInt i = 0; i < num_output_fields; i++) { 3292b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorGetArrayWrite(impl->e_vecs_full[i + impl->num_inputs], CEED_MEM_HOST, &e_data_full[i + num_input_fields])); 3301d102b48SJeremy L Thompson } 3311d102b48SJeremy L Thompson 3321d102b48SJeremy L Thompson // Loop through elements 333d1d35e2fSjeremylt for (CeedInt e = 0; e < num_elem; e++) { 3341d102b48SJeremy L Thompson // Output pointers 335d1d35e2fSjeremylt for (CeedInt i = 0; i < num_output_fields; i++) { 3362b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); 337d1d35e2fSjeremylt if (eval_mode == CEED_EVAL_NONE) { 3382b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[i], &size)); 3392b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorSetArray(impl->q_vecs_out[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data_full[i + num_input_fields][e * Q * size])); 3401d102b48SJeremy L Thompson } 3411d102b48SJeremy L Thompson } 3421d102b48SJeremy L Thompson 34316911fdaSjeremylt // Input basis apply 3442b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorInputBasis_Ref(e, Q, qf_input_fields, op_input_fields, num_input_fields, false, e_data_full, impl)); 34516911fdaSjeremylt 3461d102b48SJeremy L Thompson // Q function 3470b454692Sjeremylt if (!impl->is_identity_qf) { 3482b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionApply(qf, Q, impl->q_vecs_in, impl->q_vecs_out)); 34916911fdaSjeremylt } 3501d102b48SJeremy L Thompson 3511d102b48SJeremy L Thompson // Output basis apply 3522b730f8bSJeremy L Thompson CeedCallBackend( 3532b730f8bSJeremy L Thompson CeedOperatorOutputBasis_Ref(e, Q, qf_output_fields, op_output_fields, num_input_fields, num_output_fields, op, e_data_full, impl)); 3541d102b48SJeremy L Thompson } 355885ac19cSjeremylt 356885ac19cSjeremylt // Output restriction 357d1d35e2fSjeremylt for (CeedInt i = 0; i < num_output_fields; i++) { 358ad70ee2cSJeremy L Thompson CeedVector vec; 359edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 360ad70ee2cSJeremy L Thompson 361d1d35e2fSjeremylt // Restore Evec 3622b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->e_vecs_full[i + impl->num_inputs], &e_data_full[i + num_input_fields])); 363d1bcdac9Sjeremylt // Get output vector 3642b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[i], &vec)); 365668048e2SJed Brown // Active 3662b730f8bSJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) vec = out_vec; 3677ca8db16Sjeremylt // Restrict 368edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); 369edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApply(elem_rstr, CEED_TRANSPOSE, impl->e_vecs_full[i + impl->num_inputs], vec, request)); 370885ac19cSjeremylt } 371885ac19cSjeremylt 3727ca8db16Sjeremylt // Restore input arrays 3732b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, false, e_data_full, impl)); 374e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 37521617c04Sjeremylt } 37621617c04Sjeremylt 377f10650afSjeremylt //------------------------------------------------------------------------------ 37870a7ffb3SJeremy L Thompson // Core code for assembling linear QFunction 379f10650afSjeremylt //------------------------------------------------------------------------------ 3802b730f8bSJeremy L Thompson static inline int CeedOperatorLinearAssembleQFunctionCore_Ref(CeedOperator op, bool build_objects, CeedVector *assembled, CeedElemRestriction *rstr, 38170a7ffb3SJeremy L Thompson CeedRequest *request) { 382ca735530SJeremy L Thompson Ceed ceed, ceed_ceed_parent; 383e984cf9aSJeremy L Thompson CeedSize q_size; 384ad70ee2cSJeremy L Thompson CeedInt num_active_in, num_active_out, Q, num_elem, num_input_fields, num_output_fields, size; 385ad70ee2cSJeremy L Thompson CeedScalar *assembled_array, *e_data_full[2 * CEED_FIELD_MAX] = {NULL}; 386ad70ee2cSJeremy L Thompson CeedVector *active_in; 387ad70ee2cSJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 388ad70ee2cSJeremy L Thompson CeedQFunction qf; 389ad70ee2cSJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 390ad70ee2cSJeremy L Thompson CeedOperator_Ref *impl; 391ad70ee2cSJeremy L Thompson 3922b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 393ca735530SJeremy L Thompson CeedCallBackend(CeedOperatorGetFallbackParentCeed(op, &ceed_ceed_parent)); 394e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 395e984cf9aSJeremy L Thompson active_in = impl->qf_active_in; 396e984cf9aSJeremy L Thompson num_active_in = impl->num_active_in, num_active_out = impl->num_active_out; 397e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 398e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumQuadraturePoints(op, &Q)); 399e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 400e984cf9aSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 401e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 4021d102b48SJeremy L Thompson 4031d102b48SJeremy L Thompson // Setup 4042b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetup_Ref(op)); 4051d102b48SJeremy L Thompson 406506b1a0cSSebastian Grimberg // Check for restriction only operator 407506b1a0cSSebastian Grimberg CeedCheck(!impl->is_identity_rstr_op, ceed, CEED_ERROR_BACKEND, "Assembling restriction only operators is not supported"); 40816911fdaSjeremylt 4091d102b48SJeremy L Thompson // Input Evecs and Restriction 4102b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, NULL, true, e_data_full, impl, request)); 4111d102b48SJeremy L Thompson 4121d102b48SJeremy L Thompson // Count number of active input fields 413bb219a0fSJeremy L Thompson if (!num_active_in) { 414d1d35e2fSjeremylt for (CeedInt i = 0; i < num_input_fields; i++) { 415ad70ee2cSJeremy L Thompson CeedScalar *q_vec_array; 416ad70ee2cSJeremy L Thompson CeedVector vec; 417ad70ee2cSJeremy L Thompson 4181d102b48SJeremy L Thompson // Get input vector 4192b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 4201d102b48SJeremy L Thompson // Check if active input 4211d102b48SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 4222b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &size)); 4232b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(impl->q_vecs_in[i], 0.0)); 424ad70ee2cSJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->q_vecs_in[i], CEED_MEM_HOST, &q_vec_array)); 4252b730f8bSJeremy L Thompson CeedCallBackend(CeedRealloc(num_active_in + size, &active_in)); 4261d102b48SJeremy L Thompson for (CeedInt field = 0; field < size; field++) { 427d2643443SJeremy L Thompson q_size = (CeedSize)Q; 4282b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &active_in[num_active_in + field])); 429ad70ee2cSJeremy L Thompson CeedCallBackend(CeedVectorSetArray(active_in[num_active_in + field], CEED_MEM_HOST, CEED_USE_POINTER, &q_vec_array[field * Q])); 4301d102b48SJeremy L Thompson } 431d1d35e2fSjeremylt num_active_in += size; 432ad70ee2cSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->q_vecs_in[i], &q_vec_array)); 4331d102b48SJeremy L Thompson } 4341d102b48SJeremy L Thompson } 4354fc1f125SJeremy L Thompson impl->num_active_in = num_active_in; 436bb219a0fSJeremy L Thompson impl->qf_active_in = active_in; 437bb219a0fSJeremy L Thompson } 4381d102b48SJeremy L Thompson 4391d102b48SJeremy L Thompson // Count number of active output fields 440bb219a0fSJeremy L Thompson if (!num_active_out) { 441d1d35e2fSjeremylt for (CeedInt i = 0; i < num_output_fields; i++) { 442ad70ee2cSJeremy L Thompson CeedVector vec; 443ad70ee2cSJeremy L Thompson 4441d102b48SJeremy L Thompson // Get output vector 4452b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[i], &vec)); 4461d102b48SJeremy L Thompson // Check if active output 4471d102b48SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 4482b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[i], &size)); 449d1d35e2fSjeremylt num_active_out += size; 4501d102b48SJeremy L Thompson } 4511d102b48SJeremy L Thompson } 4524fc1f125SJeremy L Thompson impl->num_active_out = num_active_out; 453bb219a0fSJeremy L Thompson } 4541d102b48SJeremy L Thompson 4551d102b48SJeremy L Thompson // Check sizes 4566574a04fSJeremy L Thompson CeedCheck(num_active_in > 0 && num_active_out > 0, ceed, CEED_ERROR_BACKEND, "Cannot assemble QFunction without active inputs and outputs"); 4571d102b48SJeremy L Thompson 45870a7ffb3SJeremy L Thompson // Build objects if needed 45970a7ffb3SJeremy L Thompson if (build_objects) { 460ad70ee2cSJeremy L Thompson const CeedSize l_size = (CeedSize)num_elem * Q * num_active_in * num_active_out; 461d1d35e2fSjeremylt CeedInt strides[3] = {1, Q, num_active_in * num_active_out * Q}; /* *NOPAD* */ 462ad70ee2cSJeremy L Thompson 463ad70ee2cSJeremy L Thompson // Create output restriction 464ca735530SJeremy L Thompson CeedCallBackend(CeedElemRestrictionCreateStrided(ceed_ceed_parent, num_elem, Q, num_active_in * num_active_out, 4652b730f8bSJeremy L Thompson num_active_in * num_active_out * num_elem * Q, strides, rstr)); 4661d102b48SJeremy L Thompson // Create assembled vector 467ca735530SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed_ceed_parent, l_size, assembled)); 46870a7ffb3SJeremy L Thompson } 46970a7ffb3SJeremy L Thompson // Clear output vector 4702b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(*assembled, 0.0)); 471ad70ee2cSJeremy L Thompson CeedCallBackend(CeedVectorGetArray(*assembled, CEED_MEM_HOST, &assembled_array)); 4721d102b48SJeremy L Thompson 4731d102b48SJeremy L Thompson // Loop through elements 474d1d35e2fSjeremylt for (CeedInt e = 0; e < num_elem; e++) { 4751d102b48SJeremy L Thompson // Input basis apply 4762b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorInputBasis_Ref(e, Q, qf_input_fields, op_input_fields, num_input_fields, true, e_data_full, impl)); 4771d102b48SJeremy L Thompson 4781d102b48SJeremy L Thompson // Assemble QFunction 479d1d35e2fSjeremylt for (CeedInt in = 0; in < num_active_in; in++) { 4801d102b48SJeremy L Thompson // Set Inputs 4812b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(active_in[in], 1.0)); 482d1d35e2fSjeremylt if (num_active_in > 1) { 4832b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(active_in[(in + num_active_in - 1) % num_active_in], 0.0)); 48442ea3801Sjeremylt } 485506b1a0cSSebastian Grimberg if (!impl->is_identity_qf) { 4861d102b48SJeremy L Thompson // Set Outputs 487d1d35e2fSjeremylt for (CeedInt out = 0; out < num_output_fields; out++) { 488ad70ee2cSJeremy L Thompson CeedVector vec; 489ad70ee2cSJeremy L Thompson 4901d102b48SJeremy L Thompson // Get output vector 4912b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[out], &vec)); 4921d102b48SJeremy L Thompson // Check if active output 4931d102b48SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 494ad70ee2cSJeremy L Thompson CeedCallBackend(CeedVectorSetArray(impl->q_vecs_out[out], CEED_MEM_HOST, CEED_USE_POINTER, assembled_array)); 4952b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[out], &size)); 496ad70ee2cSJeremy L Thompson assembled_array += size * Q; // Advance the pointer by the size of the output 4971d102b48SJeremy L Thompson } 4981d102b48SJeremy L Thompson } 4991d102b48SJeremy L Thompson // Apply QFunction 5002b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionApply(qf, Q, impl->q_vecs_in, impl->q_vecs_out)); 501506b1a0cSSebastian Grimberg } else { 502506b1a0cSSebastian Grimberg const CeedScalar *q_vec_array; 503506b1a0cSSebastian Grimberg 504506b1a0cSSebastian Grimberg // Copy Identity Outputs 505506b1a0cSSebastian Grimberg CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[0], &size)); 506506b1a0cSSebastian Grimberg CeedCallBackend(CeedVectorGetArrayRead(impl->q_vecs_out[0], CEED_MEM_HOST, &q_vec_array)); 507506b1a0cSSebastian Grimberg for (CeedInt i = 0; i < size * Q; i++) assembled_array[i] = q_vec_array[i]; 508506b1a0cSSebastian Grimberg CeedCallBackend(CeedVectorRestoreArrayRead(impl->q_vecs_out[0], &q_vec_array)); 509506b1a0cSSebastian Grimberg assembled_array += size * Q; 510506b1a0cSSebastian Grimberg } 5111d102b48SJeremy L Thompson } 5121d102b48SJeremy L Thompson } 5131d102b48SJeremy L Thompson 5141d102b48SJeremy L Thompson // Un-set output Qvecs to prevent accidental overwrite of Assembled 515506b1a0cSSebastian Grimberg if (!impl->is_identity_qf) { 516d1d35e2fSjeremylt for (CeedInt out = 0; out < num_output_fields; out++) { 517ad70ee2cSJeremy L Thompson CeedVector vec; 518ad70ee2cSJeremy L Thompson 5191d102b48SJeremy L Thompson // Get output vector 5202b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[out], &vec)); 5211d102b48SJeremy L Thompson // Check if active output 522056ea4bdSJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE && num_elem > 0) { 5232b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorTakeArray(impl->q_vecs_out[out], CEED_MEM_HOST, NULL)); 5241d102b48SJeremy L Thompson } 5251d102b48SJeremy L Thompson } 526506b1a0cSSebastian Grimberg } 5271d102b48SJeremy L Thompson 5281d102b48SJeremy L Thompson // Restore input arrays 5292b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, true, e_data_full, impl)); 5301d102b48SJeremy L Thompson 5311d102b48SJeremy L Thompson // Restore output 532ad70ee2cSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(*assembled, &assembled_array)); 533e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 5341d102b48SJeremy L Thompson } 5351d102b48SJeremy L Thompson 536f10650afSjeremylt //------------------------------------------------------------------------------ 53770a7ffb3SJeremy L Thompson // Assemble Linear QFunction 53870a7ffb3SJeremy L Thompson //------------------------------------------------------------------------------ 5392b730f8bSJeremy L Thompson static int CeedOperatorLinearAssembleQFunction_Ref(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 5402b730f8bSJeremy L Thompson return CeedOperatorLinearAssembleQFunctionCore_Ref(op, true, assembled, rstr, request); 54170a7ffb3SJeremy L Thompson } 54270a7ffb3SJeremy L Thompson 54370a7ffb3SJeremy L Thompson //------------------------------------------------------------------------------ 54470a7ffb3SJeremy L Thompson // Update Assembled Linear QFunction 54570a7ffb3SJeremy L Thompson //------------------------------------------------------------------------------ 5462b730f8bSJeremy L Thompson static int CeedOperatorLinearAssembleQFunctionUpdate_Ref(CeedOperator op, CeedVector assembled, CeedElemRestriction rstr, CeedRequest *request) { 5472b730f8bSJeremy L Thompson return CeedOperatorLinearAssembleQFunctionCore_Ref(op, false, &assembled, &rstr, request); 54870a7ffb3SJeremy L Thompson } 54970a7ffb3SJeremy L Thompson 55070a7ffb3SJeremy L Thompson //------------------------------------------------------------------------------ 551*48acf710SJeremy L Thompson // Setup Input/Output Fields 552*48acf710SJeremy L Thompson //------------------------------------------------------------------------------ 553*48acf710SJeremy L Thompson static int CeedOperatorSetupFieldsAtPoints_Ref(CeedQFunction qf, CeedOperator op, bool is_input, CeedVector *e_vecs_full, CeedVector *e_vecs, 554*48acf710SJeremy L Thompson CeedVector *q_vecs, CeedInt start_e, CeedInt num_fields, CeedInt Q) { 555*48acf710SJeremy L Thompson Ceed ceed; 556*48acf710SJeremy L Thompson CeedSize e_size, q_size; 557*48acf710SJeremy L Thompson CeedInt max_num_points, num_comp, size, P; 558*48acf710SJeremy L Thompson CeedQFunctionField *qf_fields; 559*48acf710SJeremy L Thompson CeedOperatorField *op_fields; 560*48acf710SJeremy L Thompson 561*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 562*48acf710SJeremy L Thompson if (is_input) { 563*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL)); 564*48acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL)); 565*48acf710SJeremy L Thompson } else { 566*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields)); 567*48acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, NULL, NULL, &qf_fields)); 568*48acf710SJeremy L Thompson } 569*48acf710SJeremy L Thompson 570*48acf710SJeremy L Thompson // Get max number of points 571*48acf710SJeremy L Thompson { 572*48acf710SJeremy L Thompson CeedInt dim; 573*48acf710SJeremy L Thompson CeedElemRestriction rstr_points = NULL; 574*48acf710SJeremy L Thompson CeedOperator_Ref *impl; 575*48acf710SJeremy L Thompson 576*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorAtPointsGetPoints(op, &rstr_points, NULL)); 577*48acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetMaxPointsInElement(rstr_points, &max_num_points)); 578*48acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumComponents(rstr_points, &dim)); 579*48acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_points)); 580*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 581*48acf710SJeremy L Thompson if (is_input) CeedCallBackend(CeedVectorCreate(ceed, dim * max_num_points, &impl->point_coords_elem)); 582*48acf710SJeremy L Thompson } 583*48acf710SJeremy L Thompson 584*48acf710SJeremy L Thompson // Loop over fields 585*48acf710SJeremy L Thompson for (CeedInt i = 0; i < num_fields; i++) { 586*48acf710SJeremy L Thompson CeedEvalMode eval_mode; 587*48acf710SJeremy L Thompson CeedBasis basis; 588*48acf710SJeremy L Thompson 589*48acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 590*48acf710SJeremy L Thompson if (eval_mode != CEED_EVAL_WEIGHT) { 591*48acf710SJeremy L Thompson CeedRestrictionType rstr_type; 592*48acf710SJeremy L Thompson CeedElemRestriction elem_rstr; 593*48acf710SJeremy L Thompson 594*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr)); 595*48acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumComponents(elem_rstr, &num_comp)); 596*48acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetType(elem_rstr, &rstr_type)); 597*48acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionCreateVector(elem_rstr, NULL, &e_vecs_full[i + start_e])); 598*48acf710SJeremy L Thompson } 599*48acf710SJeremy L Thompson 600*48acf710SJeremy L Thompson switch (eval_mode) { 601*48acf710SJeremy L Thompson case CEED_EVAL_NONE: 602*48acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_fields[i], &size)); 603*48acf710SJeremy L Thompson e_size = (CeedSize)max_num_points * size; 604*48acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, e_size, &e_vecs[i])); 605*48acf710SJeremy L Thompson q_size = (CeedSize)max_num_points * size; 606*48acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 607*48acf710SJeremy L Thompson break; 608*48acf710SJeremy L Thompson case CEED_EVAL_INTERP: 609*48acf710SJeremy L Thompson case CEED_EVAL_GRAD: 610*48acf710SJeremy L Thompson case CEED_EVAL_DIV: 611*48acf710SJeremy L Thompson case CEED_EVAL_CURL: 612*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 613*48acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_fields[i], &size)); 614*48acf710SJeremy L Thompson CeedCallBackend(CeedBasisGetNumNodes(basis, &P)); 615*48acf710SJeremy L Thompson CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 616*48acf710SJeremy L Thompson e_size = (CeedSize)P * num_comp; 617*48acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, e_size, &e_vecs[i])); 618*48acf710SJeremy L Thompson q_size = (CeedSize)max_num_points * size; 619*48acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 620*48acf710SJeremy L Thompson break; 621*48acf710SJeremy L Thompson case CEED_EVAL_WEIGHT: // Only on input fields 622*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 623*48acf710SJeremy L Thompson q_size = (CeedSize)max_num_points; 624*48acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 625*48acf710SJeremy L Thompson CeedCallBackend( 626*48acf710SJeremy L Thompson CeedBasisApplyAtPoints(basis, max_num_points, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, CEED_VECTOR_NONE, q_vecs[i])); 627*48acf710SJeremy L Thompson break; 628*48acf710SJeremy L Thompson } 629*48acf710SJeremy L Thompson if (is_input && e_vecs[i]) { 630*48acf710SJeremy L Thompson CeedCallBackend(CeedVectorSetArray(e_vecs[i], CEED_MEM_HOST, CEED_COPY_VALUES, NULL)); 631*48acf710SJeremy L Thompson } 632*48acf710SJeremy L Thompson } 633*48acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 634*48acf710SJeremy L Thompson } 635*48acf710SJeremy L Thompson 636*48acf710SJeremy L Thompson //------------------------------------------------------------------------------ 637*48acf710SJeremy L Thompson // Setup Operator 638*48acf710SJeremy L Thompson //------------------------------------------------------------------------------ 639*48acf710SJeremy L Thompson static int CeedOperatorSetupAtPoints_Ref(CeedOperator op) { 640*48acf710SJeremy L Thompson bool is_setup_done; 641*48acf710SJeremy L Thompson Ceed ceed; 642*48acf710SJeremy L Thompson CeedInt Q, num_input_fields, num_output_fields; 643*48acf710SJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 644*48acf710SJeremy L Thompson CeedQFunction qf; 645*48acf710SJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 646*48acf710SJeremy L Thompson CeedOperator_Ref *impl; 647*48acf710SJeremy L Thompson 648*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorIsSetupDone(op, &is_setup_done)); 649*48acf710SJeremy L Thompson if (is_setup_done) return CEED_ERROR_SUCCESS; 650*48acf710SJeremy L Thompson 651*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 652*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 653*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 654*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetNumQuadraturePoints(op, &Q)); 655*48acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionIsIdentity(qf, &impl->is_identity_qf)); 656*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 657*48acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 658*48acf710SJeremy L Thompson 659*48acf710SJeremy L Thompson // Allocate 660*48acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(num_input_fields + num_output_fields, &impl->e_vecs_full)); 661*48acf710SJeremy L Thompson 662*48acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->input_states)); 663*48acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_vecs_in)); 664*48acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_vecs_out)); 665*48acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->q_vecs_in)); 666*48acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->q_vecs_out)); 667*48acf710SJeremy L Thompson 668*48acf710SJeremy L Thompson impl->num_inputs = num_input_fields; 669*48acf710SJeremy L Thompson impl->num_outputs = num_output_fields; 670*48acf710SJeremy L Thompson 671*48acf710SJeremy L Thompson // Set up infield and outfield pointer arrays 672*48acf710SJeremy L Thompson // Infields 673*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorSetupFieldsAtPoints_Ref(qf, op, true, impl->e_vecs_full, impl->e_vecs_in, impl->q_vecs_in, 0, num_input_fields, Q)); 674*48acf710SJeremy L Thompson // Outfields 675*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorSetupFieldsAtPoints_Ref(qf, op, false, impl->e_vecs_full, impl->e_vecs_out, impl->q_vecs_out, num_input_fields, 676*48acf710SJeremy L Thompson num_output_fields, Q)); 677*48acf710SJeremy L Thompson 678*48acf710SJeremy L Thompson // Identity QFunctions 679*48acf710SJeremy L Thompson if (impl->is_identity_qf) { 680*48acf710SJeremy L Thompson CeedEvalMode in_mode, out_mode; 681*48acf710SJeremy L Thompson CeedQFunctionField *in_fields, *out_fields; 682*48acf710SJeremy L Thompson 683*48acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &in_fields, NULL, &out_fields)); 684*48acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(in_fields[0], &in_mode)); 685*48acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(out_fields[0], &out_mode)); 686*48acf710SJeremy L Thompson 687*48acf710SJeremy L Thompson if (in_mode == CEED_EVAL_NONE && out_mode == CEED_EVAL_NONE) { 688*48acf710SJeremy L Thompson impl->is_identity_rstr_op = true; 689*48acf710SJeremy L Thompson } else { 690*48acf710SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(impl->q_vecs_in[0], &impl->q_vecs_out[0])); 691*48acf710SJeremy L Thompson } 692*48acf710SJeremy L Thompson } 693*48acf710SJeremy L Thompson 694*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorSetSetupDone(op)); 695*48acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 696*48acf710SJeremy L Thompson } 697*48acf710SJeremy L Thompson 698*48acf710SJeremy L Thompson //------------------------------------------------------------------------------ 699*48acf710SJeremy L Thompson // Setup Input Fields 700*48acf710SJeremy L Thompson //------------------------------------------------------------------------------ 701*48acf710SJeremy L Thompson static inline int CeedOperatorSetupInputsAtPoints_Ref(CeedInt num_input_fields, CeedQFunctionField *qf_input_fields, 702*48acf710SJeremy L Thompson CeedOperatorField *op_input_fields, CeedVector in_vec, CeedScalar *e_data[2 * CEED_FIELD_MAX], 703*48acf710SJeremy L Thompson CeedOperator_Ref *impl, CeedRequest *request) { 704*48acf710SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 705*48acf710SJeremy L Thompson uint64_t state; 706*48acf710SJeremy L Thompson CeedEvalMode eval_mode; 707*48acf710SJeremy L Thompson CeedVector vec; 708*48acf710SJeremy L Thompson CeedElemRestriction elem_rstr; 709*48acf710SJeremy L Thompson 710*48acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 711*48acf710SJeremy L Thompson if (eval_mode == CEED_EVAL_WEIGHT) { // Skip 712*48acf710SJeremy L Thompson } else { 713*48acf710SJeremy L Thompson // Get input vector 714*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 715*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 716*48acf710SJeremy L Thompson if (vec != CEED_VECTOR_ACTIVE) { 717*48acf710SJeremy L Thompson // Restrict 718*48acf710SJeremy L Thompson CeedCallBackend(CeedVectorGetState(vec, &state)); 719*48acf710SJeremy L Thompson if (state != impl->input_states[i]) { 720*48acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApply(elem_rstr, CEED_NOTRANSPOSE, vec, impl->e_vecs_full[i], request)); 721*48acf710SJeremy L Thompson impl->input_states[i] = state; 722*48acf710SJeremy L Thompson } 723*48acf710SJeremy L Thompson // Get evec 724*48acf710SJeremy L Thompson CeedCallBackend(CeedVectorGetArrayRead(impl->e_vecs_full[i], CEED_MEM_HOST, (const CeedScalar **)&e_data[i])); 725*48acf710SJeremy L Thompson } else { 726*48acf710SJeremy L Thompson // Set Qvec for CEED_EVAL_NONE 727*48acf710SJeremy L Thompson if (eval_mode == CEED_EVAL_NONE) { 728*48acf710SJeremy L Thompson CeedCallBackend(CeedVectorGetArrayRead(impl->e_vecs_in[i], CEED_MEM_HOST, (const CeedScalar **)&e_data[i])); 729*48acf710SJeremy L Thompson CeedCallBackend(CeedVectorSetArray(impl->q_vecs_in[i], CEED_MEM_HOST, CEED_USE_POINTER, e_data[i])); 730*48acf710SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArrayRead(impl->e_vecs_in[i], (const CeedScalar **)&e_data[i])); 731*48acf710SJeremy L Thompson } 732*48acf710SJeremy L Thompson } 733*48acf710SJeremy L Thompson } 734*48acf710SJeremy L Thompson } 735*48acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 736*48acf710SJeremy L Thompson } 737*48acf710SJeremy L Thompson 738*48acf710SJeremy L Thompson //------------------------------------------------------------------------------ 739*48acf710SJeremy L Thompson // Input Basis Action 740*48acf710SJeremy L Thompson //------------------------------------------------------------------------------ 741*48acf710SJeremy L Thompson static inline int CeedOperatorInputBasisAtPoints_Ref(CeedInt e, CeedInt num_points_offset, CeedInt num_points, CeedQFunctionField *qf_input_fields, 742*48acf710SJeremy L Thompson CeedOperatorField *op_input_fields, CeedInt num_input_fields, CeedVector in_vec, 743*48acf710SJeremy L Thompson CeedVector point_coords_elem, bool skip_active, CeedScalar *e_data[2 * CEED_FIELD_MAX], 744*48acf710SJeremy L Thompson CeedOperator_Ref *impl, CeedRequest *request) { 745*48acf710SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 746*48acf710SJeremy L Thompson bool is_active_input = false; 747*48acf710SJeremy L Thompson CeedInt elem_size, size, num_comp; 748*48acf710SJeremy L Thompson CeedRestrictionType rstr_type; 749*48acf710SJeremy L Thompson CeedEvalMode eval_mode; 750*48acf710SJeremy L Thompson CeedVector vec; 751*48acf710SJeremy L Thompson CeedElemRestriction elem_rstr; 752*48acf710SJeremy L Thompson CeedBasis basis; 753*48acf710SJeremy L Thompson 754*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 755*48acf710SJeremy L Thompson // Skip active input 756*48acf710SJeremy L Thompson is_active_input = vec == CEED_VECTOR_ACTIVE; 757*48acf710SJeremy L Thompson if (skip_active && is_active_input) continue; 758*48acf710SJeremy L Thompson 759*48acf710SJeremy L Thompson // Get elem_size, eval_mode, size 760*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 761*48acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetType(elem_rstr, &rstr_type)); 762*48acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 763*48acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &size)); 764*48acf710SJeremy L Thompson // Restrict block active input 765*48acf710SJeremy L Thompson if (is_active_input) { 766*48acf710SJeremy L Thompson if (rstr_type == CEED_RESTRICTION_POINTS) { 767*48acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(elem_rstr, e, CEED_NOTRANSPOSE, in_vec, impl->e_vecs_in[i], request)); 768*48acf710SJeremy L Thompson } else { 769*48acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyBlock(elem_rstr, e, CEED_NOTRANSPOSE, in_vec, impl->e_vecs_in[i], request)); 770*48acf710SJeremy L Thompson } 771*48acf710SJeremy L Thompson } 772*48acf710SJeremy L Thompson // Basis action 773*48acf710SJeremy L Thompson switch (eval_mode) { 774*48acf710SJeremy L Thompson case CEED_EVAL_NONE: 775*48acf710SJeremy L Thompson if (!is_active_input) { 776*48acf710SJeremy L Thompson CeedCallBackend(CeedVectorSetArray(impl->q_vecs_in[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data[i][num_points_offset * size])); 777*48acf710SJeremy L Thompson } 778*48acf710SJeremy L Thompson break; 779*48acf710SJeremy L Thompson // Note - these basis eval modes require FEM fields 780*48acf710SJeremy L Thompson case CEED_EVAL_INTERP: 781*48acf710SJeremy L Thompson case CEED_EVAL_GRAD: 782*48acf710SJeremy L Thompson case CEED_EVAL_DIV: 783*48acf710SJeremy L Thompson case CEED_EVAL_CURL: 784*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_input_fields[i], &basis)); 785*48acf710SJeremy L Thompson if (!is_active_input) { 786*48acf710SJeremy L Thompson CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 787*48acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size)); 788*48acf710SJeremy L Thompson CeedCallBackend(CeedVectorSetArray(impl->e_vecs_in[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data[i][e * elem_size * num_comp])); 789*48acf710SJeremy L Thompson } 790*48acf710SJeremy L Thompson CeedCallBackend( 791*48acf710SJeremy L Thompson CeedBasisApplyAtPoints(basis, num_points, CEED_NOTRANSPOSE, eval_mode, point_coords_elem, impl->e_vecs_in[i], impl->q_vecs_in[i])); 792*48acf710SJeremy L Thompson break; 793*48acf710SJeremy L Thompson case CEED_EVAL_WEIGHT: 794*48acf710SJeremy L Thompson break; // No action 795*48acf710SJeremy L Thompson } 796*48acf710SJeremy L Thompson } 797*48acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 798*48acf710SJeremy L Thompson } 799*48acf710SJeremy L Thompson 800*48acf710SJeremy L Thompson //------------------------------------------------------------------------------ 801*48acf710SJeremy L Thompson // Output Basis Action 802*48acf710SJeremy L Thompson //------------------------------------------------------------------------------ 803*48acf710SJeremy L Thompson static inline int CeedOperatorOutputBasisAtPoints_Ref(CeedInt e, CeedInt num_points_offset, CeedInt num_points, CeedQFunctionField *qf_output_fields, 804*48acf710SJeremy L Thompson CeedOperatorField *op_output_fields, CeedInt num_input_fields, CeedInt num_output_fields, 805*48acf710SJeremy L Thompson CeedOperator op, CeedVector out_vec, CeedVector point_coords_elem, CeedOperator_Ref *impl, 806*48acf710SJeremy L Thompson CeedRequest *request) { 807*48acf710SJeremy L Thompson for (CeedInt i = 0; i < num_output_fields; i++) { 808*48acf710SJeremy L Thompson CeedRestrictionType rstr_type; 809*48acf710SJeremy L Thompson CeedEvalMode eval_mode; 810*48acf710SJeremy L Thompson CeedVector vec; 811*48acf710SJeremy L Thompson CeedElemRestriction elem_rstr; 812*48acf710SJeremy L Thompson CeedBasis basis; 813*48acf710SJeremy L Thompson 814*48acf710SJeremy L Thompson // Get elem_size, eval_mode, size 815*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); 816*48acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); 817*48acf710SJeremy L Thompson // Basis action 818*48acf710SJeremy L Thompson switch (eval_mode) { 819*48acf710SJeremy L Thompson case CEED_EVAL_NONE: 820*48acf710SJeremy L Thompson break; // No action 821*48acf710SJeremy L Thompson case CEED_EVAL_INTERP: 822*48acf710SJeremy L Thompson case CEED_EVAL_GRAD: 823*48acf710SJeremy L Thompson case CEED_EVAL_DIV: 824*48acf710SJeremy L Thompson case CEED_EVAL_CURL: 825*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_output_fields[i], &basis)); 826*48acf710SJeremy L Thompson CeedCallBackend( 827*48acf710SJeremy L Thompson CeedBasisApplyAtPoints(basis, num_points, CEED_TRANSPOSE, eval_mode, point_coords_elem, impl->q_vecs_out[i], impl->e_vecs_out[i])); 828*48acf710SJeremy L Thompson break; 829*48acf710SJeremy L Thompson // LCOV_EXCL_START 830*48acf710SJeremy L Thompson case CEED_EVAL_WEIGHT: { 831*48acf710SJeremy L Thompson Ceed ceed; 832*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 833*48acf710SJeremy L Thompson return CeedError(ceed, CEED_ERROR_BACKEND, "CEED_EVAL_WEIGHT cannot be an output evaluation mode"); 834*48acf710SJeremy L Thompson // LCOV_EXCL_STOP 835*48acf710SJeremy L Thompson } 836*48acf710SJeremy L Thompson } 837*48acf710SJeremy L Thompson // Restrict output block 838*48acf710SJeremy L Thompson // Get output vector 839*48acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetType(elem_rstr, &rstr_type)); 840*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[i], &vec)); 841*48acf710SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) vec = out_vec; 842*48acf710SJeremy L Thompson // Restrict 843*48acf710SJeremy L Thompson if (rstr_type == CEED_RESTRICTION_POINTS) { 844*48acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(elem_rstr, e, CEED_TRANSPOSE, impl->e_vecs_out[i], vec, request)); 845*48acf710SJeremy L Thompson } else { 846*48acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyBlock(elem_rstr, e, CEED_TRANSPOSE, impl->e_vecs_out[i], vec, request)); 847*48acf710SJeremy L Thompson } 848*48acf710SJeremy L Thompson } 849*48acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 850*48acf710SJeremy L Thompson } 851*48acf710SJeremy L Thompson 852*48acf710SJeremy L Thompson //------------------------------------------------------------------------------ 853*48acf710SJeremy L Thompson // Restore Input Vectors 854*48acf710SJeremy L Thompson //------------------------------------------------------------------------------ 855*48acf710SJeremy L Thompson static inline int CeedOperatorRestoreInputsAtPoints_Ref(CeedInt num_input_fields, CeedQFunctionField *qf_input_fields, 856*48acf710SJeremy L Thompson CeedOperatorField *op_input_fields, CeedScalar *e_data[2 * CEED_FIELD_MAX], 857*48acf710SJeremy L Thompson CeedOperator_Ref *impl) { 858*48acf710SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 859*48acf710SJeremy L Thompson CeedEvalMode eval_mode; 860*48acf710SJeremy L Thompson CeedVector vec; 861*48acf710SJeremy L Thompson 862*48acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 863*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 864*48acf710SJeremy L Thompson if (eval_mode != CEED_EVAL_WEIGHT && vec != CEED_VECTOR_ACTIVE) { 865*48acf710SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArrayRead(impl->e_vecs_full[i], (const CeedScalar **)&e_data[i])); 866*48acf710SJeremy L Thompson } 867*48acf710SJeremy L Thompson } 868*48acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 869*48acf710SJeremy L Thompson } 870*48acf710SJeremy L Thompson 871*48acf710SJeremy L Thompson //------------------------------------------------------------------------------ 872*48acf710SJeremy L Thompson // Operator Apply 873*48acf710SJeremy L Thompson //------------------------------------------------------------------------------ 874*48acf710SJeremy L Thompson static int CeedOperatorApplyAddAtPoints_Ref(CeedOperator op, CeedVector in_vec, CeedVector out_vec, CeedRequest *request) { 875*48acf710SJeremy L Thompson Ceed ceed; 876*48acf710SJeremy L Thompson CeedInt num_points_offset = 0, num_input_fields, num_output_fields, num_elem; 877*48acf710SJeremy L Thompson CeedEvalMode eval_mode; 878*48acf710SJeremy L Thompson CeedScalar *e_data[2 * CEED_FIELD_MAX] = {0}; 879*48acf710SJeremy L Thompson CeedVector point_coords = NULL; 880*48acf710SJeremy L Thompson CeedElemRestriction rstr_points = NULL; 881*48acf710SJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 882*48acf710SJeremy L Thompson CeedQFunction qf; 883*48acf710SJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 884*48acf710SJeremy L Thompson CeedOperator_Ref *impl; 885*48acf710SJeremy L Thompson 886*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 887*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 888*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 889*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 890*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 891*48acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 892*48acf710SJeremy L Thompson 893*48acf710SJeremy L Thompson // Setup 894*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorSetupAtPoints_Ref(op)); 895*48acf710SJeremy L Thompson 896*48acf710SJeremy L Thompson // Restriction only operator 897*48acf710SJeremy L Thompson if (impl->is_identity_rstr_op) { 898*48acf710SJeremy L Thompson // TODO: Fix this up 899*48acf710SJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 900*48acf710SJeremy L Thompson // CeedCallBackend(CeedElemRestrictionApplyBlock(impl->block_rstr[0], e, CEED_NOTRANSPOSE, in_vec, impl->e_vecs_in[0], request)); 901*48acf710SJeremy L Thompson // CeedCallBackend(CeedElemRestrictionApplyBlock(impl->block_rstr[1], e, CEED_TRANSPOSE, impl->e_vecs_in[0], out_vec, request)); 902*48acf710SJeremy L Thompson } 903*48acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 904*48acf710SJeremy L Thompson } 905*48acf710SJeremy L Thompson 906*48acf710SJeremy L Thompson // Point coordinates 907*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorAtPointsGetPoints(op, &rstr_points, &point_coords)); 908*48acf710SJeremy L Thompson 909*48acf710SJeremy L Thompson // Input Evecs and Restriction 910*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorSetupInputsAtPoints_Ref(num_input_fields, qf_input_fields, op_input_fields, in_vec, e_data, impl, request)); 911*48acf710SJeremy L Thompson 912*48acf710SJeremy L Thompson // Output Lvecs, Evecs, and Qvecs 913*48acf710SJeremy L Thompson for (CeedInt i = 0; i < num_output_fields; i++) { 914*48acf710SJeremy L Thompson // Set Qvec if needed 915*48acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); 916*48acf710SJeremy L Thompson if (eval_mode == CEED_EVAL_NONE) { 917*48acf710SJeremy L Thompson // Set qvec to single block evec 918*48acf710SJeremy L Thompson CeedCallBackend(CeedVectorGetArrayWrite(impl->e_vecs_out[i], CEED_MEM_HOST, &e_data[i + num_input_fields])); 919*48acf710SJeremy L Thompson CeedCallBackend(CeedVectorSetArray(impl->q_vecs_out[i], CEED_MEM_HOST, CEED_USE_POINTER, e_data[i + num_input_fields])); 920*48acf710SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->e_vecs_out[i], &e_data[i + num_input_fields])); 921*48acf710SJeremy L Thompson } 922*48acf710SJeremy L Thompson } 923*48acf710SJeremy L Thompson 924*48acf710SJeremy L Thompson // Loop through elements 925*48acf710SJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 926*48acf710SJeremy L Thompson CeedInt num_points; 927*48acf710SJeremy L Thompson 928*48acf710SJeremy L Thompson // Setup points for element 929*48acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(rstr_points, e, CEED_NOTRANSPOSE, point_coords, impl->point_coords_elem, request)); 930*48acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumPointsInElement(rstr_points, e, &num_points)); 931*48acf710SJeremy L Thompson 932*48acf710SJeremy L Thompson // Input basis apply 933*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorInputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_input_fields, op_input_fields, num_input_fields, in_vec, 934*48acf710SJeremy L Thompson impl->point_coords_elem, false, e_data, impl, request)); 935*48acf710SJeremy L Thompson 936*48acf710SJeremy L Thompson // Q function 937*48acf710SJeremy L Thompson if (!impl->is_identity_qf) { 938*48acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionApply(qf, num_points, impl->q_vecs_in, impl->q_vecs_out)); 939*48acf710SJeremy L Thompson } 940*48acf710SJeremy L Thompson 941*48acf710SJeremy L Thompson // Output basis apply and restriction 942*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorOutputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_output_fields, op_output_fields, num_input_fields, 943*48acf710SJeremy L Thompson num_output_fields, op, out_vec, impl->point_coords_elem, impl, request)); 944*48acf710SJeremy L Thompson 945*48acf710SJeremy L Thompson num_points_offset += num_points; 946*48acf710SJeremy L Thompson } 947*48acf710SJeremy L Thompson 948*48acf710SJeremy L Thompson // Restore input arrays 949*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorRestoreInputsAtPoints_Ref(num_input_fields, qf_input_fields, op_input_fields, e_data, impl)); 950*48acf710SJeremy L Thompson 951*48acf710SJeremy L Thompson // Cleanup point coordinates 952*48acf710SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&point_coords)); 953*48acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_points)); 954*48acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 955*48acf710SJeremy L Thompson } 956*48acf710SJeremy L Thompson 957*48acf710SJeremy L Thompson //------------------------------------------------------------------------------ 958f10650afSjeremylt // Operator Destroy 959f10650afSjeremylt //------------------------------------------------------------------------------ 960f10650afSjeremylt static int CeedOperatorDestroy_Ref(CeedOperator op) { 961f10650afSjeremylt CeedOperator_Ref *impl; 962f10650afSjeremylt 963ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 9644fc1f125SJeremy L Thompson for (CeedInt i = 0; i < impl->num_inputs + impl->num_outputs; i++) { 9652b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->e_vecs_full[i])); 966f10650afSjeremylt } 9672b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->e_vecs_full)); 9682b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->input_states)); 969f10650afSjeremylt 9704fc1f125SJeremy L Thompson for (CeedInt i = 0; i < impl->num_inputs; i++) { 9712b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->e_vecs_in[i])); 9722b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->q_vecs_in[i])); 973f10650afSjeremylt } 9742b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->e_vecs_in)); 9752b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->q_vecs_in)); 976f10650afSjeremylt 9774fc1f125SJeremy L Thompson for (CeedInt i = 0; i < impl->num_outputs; i++) { 9782b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->e_vecs_out[i])); 9792b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->q_vecs_out[i])); 980f10650afSjeremylt } 9812b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->e_vecs_out)); 9822b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->q_vecs_out)); 983*48acf710SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->point_coords_elem)); 984f10650afSjeremylt 985bb219a0fSJeremy L Thompson // QFunction assembly 9864fc1f125SJeremy L Thompson for (CeedInt i = 0; i < impl->num_active_in; i++) { 9872b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->qf_active_in[i])); 988bb219a0fSJeremy L Thompson } 9892b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->qf_active_in)); 990bb219a0fSJeremy L Thompson 9912b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl)); 992e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 993f10650afSjeremylt } 994f10650afSjeremylt 995f10650afSjeremylt //------------------------------------------------------------------------------ 996713f43c3Sjeremylt // Operator Create 997f10650afSjeremylt //------------------------------------------------------------------------------ 99821617c04Sjeremylt int CeedOperatorCreate_Ref(CeedOperator op) { 999fe2413ffSjeremylt Ceed ceed; 10004ce2993fSjeremylt CeedOperator_Ref *impl; 100121617c04Sjeremylt 1002ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 10032b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(1, &impl)); 10042b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetData(op, impl)); 10052b730f8bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleQFunction", CeedOperatorLinearAssembleQFunction_Ref)); 10062b730f8bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleQFunctionUpdate", CeedOperatorLinearAssembleQFunctionUpdate_Ref)); 10072b730f8bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "ApplyAdd", CeedOperatorApplyAdd_Ref)); 10082b730f8bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "Destroy", CeedOperatorDestroy_Ref)); 1009e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 101021617c04Sjeremylt } 10112a86cc9dSSebastian Grimberg 10122a86cc9dSSebastian Grimberg //------------------------------------------------------------------------------ 1013*48acf710SJeremy L Thompson // Operator Create At Points 1014*48acf710SJeremy L Thompson //------------------------------------------------------------------------------ 1015*48acf710SJeremy L Thompson int CeedOperatorCreateAtPoints_Ref(CeedOperator op) { 1016*48acf710SJeremy L Thompson Ceed ceed; 1017*48acf710SJeremy L Thompson CeedOperator_Ref *impl; 1018*48acf710SJeremy L Thompson 1019*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 1020*48acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(1, &impl)); 1021*48acf710SJeremy L Thompson CeedCallBackend(CeedOperatorSetData(op, impl)); 1022*48acf710SJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "ApplyAdd", CeedOperatorApplyAddAtPoints_Ref)); 1023*48acf710SJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "Destroy", CeedOperatorDestroy_Ref)); 1024*48acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 1025*48acf710SJeremy L Thompson } 1026*48acf710SJeremy L Thompson 1027*48acf710SJeremy L Thompson //------------------------------------------------------------------------------ 1028