15aed82e4SJeremy L Thompson // Copyright (c) 2017-2024, Lawrence Livermore National Security, LLC and other CEED contributors. 23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details. 321617c04Sjeremylt // 43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause 521617c04Sjeremylt // 63d8e8822SJeremy L Thompson // This file is part of CEED: http://github.com/ceed 721617c04Sjeremylt 849aac155SJeremy L Thompson #include <ceed.h> 9ec3da8bcSJed Brown #include <ceed/backend.h> 103d576824SJeremy L Thompson #include <stdbool.h> 113d576824SJeremy L Thompson #include <stddef.h> 123d576824SJeremy L Thompson #include <stdint.h> 132b730f8bSJeremy L Thompson 1421617c04Sjeremylt #include "ceed-ref.h" 1521617c04Sjeremylt 16f10650afSjeremylt //------------------------------------------------------------------------------ 17f10650afSjeremylt // Setup Input/Output Fields 18f10650afSjeremylt //------------------------------------------------------------------------------ 19*f8a0df59SJeremy L Thompson static int CeedOperatorSetupFields_Ref(CeedQFunction qf, CeedOperator op, bool is_input, bool *skip_rstr, CeedInt *e_data_out_indices, 20*f8a0df59SJeremy L Thompson bool *apply_add_basis, CeedVector *e_vecs_full, CeedVector *e_vecs, CeedVector *q_vecs, CeedInt start_e, 21*f8a0df59SJeremy L Thompson CeedInt num_fields, CeedInt Q) { 22aedaa0e5Sjeremylt Ceed ceed; 236efa0d72SZach Atkins CeedSize e_size, q_size; 24ad70ee2cSJeremy L Thompson CeedInt num_comp, size, P; 25d1d35e2fSjeremylt CeedQFunctionField *qf_fields; 26ad70ee2cSJeremy L Thompson CeedOperatorField *op_fields; 27ad70ee2cSJeremy L Thompson 28e910d748SJeremy L Thompson { 29e910d748SJeremy L Thompson Ceed ceed_parent; 30e910d748SJeremy L Thompson 31ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 32e910d748SJeremy L Thompson CeedCallBackend(CeedGetParent(ceed, &ceed_parent)); 33e910d748SJeremy L Thompson if (ceed_parent) ceed = ceed_parent; 34e910d748SJeremy L Thompson } 354fc1f125SJeremy L Thompson if (is_input) { 362b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL)); 372b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL)); 384fc1f125SJeremy L Thompson } else { 392b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields)); 402b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, NULL, NULL, &qf_fields)); 41fe2413ffSjeremylt } 4221617c04Sjeremylt 43885ac19cSjeremylt // Loop over fields 44d1d35e2fSjeremylt for (CeedInt i = 0; i < num_fields; i++) { 45d1d35e2fSjeremylt CeedEvalMode eval_mode; 46edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 47ad70ee2cSJeremy L Thompson CeedBasis basis; 48d1d35e2fSjeremylt 49ad70ee2cSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 50d1d35e2fSjeremylt if (eval_mode != CEED_EVAL_WEIGHT) { 51edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr)); 52edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionCreateVector(elem_rstr, NULL, &e_vecs_full[i + start_e])); 53135a076eSjeremylt } 54135a076eSjeremylt 55d1d35e2fSjeremylt switch (eval_mode) { 56885ac19cSjeremylt case CEED_EVAL_NONE: 572b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_fields[i], &size)); 58d2643443SJeremy L Thompson q_size = (CeedSize)Q * size; 592b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 60aedaa0e5Sjeremylt break; 61aedaa0e5Sjeremylt case CEED_EVAL_INTERP: 62885ac19cSjeremylt case CEED_EVAL_GRAD: 63a915a514Srezgarshakeri case CEED_EVAL_DIV: 64c4e3f59bSSebastian Grimberg case CEED_EVAL_CURL: 652b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 662b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_fields[i], &size)); 672b730f8bSJeremy L Thompson CeedCallBackend(CeedBasisGetNumNodes(basis, &P)); 682b730f8bSJeremy L Thompson CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 69d2643443SJeremy L Thompson e_size = (CeedSize)P * num_comp; 702b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, e_size, &e_vecs[i])); 71d2643443SJeremy L Thompson q_size = (CeedSize)Q * size; 722b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 73885ac19cSjeremylt break; 74885ac19cSjeremylt case CEED_EVAL_WEIGHT: // Only on input fields 752b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 76d2643443SJeremy L Thompson q_size = (CeedSize)Q; 772b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 782b730f8bSJeremy L Thompson CeedCallBackend(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, q_vecs[i])); 79885ac19cSjeremylt break; 8021617c04Sjeremylt } 81885ac19cSjeremylt } 82*f8a0df59SJeremy L Thompson // Drop duplicate restrictions 833aab95c0SJeremy L Thompson if (is_input) { 843aab95c0SJeremy L Thompson for (CeedInt i = 0; i < num_fields; i++) { 853aab95c0SJeremy L Thompson CeedVector vec_i; 863aab95c0SJeremy L Thompson CeedElemRestriction rstr_i; 873aab95c0SJeremy L Thompson 883aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[i], &vec_i)); 893aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr_i)); 903aab95c0SJeremy L Thompson for (CeedInt j = i + 1; j < num_fields; j++) { 913aab95c0SJeremy L Thompson CeedVector vec_j; 923aab95c0SJeremy L Thompson CeedElemRestriction rstr_j; 933aab95c0SJeremy L Thompson 943aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[j], &vec_j)); 953aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[j], &rstr_j)); 963aab95c0SJeremy L Thompson if (vec_i == vec_j && rstr_i == rstr_j) { 973aab95c0SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs[i], &e_vecs[j])); 98*f8a0df59SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs_full[i + start_e], &e_vecs_full[j + start_e])); 993aab95c0SJeremy L Thompson skip_rstr[j] = true; 1003aab95c0SJeremy L Thompson } 1013aab95c0SJeremy L Thompson } 1023aab95c0SJeremy L Thompson } 103*f8a0df59SJeremy L Thompson } else { 104*f8a0df59SJeremy L Thompson for (CeedInt i = num_fields - 1; i >= 0; i--) { 105*f8a0df59SJeremy L Thompson CeedVector vec_i; 106*f8a0df59SJeremy L Thompson CeedElemRestriction rstr_i; 107*f8a0df59SJeremy L Thompson 108*f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[i], &vec_i)); 109*f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr_i)); 110*f8a0df59SJeremy L Thompson for (CeedInt j = i - 1; j >= 0; j--) { 111*f8a0df59SJeremy L Thompson CeedVector vec_j; 112*f8a0df59SJeremy L Thompson CeedElemRestriction rstr_j; 113*f8a0df59SJeremy L Thompson 114*f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[j], &vec_j)); 115*f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[j], &rstr_j)); 116*f8a0df59SJeremy L Thompson if (vec_i == vec_j && rstr_i == rstr_j) { 117*f8a0df59SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs[i], &e_vecs[j])); 118*f8a0df59SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs_full[i + start_e], &e_vecs_full[j + start_e])); 119*f8a0df59SJeremy L Thompson skip_rstr[j] = true; 120*f8a0df59SJeremy L Thompson apply_add_basis[i] = true; 121*f8a0df59SJeremy L Thompson e_data_out_indices[j] = i; 122*f8a0df59SJeremy L Thompson } 123*f8a0df59SJeremy L Thompson } 124*f8a0df59SJeremy L Thompson } 1253aab95c0SJeremy L Thompson } 126e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 12721617c04Sjeremylt } 12821617c04Sjeremylt 129f10650afSjeremylt //------------------------------------------------------------------------------ 130f10650afSjeremylt // Setup Operator 131f10650afSjeremylt //------------------------------------------------------------------------------/* 132885ac19cSjeremylt static int CeedOperatorSetup_Ref(CeedOperator op) { 1338c1105f8SJeremy L Thompson bool is_setup_done; 134ad70ee2cSJeremy L Thompson CeedInt Q, num_input_fields, num_output_fields; 135ad70ee2cSJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 136ad70ee2cSJeremy L Thompson CeedQFunction qf; 137ad70ee2cSJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 138ad70ee2cSJeremy L Thompson CeedOperator_Ref *impl; 139ad70ee2cSJeremy L Thompson 1402b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorIsSetupDone(op, &is_setup_done)); 1418c1105f8SJeremy L Thompson if (is_setup_done) return CEED_ERROR_SUCCESS; 142ad70ee2cSJeremy L Thompson 1432b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 1442b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 1452b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumQuadraturePoints(op, &Q)); 1462b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionIsIdentity(qf, &impl->is_identity_qf)); 1472b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 1482b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 149885ac19cSjeremylt 150885ac19cSjeremylt // Allocate 1512b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(num_input_fields + num_output_fields, &impl->e_vecs_full)); 152885ac19cSjeremylt 1533aab95c0SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->skip_rstr_in)); 154*f8a0df59SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->skip_rstr_out)); 155*f8a0df59SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_data_out_indices)); 156*f8a0df59SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->apply_add_basis_out)); 1572b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->input_states)); 1582b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_vecs_in)); 1592b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_vecs_out)); 1602b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->q_vecs_in)); 1612b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->q_vecs_out)); 162885ac19cSjeremylt 1634fc1f125SJeremy L Thompson impl->num_inputs = num_input_fields; 1644fc1f125SJeremy L Thompson impl->num_outputs = num_output_fields; 165885ac19cSjeremylt 166d1d35e2fSjeremylt // Set up infield and outfield e_vecs and q_vecs 167885ac19cSjeremylt // Infields 168*f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorSetupFields_Ref(qf, op, true, impl->skip_rstr_in, NULL, NULL, impl->e_vecs_full, impl->e_vecs_in, impl->q_vecs_in, 0, 169*f8a0df59SJeremy L Thompson num_input_fields, Q)); 1703aab95c0SJeremy L Thompson // Outfields 171*f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorSetupFields_Ref(qf, op, false, impl->skip_rstr_out, impl->e_data_out_indices, impl->apply_add_basis_out, 172*f8a0df59SJeremy L Thompson impl->e_vecs_full, impl->e_vecs_out, impl->q_vecs_out, num_input_fields, num_output_fields, Q)); 173885ac19cSjeremylt 17416911fdaSjeremylt // Identity QFunctions 1750b454692Sjeremylt if (impl->is_identity_qf) { 176d1d35e2fSjeremylt CeedEvalMode in_mode, out_mode; 177d1d35e2fSjeremylt CeedQFunctionField *in_fields, *out_fields; 178ad70ee2cSJeremy L Thompson 1792b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &in_fields, NULL, &out_fields)); 1802b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(in_fields[0], &in_mode)); 1812b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(out_fields[0], &out_mode)); 182d1d35e2fSjeremylt 1830b454692Sjeremylt if (in_mode == CEED_EVAL_NONE && out_mode == CEED_EVAL_NONE) { 184edb2538eSJeremy L Thompson impl->is_identity_rstr_op = true; 1850b454692Sjeremylt } else { 186db002c03SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(impl->q_vecs_in[0], &impl->q_vecs_out[0])); 18716911fdaSjeremylt } 18816911fdaSjeremylt } 18916911fdaSjeremylt 1902b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetSetupDone(op)); 191e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 192885ac19cSjeremylt } 193885ac19cSjeremylt 194f10650afSjeremylt //------------------------------------------------------------------------------ 195f10650afSjeremylt // Setup Operator Inputs 196f10650afSjeremylt //------------------------------------------------------------------------------ 1972b730f8bSJeremy L Thompson static inline int CeedOperatorSetupInputs_Ref(CeedInt num_input_fields, CeedQFunctionField *qf_input_fields, CeedOperatorField *op_input_fields, 1982b730f8bSJeremy L Thompson CeedVector in_vec, const bool skip_active, CeedScalar *e_data_full[2 * CEED_FIELD_MAX], 199a0162de9SJeremy L Thompson CeedOperator_Ref *impl, CeedRequest *request) { 200ad70ee2cSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 201ad70ee2cSJeremy L Thompson uint64_t state; 202d1d35e2fSjeremylt CeedEvalMode eval_mode; 203d1bcdac9Sjeremylt CeedVector vec; 204edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 205885ac19cSjeremylt 206d1bcdac9Sjeremylt // Get input vector 2072b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 2081d102b48SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 2092b730f8bSJeremy L Thompson if (skip_active) continue; 2102b730f8bSJeremy L Thompson else vec = in_vec; 2111d102b48SJeremy L Thompson } 2121d102b48SJeremy L Thompson 2132b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 2141d102b48SJeremy L Thompson // Restrict and Evec 215d1d35e2fSjeremylt if (eval_mode == CEED_EVAL_WEIGHT) { // Skip 2161d102b48SJeremy L Thompson } else { 217668048e2SJed Brown // Restrict 2182b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorGetState(vec, &state)); 2198d713cf6Sjeremylt // Skip restriction if input is unchanged 2203aab95c0SJeremy L Thompson if ((state != impl->input_states[i] || vec == in_vec) && !impl->skip_rstr_in[i]) { 221edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 222edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApply(elem_rstr, CEED_NOTRANSPOSE, vec, impl->e_vecs_full[i], request)); 2238d713cf6Sjeremylt } 2243aab95c0SJeremy L Thompson impl->input_states[i] = state; 225668048e2SJed Brown // Get evec 2262b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorGetArrayRead(impl->e_vecs_full[i], CEED_MEM_HOST, (const CeedScalar **)&e_data_full[i])); 227885ac19cSjeremylt } 228885ac19cSjeremylt } 229e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 230885ac19cSjeremylt } 231885ac19cSjeremylt 232f10650afSjeremylt //------------------------------------------------------------------------------ 233f10650afSjeremylt // Input Basis Action 234f10650afSjeremylt //------------------------------------------------------------------------------ 2352b730f8bSJeremy L Thompson static inline int CeedOperatorInputBasis_Ref(CeedInt e, CeedInt Q, CeedQFunctionField *qf_input_fields, CeedOperatorField *op_input_fields, 2362b730f8bSJeremy L Thompson CeedInt num_input_fields, const bool skip_active, CeedScalar *e_data_full[2 * CEED_FIELD_MAX], 2372b730f8bSJeremy L Thompson CeedOperator_Ref *impl) { 238ad70ee2cSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 239a915a514Srezgarshakeri CeedInt elem_size, size, num_comp; 240d1d35e2fSjeremylt CeedEvalMode eval_mode; 241edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 2421d102b48SJeremy L Thompson CeedBasis basis; 2431d102b48SJeremy L Thompson 2441d102b48SJeremy L Thompson // Skip active input 245d1d35e2fSjeremylt if (skip_active) { 2461d102b48SJeremy L Thompson CeedVector vec; 247ad70ee2cSJeremy L Thompson 2482b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 2492b730f8bSJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) continue; 2501d102b48SJeremy L Thompson } 251d1d35e2fSjeremylt // Get elem_size, eval_mode, size 252edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 253edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size)); 2542b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 2552b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &size)); 256885ac19cSjeremylt // Basis action 257d1d35e2fSjeremylt switch (eval_mode) { 258885ac19cSjeremylt case CEED_EVAL_NONE: 25981670346SSebastian Grimberg CeedCallBackend(CeedVectorSetArray(impl->q_vecs_in[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data_full[i][(CeedSize)e * Q * size])); 260885ac19cSjeremylt break; 261885ac19cSjeremylt case CEED_EVAL_INTERP: 262885ac19cSjeremylt case CEED_EVAL_GRAD: 263a915a514Srezgarshakeri case CEED_EVAL_DIV: 264c4e3f59bSSebastian Grimberg case CEED_EVAL_CURL: 265a915a514Srezgarshakeri CeedCallBackend(CeedOperatorFieldGetBasis(op_input_fields[i], &basis)); 266a915a514Srezgarshakeri CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 26781670346SSebastian Grimberg CeedCallBackend(CeedVectorSetArray(impl->e_vecs_in[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data_full[i][(CeedSize)e * elem_size * num_comp])); 268c4e3f59bSSebastian Grimberg CeedCallBackend(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, eval_mode, impl->e_vecs_in[i], impl->q_vecs_in[i])); 269a915a514Srezgarshakeri break; 270885ac19cSjeremylt case CEED_EVAL_WEIGHT: 271885ac19cSjeremylt break; // No action 272885ac19cSjeremylt } 273885ac19cSjeremylt } 274e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 275885ac19cSjeremylt } 276885ac19cSjeremylt 277f10650afSjeremylt //------------------------------------------------------------------------------ 278f10650afSjeremylt // Output Basis Action 279f10650afSjeremylt //------------------------------------------------------------------------------ 2802b730f8bSJeremy L Thompson static inline int CeedOperatorOutputBasis_Ref(CeedInt e, CeedInt Q, CeedQFunctionField *qf_output_fields, CeedOperatorField *op_output_fields, 281*f8a0df59SJeremy L Thompson CeedInt num_input_fields, CeedInt num_output_fields, bool *apply_add_basis, CeedOperator op, 2824fc1f125SJeremy L Thompson CeedScalar *e_data_full[2 * CEED_FIELD_MAX], CeedOperator_Ref *impl) { 283ad70ee2cSJeremy L Thompson for (CeedInt i = 0; i < num_output_fields; i++) { 284a915a514Srezgarshakeri CeedInt elem_size, num_comp; 285d1d35e2fSjeremylt CeedEvalMode eval_mode; 286edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 2871d102b48SJeremy L Thompson CeedBasis basis; 2881d102b48SJeremy L Thompson 289a915a514Srezgarshakeri // Get elem_size, eval_mode 290edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); 291edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size)); 2922b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); 293885ac19cSjeremylt // Basis action 294d1d35e2fSjeremylt switch (eval_mode) { 295885ac19cSjeremylt case CEED_EVAL_NONE: 296885ac19cSjeremylt break; // No action 297885ac19cSjeremylt case CEED_EVAL_INTERP: 298885ac19cSjeremylt case CEED_EVAL_GRAD: 299a915a514Srezgarshakeri case CEED_EVAL_DIV: 300c4e3f59bSSebastian Grimberg case CEED_EVAL_CURL: 301a915a514Srezgarshakeri CeedCallBackend(CeedOperatorFieldGetBasis(op_output_fields[i], &basis)); 302a915a514Srezgarshakeri CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 30381670346SSebastian Grimberg CeedCallBackend(CeedVectorSetArray(impl->e_vecs_out[i], CEED_MEM_HOST, CEED_USE_POINTER, 30481670346SSebastian Grimberg &e_data_full[i + num_input_fields][(CeedSize)e * elem_size * num_comp])); 305*f8a0df59SJeremy L Thompson if (apply_add_basis[i]) { 306*f8a0df59SJeremy L Thompson CeedCallBackend(CeedBasisApplyAdd(basis, 1, CEED_TRANSPOSE, eval_mode, impl->q_vecs_out[i], impl->e_vecs_out[i])); 307*f8a0df59SJeremy L Thompson } else { 308c4e3f59bSSebastian Grimberg CeedCallBackend(CeedBasisApply(basis, 1, CEED_TRANSPOSE, eval_mode, impl->q_vecs_out[i], impl->e_vecs_out[i])); 309*f8a0df59SJeremy L Thompson } 310a915a514Srezgarshakeri break; 311c042f62fSJeremy L Thompson // LCOV_EXCL_START 312bbfacfcdSjeremylt case CEED_EVAL_WEIGHT: { 3136e536b99SJeremy L Thompson return CeedError(CeedOperatorReturnCeed(op), CEED_ERROR_BACKEND, "CEED_EVAL_WEIGHT cannot be an output evaluation mode"); 3141d102b48SJeremy L Thompson // LCOV_EXCL_STOP 315885ac19cSjeremylt } 316885ac19cSjeremylt } 317885ac19cSjeremylt } 318e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 3191d102b48SJeremy L Thompson } 3201d102b48SJeremy L Thompson 321f10650afSjeremylt //------------------------------------------------------------------------------ 322f10650afSjeremylt // Restore Input Vectors 323f10650afSjeremylt //------------------------------------------------------------------------------ 3242b730f8bSJeremy L Thompson static inline int CeedOperatorRestoreInputs_Ref(CeedInt num_input_fields, CeedQFunctionField *qf_input_fields, CeedOperatorField *op_input_fields, 3252b730f8bSJeremy L Thompson const bool skip_active, CeedScalar *e_data_full[2 * CEED_FIELD_MAX], CeedOperator_Ref *impl) { 326ad70ee2cSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 327d1d35e2fSjeremylt CeedEvalMode eval_mode; 3281d102b48SJeremy L Thompson 3291d102b48SJeremy L Thompson // Skip active inputs 330d1d35e2fSjeremylt if (skip_active) { 3311d102b48SJeremy L Thompson CeedVector vec; 332ad70ee2cSJeremy L Thompson 3332b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 3342b730f8bSJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) continue; 3351d102b48SJeremy L Thompson } 3361d102b48SJeremy L Thompson // Restore input 3372b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 338d1d35e2fSjeremylt if (eval_mode == CEED_EVAL_WEIGHT) { // Skip 3391d102b48SJeremy L Thompson } else { 3402b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArrayRead(impl->e_vecs_full[i], (const CeedScalar **)&e_data_full[i])); 3411d102b48SJeremy L Thompson } 3421d102b48SJeremy L Thompson } 343e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 3441d102b48SJeremy L Thompson } 3451d102b48SJeremy L Thompson 346f10650afSjeremylt //------------------------------------------------------------------------------ 347f10650afSjeremylt // Operator Apply 348f10650afSjeremylt //------------------------------------------------------------------------------ 3492b730f8bSJeremy L Thompson static int CeedOperatorApplyAdd_Ref(CeedOperator op, CeedVector in_vec, CeedVector out_vec, CeedRequest *request) { 350d1d35e2fSjeremylt CeedInt Q, num_elem, num_input_fields, num_output_fields, size; 351ad70ee2cSJeremy L Thompson CeedEvalMode eval_mode; 352ad70ee2cSJeremy L Thompson CeedScalar *e_data_full[2 * CEED_FIELD_MAX] = {NULL}; 353ad70ee2cSJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 354ad70ee2cSJeremy L Thompson CeedQFunction qf; 355ad70ee2cSJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 356ad70ee2cSJeremy L Thompson CeedOperator_Ref *impl; 357ad70ee2cSJeremy L Thompson 358ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 359ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 3602b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumQuadraturePoints(op, &Q)); 3612b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 3622b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 3632b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 3641d102b48SJeremy L Thompson 3651d102b48SJeremy L Thompson // Setup 3662b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetup_Ref(op)); 3671d102b48SJeremy L Thompson 3680b454692Sjeremylt // Restriction only operator 369edb2538eSJeremy L Thompson if (impl->is_identity_rstr_op) { 370edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 371ad70ee2cSJeremy L Thompson 372edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[0], &elem_rstr)); 373edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApply(elem_rstr, CEED_NOTRANSPOSE, in_vec, impl->e_vecs_full[0], request)); 374edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[0], &elem_rstr)); 375edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApply(elem_rstr, CEED_TRANSPOSE, impl->e_vecs_full[0], out_vec, request)); 3760b454692Sjeremylt return CEED_ERROR_SUCCESS; 3770b454692Sjeremylt } 3780b454692Sjeremylt 3791d102b48SJeremy L Thompson // Input Evecs and Restriction 3802b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, in_vec, false, e_data_full, impl, request)); 3811d102b48SJeremy L Thompson 3821d102b48SJeremy L Thompson // Output Evecs 383*f8a0df59SJeremy L Thompson for (CeedInt i = num_output_fields - 1; i >= 0; i--) { 384*f8a0df59SJeremy L Thompson if (impl->skip_rstr_out[i]) { 385*f8a0df59SJeremy L Thompson e_data_full[i + num_input_fields] = e_data_full[impl->e_data_out_indices[i] + num_input_fields]; 386*f8a0df59SJeremy L Thompson } else { 3872b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorGetArrayWrite(impl->e_vecs_full[i + impl->num_inputs], CEED_MEM_HOST, &e_data_full[i + num_input_fields])); 3881d102b48SJeremy L Thompson } 389*f8a0df59SJeremy L Thompson } 3901d102b48SJeremy L Thompson 3911d102b48SJeremy L Thompson // Loop through elements 392d1d35e2fSjeremylt for (CeedInt e = 0; e < num_elem; e++) { 3931d102b48SJeremy L Thompson // Output pointers 394d1d35e2fSjeremylt for (CeedInt i = 0; i < num_output_fields; i++) { 3952b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); 396d1d35e2fSjeremylt if (eval_mode == CEED_EVAL_NONE) { 3972b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[i], &size)); 39881670346SSebastian Grimberg CeedCallBackend( 39981670346SSebastian Grimberg CeedVectorSetArray(impl->q_vecs_out[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data_full[i + num_input_fields][(CeedSize)e * Q * size])); 4001d102b48SJeremy L Thompson } 4011d102b48SJeremy L Thompson } 4021d102b48SJeremy L Thompson 40316911fdaSjeremylt // Input basis apply 4042b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorInputBasis_Ref(e, Q, qf_input_fields, op_input_fields, num_input_fields, false, e_data_full, impl)); 40516911fdaSjeremylt 4061d102b48SJeremy L Thompson // Q function 4070b454692Sjeremylt if (!impl->is_identity_qf) { 4082b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionApply(qf, Q, impl->q_vecs_in, impl->q_vecs_out)); 40916911fdaSjeremylt } 4101d102b48SJeremy L Thompson 4111d102b48SJeremy L Thompson // Output basis apply 412*f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorOutputBasis_Ref(e, Q, qf_output_fields, op_output_fields, num_input_fields, num_output_fields, 413*f8a0df59SJeremy L Thompson impl->apply_add_basis_out, op, e_data_full, impl)); 4141d102b48SJeremy L Thompson } 415885ac19cSjeremylt 416885ac19cSjeremylt // Output restriction 417d1d35e2fSjeremylt for (CeedInt i = 0; i < num_output_fields; i++) { 418ad70ee2cSJeremy L Thompson CeedVector vec; 419edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 420ad70ee2cSJeremy L Thompson 421*f8a0df59SJeremy L Thompson if (impl->skip_rstr_out[i]) continue; 422d1d35e2fSjeremylt // Restore Evec 4232b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->e_vecs_full[i + impl->num_inputs], &e_data_full[i + num_input_fields])); 424d1bcdac9Sjeremylt // Get output vector 4252b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[i], &vec)); 426668048e2SJed Brown // Active 4272b730f8bSJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) vec = out_vec; 4287ca8db16Sjeremylt // Restrict 429edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); 430edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApply(elem_rstr, CEED_TRANSPOSE, impl->e_vecs_full[i + impl->num_inputs], vec, request)); 431885ac19cSjeremylt } 432885ac19cSjeremylt 4337ca8db16Sjeremylt // Restore input arrays 4342b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, false, e_data_full, impl)); 435e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 43621617c04Sjeremylt } 43721617c04Sjeremylt 438f10650afSjeremylt //------------------------------------------------------------------------------ 43970a7ffb3SJeremy L Thompson // Core code for assembling linear QFunction 440f10650afSjeremylt //------------------------------------------------------------------------------ 4412b730f8bSJeremy L Thompson static inline int CeedOperatorLinearAssembleQFunctionCore_Ref(CeedOperator op, bool build_objects, CeedVector *assembled, CeedElemRestriction *rstr, 44270a7ffb3SJeremy L Thompson CeedRequest *request) { 443e910d748SJeremy L Thompson Ceed ceed, ceed_parent; 444ff8551c5SJeremy L Thompson CeedInt qf_size_in, qf_size_out, Q, num_elem, num_input_fields, num_output_fields; 445ad70ee2cSJeremy L Thompson CeedScalar *assembled_array, *e_data_full[2 * CEED_FIELD_MAX] = {NULL}; 446ad70ee2cSJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 447ad70ee2cSJeremy L Thompson CeedQFunction qf; 448ad70ee2cSJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 449ad70ee2cSJeremy L Thompson CeedOperator_Ref *impl; 450ad70ee2cSJeremy L Thompson 4512b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 452e910d748SJeremy L Thompson CeedCallBackend(CeedOperatorGetFallbackParentCeed(op, &ceed_parent)); 453e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 454ff8551c5SJeremy L Thompson qf_size_in = impl->qf_size_in; 455ff8551c5SJeremy L Thompson qf_size_out = impl->qf_size_out; 456e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 457e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumQuadraturePoints(op, &Q)); 458e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 459e984cf9aSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 460e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 4611d102b48SJeremy L Thompson 4621d102b48SJeremy L Thompson // Setup 4632b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetup_Ref(op)); 4641d102b48SJeremy L Thompson 465506b1a0cSSebastian Grimberg // Check for restriction only operator 466506b1a0cSSebastian Grimberg CeedCheck(!impl->is_identity_rstr_op, ceed, CEED_ERROR_BACKEND, "Assembling restriction only operators is not supported"); 46716911fdaSjeremylt 4681d102b48SJeremy L Thompson // Input Evecs and Restriction 4692b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, NULL, true, e_data_full, impl, request)); 4701d102b48SJeremy L Thompson 4711d102b48SJeremy L Thompson // Count number of active input fields 472ff8551c5SJeremy L Thompson if (qf_size_in == 0) { 473d1d35e2fSjeremylt for (CeedInt i = 0; i < num_input_fields; i++) { 474c7b67790SJeremy L Thompson CeedInt field_size; 475ad70ee2cSJeremy L Thompson CeedVector vec; 476ad70ee2cSJeremy L Thompson 4771d102b48SJeremy L Thompson // Get input vector 4782b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 4791d102b48SJeremy L Thompson // Check if active input 4801d102b48SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 481c7b67790SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &field_size)); 4822b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(impl->q_vecs_in[i], 0.0)); 483ff8551c5SJeremy L Thompson qf_size_in += field_size; 4841d102b48SJeremy L Thompson } 4851d102b48SJeremy L Thompson } 486ff8551c5SJeremy L Thompson CeedCheck(qf_size_in > 0, ceed, CEED_ERROR_BACKEND, "Cannot assemble QFunction without active inputs and outputs"); 487ff8551c5SJeremy L Thompson impl->qf_size_in = qf_size_in; 488bb219a0fSJeremy L Thompson } 4891d102b48SJeremy L Thompson 4901d102b48SJeremy L Thompson // Count number of active output fields 491ff8551c5SJeremy L Thompson if (qf_size_out == 0) { 492d1d35e2fSjeremylt for (CeedInt i = 0; i < num_output_fields; i++) { 493c7b67790SJeremy L Thompson CeedInt field_size; 494ad70ee2cSJeremy L Thompson CeedVector vec; 495ad70ee2cSJeremy L Thompson 4961d102b48SJeremy L Thompson // Get output vector 4972b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[i], &vec)); 4981d102b48SJeremy L Thompson // Check if active output 4991d102b48SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 500c7b67790SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[i], &field_size)); 501ff8551c5SJeremy L Thompson qf_size_out += field_size; 5021d102b48SJeremy L Thompson } 5031d102b48SJeremy L Thompson } 504ff8551c5SJeremy L Thompson CeedCheck(qf_size_out > 0, ceed, CEED_ERROR_BACKEND, "Cannot assemble QFunction without active inputs and outputs"); 505ff8551c5SJeremy L Thompson impl->qf_size_out = qf_size_out; 506bb219a0fSJeremy L Thompson } 5071d102b48SJeremy L Thompson 50870a7ffb3SJeremy L Thompson // Build objects if needed 50970a7ffb3SJeremy L Thompson if (build_objects) { 510ff8551c5SJeremy L Thompson const CeedSize l_size = (CeedSize)num_elem * Q * qf_size_in * qf_size_out; 511ff8551c5SJeremy L Thompson CeedInt strides[3] = {1, Q, qf_size_in * qf_size_out * Q}; /* *NOPAD* */ 512ad70ee2cSJeremy L Thompson 513ad70ee2cSJeremy L Thompson // Create output restriction 5140a5597ceSJeremy L Thompson CeedCallBackend(CeedElemRestrictionCreateStrided(ceed_parent, num_elem, Q, qf_size_in * qf_size_out, 5150a5597ceSJeremy L Thompson (CeedSize)qf_size_in * (CeedSize)qf_size_out * (CeedSize)num_elem * (CeedSize)Q, strides, rstr)); 5161d102b48SJeremy L Thompson // Create assembled vector 517e910d748SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed_parent, l_size, assembled)); 51870a7ffb3SJeremy L Thompson } 51970a7ffb3SJeremy L Thompson // Clear output vector 5202b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(*assembled, 0.0)); 521ad70ee2cSJeremy L Thompson CeedCallBackend(CeedVectorGetArray(*assembled, CEED_MEM_HOST, &assembled_array)); 5221d102b48SJeremy L Thompson 5231d102b48SJeremy L Thompson // Loop through elements 524d1d35e2fSjeremylt for (CeedInt e = 0; e < num_elem; e++) { 5251d102b48SJeremy L Thompson // Input basis apply 5262b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorInputBasis_Ref(e, Q, qf_input_fields, op_input_fields, num_input_fields, true, e_data_full, impl)); 5271d102b48SJeremy L Thompson 5281d102b48SJeremy L Thompson // Assemble QFunction 529c7b67790SJeremy L Thompson 530c7b67790SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 531c7b67790SJeremy L Thompson CeedInt field_size; 532c7b67790SJeremy L Thompson CeedVector vec; 533c7b67790SJeremy L Thompson 5341d102b48SJeremy L Thompson // Set Inputs 535c7b67790SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 536c7b67790SJeremy L Thompson if (vec != CEED_VECTOR_ACTIVE) continue; 537c7b67790SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &field_size)); 538c7b67790SJeremy L Thompson for (CeedInt field = 0; field < field_size; field++) { 539c7b67790SJeremy L Thompson // Set current portion of input to 1.0 540c7b67790SJeremy L Thompson { 541c7b67790SJeremy L Thompson CeedScalar *array; 542c7b67790SJeremy L Thompson 543c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->q_vecs_in[i], CEED_MEM_HOST, &array)); 544c7b67790SJeremy L Thompson for (CeedInt j = 0; j < Q; j++) array[field * Q + j] = 1.0; 545c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->q_vecs_in[i], &array)); 54642ea3801Sjeremylt } 547c7b67790SJeremy L Thompson 548506b1a0cSSebastian Grimberg if (!impl->is_identity_qf) { 5491d102b48SJeremy L Thompson // Set Outputs 550d1d35e2fSjeremylt for (CeedInt out = 0; out < num_output_fields; out++) { 551ad70ee2cSJeremy L Thompson CeedVector vec; 552ad70ee2cSJeremy L Thompson 5531d102b48SJeremy L Thompson // Get output vector 5542b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[out], &vec)); 5551d102b48SJeremy L Thompson // Check if active output 5561d102b48SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 557c7b67790SJeremy L Thompson CeedInt field_size; 558c7b67790SJeremy L Thompson 559ad70ee2cSJeremy L Thompson CeedCallBackend(CeedVectorSetArray(impl->q_vecs_out[out], CEED_MEM_HOST, CEED_USE_POINTER, assembled_array)); 560c7b67790SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[out], &field_size)); 561c7b67790SJeremy L Thompson assembled_array += field_size * Q; // Advance the pointer by the size of the output 5621d102b48SJeremy L Thompson } 5631d102b48SJeremy L Thompson } 5641d102b48SJeremy L Thompson // Apply QFunction 5652b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionApply(qf, Q, impl->q_vecs_in, impl->q_vecs_out)); 566506b1a0cSSebastian Grimberg } else { 567c7b67790SJeremy L Thompson CeedInt field_size; 568c7b67790SJeremy L Thompson const CeedScalar *array; 569506b1a0cSSebastian Grimberg 570506b1a0cSSebastian Grimberg // Copy Identity Outputs 571c7b67790SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[0], &field_size)); 572c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorGetArrayRead(impl->q_vecs_out[0], CEED_MEM_HOST, &array)); 573c7b67790SJeremy L Thompson for (CeedInt j = 0; j < field_size * Q; j++) assembled_array[j] = array[j]; 574c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArrayRead(impl->q_vecs_out[0], &array)); 575c7b67790SJeremy L Thompson assembled_array += field_size * Q; 576c7b67790SJeremy L Thompson } 577c7b67790SJeremy L Thompson // Reset input to 0.0 578c7b67790SJeremy L Thompson { 579c7b67790SJeremy L Thompson CeedScalar *array; 580c7b67790SJeremy L Thompson 581c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->q_vecs_in[i], CEED_MEM_HOST, &array)); 582c7b67790SJeremy L Thompson for (CeedInt j = 0; j < Q; j++) array[field * Q + j] = 0.0; 583c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->q_vecs_in[i], &array)); 584c7b67790SJeremy L Thompson } 585506b1a0cSSebastian Grimberg } 5861d102b48SJeremy L Thompson } 5871d102b48SJeremy L Thompson } 5881d102b48SJeremy L Thompson 5891d102b48SJeremy L Thompson // Un-set output Qvecs to prevent accidental overwrite of Assembled 590506b1a0cSSebastian Grimberg if (!impl->is_identity_qf) { 591d1d35e2fSjeremylt for (CeedInt out = 0; out < num_output_fields; out++) { 592ad70ee2cSJeremy L Thompson CeedVector vec; 593ad70ee2cSJeremy L Thompson 5941d102b48SJeremy L Thompson // Get output vector 5952b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[out], &vec)); 5961d102b48SJeremy L Thompson // Check if active output 597056ea4bdSJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE && num_elem > 0) { 5982b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorTakeArray(impl->q_vecs_out[out], CEED_MEM_HOST, NULL)); 5991d102b48SJeremy L Thompson } 6001d102b48SJeremy L Thompson } 601506b1a0cSSebastian Grimberg } 6021d102b48SJeremy L Thompson 6031d102b48SJeremy L Thompson // Restore input arrays 6042b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, true, e_data_full, impl)); 6051d102b48SJeremy L Thompson 6061d102b48SJeremy L Thompson // Restore output 607ad70ee2cSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(*assembled, &assembled_array)); 608e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 6091d102b48SJeremy L Thompson } 6101d102b48SJeremy L Thompson 611f10650afSjeremylt //------------------------------------------------------------------------------ 61270a7ffb3SJeremy L Thompson // Assemble Linear QFunction 61370a7ffb3SJeremy L Thompson //------------------------------------------------------------------------------ 6142b730f8bSJeremy L Thompson static int CeedOperatorLinearAssembleQFunction_Ref(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 6152b730f8bSJeremy L Thompson return CeedOperatorLinearAssembleQFunctionCore_Ref(op, true, assembled, rstr, request); 61670a7ffb3SJeremy L Thompson } 61770a7ffb3SJeremy L Thompson 61870a7ffb3SJeremy L Thompson //------------------------------------------------------------------------------ 61970a7ffb3SJeremy L Thompson // Update Assembled Linear QFunction 62070a7ffb3SJeremy L Thompson //------------------------------------------------------------------------------ 6212b730f8bSJeremy L Thompson static int CeedOperatorLinearAssembleQFunctionUpdate_Ref(CeedOperator op, CeedVector assembled, CeedElemRestriction rstr, CeedRequest *request) { 6222b730f8bSJeremy L Thompson return CeedOperatorLinearAssembleQFunctionCore_Ref(op, false, &assembled, &rstr, request); 62370a7ffb3SJeremy L Thompson } 62470a7ffb3SJeremy L Thompson 62570a7ffb3SJeremy L Thompson //------------------------------------------------------------------------------ 62648acf710SJeremy L Thompson // Setup Input/Output Fields 62748acf710SJeremy L Thompson //------------------------------------------------------------------------------ 628*f8a0df59SJeremy L Thompson static int CeedOperatorSetupFieldsAtPoints_Ref(CeedQFunction qf, CeedOperator op, bool is_input, bool *skip_rstr, bool *apply_add_basis, 629*f8a0df59SJeremy L Thompson CeedVector *e_vecs_full, CeedVector *e_vecs, CeedVector *q_vecs, CeedInt start_e, CeedInt num_fields, 630*f8a0df59SJeremy L Thompson CeedInt Q) { 63148acf710SJeremy L Thompson Ceed ceed; 63248acf710SJeremy L Thompson CeedSize e_size, q_size; 633ff1bc20eSJeremy L Thompson CeedInt max_num_points, num_comp, size, P; 63448acf710SJeremy L Thompson CeedQFunctionField *qf_fields; 63548acf710SJeremy L Thompson CeedOperatorField *op_fields; 63648acf710SJeremy L Thompson 637e910d748SJeremy L Thompson { 638e910d748SJeremy L Thompson Ceed ceed_parent; 639e910d748SJeremy L Thompson 64048acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 641e910d748SJeremy L Thompson CeedCallBackend(CeedGetParent(ceed, &ceed_parent)); 642e910d748SJeremy L Thompson if (ceed_parent) ceed = ceed_parent; 643e910d748SJeremy L Thompson } 64448acf710SJeremy L Thompson if (is_input) { 64548acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL)); 64648acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL)); 64748acf710SJeremy L Thompson } else { 64848acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields)); 64948acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, NULL, NULL, &qf_fields)); 65048acf710SJeremy L Thompson } 65148acf710SJeremy L Thompson 65248acf710SJeremy L Thompson // Get max number of points 65348acf710SJeremy L Thompson { 65448acf710SJeremy L Thompson CeedInt dim; 65548acf710SJeremy L Thompson CeedElemRestriction rstr_points = NULL; 65648acf710SJeremy L Thompson CeedOperator_Ref *impl; 65748acf710SJeremy L Thompson 65848acf710SJeremy L Thompson CeedCallBackend(CeedOperatorAtPointsGetPoints(op, &rstr_points, NULL)); 65948acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetMaxPointsInElement(rstr_points, &max_num_points)); 66048acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumComponents(rstr_points, &dim)); 66148acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_points)); 66248acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 663b37f8825SJeremy L Thompson if (is_input) { 664b37f8825SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, dim * max_num_points, &impl->point_coords_elem)); 665b37f8825SJeremy L Thompson CeedCallBackend(CeedVectorSetValue(impl->point_coords_elem, 0.0)); 666b37f8825SJeremy L Thompson } 66748acf710SJeremy L Thompson } 66848acf710SJeremy L Thompson 66948acf710SJeremy L Thompson // Loop over fields 67048acf710SJeremy L Thompson for (CeedInt i = 0; i < num_fields; i++) { 67148acf710SJeremy L Thompson CeedEvalMode eval_mode; 67248acf710SJeremy L Thompson CeedBasis basis; 67348acf710SJeremy L Thompson 67448acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 67548acf710SJeremy L Thompson if (eval_mode != CEED_EVAL_WEIGHT) { 67648acf710SJeremy L Thompson CeedElemRestriction elem_rstr; 67748acf710SJeremy L Thompson 67848acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr)); 67948acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionCreateVector(elem_rstr, NULL, &e_vecs_full[i + start_e])); 680ff1bc20eSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(e_vecs_full[i + start_e], 0.0)); 6816efa0d72SZach Atkins } 68248acf710SJeremy L Thompson 68348acf710SJeremy L Thompson switch (eval_mode) { 68438e83183SJeremy L Thompson case CEED_EVAL_NONE: { 68538e83183SJeremy L Thompson CeedVector vec; 68638e83183SJeremy L Thompson 68748acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_fields[i], &size)); 68848acf710SJeremy L Thompson e_size = (CeedSize)max_num_points * size; 68948acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, e_size, &e_vecs[i])); 69038e83183SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[i], &vec)); 69138e83183SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE || !is_input) { 69238e83183SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs[i], &q_vecs[i])); 69338e83183SJeremy L Thompson } else { 69448acf710SJeremy L Thompson q_size = (CeedSize)max_num_points * size; 69548acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 69638e83183SJeremy L Thompson } 69748acf710SJeremy L Thompson break; 69838e83183SJeremy L Thompson } 69948acf710SJeremy L Thompson case CEED_EVAL_INTERP: 70048acf710SJeremy L Thompson case CEED_EVAL_GRAD: 70148acf710SJeremy L Thompson case CEED_EVAL_DIV: 70248acf710SJeremy L Thompson case CEED_EVAL_CURL: 70348acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 70448acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_fields[i], &size)); 70548acf710SJeremy L Thompson CeedCallBackend(CeedBasisGetNumNodes(basis, &P)); 70648acf710SJeremy L Thompson CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 70748acf710SJeremy L Thompson e_size = (CeedSize)P * num_comp; 70848acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, e_size, &e_vecs[i])); 70948acf710SJeremy L Thompson q_size = (CeedSize)max_num_points * size; 71048acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 71148acf710SJeremy L Thompson break; 71248acf710SJeremy L Thompson case CEED_EVAL_WEIGHT: // Only on input fields 71348acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 71448acf710SJeremy L Thompson q_size = (CeedSize)max_num_points; 71548acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 71648acf710SJeremy L Thompson CeedCallBackend( 717fc0f7cc6SJeremy L Thompson CeedBasisApplyAtPoints(basis, 1, &max_num_points, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, CEED_VECTOR_NONE, q_vecs[i])); 71848acf710SJeremy L Thompson break; 71948acf710SJeremy L Thompson } 720ecc797dfSJeremy L Thompson // Initialize full arrays for E-vectors and Q-vectors 721297a0f46SJeremy L Thompson if (e_vecs[i]) CeedCallBackend(CeedVectorSetValue(e_vecs[i], 0.0)); 722297a0f46SJeremy L Thompson if (eval_mode != CEED_EVAL_WEIGHT) CeedCallBackend(CeedVectorSetValue(q_vecs[i], 0.0)); 72348acf710SJeremy L Thompson } 724*f8a0df59SJeremy L Thompson // Drop duplicate restrictions 7253aab95c0SJeremy L Thompson if (is_input) { 7263aab95c0SJeremy L Thompson for (CeedInt i = 0; i < num_fields; i++) { 7273aab95c0SJeremy L Thompson CeedVector vec_i; 7283aab95c0SJeremy L Thompson CeedElemRestriction rstr_i; 7293aab95c0SJeremy L Thompson 7303aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[i], &vec_i)); 7313aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr_i)); 7323aab95c0SJeremy L Thompson for (CeedInt j = i + 1; j < num_fields; j++) { 7333aab95c0SJeremy L Thompson CeedVector vec_j; 7343aab95c0SJeremy L Thompson CeedElemRestriction rstr_j; 7353aab95c0SJeremy L Thompson 7363aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[j], &vec_j)); 7373aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[j], &rstr_j)); 7383aab95c0SJeremy L Thompson if (vec_i == vec_j && rstr_i == rstr_j) { 7393aab95c0SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs[i], &e_vecs[j])); 740*f8a0df59SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs_full[i + start_e], &e_vecs_full[j + start_e])); 7413aab95c0SJeremy L Thompson skip_rstr[j] = true; 7423aab95c0SJeremy L Thompson } 7433aab95c0SJeremy L Thompson } 7443aab95c0SJeremy L Thompson } 745*f8a0df59SJeremy L Thompson } else { 746*f8a0df59SJeremy L Thompson for (CeedInt i = num_fields - 1; i >= 0; i--) { 747*f8a0df59SJeremy L Thompson CeedVector vec_i; 748*f8a0df59SJeremy L Thompson CeedElemRestriction rstr_i; 749*f8a0df59SJeremy L Thompson 750*f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[i], &vec_i)); 751*f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr_i)); 752*f8a0df59SJeremy L Thompson for (CeedInt j = i - 1; j >= 0; j--) { 753*f8a0df59SJeremy L Thompson CeedVector vec_j; 754*f8a0df59SJeremy L Thompson CeedElemRestriction rstr_j; 755*f8a0df59SJeremy L Thompson 756*f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[j], &vec_j)); 757*f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[j], &rstr_j)); 758*f8a0df59SJeremy L Thompson if (vec_i == vec_j && rstr_i == rstr_j) { 759*f8a0df59SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs[i], &e_vecs[j])); 760*f8a0df59SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs_full[i + start_e], &e_vecs_full[j + start_e])); 761*f8a0df59SJeremy L Thompson skip_rstr[j] = true; 762*f8a0df59SJeremy L Thompson apply_add_basis[i] = true; 763*f8a0df59SJeremy L Thompson } 764*f8a0df59SJeremy L Thompson } 765*f8a0df59SJeremy L Thompson } 7663aab95c0SJeremy L Thompson } 76748acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 76848acf710SJeremy L Thompson } 76948acf710SJeremy L Thompson 77048acf710SJeremy L Thompson //------------------------------------------------------------------------------ 77148acf710SJeremy L Thompson // Setup Operator 77248acf710SJeremy L Thompson //------------------------------------------------------------------------------ 77348acf710SJeremy L Thompson static int CeedOperatorSetupAtPoints_Ref(CeedOperator op) { 77448acf710SJeremy L Thompson bool is_setup_done; 77548acf710SJeremy L Thompson CeedInt Q, num_input_fields, num_output_fields; 77648acf710SJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 77748acf710SJeremy L Thompson CeedQFunction qf; 77848acf710SJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 77948acf710SJeremy L Thompson CeedOperator_Ref *impl; 78048acf710SJeremy L Thompson 78148acf710SJeremy L Thompson CeedCallBackend(CeedOperatorIsSetupDone(op, &is_setup_done)); 78248acf710SJeremy L Thompson if (is_setup_done) return CEED_ERROR_SUCCESS; 78348acf710SJeremy L Thompson 78448acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 78548acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 78648acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetNumQuadraturePoints(op, &Q)); 78748acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionIsIdentity(qf, &impl->is_identity_qf)); 78848acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 78948acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 79048acf710SJeremy L Thompson 79148acf710SJeremy L Thompson // Allocate 79248acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(num_input_fields + num_output_fields, &impl->e_vecs_full)); 79348acf710SJeremy L Thompson 7943aab95c0SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->skip_rstr_in)); 795*f8a0df59SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->skip_rstr_out)); 796*f8a0df59SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->apply_add_basis_out)); 79748acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->input_states)); 79848acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_vecs_in)); 79948acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_vecs_out)); 80048acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->q_vecs_in)); 80148acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->q_vecs_out)); 80248acf710SJeremy L Thompson 80348acf710SJeremy L Thompson impl->num_inputs = num_input_fields; 80448acf710SJeremy L Thompson impl->num_outputs = num_output_fields; 80548acf710SJeremy L Thompson 80648acf710SJeremy L Thompson // Set up infield and outfield pointer arrays 80748acf710SJeremy L Thompson // Infields 808*f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorSetupFieldsAtPoints_Ref(qf, op, true, impl->skip_rstr_in, NULL, impl->e_vecs_full, impl->e_vecs_in, impl->q_vecs_in, 0, 8093aab95c0SJeremy L Thompson num_input_fields, Q)); 81048acf710SJeremy L Thompson // Outfields 811*f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorSetupFieldsAtPoints_Ref(qf, op, false, impl->skip_rstr_out, impl->apply_add_basis_out, impl->e_vecs_full, 812*f8a0df59SJeremy L Thompson impl->e_vecs_out, impl->q_vecs_out, num_input_fields, num_output_fields, Q)); 81348acf710SJeremy L Thompson 81448acf710SJeremy L Thompson // Identity QFunctions 81548acf710SJeremy L Thompson if (impl->is_identity_qf) { 81648acf710SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(impl->q_vecs_in[0], &impl->q_vecs_out[0])); 81738e83183SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(impl->q_vecs_in[0], &impl->e_vecs_out[0])); 81848acf710SJeremy L Thompson } 81948acf710SJeremy L Thompson 82048acf710SJeremy L Thompson CeedCallBackend(CeedOperatorSetSetupDone(op)); 82148acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 82248acf710SJeremy L Thompson } 82348acf710SJeremy L Thompson 82448acf710SJeremy L Thompson //------------------------------------------------------------------------------ 82548acf710SJeremy L Thompson // Input Basis Action 82648acf710SJeremy L Thompson //------------------------------------------------------------------------------ 82748acf710SJeremy L Thompson static inline int CeedOperatorInputBasisAtPoints_Ref(CeedInt e, CeedInt num_points_offset, CeedInt num_points, CeedQFunctionField *qf_input_fields, 82848acf710SJeremy L Thompson CeedOperatorField *op_input_fields, CeedInt num_input_fields, CeedVector in_vec, 82948acf710SJeremy L Thompson CeedVector point_coords_elem, bool skip_active, CeedScalar *e_data[2 * CEED_FIELD_MAX], 83048acf710SJeremy L Thompson CeedOperator_Ref *impl, CeedRequest *request) { 83148acf710SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 83248acf710SJeremy L Thompson bool is_active_input = false; 83348acf710SJeremy L Thompson CeedInt elem_size, size, num_comp; 83448acf710SJeremy L Thompson CeedRestrictionType rstr_type; 83548acf710SJeremy L Thompson CeedEvalMode eval_mode; 83648acf710SJeremy L Thompson CeedVector vec; 83748acf710SJeremy L Thompson CeedElemRestriction elem_rstr; 83848acf710SJeremy L Thompson CeedBasis basis; 83948acf710SJeremy L Thompson 84048acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 84148acf710SJeremy L Thompson // Skip active input 84248acf710SJeremy L Thompson is_active_input = vec == CEED_VECTOR_ACTIVE; 84348acf710SJeremy L Thompson if (skip_active && is_active_input) continue; 84448acf710SJeremy L Thompson 84548acf710SJeremy L Thompson // Get elem_size, eval_mode, size 84648acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 84748acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetType(elem_rstr, &rstr_type)); 84848acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 84948acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &size)); 85048acf710SJeremy L Thompson // Restrict block active input 8513aab95c0SJeremy L Thompson if (is_active_input && !impl->skip_rstr_in[i]) { 85248acf710SJeremy L Thompson if (rstr_type == CEED_RESTRICTION_POINTS) { 85348acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(elem_rstr, e, CEED_NOTRANSPOSE, in_vec, impl->e_vecs_in[i], request)); 85448acf710SJeremy L Thompson } else { 85548acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyBlock(elem_rstr, e, CEED_NOTRANSPOSE, in_vec, impl->e_vecs_in[i], request)); 85648acf710SJeremy L Thompson } 85748acf710SJeremy L Thompson } 85848acf710SJeremy L Thompson // Basis action 85948acf710SJeremy L Thompson switch (eval_mode) { 86048acf710SJeremy L Thompson case CEED_EVAL_NONE: 86148acf710SJeremy L Thompson if (!is_active_input) { 86248acf710SJeremy L Thompson CeedCallBackend(CeedVectorSetArray(impl->q_vecs_in[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data[i][num_points_offset * size])); 86348acf710SJeremy L Thompson } 86448acf710SJeremy L Thompson break; 86548acf710SJeremy L Thompson // Note - these basis eval modes require FEM fields 86648acf710SJeremy L Thompson case CEED_EVAL_INTERP: 86748acf710SJeremy L Thompson case CEED_EVAL_GRAD: 86848acf710SJeremy L Thompson case CEED_EVAL_DIV: 86948acf710SJeremy L Thompson case CEED_EVAL_CURL: 87048acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_input_fields[i], &basis)); 87148acf710SJeremy L Thompson if (!is_active_input) { 87248acf710SJeremy L Thompson CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 87348acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size)); 87481670346SSebastian Grimberg CeedCallBackend(CeedVectorSetArray(impl->e_vecs_in[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data[i][(CeedSize)e * elem_size * num_comp])); 87548acf710SJeremy L Thompson } 87648acf710SJeremy L Thompson CeedCallBackend( 877fc0f7cc6SJeremy L Thompson CeedBasisApplyAtPoints(basis, 1, &num_points, CEED_NOTRANSPOSE, eval_mode, point_coords_elem, impl->e_vecs_in[i], impl->q_vecs_in[i])); 87848acf710SJeremy L Thompson break; 87948acf710SJeremy L Thompson case CEED_EVAL_WEIGHT: 88048acf710SJeremy L Thompson break; // No action 88148acf710SJeremy L Thompson } 88248acf710SJeremy L Thompson } 88348acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 88448acf710SJeremy L Thompson } 88548acf710SJeremy L Thompson 88648acf710SJeremy L Thompson //------------------------------------------------------------------------------ 88748acf710SJeremy L Thompson // Output Basis Action 88848acf710SJeremy L Thompson //------------------------------------------------------------------------------ 88948acf710SJeremy L Thompson static inline int CeedOperatorOutputBasisAtPoints_Ref(CeedInt e, CeedInt num_points_offset, CeedInt num_points, CeedQFunctionField *qf_output_fields, 89048acf710SJeremy L Thompson CeedOperatorField *op_output_fields, CeedInt num_input_fields, CeedInt num_output_fields, 891*f8a0df59SJeremy L Thompson bool *apply_add_basis, bool *skip_rstr, CeedOperator op, CeedVector out_vec, 892*f8a0df59SJeremy L Thompson CeedVector point_coords_elem, CeedOperator_Ref *impl, CeedRequest *request) { 89348acf710SJeremy L Thompson for (CeedInt i = 0; i < num_output_fields; i++) { 89448acf710SJeremy L Thompson CeedRestrictionType rstr_type; 89548acf710SJeremy L Thompson CeedEvalMode eval_mode; 89648acf710SJeremy L Thompson CeedVector vec; 89748acf710SJeremy L Thompson CeedElemRestriction elem_rstr; 89848acf710SJeremy L Thompson CeedBasis basis; 89948acf710SJeremy L Thompson 90048acf710SJeremy L Thompson // Get elem_size, eval_mode, size 90148acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); 90248acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); 90348acf710SJeremy L Thompson // Basis action 90448acf710SJeremy L Thompson switch (eval_mode) { 90548acf710SJeremy L Thompson case CEED_EVAL_NONE: 90648acf710SJeremy L Thompson break; // No action 90748acf710SJeremy L Thompson case CEED_EVAL_INTERP: 90848acf710SJeremy L Thompson case CEED_EVAL_GRAD: 90948acf710SJeremy L Thompson case CEED_EVAL_DIV: 91048acf710SJeremy L Thompson case CEED_EVAL_CURL: 91148acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_output_fields[i], &basis)); 912*f8a0df59SJeremy L Thompson if (apply_add_basis[i]) { 913*f8a0df59SJeremy L Thompson CeedCallBackend(CeedBasisApplyAddAtPoints(basis, 1, &num_points, CEED_TRANSPOSE, eval_mode, point_coords_elem, impl->q_vecs_out[i], 914*f8a0df59SJeremy L Thompson impl->e_vecs_out[i])); 915*f8a0df59SJeremy L Thompson } else { 91648acf710SJeremy L Thompson CeedCallBackend( 917fc0f7cc6SJeremy L Thompson CeedBasisApplyAtPoints(basis, 1, &num_points, CEED_TRANSPOSE, eval_mode, point_coords_elem, impl->q_vecs_out[i], impl->e_vecs_out[i])); 918*f8a0df59SJeremy L Thompson } 91948acf710SJeremy L Thompson break; 92048acf710SJeremy L Thompson // LCOV_EXCL_START 92148acf710SJeremy L Thompson case CEED_EVAL_WEIGHT: { 9226e536b99SJeremy L Thompson return CeedError(CeedOperatorReturnCeed(op), CEED_ERROR_BACKEND, "CEED_EVAL_WEIGHT cannot be an output evaluation mode"); 92348acf710SJeremy L Thompson // LCOV_EXCL_STOP 92448acf710SJeremy L Thompson } 92548acf710SJeremy L Thompson } 92648acf710SJeremy L Thompson // Restrict output block 927*f8a0df59SJeremy L Thompson if (skip_rstr[i]) continue; 92848acf710SJeremy L Thompson // Get output vector 92948acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetType(elem_rstr, &rstr_type)); 93048acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[i], &vec)); 93148acf710SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) vec = out_vec; 93248acf710SJeremy L Thompson // Restrict 93348acf710SJeremy L Thompson if (rstr_type == CEED_RESTRICTION_POINTS) { 93448acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(elem_rstr, e, CEED_TRANSPOSE, impl->e_vecs_out[i], vec, request)); 93548acf710SJeremy L Thompson } else { 93648acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyBlock(elem_rstr, e, CEED_TRANSPOSE, impl->e_vecs_out[i], vec, request)); 93748acf710SJeremy L Thompson } 93848acf710SJeremy L Thompson } 93948acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 94048acf710SJeremy L Thompson } 94148acf710SJeremy L Thompson 94248acf710SJeremy L Thompson //------------------------------------------------------------------------------ 94348acf710SJeremy L Thompson // Operator Apply 94448acf710SJeremy L Thompson //------------------------------------------------------------------------------ 94548acf710SJeremy L Thompson static int CeedOperatorApplyAddAtPoints_Ref(CeedOperator op, CeedVector in_vec, CeedVector out_vec, CeedRequest *request) { 94648acf710SJeremy L Thompson CeedInt num_points_offset = 0, num_input_fields, num_output_fields, num_elem; 94748acf710SJeremy L Thompson CeedScalar *e_data[2 * CEED_FIELD_MAX] = {0}; 94848acf710SJeremy L Thompson CeedVector point_coords = NULL; 94948acf710SJeremy L Thompson CeedElemRestriction rstr_points = NULL; 95048acf710SJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 95148acf710SJeremy L Thompson CeedQFunction qf; 95248acf710SJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 95348acf710SJeremy L Thompson CeedOperator_Ref *impl; 95448acf710SJeremy L Thompson 95548acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 95648acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 95748acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 95848acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 95948acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 96048acf710SJeremy L Thompson 96148acf710SJeremy L Thompson // Setup 96248acf710SJeremy L Thompson CeedCallBackend(CeedOperatorSetupAtPoints_Ref(op)); 96348acf710SJeremy L Thompson 96448acf710SJeremy L Thompson // Point coordinates 96548acf710SJeremy L Thompson CeedCallBackend(CeedOperatorAtPointsGetPoints(op, &rstr_points, &point_coords)); 96648acf710SJeremy L Thompson 96748acf710SJeremy L Thompson // Input Evecs and Restriction 9686cde1da6SZach Atkins CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, NULL, true, e_data, impl, request)); 96948acf710SJeremy L Thompson 97048acf710SJeremy L Thompson // Loop through elements 97148acf710SJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 97248acf710SJeremy L Thompson CeedInt num_points; 97348acf710SJeremy L Thompson 97448acf710SJeremy L Thompson // Setup points for element 97548acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(rstr_points, e, CEED_NOTRANSPOSE, point_coords, impl->point_coords_elem, request)); 97648acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumPointsInElement(rstr_points, e, &num_points)); 97748acf710SJeremy L Thompson 97848acf710SJeremy L Thompson // Input basis apply 97948acf710SJeremy L Thompson CeedCallBackend(CeedOperatorInputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_input_fields, op_input_fields, num_input_fields, in_vec, 98048acf710SJeremy L Thompson impl->point_coords_elem, false, e_data, impl, request)); 98148acf710SJeremy L Thompson 98248acf710SJeremy L Thompson // Q function 98348acf710SJeremy L Thompson if (!impl->is_identity_qf) { 98448acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionApply(qf, num_points, impl->q_vecs_in, impl->q_vecs_out)); 98548acf710SJeremy L Thompson } 98648acf710SJeremy L Thompson 98748acf710SJeremy L Thompson // Output basis apply and restriction 98848acf710SJeremy L Thompson CeedCallBackend(CeedOperatorOutputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_output_fields, op_output_fields, num_input_fields, 989*f8a0df59SJeremy L Thompson num_output_fields, impl->apply_add_basis_out, impl->skip_rstr_out, op, out_vec, 990*f8a0df59SJeremy L Thompson impl->point_coords_elem, impl, request)); 99148acf710SJeremy L Thompson 99248acf710SJeremy L Thompson num_points_offset += num_points; 99348acf710SJeremy L Thompson } 99448acf710SJeremy L Thompson 99548acf710SJeremy L Thompson // Restore input arrays 9966cde1da6SZach Atkins CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, true, e_data, impl)); 99748acf710SJeremy L Thompson 99848acf710SJeremy L Thompson // Cleanup point coordinates 99948acf710SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&point_coords)); 100048acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_points)); 100148acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 100248acf710SJeremy L Thompson } 100348acf710SJeremy L Thompson 100448acf710SJeremy L Thompson //------------------------------------------------------------------------------ 1005e13f2367SZach Atkins // Core code for assembling linear QFunction 1006e13f2367SZach Atkins //------------------------------------------------------------------------------ 1007e13f2367SZach Atkins static inline int CeedOperatorLinearAssembleQFunctionAtPointsCore_Ref(CeedOperator op, bool build_objects, CeedVector *assembled, 1008e13f2367SZach Atkins CeedElemRestriction *rstr, CeedRequest *request) { 1009e13f2367SZach Atkins Ceed ceed; 1010ff8551c5SJeremy L Thompson CeedInt qf_size_in, qf_size_out, max_num_points, num_elem, num_input_fields, num_output_fields, num_points_offset = 0; 1011e13f2367SZach Atkins CeedScalar *assembled_array, *e_data_full[2 * CEED_FIELD_MAX] = {NULL}; 1012c7b67790SJeremy L Thompson CeedVector point_coords = NULL; 1013e13f2367SZach Atkins CeedQFunctionField *qf_input_fields, *qf_output_fields; 1014e13f2367SZach Atkins CeedQFunction qf; 1015e13f2367SZach Atkins CeedOperatorField *op_input_fields, *op_output_fields; 1016e13f2367SZach Atkins CeedOperator_Ref *impl; 1017e13f2367SZach Atkins CeedElemRestriction rstr_points = NULL; 1018e13f2367SZach Atkins 1019e13f2367SZach Atkins CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 1020e13f2367SZach Atkins CeedCallBackend(CeedOperatorGetData(op, &impl)); 1021ff8551c5SJeremy L Thompson qf_size_in = impl->qf_size_in; 1022ff8551c5SJeremy L Thompson qf_size_out = impl->qf_size_out; 1023e13f2367SZach Atkins CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 1024e13f2367SZach Atkins CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 1025e13f2367SZach Atkins CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 1026e13f2367SZach Atkins CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 1027e13f2367SZach Atkins 1028e13f2367SZach Atkins // Setup 1029e13f2367SZach Atkins CeedCallBackend(CeedOperatorSetupAtPoints_Ref(op)); 1030e13f2367SZach Atkins 1031e13f2367SZach Atkins // Check for restriction only operator 1032e13f2367SZach Atkins CeedCheck(!impl->is_identity_rstr_op, ceed, CEED_ERROR_BACKEND, "Assembling restriction only operators is not supported"); 1033e13f2367SZach Atkins 1034e13f2367SZach Atkins // Point coordinates 1035e13f2367SZach Atkins CeedCallBackend(CeedOperatorAtPointsGetPoints(op, &rstr_points, &point_coords)); 1036e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionGetMaxPointsInElement(rstr_points, &max_num_points)); 1037e13f2367SZach Atkins 1038e13f2367SZach Atkins // Input Evecs and Restriction 1039e13f2367SZach Atkins CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, NULL, true, e_data_full, impl, request)); 1040e13f2367SZach Atkins 1041e13f2367SZach Atkins // Count number of active input fields 1042ff8551c5SJeremy L Thompson if (qf_size_in == 0) { 1043e13f2367SZach Atkins for (CeedInt i = 0; i < num_input_fields; i++) { 1044e13f2367SZach Atkins CeedInt field_size; 1045e13f2367SZach Atkins CeedVector vec; 1046e13f2367SZach Atkins 1047e13f2367SZach Atkins // Get input vector 1048e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 1049e13f2367SZach Atkins // Check if active input 1050e13f2367SZach Atkins if (vec == CEED_VECTOR_ACTIVE) { 1051e13f2367SZach Atkins // Check that all active inputs are nodal fields 1052e13f2367SZach Atkins { 1053e13f2367SZach Atkins CeedElemRestriction elem_rstr; 1054e13f2367SZach Atkins bool is_at_points = false; 1055e13f2367SZach Atkins 1056e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 1057637baffdSJeremy L Thompson CeedCallBackend(CeedElemRestrictionIsAtPoints(elem_rstr, &is_at_points)); 1058e13f2367SZach Atkins CeedCheck(!is_at_points, ceed, CEED_ERROR_BACKEND, "Cannot assemble QFunction with active input at points"); 1059e13f2367SZach Atkins } 1060e13f2367SZach Atkins // Get size of active input 1061e13f2367SZach Atkins CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &field_size)); 1062ff8551c5SJeremy L Thompson qf_size_in += field_size; 1063e13f2367SZach Atkins } 1064e13f2367SZach Atkins } 1065ff8551c5SJeremy L Thompson CeedCheck(qf_size_in, ceed, CEED_ERROR_BACKEND, "Cannot assemble QFunction without active inputs and outputs"); 1066ff8551c5SJeremy L Thompson impl->qf_size_in = qf_size_in; 1067e13f2367SZach Atkins } 1068e13f2367SZach Atkins 1069e13f2367SZach Atkins // Count number of active output fields 1070ff8551c5SJeremy L Thompson if (qf_size_out == 0) { 1071e13f2367SZach Atkins for (CeedInt i = 0; i < num_output_fields; i++) { 1072e13f2367SZach Atkins CeedInt field_size; 1073c7b67790SJeremy L Thompson CeedVector vec; 1074e13f2367SZach Atkins 1075e13f2367SZach Atkins // Get output vector 1076e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[i], &vec)); 1077e13f2367SZach Atkins // Check if active output 1078e13f2367SZach Atkins if (vec == CEED_VECTOR_ACTIVE) { 1079e13f2367SZach Atkins // Check that all active inputs are nodal fields 1080e13f2367SZach Atkins { 1081e13f2367SZach Atkins CeedElemRestriction elem_rstr; 1082e13f2367SZach Atkins bool is_at_points = false; 1083e13f2367SZach Atkins 1084e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); 1085637baffdSJeremy L Thompson CeedCallBackend(CeedElemRestrictionIsAtPoints(elem_rstr, &is_at_points)); 1086e13f2367SZach Atkins CeedCheck(!is_at_points, ceed, CEED_ERROR_BACKEND, "Cannot assemble QFunction with active input at points"); 1087e13f2367SZach Atkins } 1088e13f2367SZach Atkins // Get size of active output 1089e13f2367SZach Atkins CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[i], &field_size)); 1090c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorSetValue(impl->q_vecs_in[i], 0.0)); 1091ff8551c5SJeremy L Thompson qf_size_out += field_size; 1092e13f2367SZach Atkins } 1093e13f2367SZach Atkins } 1094ff8551c5SJeremy L Thompson CeedCheck(qf_size_out > 0, ceed, CEED_ERROR_BACKEND, "Cannot assemble QFunction without active inputs and outputs"); 1095ff8551c5SJeremy L Thompson impl->qf_size_out = qf_size_out; 1096e13f2367SZach Atkins } 1097e13f2367SZach Atkins 1098e13f2367SZach Atkins // Build objects if needed 1099e13f2367SZach Atkins if (build_objects) { 1100e13f2367SZach Atkins CeedInt num_points_total; 1101e13f2367SZach Atkins const CeedInt *offsets; 1102e13f2367SZach Atkins 1103e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionGetNumPoints(rstr_points, &num_points_total)); 1104e13f2367SZach Atkins 1105e13f2367SZach Atkins // Create output restriction (at points) 1106e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionGetOffsets(rstr_points, CEED_MEM_HOST, &offsets)); 1107ff8551c5SJeremy L Thompson CeedCallBackend(CeedElemRestrictionCreateAtPoints(ceed, num_elem, num_points_total, qf_size_in * qf_size_out, 1108ff8551c5SJeremy L Thompson qf_size_in * qf_size_out * num_points_total, CEED_MEM_HOST, CEED_COPY_VALUES, offsets, rstr)); 1109e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionRestoreOffsets(rstr_points, &offsets)); 1110e13f2367SZach Atkins 1111e13f2367SZach Atkins // Create assembled vector 1112e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionCreateVector(*rstr, assembled, NULL)); 1113e13f2367SZach Atkins } 1114e13f2367SZach Atkins // Clear output vector 1115e13f2367SZach Atkins CeedCallBackend(CeedVectorSetValue(*assembled, 0.0)); 1116e13f2367SZach Atkins CeedCallBackend(CeedVectorGetArray(*assembled, CEED_MEM_HOST, &assembled_array)); 1117e13f2367SZach Atkins 1118e13f2367SZach Atkins // Loop through elements 1119e13f2367SZach Atkins for (CeedInt e = 0; e < num_elem; e++) { 1120e13f2367SZach Atkins CeedInt num_points; 1121e13f2367SZach Atkins 1122e13f2367SZach Atkins // Setup points for element 1123e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(rstr_points, e, CEED_NOTRANSPOSE, point_coords, impl->point_coords_elem, request)); 1124e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionGetNumPointsInElement(rstr_points, e, &num_points)); 1125e13f2367SZach Atkins 1126e13f2367SZach Atkins // Input basis apply 1127e13f2367SZach Atkins CeedCallBackend(CeedOperatorInputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_input_fields, op_input_fields, num_input_fields, NULL, 1128e13f2367SZach Atkins impl->point_coords_elem, true, e_data_full, impl, request)); 1129e13f2367SZach Atkins 1130e13f2367SZach Atkins // Assemble QFunction 1131c7b67790SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 1132c7b67790SJeremy L Thompson CeedInt field_size; 1133c7b67790SJeremy L Thompson CeedVector vec; 1134c7b67790SJeremy L Thompson 1135c7b67790SJeremy L Thompson // Get input vector 1136c7b67790SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 1137c7b67790SJeremy L Thompson // Check if active input 1138c7b67790SJeremy L Thompson if (vec != CEED_VECTOR_ACTIVE) continue; 1139c7b67790SJeremy L Thompson // Get size of active input 1140c7b67790SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &field_size)); 1141c7b67790SJeremy L Thompson for (CeedInt field = 0; field < field_size; field++) { 1142c7b67790SJeremy L Thompson // Set current portion of input to 1.0 1143c7b67790SJeremy L Thompson { 1144c7b67790SJeremy L Thompson CeedScalar *array; 1145c7b67790SJeremy L Thompson 1146c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->q_vecs_in[i], CEED_MEM_HOST, &array)); 1147c7b67790SJeremy L Thompson for (CeedInt j = 0; j < num_points; j++) array[field * num_points + j] = 1.0; 1148c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->q_vecs_in[i], &array)); 1149e13f2367SZach Atkins } 1150c7b67790SJeremy L Thompson 1151e13f2367SZach Atkins if (!impl->is_identity_qf) { 1152e13f2367SZach Atkins // Set Outputs 1153e13f2367SZach Atkins for (CeedInt out = 0; out < num_output_fields; out++) { 1154e13f2367SZach Atkins CeedVector vec; 1155e13f2367SZach Atkins CeedInt field_size; 1156e13f2367SZach Atkins 1157e13f2367SZach Atkins // Get output vector 1158e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[out], &vec)); 1159e13f2367SZach Atkins // Check if active output 1160e13f2367SZach Atkins if (vec == CEED_VECTOR_ACTIVE) { 1161e13f2367SZach Atkins CeedCallBackend(CeedVectorSetArray(impl->q_vecs_out[out], CEED_MEM_HOST, CEED_USE_POINTER, assembled_array)); 1162e13f2367SZach Atkins CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[out], &field_size)); 1163e13f2367SZach Atkins assembled_array += field_size * num_points; // Advance the pointer by the size of the output 1164e13f2367SZach Atkins } 1165e13f2367SZach Atkins } 1166e13f2367SZach Atkins // Apply QFunction 1167e13f2367SZach Atkins CeedCallBackend(CeedQFunctionApply(qf, num_points, impl->q_vecs_in, impl->q_vecs_out)); 1168e13f2367SZach Atkins } else { 1169c7b67790SJeremy L Thompson const CeedScalar *array; 1170e13f2367SZach Atkins CeedInt field_size; 1171e13f2367SZach Atkins 1172e13f2367SZach Atkins // Copy Identity Outputs 1173e13f2367SZach Atkins CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[0], &field_size)); 1174c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorGetArrayRead(impl->q_vecs_out[0], CEED_MEM_HOST, &array)); 1175c7b67790SJeremy L Thompson for (CeedInt j = 0; j < field_size * num_points; j++) assembled_array[j] = array[j]; 1176c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArrayRead(impl->q_vecs_out[0], &array)); 1177e13f2367SZach Atkins assembled_array += field_size * num_points; 1178e13f2367SZach Atkins } 1179c7b67790SJeremy L Thompson // Reset input to 0.0 1180c7b67790SJeremy L Thompson { 1181c7b67790SJeremy L Thompson CeedScalar *array; 1182c7b67790SJeremy L Thompson 1183c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->q_vecs_in[i], CEED_MEM_HOST, &array)); 1184c7b67790SJeremy L Thompson for (CeedInt j = 0; j < num_points; j++) array[field * num_points + j] = 0.0; 1185c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->q_vecs_in[i], &array)); 1186c7b67790SJeremy L Thompson } 1187c7b67790SJeremy L Thompson } 1188e13f2367SZach Atkins } 1189e13f2367SZach Atkins num_points_offset += num_points; 1190e13f2367SZach Atkins } 1191e13f2367SZach Atkins 1192e13f2367SZach Atkins // Un-set output Qvecs to prevent accidental overwrite of Assembled 1193e13f2367SZach Atkins if (!impl->is_identity_qf) { 1194e13f2367SZach Atkins for (CeedInt out = 0; out < num_output_fields; out++) { 1195e13f2367SZach Atkins CeedVector vec; 1196e13f2367SZach Atkins 1197e13f2367SZach Atkins // Get output vector 1198e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[out], &vec)); 1199e13f2367SZach Atkins // Check if active output 1200e13f2367SZach Atkins if (vec == CEED_VECTOR_ACTIVE && num_elem > 0) { 1201e13f2367SZach Atkins CeedCallBackend(CeedVectorTakeArray(impl->q_vecs_out[out], CEED_MEM_HOST, NULL)); 1202e13f2367SZach Atkins } 1203e13f2367SZach Atkins } 1204e13f2367SZach Atkins } 1205e13f2367SZach Atkins 1206e13f2367SZach Atkins // Restore input arrays 1207e13f2367SZach Atkins CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, true, e_data_full, impl)); 1208e13f2367SZach Atkins 1209e13f2367SZach Atkins // Restore output 1210e13f2367SZach Atkins CeedCallBackend(CeedVectorRestoreArray(*assembled, &assembled_array)); 1211e13f2367SZach Atkins 1212e13f2367SZach Atkins // Cleanup 1213e13f2367SZach Atkins CeedCallBackend(CeedVectorDestroy(&point_coords)); 1214e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionDestroy(&rstr_points)); 1215e13f2367SZach Atkins return CEED_ERROR_SUCCESS; 1216e13f2367SZach Atkins } 1217e13f2367SZach Atkins 1218e13f2367SZach Atkins //------------------------------------------------------------------------------ 1219e13f2367SZach Atkins // Assemble Linear QFunction 1220e13f2367SZach Atkins //------------------------------------------------------------------------------ 1221e13f2367SZach Atkins static int CeedOperatorLinearAssembleQFunctionAtPoints_Ref(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 1222e13f2367SZach Atkins return CeedOperatorLinearAssembleQFunctionAtPointsCore_Ref(op, true, assembled, rstr, request); 1223e13f2367SZach Atkins } 1224e13f2367SZach Atkins 1225e13f2367SZach Atkins //------------------------------------------------------------------------------ 1226e13f2367SZach Atkins // Update Assembled Linear QFunction 1227e13f2367SZach Atkins //------------------------------------------------------------------------------ 1228e13f2367SZach Atkins static int CeedOperatorLinearAssembleQFunctionAtPointsUpdate_Ref(CeedOperator op, CeedVector assembled, CeedElemRestriction rstr, 1229e13f2367SZach Atkins CeedRequest *request) { 1230e13f2367SZach Atkins return CeedOperatorLinearAssembleQFunctionAtPointsCore_Ref(op, false, &assembled, &rstr, request); 1231e13f2367SZach Atkins } 1232e13f2367SZach Atkins 1233e13f2367SZach Atkins //------------------------------------------------------------------------------ 1234fb133d4bSJeremy L Thompson // Assemble Operator Diagonal AtPoints 1235e13f2367SZach Atkins //------------------------------------------------------------------------------ 1236fb133d4bSJeremy L Thompson static int CeedOperatorLinearAssembleAddDiagonalAtPoints_Ref(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1237382e9c83SJeremy L Thompson CeedInt num_points_offset = 0, num_input_fields, num_output_fields, num_elem, num_comp_active = 1; 1238fb133d4bSJeremy L Thompson CeedScalar *e_data[2 * CEED_FIELD_MAX] = {0}; 1239fb133d4bSJeremy L Thompson Ceed ceed; 1240fb133d4bSJeremy L Thompson CeedVector point_coords = NULL, in_vec, out_vec; 1241fb133d4bSJeremy L Thompson CeedElemRestriction rstr_points = NULL; 1242fb133d4bSJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 1243fb133d4bSJeremy L Thompson CeedQFunction qf; 1244fb133d4bSJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 1245fb133d4bSJeremy L Thompson CeedOperator_Ref *impl; 1246fb133d4bSJeremy L Thompson 1247fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 1248fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 1249fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 1250fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 1251fb133d4bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 1252fb133d4bSJeremy L Thompson 1253fb133d4bSJeremy L Thompson // Setup 1254fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorSetupAtPoints_Ref(op)); 1255fb133d4bSJeremy L Thompson 1256fb133d4bSJeremy L Thompson // Ceed 1257fb133d4bSJeremy L Thompson { 1258fb133d4bSJeremy L Thompson Ceed ceed_parent; 1259fb133d4bSJeremy L Thompson 1260fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 1261fb133d4bSJeremy L Thompson CeedCallBackend(CeedGetParent(ceed, &ceed_parent)); 1262fb133d4bSJeremy L Thompson if (ceed_parent) ceed = ceed_parent; 1263fb133d4bSJeremy L Thompson } 1264fb133d4bSJeremy L Thompson 1265fb133d4bSJeremy L Thompson // Point coordinates 1266fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorAtPointsGetPoints(op, &rstr_points, &point_coords)); 1267fb133d4bSJeremy L Thompson 1268fb133d4bSJeremy L Thompson // Input and output vectors 1269fb133d4bSJeremy L Thompson { 1270fb133d4bSJeremy L Thompson CeedSize input_size, output_size; 1271fb133d4bSJeremy L Thompson 1272fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 1273fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, input_size, &in_vec)); 1274fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, output_size, &out_vec)); 1275fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(out_vec, 0.0)); 1276fb133d4bSJeremy L Thompson } 1277fb133d4bSJeremy L Thompson 1278382e9c83SJeremy L Thompson // Clear input Qvecs 127986e10729SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 128086e10729SJeremy L Thompson CeedVector vec; 128186e10729SJeremy L Thompson 128286e10729SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 128386e10729SJeremy L Thompson if (vec != CEED_VECTOR_ACTIVE) continue; 128486e10729SJeremy L Thompson CeedCallBackend(CeedVectorSetValue(impl->q_vecs_in[i], 0.0)); 128586e10729SJeremy L Thompson } 1286382e9c83SJeremy L Thompson 1287fb133d4bSJeremy L Thompson // Input Evecs and Restriction 1288fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, NULL, true, e_data, impl, request)); 1289fb133d4bSJeremy L Thompson 1290fb133d4bSJeremy L Thompson // Loop through elements 1291fb133d4bSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 1292fb133d4bSJeremy L Thompson CeedInt num_points, e_vec_size = 0; 1293fb133d4bSJeremy L Thompson 1294fb133d4bSJeremy L Thompson // Setup points for element 1295fb133d4bSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(rstr_points, e, CEED_NOTRANSPOSE, point_coords, impl->point_coords_elem, request)); 1296fb133d4bSJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumPointsInElement(rstr_points, e, &num_points)); 1297fb133d4bSJeremy L Thompson 1298fb133d4bSJeremy L Thompson // Input basis apply for non-active bases 1299fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorInputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_input_fields, op_input_fields, num_input_fields, in_vec, 1300fb133d4bSJeremy L Thompson impl->point_coords_elem, true, e_data, impl, request)); 1301fb133d4bSJeremy L Thompson 1302fb133d4bSJeremy L Thompson // Loop over points on element 1303fb133d4bSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 1304382e9c83SJeremy L Thompson bool is_active_at_points = true; 1305382e9c83SJeremy L Thompson CeedInt elem_size_active = 1; 1306382e9c83SJeremy L Thompson CeedRestrictionType rstr_type; 1307fb133d4bSJeremy L Thompson CeedVector vec; 1308382e9c83SJeremy L Thompson CeedElemRestriction elem_rstr; 1309fb133d4bSJeremy L Thompson 1310fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 1311382e9c83SJeremy L Thompson // -- Skip non-active input 1312382e9c83SJeremy L Thompson if (vec != CEED_VECTOR_ACTIVE) continue; 1313fb133d4bSJeremy L Thompson 1314382e9c83SJeremy L Thompson // -- Get active restriction type 1315382e9c83SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 1316382e9c83SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetType(elem_rstr, &rstr_type)); 1317382e9c83SJeremy L Thompson is_active_at_points = rstr_type == CEED_RESTRICTION_POINTS; 1318382e9c83SJeremy L Thompson if (!is_active_at_points) CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size_active)); 1319382e9c83SJeremy L Thompson else elem_size_active = num_points; 1320382e9c83SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumComponents(elem_rstr, &num_comp_active)); 1321382e9c83SJeremy L Thompson 1322382e9c83SJeremy L Thompson e_vec_size = elem_size_active * num_comp_active; 1323382e9c83SJeremy L Thompson for (CeedInt s = 0; s < e_vec_size; s++) { 1324382e9c83SJeremy L Thompson CeedEvalMode eval_mode; 1325382e9c83SJeremy L Thompson CeedBasis basis; 1326382e9c83SJeremy L Thompson 1327382e9c83SJeremy L Thompson // -- Update unit vector 1328fb133d4bSJeremy L Thompson { 1329fb133d4bSJeremy L Thompson CeedScalar *array; 1330fb133d4bSJeremy L Thompson 133113062808SJeremy L Thompson if (s == 0) CeedCallBackend(CeedVectorSetValue(impl->e_vecs_in[i], 0.0)); 1332fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->e_vecs_in[i], CEED_MEM_HOST, &array)); 1333fb133d4bSJeremy L Thompson array[s] = 1.0; 1334fb133d4bSJeremy L Thompson if (s > 0) array[s - 1] = 0.0; 1335fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->e_vecs_in[i], &array)); 1336fb133d4bSJeremy L Thompson } 1337382e9c83SJeremy L Thompson // -- Basis action 1338958e607dSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 1339fb133d4bSJeremy L Thompson switch (eval_mode) { 1340fb133d4bSJeremy L Thompson case CEED_EVAL_NONE: 1341fb133d4bSJeremy L Thompson break; 1342fb133d4bSJeremy L Thompson // Note - these basis eval modes require FEM fields 1343fb133d4bSJeremy L Thompson case CEED_EVAL_INTERP: 1344fb133d4bSJeremy L Thompson case CEED_EVAL_GRAD: 1345fb133d4bSJeremy L Thompson case CEED_EVAL_DIV: 1346fb133d4bSJeremy L Thompson case CEED_EVAL_CURL: 1347fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_input_fields[i], &basis)); 1348fc0f7cc6SJeremy L Thompson CeedCallBackend(CeedBasisApplyAtPoints(basis, 1, &num_points, CEED_NOTRANSPOSE, eval_mode, impl->point_coords_elem, impl->e_vecs_in[i], 1349fb133d4bSJeremy L Thompson impl->q_vecs_in[i])); 1350fb133d4bSJeremy L Thompson break; 1351fb133d4bSJeremy L Thompson case CEED_EVAL_WEIGHT: 1352fb133d4bSJeremy L Thompson break; // No action 1353fb133d4bSJeremy L Thompson } 1354fb133d4bSJeremy L Thompson 1355fb133d4bSJeremy L Thompson // -- Q function 1356fb133d4bSJeremy L Thompson if (!impl->is_identity_qf) { 1357fb133d4bSJeremy L Thompson CeedCallBackend(CeedQFunctionApply(qf, num_points, impl->q_vecs_in, impl->q_vecs_out)); 1358fb133d4bSJeremy L Thompson } 1359fb133d4bSJeremy L Thompson 1360fb133d4bSJeremy L Thompson // -- Output basis apply and restriction 1361fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorOutputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_output_fields, op_output_fields, num_input_fields, 1362*f8a0df59SJeremy L Thompson num_output_fields, impl->apply_add_basis_out, impl->skip_rstr_out, op, out_vec, 1363*f8a0df59SJeremy L Thompson impl->point_coords_elem, impl, request)); 1364fb133d4bSJeremy L Thompson 1365fb133d4bSJeremy L Thompson // -- Grab diagonal value 136686e10729SJeremy L Thompson for (CeedInt j = 0; j < num_output_fields; j++) { 136764a7ec2fSZach Atkins bool is_active_output = false; 1368382e9c83SJeremy L Thompson CeedInt elem_size = 0; 1369fb133d4bSJeremy L Thompson CeedRestrictionType rstr_type; 1370fb133d4bSJeremy L Thompson CeedEvalMode eval_mode; 1371fb133d4bSJeremy L Thompson CeedVector vec; 1372fb133d4bSJeremy L Thompson CeedElemRestriction elem_rstr; 1373fb133d4bSJeremy L Thompson CeedBasis basis; 1374fb133d4bSJeremy L Thompson 137586e10729SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[j], &vec)); 13760c7f167fSZach Atkins // ---- Skip non-active output 137764a7ec2fSZach Atkins is_active_output = vec == CEED_VECTOR_ACTIVE; 137864a7ec2fSZach Atkins if (!is_active_output) continue; 1379fb133d4bSJeremy L Thompson 1380382e9c83SJeremy L Thompson // ---- Check if elem size matches 138186e10729SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[j], &elem_rstr)); 1382382e9c83SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetType(elem_rstr, &rstr_type)); 1383382e9c83SJeremy L Thompson if (is_active_at_points && rstr_type != CEED_RESTRICTION_POINTS) continue; 1384382e9c83SJeremy L Thompson if (rstr_type == CEED_RESTRICTION_POINTS) { 1385382e9c83SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumPointsInElement(elem_rstr, e, &elem_size)); 1386382e9c83SJeremy L Thompson } else { 1387382e9c83SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size)); 1388382e9c83SJeremy L Thompson } 1389382e9c83SJeremy L Thompson { 1390382e9c83SJeremy L Thompson CeedInt num_comp = 0; 1391382e9c83SJeremy L Thompson 1392382e9c83SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumComponents(elem_rstr, &num_comp)); 1393382e9c83SJeremy L Thompson if (e_vec_size != num_comp * elem_size) continue; 1394382e9c83SJeremy L Thompson } 1395382e9c83SJeremy L Thompson 1396fb133d4bSJeremy L Thompson // ---- Basis action 139786e10729SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[j], &eval_mode)); 1398fb133d4bSJeremy L Thompson switch (eval_mode) { 1399fb133d4bSJeremy L Thompson case CEED_EVAL_NONE: 1400fb133d4bSJeremy L Thompson break; // No action 1401fb133d4bSJeremy L Thompson case CEED_EVAL_INTERP: 1402fb133d4bSJeremy L Thompson case CEED_EVAL_GRAD: 1403fb133d4bSJeremy L Thompson case CEED_EVAL_DIV: 1404fb133d4bSJeremy L Thompson case CEED_EVAL_CURL: 140586e10729SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_output_fields[j], &basis)); 140686e10729SJeremy L Thompson CeedCallBackend(CeedBasisApplyAtPoints(basis, 1, &num_points, CEED_TRANSPOSE, eval_mode, impl->point_coords_elem, impl->q_vecs_out[j], 140786e10729SJeremy L Thompson impl->e_vecs_out[j])); 1408fb133d4bSJeremy L Thompson break; 1409fb133d4bSJeremy L Thompson // LCOV_EXCL_START 1410fb133d4bSJeremy L Thompson case CEED_EVAL_WEIGHT: { 1411fb133d4bSJeremy L Thompson return CeedError(CeedOperatorReturnCeed(op), CEED_ERROR_BACKEND, "CEED_EVAL_WEIGHT cannot be an output evaluation mode"); 1412fb133d4bSJeremy L Thompson // LCOV_EXCL_STOP 1413fb133d4bSJeremy L Thompson } 1414fb133d4bSJeremy L Thompson } 1415fb133d4bSJeremy L Thompson // ---- Update output vector 1416fb133d4bSJeremy L Thompson { 1417fb133d4bSJeremy L Thompson CeedScalar *array, current_value = 0.0; 1418fb133d4bSJeremy L Thompson 141986e10729SJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->e_vecs_out[j], CEED_MEM_HOST, &array)); 1420fb133d4bSJeremy L Thompson current_value = array[s]; 142186e10729SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->e_vecs_out[j], &array)); 142286e10729SJeremy L Thompson CeedCallBackend(CeedVectorSetValue(impl->e_vecs_out[j], 0.0)); 142386e10729SJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->e_vecs_out[j], CEED_MEM_HOST, &array)); 1424fb133d4bSJeremy L Thompson array[s] = current_value; 142586e10729SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->e_vecs_out[j], &array)); 1426fb133d4bSJeremy L Thompson } 1427fb133d4bSJeremy L Thompson // ---- Restrict output block 1428fb133d4bSJeremy L Thompson if (rstr_type == CEED_RESTRICTION_POINTS) { 142986e10729SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(elem_rstr, e, CEED_TRANSPOSE, impl->e_vecs_out[j], assembled, request)); 1430fb133d4bSJeremy L Thompson } else { 143186e10729SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyBlock(elem_rstr, e, CEED_TRANSPOSE, impl->e_vecs_out[j], assembled, request)); 1432fb133d4bSJeremy L Thompson } 1433fb133d4bSJeremy L Thompson } 1434382e9c83SJeremy L Thompson // -- Reset unit vector 143513062808SJeremy L Thompson if (s == e_vec_size - 1) CeedCallBackend(CeedVectorSetValue(impl->q_vecs_in[i], 0.0)); 1436382e9c83SJeremy L Thompson } 1437fb133d4bSJeremy L Thompson } 1438fb133d4bSJeremy L Thompson num_points_offset += num_points; 1439fb133d4bSJeremy L Thompson } 1440fb133d4bSJeremy L Thompson 1441fb133d4bSJeremy L Thompson // Restore input arrays 1442fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, true, e_data, impl)); 1443fb133d4bSJeremy L Thompson 1444fb133d4bSJeremy L Thompson // Cleanup 1445fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&in_vec)); 1446fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&out_vec)); 1447fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&point_coords)); 1448fb133d4bSJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_points)); 1449fb133d4bSJeremy L Thompson return CEED_ERROR_SUCCESS; 1450fb133d4bSJeremy L Thompson } 1451e13f2367SZach Atkins 1452e13f2367SZach Atkins //------------------------------------------------------------------------------ 1453f10650afSjeremylt // Operator Destroy 1454f10650afSjeremylt //------------------------------------------------------------------------------ 1455f10650afSjeremylt static int CeedOperatorDestroy_Ref(CeedOperator op) { 1456f10650afSjeremylt CeedOperator_Ref *impl; 1457f10650afSjeremylt 1458ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 14593aab95c0SJeremy L Thompson CeedCallBackend(CeedFree(&impl->skip_rstr_in)); 1460*f8a0df59SJeremy L Thompson CeedCallBackend(CeedFree(&impl->skip_rstr_out)); 1461*f8a0df59SJeremy L Thompson CeedCallBackend(CeedFree(&impl->e_data_out_indices)); 1462*f8a0df59SJeremy L Thompson CeedCallBackend(CeedFree(&impl->apply_add_basis_out)); 14634fc1f125SJeremy L Thompson for (CeedInt i = 0; i < impl->num_inputs + impl->num_outputs; i++) { 14642b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->e_vecs_full[i])); 1465f10650afSjeremylt } 14662b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->e_vecs_full)); 14672b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->input_states)); 1468f10650afSjeremylt 14694fc1f125SJeremy L Thompson for (CeedInt i = 0; i < impl->num_inputs; i++) { 14702b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->e_vecs_in[i])); 14712b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->q_vecs_in[i])); 1472f10650afSjeremylt } 14732b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->e_vecs_in)); 14742b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->q_vecs_in)); 1475f10650afSjeremylt 14764fc1f125SJeremy L Thompson for (CeedInt i = 0; i < impl->num_outputs; i++) { 14772b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->e_vecs_out[i])); 14782b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->q_vecs_out[i])); 1479f10650afSjeremylt } 14802b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->e_vecs_out)); 14812b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->q_vecs_out)); 148248acf710SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->point_coords_elem)); 1483f10650afSjeremylt 14842b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl)); 1485e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 1486f10650afSjeremylt } 1487f10650afSjeremylt 1488f10650afSjeremylt //------------------------------------------------------------------------------ 1489713f43c3Sjeremylt // Operator Create 1490f10650afSjeremylt //------------------------------------------------------------------------------ 149121617c04Sjeremylt int CeedOperatorCreate_Ref(CeedOperator op) { 1492fe2413ffSjeremylt Ceed ceed; 14934ce2993fSjeremylt CeedOperator_Ref *impl; 149421617c04Sjeremylt 1495ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 14962b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(1, &impl)); 14972b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetData(op, impl)); 14982b730f8bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleQFunction", CeedOperatorLinearAssembleQFunction_Ref)); 14992b730f8bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleQFunctionUpdate", CeedOperatorLinearAssembleQFunctionUpdate_Ref)); 15002b730f8bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "ApplyAdd", CeedOperatorApplyAdd_Ref)); 15012b730f8bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "Destroy", CeedOperatorDestroy_Ref)); 1502e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 150321617c04Sjeremylt } 15042a86cc9dSSebastian Grimberg 15052a86cc9dSSebastian Grimberg //------------------------------------------------------------------------------ 150648acf710SJeremy L Thompson // Operator Create At Points 150748acf710SJeremy L Thompson //------------------------------------------------------------------------------ 150848acf710SJeremy L Thompson int CeedOperatorCreateAtPoints_Ref(CeedOperator op) { 150948acf710SJeremy L Thompson Ceed ceed; 151048acf710SJeremy L Thompson CeedOperator_Ref *impl; 151148acf710SJeremy L Thompson 151248acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 151348acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(1, &impl)); 151448acf710SJeremy L Thompson CeedCallBackend(CeedOperatorSetData(op, impl)); 1515e13f2367SZach Atkins CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleQFunction", CeedOperatorLinearAssembleQFunctionAtPoints_Ref)); 1516e13f2367SZach Atkins CeedCallBackend( 1517e13f2367SZach Atkins CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleQFunctionUpdate", CeedOperatorLinearAssembleQFunctionAtPointsUpdate_Ref)); 1518fb133d4bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleAddDiagonal", CeedOperatorLinearAssembleAddDiagonalAtPoints_Ref)); 151948acf710SJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "ApplyAdd", CeedOperatorApplyAddAtPoints_Ref)); 152048acf710SJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "Destroy", CeedOperatorDestroy_Ref)); 152148acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 152248acf710SJeremy L Thompson } 152348acf710SJeremy L Thompson 152448acf710SJeremy L Thompson //------------------------------------------------------------------------------ 1525