15aed82e4SJeremy L Thompson // Copyright (c) 2017-2024, Lawrence Livermore National Security, LLC and other CEED contributors. 23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details. 321617c04Sjeremylt // 43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause 521617c04Sjeremylt // 63d8e8822SJeremy L Thompson // This file is part of CEED: http://github.com/ceed 721617c04Sjeremylt 849aac155SJeremy L Thompson #include <ceed.h> 9ec3da8bcSJed Brown #include <ceed/backend.h> 103d576824SJeremy L Thompson #include <stdbool.h> 113d576824SJeremy L Thompson #include <stddef.h> 123d576824SJeremy L Thompson #include <stdint.h> 132b730f8bSJeremy L Thompson 1421617c04Sjeremylt #include "ceed-ref.h" 1521617c04Sjeremylt 16f10650afSjeremylt //------------------------------------------------------------------------------ 17f10650afSjeremylt // Setup Input/Output Fields 18f10650afSjeremylt //------------------------------------------------------------------------------ 19f8a0df59SJeremy L Thompson static int CeedOperatorSetupFields_Ref(CeedQFunction qf, CeedOperator op, bool is_input, bool *skip_rstr, CeedInt *e_data_out_indices, 20f8a0df59SJeremy L Thompson bool *apply_add_basis, CeedVector *e_vecs_full, CeedVector *e_vecs, CeedVector *q_vecs, CeedInt start_e, 21f8a0df59SJeremy L Thompson CeedInt num_fields, CeedInt Q) { 22aedaa0e5Sjeremylt Ceed ceed; 236efa0d72SZach Atkins CeedSize e_size, q_size; 24ad70ee2cSJeremy L Thompson CeedInt num_comp, size, P; 25d1d35e2fSjeremylt CeedQFunctionField *qf_fields; 26ad70ee2cSJeremy L Thompson CeedOperatorField *op_fields; 27ad70ee2cSJeremy L Thompson 28e910d748SJeremy L Thompson { 29e910d748SJeremy L Thompson Ceed ceed_parent; 30e910d748SJeremy L Thompson 31ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 32e910d748SJeremy L Thompson CeedCallBackend(CeedGetParent(ceed, &ceed_parent)); 33e910d748SJeremy L Thompson if (ceed_parent) ceed = ceed_parent; 34e910d748SJeremy L Thompson } 354fc1f125SJeremy L Thompson if (is_input) { 362b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL)); 372b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL)); 384fc1f125SJeremy L Thompson } else { 392b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields)); 402b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, NULL, NULL, &qf_fields)); 41fe2413ffSjeremylt } 4221617c04Sjeremylt 43885ac19cSjeremylt // Loop over fields 44d1d35e2fSjeremylt for (CeedInt i = 0; i < num_fields; i++) { 45d1d35e2fSjeremylt CeedEvalMode eval_mode; 46edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 47ad70ee2cSJeremy L Thompson CeedBasis basis; 48d1d35e2fSjeremylt 49ad70ee2cSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 50d1d35e2fSjeremylt if (eval_mode != CEED_EVAL_WEIGHT) { 51edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr)); 52edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionCreateVector(elem_rstr, NULL, &e_vecs_full[i + start_e])); 53*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 54135a076eSjeremylt } 55135a076eSjeremylt 56d1d35e2fSjeremylt switch (eval_mode) { 57885ac19cSjeremylt case CEED_EVAL_NONE: 582b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_fields[i], &size)); 59d2643443SJeremy L Thompson q_size = (CeedSize)Q * size; 602b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 61aedaa0e5Sjeremylt break; 62aedaa0e5Sjeremylt case CEED_EVAL_INTERP: 63885ac19cSjeremylt case CEED_EVAL_GRAD: 64a915a514Srezgarshakeri case CEED_EVAL_DIV: 65c4e3f59bSSebastian Grimberg case CEED_EVAL_CURL: 662b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 672b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_fields[i], &size)); 682b730f8bSJeremy L Thompson CeedCallBackend(CeedBasisGetNumNodes(basis, &P)); 692b730f8bSJeremy L Thompson CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 70d2643443SJeremy L Thompson e_size = (CeedSize)P * num_comp; 712b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, e_size, &e_vecs[i])); 72d2643443SJeremy L Thompson q_size = (CeedSize)Q * size; 732b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 74*681d0ea7SJeremy L Thompson CeedCallBackend(CeedBasisDestroy(&basis)); 75885ac19cSjeremylt break; 76885ac19cSjeremylt case CEED_EVAL_WEIGHT: // Only on input fields 772b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 78d2643443SJeremy L Thompson q_size = (CeedSize)Q; 792b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 802b730f8bSJeremy L Thompson CeedCallBackend(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, q_vecs[i])); 81*681d0ea7SJeremy L Thompson CeedCallBackend(CeedBasisDestroy(&basis)); 82885ac19cSjeremylt break; 8321617c04Sjeremylt } 84885ac19cSjeremylt } 85f8a0df59SJeremy L Thompson // Drop duplicate restrictions 863aab95c0SJeremy L Thompson if (is_input) { 873aab95c0SJeremy L Thompson for (CeedInt i = 0; i < num_fields; i++) { 883aab95c0SJeremy L Thompson CeedVector vec_i; 893aab95c0SJeremy L Thompson CeedElemRestriction rstr_i; 903aab95c0SJeremy L Thompson 913aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[i], &vec_i)); 923aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr_i)); 933aab95c0SJeremy L Thompson for (CeedInt j = i + 1; j < num_fields; j++) { 943aab95c0SJeremy L Thompson CeedVector vec_j; 953aab95c0SJeremy L Thompson CeedElemRestriction rstr_j; 963aab95c0SJeremy L Thompson 973aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[j], &vec_j)); 983aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[j], &rstr_j)); 993aab95c0SJeremy L Thompson if (vec_i == vec_j && rstr_i == rstr_j) { 1003aab95c0SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs[i], &e_vecs[j])); 101f8a0df59SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs_full[i + start_e], &e_vecs_full[j + start_e])); 1023aab95c0SJeremy L Thompson skip_rstr[j] = true; 1033aab95c0SJeremy L Thompson } 104*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec_j)); 105*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_j)); 1063aab95c0SJeremy L Thompson } 107*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec_i)); 108*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_i)); 1093aab95c0SJeremy L Thompson } 110f8a0df59SJeremy L Thompson } else { 111f8a0df59SJeremy L Thompson for (CeedInt i = num_fields - 1; i >= 0; i--) { 112f8a0df59SJeremy L Thompson CeedVector vec_i; 113f8a0df59SJeremy L Thompson CeedElemRestriction rstr_i; 114f8a0df59SJeremy L Thompson 115f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[i], &vec_i)); 116f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr_i)); 117f8a0df59SJeremy L Thompson for (CeedInt j = i - 1; j >= 0; j--) { 118f8a0df59SJeremy L Thompson CeedVector vec_j; 119f8a0df59SJeremy L Thompson CeedElemRestriction rstr_j; 120f8a0df59SJeremy L Thompson 121f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[j], &vec_j)); 122f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[j], &rstr_j)); 123f8a0df59SJeremy L Thompson if (vec_i == vec_j && rstr_i == rstr_j) { 124f8a0df59SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs[i], &e_vecs[j])); 125f8a0df59SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs_full[i + start_e], &e_vecs_full[j + start_e])); 126f8a0df59SJeremy L Thompson skip_rstr[j] = true; 127f8a0df59SJeremy L Thompson apply_add_basis[i] = true; 128f8a0df59SJeremy L Thompson e_data_out_indices[j] = i; 129f8a0df59SJeremy L Thompson } 130*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec_j)); 131*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_j)); 132f8a0df59SJeremy L Thompson } 133*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec_i)); 134*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_i)); 135f8a0df59SJeremy L Thompson } 1363aab95c0SJeremy L Thompson } 137e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 13821617c04Sjeremylt } 13921617c04Sjeremylt 140f10650afSjeremylt //------------------------------------------------------------------------------ 141f10650afSjeremylt // Setup Operator 142f10650afSjeremylt //------------------------------------------------------------------------------/* 143885ac19cSjeremylt static int CeedOperatorSetup_Ref(CeedOperator op) { 1448c1105f8SJeremy L Thompson bool is_setup_done; 145ad70ee2cSJeremy L Thompson CeedInt Q, num_input_fields, num_output_fields; 146ad70ee2cSJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 147ad70ee2cSJeremy L Thompson CeedQFunction qf; 148ad70ee2cSJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 149ad70ee2cSJeremy L Thompson CeedOperator_Ref *impl; 150ad70ee2cSJeremy L Thompson 1512b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorIsSetupDone(op, &is_setup_done)); 1528c1105f8SJeremy L Thompson if (is_setup_done) return CEED_ERROR_SUCCESS; 153ad70ee2cSJeremy L Thompson 1542b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 1552b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 1562b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumQuadraturePoints(op, &Q)); 1572b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionIsIdentity(qf, &impl->is_identity_qf)); 1582b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 1592b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 160885ac19cSjeremylt 161885ac19cSjeremylt // Allocate 1622b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(num_input_fields + num_output_fields, &impl->e_vecs_full)); 163885ac19cSjeremylt 1643aab95c0SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->skip_rstr_in)); 165f8a0df59SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->skip_rstr_out)); 166f8a0df59SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_data_out_indices)); 167f8a0df59SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->apply_add_basis_out)); 1682b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->input_states)); 1692b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_vecs_in)); 1702b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_vecs_out)); 1712b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->q_vecs_in)); 1722b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->q_vecs_out)); 173885ac19cSjeremylt 1744fc1f125SJeremy L Thompson impl->num_inputs = num_input_fields; 1754fc1f125SJeremy L Thompson impl->num_outputs = num_output_fields; 176885ac19cSjeremylt 177d1d35e2fSjeremylt // Set up infield and outfield e_vecs and q_vecs 178885ac19cSjeremylt // Infields 179f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorSetupFields_Ref(qf, op, true, impl->skip_rstr_in, NULL, NULL, impl->e_vecs_full, impl->e_vecs_in, impl->q_vecs_in, 0, 180f8a0df59SJeremy L Thompson num_input_fields, Q)); 1813aab95c0SJeremy L Thompson // Outfields 182f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorSetupFields_Ref(qf, op, false, impl->skip_rstr_out, impl->e_data_out_indices, impl->apply_add_basis_out, 183f8a0df59SJeremy L Thompson impl->e_vecs_full, impl->e_vecs_out, impl->q_vecs_out, num_input_fields, num_output_fields, Q)); 184885ac19cSjeremylt 18516911fdaSjeremylt // Identity QFunctions 1860b454692Sjeremylt if (impl->is_identity_qf) { 187d1d35e2fSjeremylt CeedEvalMode in_mode, out_mode; 188d1d35e2fSjeremylt CeedQFunctionField *in_fields, *out_fields; 189ad70ee2cSJeremy L Thompson 1902b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &in_fields, NULL, &out_fields)); 1912b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(in_fields[0], &in_mode)); 1922b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(out_fields[0], &out_mode)); 193d1d35e2fSjeremylt 1940b454692Sjeremylt if (in_mode == CEED_EVAL_NONE && out_mode == CEED_EVAL_NONE) { 195edb2538eSJeremy L Thompson impl->is_identity_rstr_op = true; 1960b454692Sjeremylt } else { 197db002c03SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(impl->q_vecs_in[0], &impl->q_vecs_out[0])); 19816911fdaSjeremylt } 19916911fdaSjeremylt } 20016911fdaSjeremylt 2012b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetSetupDone(op)); 202e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 203885ac19cSjeremylt } 204885ac19cSjeremylt 205f10650afSjeremylt //------------------------------------------------------------------------------ 206f10650afSjeremylt // Setup Operator Inputs 207f10650afSjeremylt //------------------------------------------------------------------------------ 2082b730f8bSJeremy L Thompson static inline int CeedOperatorSetupInputs_Ref(CeedInt num_input_fields, CeedQFunctionField *qf_input_fields, CeedOperatorField *op_input_fields, 2092b730f8bSJeremy L Thompson CeedVector in_vec, const bool skip_active, CeedScalar *e_data_full[2 * CEED_FIELD_MAX], 210a0162de9SJeremy L Thompson CeedOperator_Ref *impl, CeedRequest *request) { 211ad70ee2cSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 212*681d0ea7SJeremy L Thompson bool is_active; 213ad70ee2cSJeremy L Thompson uint64_t state; 214d1d35e2fSjeremylt CeedEvalMode eval_mode; 215d1bcdac9Sjeremylt CeedVector vec; 216885ac19cSjeremylt 217d1bcdac9Sjeremylt // Get input vector 2182b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 219*681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 220*681d0ea7SJeremy L Thompson if (is_active) { 2212b730f8bSJeremy L Thompson if (skip_active) continue; 2222b730f8bSJeremy L Thompson else vec = in_vec; 2231d102b48SJeremy L Thompson } 2241d102b48SJeremy L Thompson 2252b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 2261d102b48SJeremy L Thompson // Restrict and Evec 227d1d35e2fSjeremylt if (eval_mode == CEED_EVAL_WEIGHT) { // Skip 2281d102b48SJeremy L Thompson } else { 229668048e2SJed Brown // Restrict 2302b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorGetState(vec, &state)); 2318d713cf6Sjeremylt // Skip restriction if input is unchanged 2323aab95c0SJeremy L Thompson if ((state != impl->input_states[i] || vec == in_vec) && !impl->skip_rstr_in[i]) { 233*681d0ea7SJeremy L Thompson CeedElemRestriction elem_rstr; 234*681d0ea7SJeremy L Thompson 235edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 236edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApply(elem_rstr, CEED_NOTRANSPOSE, vec, impl->e_vecs_full[i], request)); 237*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 2388d713cf6Sjeremylt } 2393aab95c0SJeremy L Thompson impl->input_states[i] = state; 240668048e2SJed Brown // Get evec 2412b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorGetArrayRead(impl->e_vecs_full[i], CEED_MEM_HOST, (const CeedScalar **)&e_data_full[i])); 242885ac19cSjeremylt } 243*681d0ea7SJeremy L Thompson if (!is_active) CeedCallBackend(CeedVectorDestroy(&vec)); 244885ac19cSjeremylt } 245e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 246885ac19cSjeremylt } 247885ac19cSjeremylt 248f10650afSjeremylt //------------------------------------------------------------------------------ 249f10650afSjeremylt // Input Basis Action 250f10650afSjeremylt //------------------------------------------------------------------------------ 2512b730f8bSJeremy L Thompson static inline int CeedOperatorInputBasis_Ref(CeedInt e, CeedInt Q, CeedQFunctionField *qf_input_fields, CeedOperatorField *op_input_fields, 2522b730f8bSJeremy L Thompson CeedInt num_input_fields, const bool skip_active, CeedScalar *e_data_full[2 * CEED_FIELD_MAX], 2532b730f8bSJeremy L Thompson CeedOperator_Ref *impl) { 254ad70ee2cSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 255a915a514Srezgarshakeri CeedInt elem_size, size, num_comp; 256d1d35e2fSjeremylt CeedEvalMode eval_mode; 257edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 2581d102b48SJeremy L Thompson CeedBasis basis; 2591d102b48SJeremy L Thompson 2601d102b48SJeremy L Thompson // Skip active input 261d1d35e2fSjeremylt if (skip_active) { 262*681d0ea7SJeremy L Thompson bool is_active; 2631d102b48SJeremy L Thompson CeedVector vec; 264ad70ee2cSJeremy L Thompson 2652b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 266*681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 267*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 268*681d0ea7SJeremy L Thompson if (is_active) continue; 2691d102b48SJeremy L Thompson } 270d1d35e2fSjeremylt // Get elem_size, eval_mode, size 271edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 272edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size)); 273*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 2742b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 2752b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &size)); 276885ac19cSjeremylt // Basis action 277d1d35e2fSjeremylt switch (eval_mode) { 278885ac19cSjeremylt case CEED_EVAL_NONE: 27981670346SSebastian Grimberg CeedCallBackend(CeedVectorSetArray(impl->q_vecs_in[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data_full[i][(CeedSize)e * Q * size])); 280885ac19cSjeremylt break; 281885ac19cSjeremylt case CEED_EVAL_INTERP: 282885ac19cSjeremylt case CEED_EVAL_GRAD: 283a915a514Srezgarshakeri case CEED_EVAL_DIV: 284c4e3f59bSSebastian Grimberg case CEED_EVAL_CURL: 285a915a514Srezgarshakeri CeedCallBackend(CeedOperatorFieldGetBasis(op_input_fields[i], &basis)); 286a915a514Srezgarshakeri CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 28781670346SSebastian Grimberg CeedCallBackend(CeedVectorSetArray(impl->e_vecs_in[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data_full[i][(CeedSize)e * elem_size * num_comp])); 288c4e3f59bSSebastian Grimberg CeedCallBackend(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, eval_mode, impl->e_vecs_in[i], impl->q_vecs_in[i])); 289*681d0ea7SJeremy L Thompson CeedCallBackend(CeedBasisDestroy(&basis)); 290a915a514Srezgarshakeri break; 291885ac19cSjeremylt case CEED_EVAL_WEIGHT: 292885ac19cSjeremylt break; // No action 293885ac19cSjeremylt } 294885ac19cSjeremylt } 295e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 296885ac19cSjeremylt } 297885ac19cSjeremylt 298f10650afSjeremylt //------------------------------------------------------------------------------ 299f10650afSjeremylt // Output Basis Action 300f10650afSjeremylt //------------------------------------------------------------------------------ 3012b730f8bSJeremy L Thompson static inline int CeedOperatorOutputBasis_Ref(CeedInt e, CeedInt Q, CeedQFunctionField *qf_output_fields, CeedOperatorField *op_output_fields, 302f8a0df59SJeremy L Thompson CeedInt num_input_fields, CeedInt num_output_fields, bool *apply_add_basis, CeedOperator op, 3034fc1f125SJeremy L Thompson CeedScalar *e_data_full[2 * CEED_FIELD_MAX], CeedOperator_Ref *impl) { 304ad70ee2cSJeremy L Thompson for (CeedInt i = 0; i < num_output_fields; i++) { 305a915a514Srezgarshakeri CeedInt elem_size, num_comp; 306d1d35e2fSjeremylt CeedEvalMode eval_mode; 307edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 3081d102b48SJeremy L Thompson CeedBasis basis; 3091d102b48SJeremy L Thompson 310a915a514Srezgarshakeri // Get elem_size, eval_mode 311edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); 312edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size)); 313*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 3142b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); 315885ac19cSjeremylt // Basis action 316d1d35e2fSjeremylt switch (eval_mode) { 317885ac19cSjeremylt case CEED_EVAL_NONE: 318885ac19cSjeremylt break; // No action 319885ac19cSjeremylt case CEED_EVAL_INTERP: 320885ac19cSjeremylt case CEED_EVAL_GRAD: 321a915a514Srezgarshakeri case CEED_EVAL_DIV: 322c4e3f59bSSebastian Grimberg case CEED_EVAL_CURL: 323a915a514Srezgarshakeri CeedCallBackend(CeedOperatorFieldGetBasis(op_output_fields[i], &basis)); 324a915a514Srezgarshakeri CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 32581670346SSebastian Grimberg CeedCallBackend(CeedVectorSetArray(impl->e_vecs_out[i], CEED_MEM_HOST, CEED_USE_POINTER, 32681670346SSebastian Grimberg &e_data_full[i + num_input_fields][(CeedSize)e * elem_size * num_comp])); 327f8a0df59SJeremy L Thompson if (apply_add_basis[i]) { 328f8a0df59SJeremy L Thompson CeedCallBackend(CeedBasisApplyAdd(basis, 1, CEED_TRANSPOSE, eval_mode, impl->q_vecs_out[i], impl->e_vecs_out[i])); 329f8a0df59SJeremy L Thompson } else { 330c4e3f59bSSebastian Grimberg CeedCallBackend(CeedBasisApply(basis, 1, CEED_TRANSPOSE, eval_mode, impl->q_vecs_out[i], impl->e_vecs_out[i])); 331f8a0df59SJeremy L Thompson } 332*681d0ea7SJeremy L Thompson CeedCallBackend(CeedBasisDestroy(&basis)); 333a915a514Srezgarshakeri break; 334c042f62fSJeremy L Thompson // LCOV_EXCL_START 335bbfacfcdSjeremylt case CEED_EVAL_WEIGHT: { 3366e536b99SJeremy L Thompson return CeedError(CeedOperatorReturnCeed(op), CEED_ERROR_BACKEND, "CEED_EVAL_WEIGHT cannot be an output evaluation mode"); 3371d102b48SJeremy L Thompson // LCOV_EXCL_STOP 338885ac19cSjeremylt } 339885ac19cSjeremylt } 340885ac19cSjeremylt } 341e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 3421d102b48SJeremy L Thompson } 3431d102b48SJeremy L Thompson 344f10650afSjeremylt //------------------------------------------------------------------------------ 345f10650afSjeremylt // Restore Input Vectors 346f10650afSjeremylt //------------------------------------------------------------------------------ 3472b730f8bSJeremy L Thompson static inline int CeedOperatorRestoreInputs_Ref(CeedInt num_input_fields, CeedQFunctionField *qf_input_fields, CeedOperatorField *op_input_fields, 3482b730f8bSJeremy L Thompson const bool skip_active, CeedScalar *e_data_full[2 * CEED_FIELD_MAX], CeedOperator_Ref *impl) { 349ad70ee2cSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 350d1d35e2fSjeremylt CeedEvalMode eval_mode; 3511d102b48SJeremy L Thompson 3521d102b48SJeremy L Thompson // Skip active inputs 353d1d35e2fSjeremylt if (skip_active) { 354*681d0ea7SJeremy L Thompson bool is_active; 3551d102b48SJeremy L Thompson CeedVector vec; 356ad70ee2cSJeremy L Thompson 3572b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 358*681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 359*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 360*681d0ea7SJeremy L Thompson if (is_active) continue; 3611d102b48SJeremy L Thompson } 3621d102b48SJeremy L Thompson // Restore input 3632b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 364d1d35e2fSjeremylt if (eval_mode == CEED_EVAL_WEIGHT) { // Skip 3651d102b48SJeremy L Thompson } else { 3662b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArrayRead(impl->e_vecs_full[i], (const CeedScalar **)&e_data_full[i])); 3671d102b48SJeremy L Thompson } 3681d102b48SJeremy L Thompson } 369e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 3701d102b48SJeremy L Thompson } 3711d102b48SJeremy L Thompson 372f10650afSjeremylt //------------------------------------------------------------------------------ 373f10650afSjeremylt // Operator Apply 374f10650afSjeremylt //------------------------------------------------------------------------------ 3752b730f8bSJeremy L Thompson static int CeedOperatorApplyAdd_Ref(CeedOperator op, CeedVector in_vec, CeedVector out_vec, CeedRequest *request) { 376d1d35e2fSjeremylt CeedInt Q, num_elem, num_input_fields, num_output_fields, size; 377ad70ee2cSJeremy L Thompson CeedEvalMode eval_mode; 378ad70ee2cSJeremy L Thompson CeedScalar *e_data_full[2 * CEED_FIELD_MAX] = {NULL}; 379ad70ee2cSJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 380ad70ee2cSJeremy L Thompson CeedQFunction qf; 381ad70ee2cSJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 382ad70ee2cSJeremy L Thompson CeedOperator_Ref *impl; 383ad70ee2cSJeremy L Thompson 384ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 385ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 3862b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumQuadraturePoints(op, &Q)); 3872b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 3882b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 3892b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 3901d102b48SJeremy L Thompson 3911d102b48SJeremy L Thompson // Setup 3922b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetup_Ref(op)); 3931d102b48SJeremy L Thompson 3940b454692Sjeremylt // Restriction only operator 395edb2538eSJeremy L Thompson if (impl->is_identity_rstr_op) { 396edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 397ad70ee2cSJeremy L Thompson 398edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[0], &elem_rstr)); 399edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApply(elem_rstr, CEED_NOTRANSPOSE, in_vec, impl->e_vecs_full[0], request)); 400*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 401edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[0], &elem_rstr)); 402edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApply(elem_rstr, CEED_TRANSPOSE, impl->e_vecs_full[0], out_vec, request)); 403*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 4040b454692Sjeremylt return CEED_ERROR_SUCCESS; 4050b454692Sjeremylt } 4060b454692Sjeremylt 4071d102b48SJeremy L Thompson // Input Evecs and Restriction 4082b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, in_vec, false, e_data_full, impl, request)); 4091d102b48SJeremy L Thompson 4101d102b48SJeremy L Thompson // Output Evecs 411f8a0df59SJeremy L Thompson for (CeedInt i = num_output_fields - 1; i >= 0; i--) { 412f8a0df59SJeremy L Thompson if (impl->skip_rstr_out[i]) { 413f8a0df59SJeremy L Thompson e_data_full[i + num_input_fields] = e_data_full[impl->e_data_out_indices[i] + num_input_fields]; 414f8a0df59SJeremy L Thompson } else { 4152b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorGetArrayWrite(impl->e_vecs_full[i + impl->num_inputs], CEED_MEM_HOST, &e_data_full[i + num_input_fields])); 4161d102b48SJeremy L Thompson } 417f8a0df59SJeremy L Thompson } 4181d102b48SJeremy L Thompson 4191d102b48SJeremy L Thompson // Loop through elements 420d1d35e2fSjeremylt for (CeedInt e = 0; e < num_elem; e++) { 4211d102b48SJeremy L Thompson // Output pointers 422d1d35e2fSjeremylt for (CeedInt i = 0; i < num_output_fields; i++) { 4232b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); 424d1d35e2fSjeremylt if (eval_mode == CEED_EVAL_NONE) { 4252b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[i], &size)); 42681670346SSebastian Grimberg CeedCallBackend( 42781670346SSebastian Grimberg CeedVectorSetArray(impl->q_vecs_out[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data_full[i + num_input_fields][(CeedSize)e * Q * size])); 4281d102b48SJeremy L Thompson } 4291d102b48SJeremy L Thompson } 4301d102b48SJeremy L Thompson 43116911fdaSjeremylt // Input basis apply 4322b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorInputBasis_Ref(e, Q, qf_input_fields, op_input_fields, num_input_fields, false, e_data_full, impl)); 43316911fdaSjeremylt 4341d102b48SJeremy L Thompson // Q function 4350b454692Sjeremylt if (!impl->is_identity_qf) { 4362b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionApply(qf, Q, impl->q_vecs_in, impl->q_vecs_out)); 43716911fdaSjeremylt } 4381d102b48SJeremy L Thompson 4391d102b48SJeremy L Thompson // Output basis apply 440f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorOutputBasis_Ref(e, Q, qf_output_fields, op_output_fields, num_input_fields, num_output_fields, 441f8a0df59SJeremy L Thompson impl->apply_add_basis_out, op, e_data_full, impl)); 4421d102b48SJeremy L Thompson } 443885ac19cSjeremylt 444885ac19cSjeremylt // Output restriction 445d1d35e2fSjeremylt for (CeedInt i = 0; i < num_output_fields; i++) { 446*681d0ea7SJeremy L Thompson bool is_active; 447ad70ee2cSJeremy L Thompson CeedVector vec; 448edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 449ad70ee2cSJeremy L Thompson 450f8a0df59SJeremy L Thompson if (impl->skip_rstr_out[i]) continue; 451d1d35e2fSjeremylt // Restore Evec 4522b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->e_vecs_full[i + impl->num_inputs], &e_data_full[i + num_input_fields])); 453d1bcdac9Sjeremylt // Get output vector 4542b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[i], &vec)); 455668048e2SJed Brown // Active 456*681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 457*681d0ea7SJeremy L Thompson if (is_active) vec = out_vec; 4587ca8db16Sjeremylt // Restrict 459edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); 460edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApply(elem_rstr, CEED_TRANSPOSE, impl->e_vecs_full[i + impl->num_inputs], vec, request)); 461*681d0ea7SJeremy L Thompson if (!is_active) CeedCallBackend(CeedVectorDestroy(&vec)); 462*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 463885ac19cSjeremylt } 464885ac19cSjeremylt 4657ca8db16Sjeremylt // Restore input arrays 4662b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, false, e_data_full, impl)); 467e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 46821617c04Sjeremylt } 46921617c04Sjeremylt 470f10650afSjeremylt //------------------------------------------------------------------------------ 47170a7ffb3SJeremy L Thompson // Core code for assembling linear QFunction 472f10650afSjeremylt //------------------------------------------------------------------------------ 4732b730f8bSJeremy L Thompson static inline int CeedOperatorLinearAssembleQFunctionCore_Ref(CeedOperator op, bool build_objects, CeedVector *assembled, CeedElemRestriction *rstr, 47470a7ffb3SJeremy L Thompson CeedRequest *request) { 475e910d748SJeremy L Thompson Ceed ceed, ceed_parent; 476ff8551c5SJeremy L Thompson CeedInt qf_size_in, qf_size_out, Q, num_elem, num_input_fields, num_output_fields; 477ad70ee2cSJeremy L Thompson CeedScalar *assembled_array, *e_data_full[2 * CEED_FIELD_MAX] = {NULL}; 478ad70ee2cSJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 479ad70ee2cSJeremy L Thompson CeedQFunction qf; 480ad70ee2cSJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 481ad70ee2cSJeremy L Thompson CeedOperator_Ref *impl; 482ad70ee2cSJeremy L Thompson 4832b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 484e910d748SJeremy L Thompson CeedCallBackend(CeedOperatorGetFallbackParentCeed(op, &ceed_parent)); 485e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 486ff8551c5SJeremy L Thompson qf_size_in = impl->qf_size_in; 487ff8551c5SJeremy L Thompson qf_size_out = impl->qf_size_out; 488e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 489e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumQuadraturePoints(op, &Q)); 490e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 491e984cf9aSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 492e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 4931d102b48SJeremy L Thompson 4941d102b48SJeremy L Thompson // Setup 4952b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetup_Ref(op)); 4961d102b48SJeremy L Thompson 497506b1a0cSSebastian Grimberg // Check for restriction only operator 498506b1a0cSSebastian Grimberg CeedCheck(!impl->is_identity_rstr_op, ceed, CEED_ERROR_BACKEND, "Assembling restriction only operators is not supported"); 49916911fdaSjeremylt 5001d102b48SJeremy L Thompson // Input Evecs and Restriction 5012b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, NULL, true, e_data_full, impl, request)); 5021d102b48SJeremy L Thompson 5031d102b48SJeremy L Thompson // Count number of active input fields 504ff8551c5SJeremy L Thompson if (qf_size_in == 0) { 505d1d35e2fSjeremylt for (CeedInt i = 0; i < num_input_fields; i++) { 506c7b67790SJeremy L Thompson CeedInt field_size; 507ad70ee2cSJeremy L Thompson CeedVector vec; 508ad70ee2cSJeremy L Thompson 5091d102b48SJeremy L Thompson // Get input vector 5102b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 5111d102b48SJeremy L Thompson // Check if active input 5121d102b48SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 513c7b67790SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &field_size)); 5142b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(impl->q_vecs_in[i], 0.0)); 515ff8551c5SJeremy L Thompson qf_size_in += field_size; 5161d102b48SJeremy L Thompson } 517*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 5181d102b48SJeremy L Thompson } 519ff8551c5SJeremy L Thompson CeedCheck(qf_size_in > 0, ceed, CEED_ERROR_BACKEND, "Cannot assemble QFunction without active inputs and outputs"); 520ff8551c5SJeremy L Thompson impl->qf_size_in = qf_size_in; 521bb219a0fSJeremy L Thompson } 5221d102b48SJeremy L Thompson 5231d102b48SJeremy L Thompson // Count number of active output fields 524ff8551c5SJeremy L Thompson if (qf_size_out == 0) { 525d1d35e2fSjeremylt for (CeedInt i = 0; i < num_output_fields; i++) { 526c7b67790SJeremy L Thompson CeedInt field_size; 527ad70ee2cSJeremy L Thompson CeedVector vec; 528ad70ee2cSJeremy L Thompson 5291d102b48SJeremy L Thompson // Get output vector 5302b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[i], &vec)); 5311d102b48SJeremy L Thompson // Check if active output 5321d102b48SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 533c7b67790SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[i], &field_size)); 534ff8551c5SJeremy L Thompson qf_size_out += field_size; 5351d102b48SJeremy L Thompson } 536*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 5371d102b48SJeremy L Thompson } 538ff8551c5SJeremy L Thompson CeedCheck(qf_size_out > 0, ceed, CEED_ERROR_BACKEND, "Cannot assemble QFunction without active inputs and outputs"); 539ff8551c5SJeremy L Thompson impl->qf_size_out = qf_size_out; 540bb219a0fSJeremy L Thompson } 5411d102b48SJeremy L Thompson 54270a7ffb3SJeremy L Thompson // Build objects if needed 54370a7ffb3SJeremy L Thompson if (build_objects) { 544ff8551c5SJeremy L Thompson const CeedSize l_size = (CeedSize)num_elem * Q * qf_size_in * qf_size_out; 545ff8551c5SJeremy L Thompson CeedInt strides[3] = {1, Q, qf_size_in * qf_size_out * Q}; /* *NOPAD* */ 546ad70ee2cSJeremy L Thompson 547ad70ee2cSJeremy L Thompson // Create output restriction 5480a5597ceSJeremy L Thompson CeedCallBackend(CeedElemRestrictionCreateStrided(ceed_parent, num_elem, Q, qf_size_in * qf_size_out, 5490a5597ceSJeremy L Thompson (CeedSize)qf_size_in * (CeedSize)qf_size_out * (CeedSize)num_elem * (CeedSize)Q, strides, rstr)); 5501d102b48SJeremy L Thompson // Create assembled vector 551e910d748SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed_parent, l_size, assembled)); 55270a7ffb3SJeremy L Thompson } 55370a7ffb3SJeremy L Thompson // Clear output vector 5542b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(*assembled, 0.0)); 555ad70ee2cSJeremy L Thompson CeedCallBackend(CeedVectorGetArray(*assembled, CEED_MEM_HOST, &assembled_array)); 5561d102b48SJeremy L Thompson 5571d102b48SJeremy L Thompson // Loop through elements 558d1d35e2fSjeremylt for (CeedInt e = 0; e < num_elem; e++) { 5591d102b48SJeremy L Thompson // Input basis apply 5602b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorInputBasis_Ref(e, Q, qf_input_fields, op_input_fields, num_input_fields, true, e_data_full, impl)); 5611d102b48SJeremy L Thompson 5621d102b48SJeremy L Thompson // Assemble QFunction 563c7b67790SJeremy L Thompson 564c7b67790SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 565*681d0ea7SJeremy L Thompson bool is_active; 566c7b67790SJeremy L Thompson CeedInt field_size; 567c7b67790SJeremy L Thompson CeedVector vec; 568c7b67790SJeremy L Thompson 5691d102b48SJeremy L Thompson // Set Inputs 570c7b67790SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 571*681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 572*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 573*681d0ea7SJeremy L Thompson if (!is_active) continue; 574c7b67790SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &field_size)); 575c7b67790SJeremy L Thompson for (CeedInt field = 0; field < field_size; field++) { 576c7b67790SJeremy L Thompson // Set current portion of input to 1.0 577c7b67790SJeremy L Thompson { 578c7b67790SJeremy L Thompson CeedScalar *array; 579c7b67790SJeremy L Thompson 580c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->q_vecs_in[i], CEED_MEM_HOST, &array)); 581c7b67790SJeremy L Thompson for (CeedInt j = 0; j < Q; j++) array[field * Q + j] = 1.0; 582c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->q_vecs_in[i], &array)); 58342ea3801Sjeremylt } 584c7b67790SJeremy L Thompson 585506b1a0cSSebastian Grimberg if (!impl->is_identity_qf) { 5861d102b48SJeremy L Thompson // Set Outputs 587d1d35e2fSjeremylt for (CeedInt out = 0; out < num_output_fields; out++) { 588ad70ee2cSJeremy L Thompson CeedVector vec; 589ad70ee2cSJeremy L Thompson 5901d102b48SJeremy L Thompson // Get output vector 5912b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[out], &vec)); 5921d102b48SJeremy L Thompson // Check if active output 5931d102b48SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 594c7b67790SJeremy L Thompson CeedInt field_size; 595c7b67790SJeremy L Thompson 596ad70ee2cSJeremy L Thompson CeedCallBackend(CeedVectorSetArray(impl->q_vecs_out[out], CEED_MEM_HOST, CEED_USE_POINTER, assembled_array)); 597c7b67790SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[out], &field_size)); 598c7b67790SJeremy L Thompson assembled_array += field_size * Q; // Advance the pointer by the size of the output 5991d102b48SJeremy L Thompson } 600*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 6011d102b48SJeremy L Thompson } 6021d102b48SJeremy L Thompson // Apply QFunction 6032b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionApply(qf, Q, impl->q_vecs_in, impl->q_vecs_out)); 604506b1a0cSSebastian Grimberg } else { 605c7b67790SJeremy L Thompson CeedInt field_size; 606c7b67790SJeremy L Thompson const CeedScalar *array; 607506b1a0cSSebastian Grimberg 608506b1a0cSSebastian Grimberg // Copy Identity Outputs 609c7b67790SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[0], &field_size)); 610c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorGetArrayRead(impl->q_vecs_out[0], CEED_MEM_HOST, &array)); 611c7b67790SJeremy L Thompson for (CeedInt j = 0; j < field_size * Q; j++) assembled_array[j] = array[j]; 612c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArrayRead(impl->q_vecs_out[0], &array)); 613c7b67790SJeremy L Thompson assembled_array += field_size * Q; 614c7b67790SJeremy L Thompson } 615c7b67790SJeremy L Thompson // Reset input to 0.0 616c7b67790SJeremy L Thompson { 617c7b67790SJeremy L Thompson CeedScalar *array; 618c7b67790SJeremy L Thompson 619c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->q_vecs_in[i], CEED_MEM_HOST, &array)); 620c7b67790SJeremy L Thompson for (CeedInt j = 0; j < Q; j++) array[field * Q + j] = 0.0; 621c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->q_vecs_in[i], &array)); 622c7b67790SJeremy L Thompson } 623506b1a0cSSebastian Grimberg } 6241d102b48SJeremy L Thompson } 6251d102b48SJeremy L Thompson } 6261d102b48SJeremy L Thompson 6271d102b48SJeremy L Thompson // Un-set output Qvecs to prevent accidental overwrite of Assembled 628506b1a0cSSebastian Grimberg if (!impl->is_identity_qf) { 629d1d35e2fSjeremylt for (CeedInt out = 0; out < num_output_fields; out++) { 630ad70ee2cSJeremy L Thompson CeedVector vec; 631ad70ee2cSJeremy L Thompson 6321d102b48SJeremy L Thompson // Get output vector 6332b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[out], &vec)); 6341d102b48SJeremy L Thompson // Check if active output 635056ea4bdSJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE && num_elem > 0) { 6362b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorTakeArray(impl->q_vecs_out[out], CEED_MEM_HOST, NULL)); 6371d102b48SJeremy L Thompson } 638*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 6391d102b48SJeremy L Thompson } 640506b1a0cSSebastian Grimberg } 6411d102b48SJeremy L Thompson 6421d102b48SJeremy L Thompson // Restore input arrays 6432b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, true, e_data_full, impl)); 6441d102b48SJeremy L Thompson 6451d102b48SJeremy L Thompson // Restore output 646ad70ee2cSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(*assembled, &assembled_array)); 647e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 6481d102b48SJeremy L Thompson } 6491d102b48SJeremy L Thompson 650f10650afSjeremylt //------------------------------------------------------------------------------ 65170a7ffb3SJeremy L Thompson // Assemble Linear QFunction 65270a7ffb3SJeremy L Thompson //------------------------------------------------------------------------------ 6532b730f8bSJeremy L Thompson static int CeedOperatorLinearAssembleQFunction_Ref(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 6542b730f8bSJeremy L Thompson return CeedOperatorLinearAssembleQFunctionCore_Ref(op, true, assembled, rstr, request); 65570a7ffb3SJeremy L Thompson } 65670a7ffb3SJeremy L Thompson 65770a7ffb3SJeremy L Thompson //------------------------------------------------------------------------------ 65870a7ffb3SJeremy L Thompson // Update Assembled Linear QFunction 65970a7ffb3SJeremy L Thompson //------------------------------------------------------------------------------ 6602b730f8bSJeremy L Thompson static int CeedOperatorLinearAssembleQFunctionUpdate_Ref(CeedOperator op, CeedVector assembled, CeedElemRestriction rstr, CeedRequest *request) { 6612b730f8bSJeremy L Thompson return CeedOperatorLinearAssembleQFunctionCore_Ref(op, false, &assembled, &rstr, request); 66270a7ffb3SJeremy L Thompson } 66370a7ffb3SJeremy L Thompson 66470a7ffb3SJeremy L Thompson //------------------------------------------------------------------------------ 66548acf710SJeremy L Thompson // Setup Input/Output Fields 66648acf710SJeremy L Thompson //------------------------------------------------------------------------------ 667f8a0df59SJeremy L Thompson static int CeedOperatorSetupFieldsAtPoints_Ref(CeedQFunction qf, CeedOperator op, bool is_input, bool *skip_rstr, bool *apply_add_basis, 668f8a0df59SJeremy L Thompson CeedVector *e_vecs_full, CeedVector *e_vecs, CeedVector *q_vecs, CeedInt start_e, CeedInt num_fields, 669f8a0df59SJeremy L Thompson CeedInt Q) { 67048acf710SJeremy L Thompson Ceed ceed; 67148acf710SJeremy L Thompson CeedSize e_size, q_size; 672ff1bc20eSJeremy L Thompson CeedInt max_num_points, num_comp, size, P; 67348acf710SJeremy L Thompson CeedQFunctionField *qf_fields; 67448acf710SJeremy L Thompson CeedOperatorField *op_fields; 67548acf710SJeremy L Thompson 676e910d748SJeremy L Thompson { 677e910d748SJeremy L Thompson Ceed ceed_parent; 678e910d748SJeremy L Thompson 67948acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 680e910d748SJeremy L Thompson CeedCallBackend(CeedGetParent(ceed, &ceed_parent)); 681e910d748SJeremy L Thompson if (ceed_parent) ceed = ceed_parent; 682e910d748SJeremy L Thompson } 68348acf710SJeremy L Thompson if (is_input) { 68448acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL)); 68548acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL)); 68648acf710SJeremy L Thompson } else { 68748acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields)); 68848acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, NULL, NULL, &qf_fields)); 68948acf710SJeremy L Thompson } 69048acf710SJeremy L Thompson 69148acf710SJeremy L Thompson // Get max number of points 69248acf710SJeremy L Thompson { 69348acf710SJeremy L Thompson CeedInt dim; 69448acf710SJeremy L Thompson CeedElemRestriction rstr_points = NULL; 69548acf710SJeremy L Thompson CeedOperator_Ref *impl; 69648acf710SJeremy L Thompson 69748acf710SJeremy L Thompson CeedCallBackend(CeedOperatorAtPointsGetPoints(op, &rstr_points, NULL)); 69848acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetMaxPointsInElement(rstr_points, &max_num_points)); 69948acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumComponents(rstr_points, &dim)); 70048acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_points)); 70148acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 702b37f8825SJeremy L Thompson if (is_input) { 703b37f8825SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, dim * max_num_points, &impl->point_coords_elem)); 704b37f8825SJeremy L Thompson CeedCallBackend(CeedVectorSetValue(impl->point_coords_elem, 0.0)); 705b37f8825SJeremy L Thompson } 70648acf710SJeremy L Thompson } 70748acf710SJeremy L Thompson 70848acf710SJeremy L Thompson // Loop over fields 70948acf710SJeremy L Thompson for (CeedInt i = 0; i < num_fields; i++) { 71048acf710SJeremy L Thompson CeedEvalMode eval_mode; 71148acf710SJeremy L Thompson CeedBasis basis; 71248acf710SJeremy L Thompson 71348acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 71448acf710SJeremy L Thompson if (eval_mode != CEED_EVAL_WEIGHT) { 71548acf710SJeremy L Thompson CeedElemRestriction elem_rstr; 71648acf710SJeremy L Thompson 71748acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr)); 71848acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionCreateVector(elem_rstr, NULL, &e_vecs_full[i + start_e])); 719*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 720ff1bc20eSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(e_vecs_full[i + start_e], 0.0)); 7216efa0d72SZach Atkins } 72248acf710SJeremy L Thompson 72348acf710SJeremy L Thompson switch (eval_mode) { 72438e83183SJeremy L Thompson case CEED_EVAL_NONE: { 72538e83183SJeremy L Thompson CeedVector vec; 72638e83183SJeremy L Thompson 72748acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_fields[i], &size)); 72848acf710SJeremy L Thompson e_size = (CeedSize)max_num_points * size; 72948acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, e_size, &e_vecs[i])); 73038e83183SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[i], &vec)); 73138e83183SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE || !is_input) { 73238e83183SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs[i], &q_vecs[i])); 73338e83183SJeremy L Thompson } else { 73448acf710SJeremy L Thompson q_size = (CeedSize)max_num_points * size; 73548acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 73638e83183SJeremy L Thompson } 737*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 73848acf710SJeremy L Thompson break; 73938e83183SJeremy L Thompson } 74048acf710SJeremy L Thompson case CEED_EVAL_INTERP: 74148acf710SJeremy L Thompson case CEED_EVAL_GRAD: 74248acf710SJeremy L Thompson case CEED_EVAL_DIV: 74348acf710SJeremy L Thompson case CEED_EVAL_CURL: 74448acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 74548acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_fields[i], &size)); 74648acf710SJeremy L Thompson CeedCallBackend(CeedBasisGetNumNodes(basis, &P)); 74748acf710SJeremy L Thompson CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 74848acf710SJeremy L Thompson e_size = (CeedSize)P * num_comp; 74948acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, e_size, &e_vecs[i])); 75048acf710SJeremy L Thompson q_size = (CeedSize)max_num_points * size; 75148acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 752*681d0ea7SJeremy L Thompson CeedCallBackend(CeedBasisDestroy(&basis)); 75348acf710SJeremy L Thompson break; 75448acf710SJeremy L Thompson case CEED_EVAL_WEIGHT: // Only on input fields 75548acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 75648acf710SJeremy L Thompson q_size = (CeedSize)max_num_points; 75748acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 75848acf710SJeremy L Thompson CeedCallBackend( 759fc0f7cc6SJeremy L Thompson CeedBasisApplyAtPoints(basis, 1, &max_num_points, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, CEED_VECTOR_NONE, q_vecs[i])); 760*681d0ea7SJeremy L Thompson CeedCallBackend(CeedBasisDestroy(&basis)); 76148acf710SJeremy L Thompson break; 76248acf710SJeremy L Thompson } 763ecc797dfSJeremy L Thompson // Initialize full arrays for E-vectors and Q-vectors 764297a0f46SJeremy L Thompson if (e_vecs[i]) CeedCallBackend(CeedVectorSetValue(e_vecs[i], 0.0)); 765297a0f46SJeremy L Thompson if (eval_mode != CEED_EVAL_WEIGHT) CeedCallBackend(CeedVectorSetValue(q_vecs[i], 0.0)); 76648acf710SJeremy L Thompson } 767f8a0df59SJeremy L Thompson // Drop duplicate restrictions 7683aab95c0SJeremy L Thompson if (is_input) { 7693aab95c0SJeremy L Thompson for (CeedInt i = 0; i < num_fields; i++) { 7703aab95c0SJeremy L Thompson CeedVector vec_i; 7713aab95c0SJeremy L Thompson CeedElemRestriction rstr_i; 7723aab95c0SJeremy L Thompson 7733aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[i], &vec_i)); 7743aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr_i)); 7753aab95c0SJeremy L Thompson for (CeedInt j = i + 1; j < num_fields; j++) { 7763aab95c0SJeremy L Thompson CeedVector vec_j; 7773aab95c0SJeremy L Thompson CeedElemRestriction rstr_j; 7783aab95c0SJeremy L Thompson 7793aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[j], &vec_j)); 7803aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[j], &rstr_j)); 7813aab95c0SJeremy L Thompson if (vec_i == vec_j && rstr_i == rstr_j) { 7823aab95c0SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs[i], &e_vecs[j])); 783f8a0df59SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs_full[i + start_e], &e_vecs_full[j + start_e])); 7843aab95c0SJeremy L Thompson skip_rstr[j] = true; 7853aab95c0SJeremy L Thompson } 786*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec_j)); 787*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_j)); 7883aab95c0SJeremy L Thompson } 789*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec_i)); 790*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_i)); 7913aab95c0SJeremy L Thompson } 792f8a0df59SJeremy L Thompson } else { 793f8a0df59SJeremy L Thompson for (CeedInt i = num_fields - 1; i >= 0; i--) { 794f8a0df59SJeremy L Thompson CeedVector vec_i; 795f8a0df59SJeremy L Thompson CeedElemRestriction rstr_i; 796f8a0df59SJeremy L Thompson 797f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[i], &vec_i)); 798f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr_i)); 799f8a0df59SJeremy L Thompson for (CeedInt j = i - 1; j >= 0; j--) { 800f8a0df59SJeremy L Thompson CeedVector vec_j; 801f8a0df59SJeremy L Thompson CeedElemRestriction rstr_j; 802f8a0df59SJeremy L Thompson 803f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[j], &vec_j)); 804f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[j], &rstr_j)); 805f8a0df59SJeremy L Thompson if (vec_i == vec_j && rstr_i == rstr_j) { 806f8a0df59SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs[i], &e_vecs[j])); 807f8a0df59SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs_full[i + start_e], &e_vecs_full[j + start_e])); 808f8a0df59SJeremy L Thompson skip_rstr[j] = true; 809f8a0df59SJeremy L Thompson apply_add_basis[i] = true; 810f8a0df59SJeremy L Thompson } 811*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec_j)); 812*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_j)); 813f8a0df59SJeremy L Thompson } 814*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec_i)); 815*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_i)); 816f8a0df59SJeremy L Thompson } 8173aab95c0SJeremy L Thompson } 81848acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 81948acf710SJeremy L Thompson } 82048acf710SJeremy L Thompson 82148acf710SJeremy L Thompson //------------------------------------------------------------------------------ 82248acf710SJeremy L Thompson // Setup Operator 82348acf710SJeremy L Thompson //------------------------------------------------------------------------------ 82448acf710SJeremy L Thompson static int CeedOperatorSetupAtPoints_Ref(CeedOperator op) { 82548acf710SJeremy L Thompson bool is_setup_done; 82648acf710SJeremy L Thompson CeedInt Q, num_input_fields, num_output_fields; 82748acf710SJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 82848acf710SJeremy L Thompson CeedQFunction qf; 82948acf710SJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 83048acf710SJeremy L Thompson CeedOperator_Ref *impl; 83148acf710SJeremy L Thompson 83248acf710SJeremy L Thompson CeedCallBackend(CeedOperatorIsSetupDone(op, &is_setup_done)); 83348acf710SJeremy L Thompson if (is_setup_done) return CEED_ERROR_SUCCESS; 83448acf710SJeremy L Thompson 83548acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 83648acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 83748acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetNumQuadraturePoints(op, &Q)); 83848acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionIsIdentity(qf, &impl->is_identity_qf)); 83948acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 84048acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 84148acf710SJeremy L Thompson 84248acf710SJeremy L Thompson // Allocate 84348acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(num_input_fields + num_output_fields, &impl->e_vecs_full)); 84448acf710SJeremy L Thompson 8453aab95c0SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->skip_rstr_in)); 846f8a0df59SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->skip_rstr_out)); 847f8a0df59SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->apply_add_basis_out)); 84848acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->input_states)); 84948acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_vecs_in)); 85048acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_vecs_out)); 85148acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->q_vecs_in)); 85248acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->q_vecs_out)); 85348acf710SJeremy L Thompson 85448acf710SJeremy L Thompson impl->num_inputs = num_input_fields; 85548acf710SJeremy L Thompson impl->num_outputs = num_output_fields; 85648acf710SJeremy L Thompson 85748acf710SJeremy L Thompson // Set up infield and outfield pointer arrays 85848acf710SJeremy L Thompson // Infields 859f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorSetupFieldsAtPoints_Ref(qf, op, true, impl->skip_rstr_in, NULL, impl->e_vecs_full, impl->e_vecs_in, impl->q_vecs_in, 0, 8603aab95c0SJeremy L Thompson num_input_fields, Q)); 86148acf710SJeremy L Thompson // Outfields 862f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorSetupFieldsAtPoints_Ref(qf, op, false, impl->skip_rstr_out, impl->apply_add_basis_out, impl->e_vecs_full, 863f8a0df59SJeremy L Thompson impl->e_vecs_out, impl->q_vecs_out, num_input_fields, num_output_fields, Q)); 86448acf710SJeremy L Thompson 86548acf710SJeremy L Thompson // Identity QFunctions 86648acf710SJeremy L Thompson if (impl->is_identity_qf) { 86748acf710SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(impl->q_vecs_in[0], &impl->q_vecs_out[0])); 86838e83183SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(impl->q_vecs_in[0], &impl->e_vecs_out[0])); 86948acf710SJeremy L Thompson } 87048acf710SJeremy L Thompson 87148acf710SJeremy L Thompson CeedCallBackend(CeedOperatorSetSetupDone(op)); 87248acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 87348acf710SJeremy L Thompson } 87448acf710SJeremy L Thompson 87548acf710SJeremy L Thompson //------------------------------------------------------------------------------ 87648acf710SJeremy L Thompson // Input Basis Action 87748acf710SJeremy L Thompson //------------------------------------------------------------------------------ 87848acf710SJeremy L Thompson static inline int CeedOperatorInputBasisAtPoints_Ref(CeedInt e, CeedInt num_points_offset, CeedInt num_points, CeedQFunctionField *qf_input_fields, 87948acf710SJeremy L Thompson CeedOperatorField *op_input_fields, CeedInt num_input_fields, CeedVector in_vec, 88048acf710SJeremy L Thompson CeedVector point_coords_elem, bool skip_active, CeedScalar *e_data[2 * CEED_FIELD_MAX], 88148acf710SJeremy L Thompson CeedOperator_Ref *impl, CeedRequest *request) { 88248acf710SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 883*681d0ea7SJeremy L Thompson bool is_active; 88448acf710SJeremy L Thompson CeedInt elem_size, size, num_comp; 88548acf710SJeremy L Thompson CeedRestrictionType rstr_type; 88648acf710SJeremy L Thompson CeedEvalMode eval_mode; 88748acf710SJeremy L Thompson CeedVector vec; 88848acf710SJeremy L Thompson CeedElemRestriction elem_rstr; 88948acf710SJeremy L Thompson CeedBasis basis; 89048acf710SJeremy L Thompson 89148acf710SJeremy L Thompson // Skip active input 892*681d0ea7SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 893*681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 894*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 895*681d0ea7SJeremy L Thompson if (skip_active && is_active) continue; 89648acf710SJeremy L Thompson 89748acf710SJeremy L Thompson // Get elem_size, eval_mode, size 89848acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 89948acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetType(elem_rstr, &rstr_type)); 90048acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 90148acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &size)); 90248acf710SJeremy L Thompson // Restrict block active input 903*681d0ea7SJeremy L Thompson if (is_active && !impl->skip_rstr_in[i]) { 90448acf710SJeremy L Thompson if (rstr_type == CEED_RESTRICTION_POINTS) { 90548acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(elem_rstr, e, CEED_NOTRANSPOSE, in_vec, impl->e_vecs_in[i], request)); 90648acf710SJeremy L Thompson } else { 90748acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyBlock(elem_rstr, e, CEED_NOTRANSPOSE, in_vec, impl->e_vecs_in[i], request)); 90848acf710SJeremy L Thompson } 90948acf710SJeremy L Thompson } 91048acf710SJeremy L Thompson // Basis action 91148acf710SJeremy L Thompson switch (eval_mode) { 91248acf710SJeremy L Thompson case CEED_EVAL_NONE: 913*681d0ea7SJeremy L Thompson if (!is_active) { 91448acf710SJeremy L Thompson CeedCallBackend(CeedVectorSetArray(impl->q_vecs_in[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data[i][num_points_offset * size])); 91548acf710SJeremy L Thompson } 91648acf710SJeremy L Thompson break; 91748acf710SJeremy L Thompson // Note - these basis eval modes require FEM fields 91848acf710SJeremy L Thompson case CEED_EVAL_INTERP: 91948acf710SJeremy L Thompson case CEED_EVAL_GRAD: 92048acf710SJeremy L Thompson case CEED_EVAL_DIV: 92148acf710SJeremy L Thompson case CEED_EVAL_CURL: 92248acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_input_fields[i], &basis)); 923*681d0ea7SJeremy L Thompson if (!is_active) { 92448acf710SJeremy L Thompson CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 92548acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size)); 92681670346SSebastian Grimberg CeedCallBackend(CeedVectorSetArray(impl->e_vecs_in[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data[i][(CeedSize)e * elem_size * num_comp])); 92748acf710SJeremy L Thompson } 92848acf710SJeremy L Thompson CeedCallBackend( 929fc0f7cc6SJeremy L Thompson CeedBasisApplyAtPoints(basis, 1, &num_points, CEED_NOTRANSPOSE, eval_mode, point_coords_elem, impl->e_vecs_in[i], impl->q_vecs_in[i])); 930*681d0ea7SJeremy L Thompson CeedCallBackend(CeedBasisDestroy(&basis)); 93148acf710SJeremy L Thompson break; 93248acf710SJeremy L Thompson case CEED_EVAL_WEIGHT: 93348acf710SJeremy L Thompson break; // No action 93448acf710SJeremy L Thompson } 935*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 93648acf710SJeremy L Thompson } 93748acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 93848acf710SJeremy L Thompson } 93948acf710SJeremy L Thompson 94048acf710SJeremy L Thompson //------------------------------------------------------------------------------ 94148acf710SJeremy L Thompson // Output Basis Action 94248acf710SJeremy L Thompson //------------------------------------------------------------------------------ 94348acf710SJeremy L Thompson static inline int CeedOperatorOutputBasisAtPoints_Ref(CeedInt e, CeedInt num_points_offset, CeedInt num_points, CeedQFunctionField *qf_output_fields, 94448acf710SJeremy L Thompson CeedOperatorField *op_output_fields, CeedInt num_input_fields, CeedInt num_output_fields, 945f8a0df59SJeremy L Thompson bool *apply_add_basis, bool *skip_rstr, CeedOperator op, CeedVector out_vec, 946f8a0df59SJeremy L Thompson CeedVector point_coords_elem, CeedOperator_Ref *impl, CeedRequest *request) { 94748acf710SJeremy L Thompson for (CeedInt i = 0; i < num_output_fields; i++) { 948*681d0ea7SJeremy L Thompson bool is_active; 94948acf710SJeremy L Thompson CeedRestrictionType rstr_type; 95048acf710SJeremy L Thompson CeedEvalMode eval_mode; 95148acf710SJeremy L Thompson CeedVector vec; 95248acf710SJeremy L Thompson CeedElemRestriction elem_rstr; 95348acf710SJeremy L Thompson CeedBasis basis; 95448acf710SJeremy L Thompson 95548acf710SJeremy L Thompson // Get elem_size, eval_mode, size 95648acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); 95748acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); 95848acf710SJeremy L Thompson // Basis action 95948acf710SJeremy L Thompson switch (eval_mode) { 96048acf710SJeremy L Thompson case CEED_EVAL_NONE: 96148acf710SJeremy L Thompson break; // No action 96248acf710SJeremy L Thompson case CEED_EVAL_INTERP: 96348acf710SJeremy L Thompson case CEED_EVAL_GRAD: 96448acf710SJeremy L Thompson case CEED_EVAL_DIV: 96548acf710SJeremy L Thompson case CEED_EVAL_CURL: 96648acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_output_fields[i], &basis)); 967f8a0df59SJeremy L Thompson if (apply_add_basis[i]) { 968f8a0df59SJeremy L Thompson CeedCallBackend(CeedBasisApplyAddAtPoints(basis, 1, &num_points, CEED_TRANSPOSE, eval_mode, point_coords_elem, impl->q_vecs_out[i], 969f8a0df59SJeremy L Thompson impl->e_vecs_out[i])); 970f8a0df59SJeremy L Thompson } else { 97148acf710SJeremy L Thompson CeedCallBackend( 972fc0f7cc6SJeremy L Thompson CeedBasisApplyAtPoints(basis, 1, &num_points, CEED_TRANSPOSE, eval_mode, point_coords_elem, impl->q_vecs_out[i], impl->e_vecs_out[i])); 973f8a0df59SJeremy L Thompson } 974*681d0ea7SJeremy L Thompson CeedCallBackend(CeedBasisDestroy(&basis)); 97548acf710SJeremy L Thompson break; 97648acf710SJeremy L Thompson // LCOV_EXCL_START 97748acf710SJeremy L Thompson case CEED_EVAL_WEIGHT: { 9786e536b99SJeremy L Thompson return CeedError(CeedOperatorReturnCeed(op), CEED_ERROR_BACKEND, "CEED_EVAL_WEIGHT cannot be an output evaluation mode"); 97948acf710SJeremy L Thompson // LCOV_EXCL_STOP 98048acf710SJeremy L Thompson } 98148acf710SJeremy L Thompson } 98248acf710SJeremy L Thompson // Restrict output block 983f8a0df59SJeremy L Thompson if (skip_rstr[i]) continue; 98448acf710SJeremy L Thompson // Get output vector 98548acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetType(elem_rstr, &rstr_type)); 98648acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[i], &vec)); 987*681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 988*681d0ea7SJeremy L Thompson if (is_active) vec = out_vec; 98948acf710SJeremy L Thompson // Restrict 99048acf710SJeremy L Thompson if (rstr_type == CEED_RESTRICTION_POINTS) { 99148acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(elem_rstr, e, CEED_TRANSPOSE, impl->e_vecs_out[i], vec, request)); 99248acf710SJeremy L Thompson } else { 99348acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyBlock(elem_rstr, e, CEED_TRANSPOSE, impl->e_vecs_out[i], vec, request)); 99448acf710SJeremy L Thompson } 995*681d0ea7SJeremy L Thompson if (!is_active) CeedCallBackend(CeedVectorDestroy(&vec)); 996*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 99748acf710SJeremy L Thompson } 99848acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 99948acf710SJeremy L Thompson } 100048acf710SJeremy L Thompson 100148acf710SJeremy L Thompson //------------------------------------------------------------------------------ 100248acf710SJeremy L Thompson // Operator Apply 100348acf710SJeremy L Thompson //------------------------------------------------------------------------------ 100448acf710SJeremy L Thompson static int CeedOperatorApplyAddAtPoints_Ref(CeedOperator op, CeedVector in_vec, CeedVector out_vec, CeedRequest *request) { 100548acf710SJeremy L Thompson CeedInt num_points_offset = 0, num_input_fields, num_output_fields, num_elem; 100648acf710SJeremy L Thompson CeedScalar *e_data[2 * CEED_FIELD_MAX] = {0}; 100748acf710SJeremy L Thompson CeedVector point_coords = NULL; 100848acf710SJeremy L Thompson CeedElemRestriction rstr_points = NULL; 100948acf710SJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 101048acf710SJeremy L Thompson CeedQFunction qf; 101148acf710SJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 101248acf710SJeremy L Thompson CeedOperator_Ref *impl; 101348acf710SJeremy L Thompson 101448acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 101548acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 101648acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 101748acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 101848acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 101948acf710SJeremy L Thompson 102048acf710SJeremy L Thompson // Setup 102148acf710SJeremy L Thompson CeedCallBackend(CeedOperatorSetupAtPoints_Ref(op)); 102248acf710SJeremy L Thompson 102348acf710SJeremy L Thompson // Point coordinates 102448acf710SJeremy L Thompson CeedCallBackend(CeedOperatorAtPointsGetPoints(op, &rstr_points, &point_coords)); 102548acf710SJeremy L Thompson 102648acf710SJeremy L Thompson // Input Evecs and Restriction 10276cde1da6SZach Atkins CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, NULL, true, e_data, impl, request)); 102848acf710SJeremy L Thompson 102948acf710SJeremy L Thompson // Loop through elements 103048acf710SJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 103148acf710SJeremy L Thompson CeedInt num_points; 103248acf710SJeremy L Thompson 103348acf710SJeremy L Thompson // Setup points for element 103448acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(rstr_points, e, CEED_NOTRANSPOSE, point_coords, impl->point_coords_elem, request)); 103548acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumPointsInElement(rstr_points, e, &num_points)); 103648acf710SJeremy L Thompson 103748acf710SJeremy L Thompson // Input basis apply 103848acf710SJeremy L Thompson CeedCallBackend(CeedOperatorInputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_input_fields, op_input_fields, num_input_fields, in_vec, 103948acf710SJeremy L Thompson impl->point_coords_elem, false, e_data, impl, request)); 104048acf710SJeremy L Thompson 104148acf710SJeremy L Thompson // Q function 104248acf710SJeremy L Thompson if (!impl->is_identity_qf) { 104348acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionApply(qf, num_points, impl->q_vecs_in, impl->q_vecs_out)); 104448acf710SJeremy L Thompson } 104548acf710SJeremy L Thompson 104648acf710SJeremy L Thompson // Output basis apply and restriction 104748acf710SJeremy L Thompson CeedCallBackend(CeedOperatorOutputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_output_fields, op_output_fields, num_input_fields, 1048f8a0df59SJeremy L Thompson num_output_fields, impl->apply_add_basis_out, impl->skip_rstr_out, op, out_vec, 1049f8a0df59SJeremy L Thompson impl->point_coords_elem, impl, request)); 105048acf710SJeremy L Thompson 105148acf710SJeremy L Thompson num_points_offset += num_points; 105248acf710SJeremy L Thompson } 105348acf710SJeremy L Thompson 105448acf710SJeremy L Thompson // Restore input arrays 10556cde1da6SZach Atkins CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, true, e_data, impl)); 105648acf710SJeremy L Thompson 105748acf710SJeremy L Thompson // Cleanup point coordinates 105848acf710SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&point_coords)); 105948acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_points)); 106048acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 106148acf710SJeremy L Thompson } 106248acf710SJeremy L Thompson 106348acf710SJeremy L Thompson //------------------------------------------------------------------------------ 1064e13f2367SZach Atkins // Core code for assembling linear QFunction 1065e13f2367SZach Atkins //------------------------------------------------------------------------------ 1066e13f2367SZach Atkins static inline int CeedOperatorLinearAssembleQFunctionAtPointsCore_Ref(CeedOperator op, bool build_objects, CeedVector *assembled, 1067e13f2367SZach Atkins CeedElemRestriction *rstr, CeedRequest *request) { 1068e13f2367SZach Atkins Ceed ceed; 1069ff8551c5SJeremy L Thompson CeedInt qf_size_in, qf_size_out, max_num_points, num_elem, num_input_fields, num_output_fields, num_points_offset = 0; 1070e13f2367SZach Atkins CeedScalar *assembled_array, *e_data_full[2 * CEED_FIELD_MAX] = {NULL}; 1071c7b67790SJeremy L Thompson CeedVector point_coords = NULL; 1072e13f2367SZach Atkins CeedQFunctionField *qf_input_fields, *qf_output_fields; 1073e13f2367SZach Atkins CeedQFunction qf; 1074e13f2367SZach Atkins CeedOperatorField *op_input_fields, *op_output_fields; 1075e13f2367SZach Atkins CeedOperator_Ref *impl; 1076e13f2367SZach Atkins CeedElemRestriction rstr_points = NULL; 1077e13f2367SZach Atkins 1078e13f2367SZach Atkins CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 1079e13f2367SZach Atkins CeedCallBackend(CeedOperatorGetData(op, &impl)); 1080ff8551c5SJeremy L Thompson qf_size_in = impl->qf_size_in; 1081ff8551c5SJeremy L Thompson qf_size_out = impl->qf_size_out; 1082e13f2367SZach Atkins CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 1083e13f2367SZach Atkins CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 1084e13f2367SZach Atkins CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 1085e13f2367SZach Atkins CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 1086e13f2367SZach Atkins 1087e13f2367SZach Atkins // Setup 1088e13f2367SZach Atkins CeedCallBackend(CeedOperatorSetupAtPoints_Ref(op)); 1089e13f2367SZach Atkins 1090e13f2367SZach Atkins // Check for restriction only operator 1091e13f2367SZach Atkins CeedCheck(!impl->is_identity_rstr_op, ceed, CEED_ERROR_BACKEND, "Assembling restriction only operators is not supported"); 1092e13f2367SZach Atkins 1093e13f2367SZach Atkins // Point coordinates 1094e13f2367SZach Atkins CeedCallBackend(CeedOperatorAtPointsGetPoints(op, &rstr_points, &point_coords)); 1095e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionGetMaxPointsInElement(rstr_points, &max_num_points)); 1096e13f2367SZach Atkins 1097e13f2367SZach Atkins // Input Evecs and Restriction 1098e13f2367SZach Atkins CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, NULL, true, e_data_full, impl, request)); 1099e13f2367SZach Atkins 1100e13f2367SZach Atkins // Count number of active input fields 1101ff8551c5SJeremy L Thompson if (qf_size_in == 0) { 1102e13f2367SZach Atkins for (CeedInt i = 0; i < num_input_fields; i++) { 1103e13f2367SZach Atkins CeedInt field_size; 1104e13f2367SZach Atkins CeedVector vec; 1105e13f2367SZach Atkins 1106e13f2367SZach Atkins // Get input vector 1107e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 1108e13f2367SZach Atkins // Check if active input 1109e13f2367SZach Atkins if (vec == CEED_VECTOR_ACTIVE) { 1110e13f2367SZach Atkins // Check that all active inputs are nodal fields 1111e13f2367SZach Atkins { 1112e13f2367SZach Atkins CeedElemRestriction elem_rstr; 1113e13f2367SZach Atkins bool is_at_points = false; 1114e13f2367SZach Atkins 1115e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 1116637baffdSJeremy L Thompson CeedCallBackend(CeedElemRestrictionIsAtPoints(elem_rstr, &is_at_points)); 1117*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 1118e13f2367SZach Atkins CeedCheck(!is_at_points, ceed, CEED_ERROR_BACKEND, "Cannot assemble QFunction with active input at points"); 1119e13f2367SZach Atkins } 1120e13f2367SZach Atkins // Get size of active input 1121e13f2367SZach Atkins CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &field_size)); 1122ff8551c5SJeremy L Thompson qf_size_in += field_size; 1123e13f2367SZach Atkins } 1124*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 1125e13f2367SZach Atkins } 1126ff8551c5SJeremy L Thompson CeedCheck(qf_size_in, ceed, CEED_ERROR_BACKEND, "Cannot assemble QFunction without active inputs and outputs"); 1127ff8551c5SJeremy L Thompson impl->qf_size_in = qf_size_in; 1128e13f2367SZach Atkins } 1129e13f2367SZach Atkins 1130e13f2367SZach Atkins // Count number of active output fields 1131ff8551c5SJeremy L Thompson if (qf_size_out == 0) { 1132e13f2367SZach Atkins for (CeedInt i = 0; i < num_output_fields; i++) { 1133e13f2367SZach Atkins CeedInt field_size; 1134c7b67790SJeremy L Thompson CeedVector vec; 1135e13f2367SZach Atkins 1136e13f2367SZach Atkins // Get output vector 1137e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[i], &vec)); 1138e13f2367SZach Atkins // Check if active output 1139e13f2367SZach Atkins if (vec == CEED_VECTOR_ACTIVE) { 1140e13f2367SZach Atkins // Check that all active inputs are nodal fields 1141e13f2367SZach Atkins { 1142e13f2367SZach Atkins CeedElemRestriction elem_rstr; 1143e13f2367SZach Atkins bool is_at_points = false; 1144e13f2367SZach Atkins 1145e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); 1146637baffdSJeremy L Thompson CeedCallBackend(CeedElemRestrictionIsAtPoints(elem_rstr, &is_at_points)); 1147*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 1148e13f2367SZach Atkins CeedCheck(!is_at_points, ceed, CEED_ERROR_BACKEND, "Cannot assemble QFunction with active input at points"); 1149e13f2367SZach Atkins } 1150e13f2367SZach Atkins // Get size of active output 1151e13f2367SZach Atkins CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[i], &field_size)); 1152c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorSetValue(impl->q_vecs_in[i], 0.0)); 1153ff8551c5SJeremy L Thompson qf_size_out += field_size; 1154e13f2367SZach Atkins } 1155*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 1156e13f2367SZach Atkins } 1157ff8551c5SJeremy L Thompson CeedCheck(qf_size_out > 0, ceed, CEED_ERROR_BACKEND, "Cannot assemble QFunction without active inputs and outputs"); 1158ff8551c5SJeremy L Thompson impl->qf_size_out = qf_size_out; 1159e13f2367SZach Atkins } 1160e13f2367SZach Atkins 1161e13f2367SZach Atkins // Build objects if needed 1162e13f2367SZach Atkins if (build_objects) { 1163e13f2367SZach Atkins CeedInt num_points_total; 1164e13f2367SZach Atkins const CeedInt *offsets; 1165e13f2367SZach Atkins 1166e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionGetNumPoints(rstr_points, &num_points_total)); 1167e13f2367SZach Atkins 1168e13f2367SZach Atkins // Create output restriction (at points) 1169e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionGetOffsets(rstr_points, CEED_MEM_HOST, &offsets)); 1170ff8551c5SJeremy L Thompson CeedCallBackend(CeedElemRestrictionCreateAtPoints(ceed, num_elem, num_points_total, qf_size_in * qf_size_out, 1171ff8551c5SJeremy L Thompson qf_size_in * qf_size_out * num_points_total, CEED_MEM_HOST, CEED_COPY_VALUES, offsets, rstr)); 1172e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionRestoreOffsets(rstr_points, &offsets)); 1173e13f2367SZach Atkins 1174e13f2367SZach Atkins // Create assembled vector 1175e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionCreateVector(*rstr, assembled, NULL)); 1176e13f2367SZach Atkins } 1177e13f2367SZach Atkins // Clear output vector 1178e13f2367SZach Atkins CeedCallBackend(CeedVectorSetValue(*assembled, 0.0)); 1179e13f2367SZach Atkins CeedCallBackend(CeedVectorGetArray(*assembled, CEED_MEM_HOST, &assembled_array)); 1180e13f2367SZach Atkins 1181e13f2367SZach Atkins // Loop through elements 1182e13f2367SZach Atkins for (CeedInt e = 0; e < num_elem; e++) { 1183e13f2367SZach Atkins CeedInt num_points; 1184e13f2367SZach Atkins 1185e13f2367SZach Atkins // Setup points for element 1186e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(rstr_points, e, CEED_NOTRANSPOSE, point_coords, impl->point_coords_elem, request)); 1187e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionGetNumPointsInElement(rstr_points, e, &num_points)); 1188e13f2367SZach Atkins 1189e13f2367SZach Atkins // Input basis apply 1190e13f2367SZach Atkins CeedCallBackend(CeedOperatorInputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_input_fields, op_input_fields, num_input_fields, NULL, 1191e13f2367SZach Atkins impl->point_coords_elem, true, e_data_full, impl, request)); 1192e13f2367SZach Atkins 1193e13f2367SZach Atkins // Assemble QFunction 1194c7b67790SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 1195*681d0ea7SJeremy L Thompson bool is_active; 1196c7b67790SJeremy L Thompson CeedInt field_size; 1197c7b67790SJeremy L Thompson CeedVector vec; 1198c7b67790SJeremy L Thompson 1199c7b67790SJeremy L Thompson // Get input vector 1200c7b67790SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 1201*681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 1202*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 1203c7b67790SJeremy L Thompson // Check if active input 1204*681d0ea7SJeremy L Thompson if (!is_active) continue; 1205c7b67790SJeremy L Thompson // Get size of active input 1206c7b67790SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &field_size)); 1207c7b67790SJeremy L Thompson for (CeedInt field = 0; field < field_size; field++) { 1208c7b67790SJeremy L Thompson // Set current portion of input to 1.0 1209c7b67790SJeremy L Thompson { 1210c7b67790SJeremy L Thompson CeedScalar *array; 1211c7b67790SJeremy L Thompson 1212c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->q_vecs_in[i], CEED_MEM_HOST, &array)); 1213c7b67790SJeremy L Thompson for (CeedInt j = 0; j < num_points; j++) array[field * num_points + j] = 1.0; 1214c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->q_vecs_in[i], &array)); 1215e13f2367SZach Atkins } 1216c7b67790SJeremy L Thompson 1217e13f2367SZach Atkins if (!impl->is_identity_qf) { 1218e13f2367SZach Atkins // Set Outputs 1219e13f2367SZach Atkins for (CeedInt out = 0; out < num_output_fields; out++) { 1220e13f2367SZach Atkins CeedVector vec; 1221e13f2367SZach Atkins CeedInt field_size; 1222e13f2367SZach Atkins 1223e13f2367SZach Atkins // Get output vector 1224e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[out], &vec)); 1225e13f2367SZach Atkins // Check if active output 1226e13f2367SZach Atkins if (vec == CEED_VECTOR_ACTIVE) { 1227e13f2367SZach Atkins CeedCallBackend(CeedVectorSetArray(impl->q_vecs_out[out], CEED_MEM_HOST, CEED_USE_POINTER, assembled_array)); 1228e13f2367SZach Atkins CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[out], &field_size)); 1229e13f2367SZach Atkins assembled_array += field_size * num_points; // Advance the pointer by the size of the output 1230e13f2367SZach Atkins } 1231*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 1232e13f2367SZach Atkins } 1233e13f2367SZach Atkins // Apply QFunction 1234e13f2367SZach Atkins CeedCallBackend(CeedQFunctionApply(qf, num_points, impl->q_vecs_in, impl->q_vecs_out)); 1235e13f2367SZach Atkins } else { 1236c7b67790SJeremy L Thompson const CeedScalar *array; 1237e13f2367SZach Atkins CeedInt field_size; 1238e13f2367SZach Atkins 1239e13f2367SZach Atkins // Copy Identity Outputs 1240e13f2367SZach Atkins CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[0], &field_size)); 1241c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorGetArrayRead(impl->q_vecs_out[0], CEED_MEM_HOST, &array)); 1242c7b67790SJeremy L Thompson for (CeedInt j = 0; j < field_size * num_points; j++) assembled_array[j] = array[j]; 1243c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArrayRead(impl->q_vecs_out[0], &array)); 1244e13f2367SZach Atkins assembled_array += field_size * num_points; 1245e13f2367SZach Atkins } 1246c7b67790SJeremy L Thompson // Reset input to 0.0 1247c7b67790SJeremy L Thompson { 1248c7b67790SJeremy L Thompson CeedScalar *array; 1249c7b67790SJeremy L Thompson 1250c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->q_vecs_in[i], CEED_MEM_HOST, &array)); 1251c7b67790SJeremy L Thompson for (CeedInt j = 0; j < num_points; j++) array[field * num_points + j] = 0.0; 1252c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->q_vecs_in[i], &array)); 1253c7b67790SJeremy L Thompson } 1254c7b67790SJeremy L Thompson } 1255e13f2367SZach Atkins } 1256e13f2367SZach Atkins num_points_offset += num_points; 1257e13f2367SZach Atkins } 1258e13f2367SZach Atkins 1259e13f2367SZach Atkins // Un-set output Qvecs to prevent accidental overwrite of Assembled 1260e13f2367SZach Atkins if (!impl->is_identity_qf) { 1261e13f2367SZach Atkins for (CeedInt out = 0; out < num_output_fields; out++) { 1262e13f2367SZach Atkins CeedVector vec; 1263e13f2367SZach Atkins 1264e13f2367SZach Atkins // Get output vector 1265e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[out], &vec)); 1266e13f2367SZach Atkins // Check if active output 1267e13f2367SZach Atkins if (vec == CEED_VECTOR_ACTIVE && num_elem > 0) { 1268e13f2367SZach Atkins CeedCallBackend(CeedVectorTakeArray(impl->q_vecs_out[out], CEED_MEM_HOST, NULL)); 1269e13f2367SZach Atkins } 1270*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 1271e13f2367SZach Atkins } 1272e13f2367SZach Atkins } 1273e13f2367SZach Atkins 1274e13f2367SZach Atkins // Restore input arrays 1275e13f2367SZach Atkins CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, true, e_data_full, impl)); 1276e13f2367SZach Atkins 1277e13f2367SZach Atkins // Restore output 1278e13f2367SZach Atkins CeedCallBackend(CeedVectorRestoreArray(*assembled, &assembled_array)); 1279e13f2367SZach Atkins 1280e13f2367SZach Atkins // Cleanup 1281e13f2367SZach Atkins CeedCallBackend(CeedVectorDestroy(&point_coords)); 1282e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionDestroy(&rstr_points)); 1283e13f2367SZach Atkins return CEED_ERROR_SUCCESS; 1284e13f2367SZach Atkins } 1285e13f2367SZach Atkins 1286e13f2367SZach Atkins //------------------------------------------------------------------------------ 1287e13f2367SZach Atkins // Assemble Linear QFunction 1288e13f2367SZach Atkins //------------------------------------------------------------------------------ 1289e13f2367SZach Atkins static int CeedOperatorLinearAssembleQFunctionAtPoints_Ref(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 1290e13f2367SZach Atkins return CeedOperatorLinearAssembleQFunctionAtPointsCore_Ref(op, true, assembled, rstr, request); 1291e13f2367SZach Atkins } 1292e13f2367SZach Atkins 1293e13f2367SZach Atkins //------------------------------------------------------------------------------ 1294e13f2367SZach Atkins // Update Assembled Linear QFunction 1295e13f2367SZach Atkins //------------------------------------------------------------------------------ 1296e13f2367SZach Atkins static int CeedOperatorLinearAssembleQFunctionAtPointsUpdate_Ref(CeedOperator op, CeedVector assembled, CeedElemRestriction rstr, 1297e13f2367SZach Atkins CeedRequest *request) { 1298e13f2367SZach Atkins return CeedOperatorLinearAssembleQFunctionAtPointsCore_Ref(op, false, &assembled, &rstr, request); 1299e13f2367SZach Atkins } 1300e13f2367SZach Atkins 1301e13f2367SZach Atkins //------------------------------------------------------------------------------ 1302fb133d4bSJeremy L Thompson // Assemble Operator Diagonal AtPoints 1303e13f2367SZach Atkins //------------------------------------------------------------------------------ 1304fb133d4bSJeremy L Thompson static int CeedOperatorLinearAssembleAddDiagonalAtPoints_Ref(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1305382e9c83SJeremy L Thompson CeedInt num_points_offset = 0, num_input_fields, num_output_fields, num_elem, num_comp_active = 1; 1306fb133d4bSJeremy L Thompson CeedScalar *e_data[2 * CEED_FIELD_MAX] = {0}; 1307fb133d4bSJeremy L Thompson Ceed ceed; 1308fb133d4bSJeremy L Thompson CeedVector point_coords = NULL, in_vec, out_vec; 1309fb133d4bSJeremy L Thompson CeedElemRestriction rstr_points = NULL; 1310fb133d4bSJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 1311fb133d4bSJeremy L Thompson CeedQFunction qf; 1312fb133d4bSJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 1313fb133d4bSJeremy L Thompson CeedOperator_Ref *impl; 1314fb133d4bSJeremy L Thompson 1315fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 1316fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 1317fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 1318fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 1319fb133d4bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 1320fb133d4bSJeremy L Thompson 1321fb133d4bSJeremy L Thompson // Setup 1322fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorSetupAtPoints_Ref(op)); 1323fb133d4bSJeremy L Thompson 1324fb133d4bSJeremy L Thompson // Ceed 1325fb133d4bSJeremy L Thompson { 1326fb133d4bSJeremy L Thompson Ceed ceed_parent; 1327fb133d4bSJeremy L Thompson 1328fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 1329fb133d4bSJeremy L Thompson CeedCallBackend(CeedGetParent(ceed, &ceed_parent)); 1330fb133d4bSJeremy L Thompson if (ceed_parent) ceed = ceed_parent; 1331fb133d4bSJeremy L Thompson } 1332fb133d4bSJeremy L Thompson 1333fb133d4bSJeremy L Thompson // Point coordinates 1334fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorAtPointsGetPoints(op, &rstr_points, &point_coords)); 1335fb133d4bSJeremy L Thompson 1336fb133d4bSJeremy L Thompson // Input and output vectors 1337fb133d4bSJeremy L Thompson { 1338fb133d4bSJeremy L Thompson CeedSize input_size, output_size; 1339fb133d4bSJeremy L Thompson 1340fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 1341fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, input_size, &in_vec)); 1342fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, output_size, &out_vec)); 1343fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(out_vec, 0.0)); 1344fb133d4bSJeremy L Thompson } 1345fb133d4bSJeremy L Thompson 1346382e9c83SJeremy L Thompson // Clear input Qvecs 134786e10729SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 1348*681d0ea7SJeremy L Thompson bool is_active; 134986e10729SJeremy L Thompson CeedVector vec; 135086e10729SJeremy L Thompson 135186e10729SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 1352*681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 1353*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 1354*681d0ea7SJeremy L Thompson if (!is_active) continue; 135586e10729SJeremy L Thompson CeedCallBackend(CeedVectorSetValue(impl->q_vecs_in[i], 0.0)); 135686e10729SJeremy L Thompson } 1357382e9c83SJeremy L Thompson 1358fb133d4bSJeremy L Thompson // Input Evecs and Restriction 1359fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, NULL, true, e_data, impl, request)); 1360fb133d4bSJeremy L Thompson 1361fb133d4bSJeremy L Thompson // Loop through elements 1362fb133d4bSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 1363fb133d4bSJeremy L Thompson CeedInt num_points, e_vec_size = 0; 1364fb133d4bSJeremy L Thompson 1365fb133d4bSJeremy L Thompson // Setup points for element 1366fb133d4bSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(rstr_points, e, CEED_NOTRANSPOSE, point_coords, impl->point_coords_elem, request)); 1367fb133d4bSJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumPointsInElement(rstr_points, e, &num_points)); 1368fb133d4bSJeremy L Thompson 1369fb133d4bSJeremy L Thompson // Input basis apply for non-active bases 1370fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorInputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_input_fields, op_input_fields, num_input_fields, in_vec, 1371fb133d4bSJeremy L Thompson impl->point_coords_elem, true, e_data, impl, request)); 1372fb133d4bSJeremy L Thompson 1373fb133d4bSJeremy L Thompson // Loop over points on element 1374fb133d4bSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 1375*681d0ea7SJeremy L Thompson bool is_active_at_points = true, is_active; 1376382e9c83SJeremy L Thompson CeedInt elem_size_active = 1; 1377382e9c83SJeremy L Thompson CeedRestrictionType rstr_type; 1378fb133d4bSJeremy L Thompson CeedVector vec; 1379382e9c83SJeremy L Thompson CeedElemRestriction elem_rstr; 1380fb133d4bSJeremy L Thompson 1381382e9c83SJeremy L Thompson // -- Skip non-active input 1382*681d0ea7SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 1383*681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 1384*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 1385*681d0ea7SJeremy L Thompson if (!is_active) continue; 1386fb133d4bSJeremy L Thompson 1387382e9c83SJeremy L Thompson // -- Get active restriction type 1388382e9c83SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 1389382e9c83SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetType(elem_rstr, &rstr_type)); 1390382e9c83SJeremy L Thompson is_active_at_points = rstr_type == CEED_RESTRICTION_POINTS; 1391382e9c83SJeremy L Thompson if (!is_active_at_points) CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size_active)); 1392382e9c83SJeremy L Thompson else elem_size_active = num_points; 1393382e9c83SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumComponents(elem_rstr, &num_comp_active)); 1394*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 1395382e9c83SJeremy L Thompson 1396382e9c83SJeremy L Thompson e_vec_size = elem_size_active * num_comp_active; 1397382e9c83SJeremy L Thompson for (CeedInt s = 0; s < e_vec_size; s++) { 1398382e9c83SJeremy L Thompson CeedEvalMode eval_mode; 1399382e9c83SJeremy L Thompson CeedBasis basis; 1400382e9c83SJeremy L Thompson 1401382e9c83SJeremy L Thompson // -- Update unit vector 1402fb133d4bSJeremy L Thompson { 1403fb133d4bSJeremy L Thompson CeedScalar *array; 1404fb133d4bSJeremy L Thompson 140513062808SJeremy L Thompson if (s == 0) CeedCallBackend(CeedVectorSetValue(impl->e_vecs_in[i], 0.0)); 1406fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->e_vecs_in[i], CEED_MEM_HOST, &array)); 1407fb133d4bSJeremy L Thompson array[s] = 1.0; 1408fb133d4bSJeremy L Thompson if (s > 0) array[s - 1] = 0.0; 1409fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->e_vecs_in[i], &array)); 1410fb133d4bSJeremy L Thompson } 1411382e9c83SJeremy L Thompson // -- Basis action 1412958e607dSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 1413fb133d4bSJeremy L Thompson switch (eval_mode) { 1414fb133d4bSJeremy L Thompson case CEED_EVAL_NONE: 1415fb133d4bSJeremy L Thompson break; 1416fb133d4bSJeremy L Thompson // Note - these basis eval modes require FEM fields 1417fb133d4bSJeremy L Thompson case CEED_EVAL_INTERP: 1418fb133d4bSJeremy L Thompson case CEED_EVAL_GRAD: 1419fb133d4bSJeremy L Thompson case CEED_EVAL_DIV: 1420fb133d4bSJeremy L Thompson case CEED_EVAL_CURL: 1421fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_input_fields[i], &basis)); 1422fc0f7cc6SJeremy L Thompson CeedCallBackend(CeedBasisApplyAtPoints(basis, 1, &num_points, CEED_NOTRANSPOSE, eval_mode, impl->point_coords_elem, impl->e_vecs_in[i], 1423fb133d4bSJeremy L Thompson impl->q_vecs_in[i])); 1424*681d0ea7SJeremy L Thompson CeedCallBackend(CeedBasisDestroy(&basis)); 1425fb133d4bSJeremy L Thompson break; 1426fb133d4bSJeremy L Thompson case CEED_EVAL_WEIGHT: 1427fb133d4bSJeremy L Thompson break; // No action 1428fb133d4bSJeremy L Thompson } 1429fb133d4bSJeremy L Thompson 1430fb133d4bSJeremy L Thompson // -- Q function 1431fb133d4bSJeremy L Thompson if (!impl->is_identity_qf) { 1432fb133d4bSJeremy L Thompson CeedCallBackend(CeedQFunctionApply(qf, num_points, impl->q_vecs_in, impl->q_vecs_out)); 1433fb133d4bSJeremy L Thompson } 1434fb133d4bSJeremy L Thompson 1435fb133d4bSJeremy L Thompson // -- Output basis apply and restriction 1436fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorOutputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_output_fields, op_output_fields, num_input_fields, 1437f8a0df59SJeremy L Thompson num_output_fields, impl->apply_add_basis_out, impl->skip_rstr_out, op, out_vec, 1438f8a0df59SJeremy L Thompson impl->point_coords_elem, impl, request)); 1439fb133d4bSJeremy L Thompson 1440fb133d4bSJeremy L Thompson // -- Grab diagonal value 144186e10729SJeremy L Thompson for (CeedInt j = 0; j < num_output_fields; j++) { 1442*681d0ea7SJeremy L Thompson bool is_active; 1443382e9c83SJeremy L Thompson CeedInt elem_size = 0; 1444fb133d4bSJeremy L Thompson CeedRestrictionType rstr_type; 1445fb133d4bSJeremy L Thompson CeedEvalMode eval_mode; 1446fb133d4bSJeremy L Thompson CeedVector vec; 1447fb133d4bSJeremy L Thompson CeedElemRestriction elem_rstr; 1448fb133d4bSJeremy L Thompson CeedBasis basis; 1449fb133d4bSJeremy L Thompson 14500c7f167fSZach Atkins // ---- Skip non-active output 1451*681d0ea7SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[j], &vec)); 1452*681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 1453*681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 1454*681d0ea7SJeremy L Thompson if (!is_active) continue; 1455fb133d4bSJeremy L Thompson 1456382e9c83SJeremy L Thompson // ---- Check if elem size matches 145786e10729SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[j], &elem_rstr)); 1458382e9c83SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetType(elem_rstr, &rstr_type)); 1459382e9c83SJeremy L Thompson if (is_active_at_points && rstr_type != CEED_RESTRICTION_POINTS) continue; 1460382e9c83SJeremy L Thompson if (rstr_type == CEED_RESTRICTION_POINTS) { 1461382e9c83SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumPointsInElement(elem_rstr, e, &elem_size)); 1462382e9c83SJeremy L Thompson } else { 1463382e9c83SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size)); 1464382e9c83SJeremy L Thompson } 1465382e9c83SJeremy L Thompson { 1466382e9c83SJeremy L Thompson CeedInt num_comp = 0; 1467382e9c83SJeremy L Thompson 1468382e9c83SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumComponents(elem_rstr, &num_comp)); 1469382e9c83SJeremy L Thompson if (e_vec_size != num_comp * elem_size) continue; 1470382e9c83SJeremy L Thompson } 1471382e9c83SJeremy L Thompson 1472fb133d4bSJeremy L Thompson // ---- Basis action 147386e10729SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[j], &eval_mode)); 1474fb133d4bSJeremy L Thompson switch (eval_mode) { 1475fb133d4bSJeremy L Thompson case CEED_EVAL_NONE: 1476fb133d4bSJeremy L Thompson break; // No action 1477fb133d4bSJeremy L Thompson case CEED_EVAL_INTERP: 1478fb133d4bSJeremy L Thompson case CEED_EVAL_GRAD: 1479fb133d4bSJeremy L Thompson case CEED_EVAL_DIV: 1480fb133d4bSJeremy L Thompson case CEED_EVAL_CURL: 148186e10729SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_output_fields[j], &basis)); 148286e10729SJeremy L Thompson CeedCallBackend(CeedBasisApplyAtPoints(basis, 1, &num_points, CEED_TRANSPOSE, eval_mode, impl->point_coords_elem, impl->q_vecs_out[j], 148386e10729SJeremy L Thompson impl->e_vecs_out[j])); 1484*681d0ea7SJeremy L Thompson CeedCallBackend(CeedBasisDestroy(&basis)); 1485fb133d4bSJeremy L Thompson break; 1486fb133d4bSJeremy L Thompson // LCOV_EXCL_START 1487fb133d4bSJeremy L Thompson case CEED_EVAL_WEIGHT: { 1488fb133d4bSJeremy L Thompson return CeedError(CeedOperatorReturnCeed(op), CEED_ERROR_BACKEND, "CEED_EVAL_WEIGHT cannot be an output evaluation mode"); 1489fb133d4bSJeremy L Thompson // LCOV_EXCL_STOP 1490fb133d4bSJeremy L Thompson } 1491fb133d4bSJeremy L Thompson } 1492fb133d4bSJeremy L Thompson // ---- Update output vector 1493fb133d4bSJeremy L Thompson { 1494fb133d4bSJeremy L Thompson CeedScalar *array, current_value = 0.0; 1495fb133d4bSJeremy L Thompson 149686e10729SJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->e_vecs_out[j], CEED_MEM_HOST, &array)); 1497fb133d4bSJeremy L Thompson current_value = array[s]; 149886e10729SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->e_vecs_out[j], &array)); 149986e10729SJeremy L Thompson CeedCallBackend(CeedVectorSetValue(impl->e_vecs_out[j], 0.0)); 150086e10729SJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->e_vecs_out[j], CEED_MEM_HOST, &array)); 1501fb133d4bSJeremy L Thompson array[s] = current_value; 150286e10729SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->e_vecs_out[j], &array)); 1503fb133d4bSJeremy L Thompson } 1504fb133d4bSJeremy L Thompson // ---- Restrict output block 1505fb133d4bSJeremy L Thompson if (rstr_type == CEED_RESTRICTION_POINTS) { 150686e10729SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(elem_rstr, e, CEED_TRANSPOSE, impl->e_vecs_out[j], assembled, request)); 1507fb133d4bSJeremy L Thompson } else { 150886e10729SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyBlock(elem_rstr, e, CEED_TRANSPOSE, impl->e_vecs_out[j], assembled, request)); 1509fb133d4bSJeremy L Thompson } 1510*681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 1511fb133d4bSJeremy L Thompson } 1512382e9c83SJeremy L Thompson // -- Reset unit vector 151313062808SJeremy L Thompson if (s == e_vec_size - 1) CeedCallBackend(CeedVectorSetValue(impl->q_vecs_in[i], 0.0)); 1514382e9c83SJeremy L Thompson } 1515fb133d4bSJeremy L Thompson } 1516fb133d4bSJeremy L Thompson num_points_offset += num_points; 1517fb133d4bSJeremy L Thompson } 1518fb133d4bSJeremy L Thompson 1519fb133d4bSJeremy L Thompson // Restore input arrays 1520fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, true, e_data, impl)); 1521fb133d4bSJeremy L Thompson 1522fb133d4bSJeremy L Thompson // Cleanup 1523fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&in_vec)); 1524fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&out_vec)); 1525fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&point_coords)); 1526fb133d4bSJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_points)); 1527fb133d4bSJeremy L Thompson return CEED_ERROR_SUCCESS; 1528fb133d4bSJeremy L Thompson } 1529e13f2367SZach Atkins 1530e13f2367SZach Atkins //------------------------------------------------------------------------------ 1531f10650afSjeremylt // Operator Destroy 1532f10650afSjeremylt //------------------------------------------------------------------------------ 1533f10650afSjeremylt static int CeedOperatorDestroy_Ref(CeedOperator op) { 1534f10650afSjeremylt CeedOperator_Ref *impl; 1535f10650afSjeremylt 1536ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 15373aab95c0SJeremy L Thompson CeedCallBackend(CeedFree(&impl->skip_rstr_in)); 1538f8a0df59SJeremy L Thompson CeedCallBackend(CeedFree(&impl->skip_rstr_out)); 1539f8a0df59SJeremy L Thompson CeedCallBackend(CeedFree(&impl->e_data_out_indices)); 1540f8a0df59SJeremy L Thompson CeedCallBackend(CeedFree(&impl->apply_add_basis_out)); 15414fc1f125SJeremy L Thompson for (CeedInt i = 0; i < impl->num_inputs + impl->num_outputs; i++) { 15422b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->e_vecs_full[i])); 1543f10650afSjeremylt } 15442b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->e_vecs_full)); 15452b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->input_states)); 1546f10650afSjeremylt 15474fc1f125SJeremy L Thompson for (CeedInt i = 0; i < impl->num_inputs; i++) { 15482b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->e_vecs_in[i])); 15492b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->q_vecs_in[i])); 1550f10650afSjeremylt } 15512b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->e_vecs_in)); 15522b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->q_vecs_in)); 1553f10650afSjeremylt 15544fc1f125SJeremy L Thompson for (CeedInt i = 0; i < impl->num_outputs; i++) { 15552b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->e_vecs_out[i])); 15562b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->q_vecs_out[i])); 1557f10650afSjeremylt } 15582b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->e_vecs_out)); 15592b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->q_vecs_out)); 156048acf710SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->point_coords_elem)); 1561f10650afSjeremylt 15622b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl)); 1563e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 1564f10650afSjeremylt } 1565f10650afSjeremylt 1566f10650afSjeremylt //------------------------------------------------------------------------------ 1567713f43c3Sjeremylt // Operator Create 1568f10650afSjeremylt //------------------------------------------------------------------------------ 156921617c04Sjeremylt int CeedOperatorCreate_Ref(CeedOperator op) { 1570fe2413ffSjeremylt Ceed ceed; 15714ce2993fSjeremylt CeedOperator_Ref *impl; 157221617c04Sjeremylt 1573ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 15742b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(1, &impl)); 15752b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetData(op, impl)); 15762b730f8bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleQFunction", CeedOperatorLinearAssembleQFunction_Ref)); 15772b730f8bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleQFunctionUpdate", CeedOperatorLinearAssembleQFunctionUpdate_Ref)); 15782b730f8bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "ApplyAdd", CeedOperatorApplyAdd_Ref)); 15792b730f8bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "Destroy", CeedOperatorDestroy_Ref)); 1580e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 158121617c04Sjeremylt } 15822a86cc9dSSebastian Grimberg 15832a86cc9dSSebastian Grimberg //------------------------------------------------------------------------------ 158448acf710SJeremy L Thompson // Operator Create At Points 158548acf710SJeremy L Thompson //------------------------------------------------------------------------------ 158648acf710SJeremy L Thompson int CeedOperatorCreateAtPoints_Ref(CeedOperator op) { 158748acf710SJeremy L Thompson Ceed ceed; 158848acf710SJeremy L Thompson CeedOperator_Ref *impl; 158948acf710SJeremy L Thompson 159048acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 159148acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(1, &impl)); 159248acf710SJeremy L Thompson CeedCallBackend(CeedOperatorSetData(op, impl)); 1593e13f2367SZach Atkins CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleQFunction", CeedOperatorLinearAssembleQFunctionAtPoints_Ref)); 1594e13f2367SZach Atkins CeedCallBackend( 1595e13f2367SZach Atkins CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleQFunctionUpdate", CeedOperatorLinearAssembleQFunctionAtPointsUpdate_Ref)); 1596fb133d4bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleAddDiagonal", CeedOperatorLinearAssembleAddDiagonalAtPoints_Ref)); 159748acf710SJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "ApplyAdd", CeedOperatorApplyAddAtPoints_Ref)); 159848acf710SJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "Destroy", CeedOperatorDestroy_Ref)); 159948acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 160048acf710SJeremy L Thompson } 160148acf710SJeremy L Thompson 160248acf710SJeremy L Thompson //------------------------------------------------------------------------------ 1603