15aed82e4SJeremy L Thompson // Copyright (c) 2017-2024, Lawrence Livermore National Security, LLC and other CEED contributors. 23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details. 321617c04Sjeremylt // 43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause 521617c04Sjeremylt // 63d8e8822SJeremy L Thompson // This file is part of CEED: http://github.com/ceed 721617c04Sjeremylt 849aac155SJeremy L Thompson #include <ceed.h> 9ec3da8bcSJed Brown #include <ceed/backend.h> 103d576824SJeremy L Thompson #include <stdbool.h> 113d576824SJeremy L Thompson #include <stddef.h> 123d576824SJeremy L Thompson #include <stdint.h> 132b730f8bSJeremy L Thompson 1421617c04Sjeremylt #include "ceed-ref.h" 1521617c04Sjeremylt 16f10650afSjeremylt //------------------------------------------------------------------------------ 17f10650afSjeremylt // Setup Input/Output Fields 18f10650afSjeremylt //------------------------------------------------------------------------------ 19f8a0df59SJeremy L Thompson static int CeedOperatorSetupFields_Ref(CeedQFunction qf, CeedOperator op, bool is_input, bool *skip_rstr, CeedInt *e_data_out_indices, 20f8a0df59SJeremy L Thompson bool *apply_add_basis, CeedVector *e_vecs_full, CeedVector *e_vecs, CeedVector *q_vecs, CeedInt start_e, 21f8a0df59SJeremy L Thompson CeedInt num_fields, CeedInt Q) { 22aedaa0e5Sjeremylt Ceed ceed; 236efa0d72SZach Atkins CeedSize e_size, q_size; 24ad70ee2cSJeremy L Thompson CeedInt num_comp, size, P; 25d1d35e2fSjeremylt CeedQFunctionField *qf_fields; 26ad70ee2cSJeremy L Thompson CeedOperatorField *op_fields; 27ad70ee2cSJeremy L Thompson 28e910d748SJeremy L Thompson { 29e910d748SJeremy L Thompson Ceed ceed_parent; 30e910d748SJeremy L Thompson 31ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 32e910d748SJeremy L Thompson CeedCallBackend(CeedGetParent(ceed, &ceed_parent)); 33*9bc66399SJeremy L Thompson CeedCallBackend(CeedReferenceCopy(ceed_parent, &ceed)); 34*9bc66399SJeremy L Thompson CeedCallBackend(CeedDestroy(&ceed_parent)); 35e910d748SJeremy L Thompson } 364fc1f125SJeremy L Thompson if (is_input) { 372b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL)); 382b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL)); 394fc1f125SJeremy L Thompson } else { 402b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields)); 412b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, NULL, NULL, &qf_fields)); 42fe2413ffSjeremylt } 4321617c04Sjeremylt 44885ac19cSjeremylt // Loop over fields 45d1d35e2fSjeremylt for (CeedInt i = 0; i < num_fields; i++) { 46d1d35e2fSjeremylt CeedEvalMode eval_mode; 47edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 48ad70ee2cSJeremy L Thompson CeedBasis basis; 49d1d35e2fSjeremylt 50ad70ee2cSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 51d1d35e2fSjeremylt if (eval_mode != CEED_EVAL_WEIGHT) { 52edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr)); 53edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionCreateVector(elem_rstr, NULL, &e_vecs_full[i + start_e])); 54681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 55135a076eSjeremylt } 56135a076eSjeremylt 57d1d35e2fSjeremylt switch (eval_mode) { 58885ac19cSjeremylt case CEED_EVAL_NONE: 592b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_fields[i], &size)); 60d2643443SJeremy L Thompson q_size = (CeedSize)Q * size; 612b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 62aedaa0e5Sjeremylt break; 63aedaa0e5Sjeremylt case CEED_EVAL_INTERP: 64885ac19cSjeremylt case CEED_EVAL_GRAD: 65a915a514Srezgarshakeri case CEED_EVAL_DIV: 66c4e3f59bSSebastian Grimberg case CEED_EVAL_CURL: 672b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 682b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_fields[i], &size)); 692b730f8bSJeremy L Thompson CeedCallBackend(CeedBasisGetNumNodes(basis, &P)); 702b730f8bSJeremy L Thompson CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 71d2643443SJeremy L Thompson e_size = (CeedSize)P * num_comp; 722b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, e_size, &e_vecs[i])); 73d2643443SJeremy L Thompson q_size = (CeedSize)Q * size; 742b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 75681d0ea7SJeremy L Thompson CeedCallBackend(CeedBasisDestroy(&basis)); 76885ac19cSjeremylt break; 77885ac19cSjeremylt case CEED_EVAL_WEIGHT: // Only on input fields 782b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 79d2643443SJeremy L Thompson q_size = (CeedSize)Q; 802b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 812b730f8bSJeremy L Thompson CeedCallBackend(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, q_vecs[i])); 82681d0ea7SJeremy L Thompson CeedCallBackend(CeedBasisDestroy(&basis)); 83885ac19cSjeremylt break; 8421617c04Sjeremylt } 85885ac19cSjeremylt } 86f8a0df59SJeremy L Thompson // Drop duplicate restrictions 873aab95c0SJeremy L Thompson if (is_input) { 883aab95c0SJeremy L Thompson for (CeedInt i = 0; i < num_fields; i++) { 893aab95c0SJeremy L Thompson CeedVector vec_i; 903aab95c0SJeremy L Thompson CeedElemRestriction rstr_i; 913aab95c0SJeremy L Thompson 923aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[i], &vec_i)); 933aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr_i)); 943aab95c0SJeremy L Thompson for (CeedInt j = i + 1; j < num_fields; j++) { 953aab95c0SJeremy L Thompson CeedVector vec_j; 963aab95c0SJeremy L Thompson CeedElemRestriction rstr_j; 973aab95c0SJeremy L Thompson 983aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[j], &vec_j)); 993aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[j], &rstr_j)); 1003aab95c0SJeremy L Thompson if (vec_i == vec_j && rstr_i == rstr_j) { 1013aab95c0SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs[i], &e_vecs[j])); 102f8a0df59SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs_full[i + start_e], &e_vecs_full[j + start_e])); 1033aab95c0SJeremy L Thompson skip_rstr[j] = true; 1043aab95c0SJeremy L Thompson } 105681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec_j)); 106681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_j)); 1073aab95c0SJeremy L Thompson } 108681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec_i)); 109681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_i)); 1103aab95c0SJeremy L Thompson } 111f8a0df59SJeremy L Thompson } else { 112f8a0df59SJeremy L Thompson for (CeedInt i = num_fields - 1; i >= 0; i--) { 113f8a0df59SJeremy L Thompson CeedVector vec_i; 114f8a0df59SJeremy L Thompson CeedElemRestriction rstr_i; 115f8a0df59SJeremy L Thompson 116f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[i], &vec_i)); 117f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr_i)); 118f8a0df59SJeremy L Thompson for (CeedInt j = i - 1; j >= 0; j--) { 119f8a0df59SJeremy L Thompson CeedVector vec_j; 120f8a0df59SJeremy L Thompson CeedElemRestriction rstr_j; 121f8a0df59SJeremy L Thompson 122f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[j], &vec_j)); 123f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[j], &rstr_j)); 124f8a0df59SJeremy L Thompson if (vec_i == vec_j && rstr_i == rstr_j) { 125f8a0df59SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs[i], &e_vecs[j])); 126f8a0df59SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs_full[i + start_e], &e_vecs_full[j + start_e])); 127f8a0df59SJeremy L Thompson skip_rstr[j] = true; 128f8a0df59SJeremy L Thompson apply_add_basis[i] = true; 129f8a0df59SJeremy L Thompson e_data_out_indices[j] = i; 130f8a0df59SJeremy L Thompson } 131681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec_j)); 132681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_j)); 133f8a0df59SJeremy L Thompson } 134681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec_i)); 135681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_i)); 136f8a0df59SJeremy L Thompson } 1373aab95c0SJeremy L Thompson } 138*9bc66399SJeremy L Thompson CeedCallBackend(CeedDestroy(&ceed)); 139e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 14021617c04Sjeremylt } 14121617c04Sjeremylt 142f10650afSjeremylt //------------------------------------------------------------------------------ 143f10650afSjeremylt // Setup Operator 144f10650afSjeremylt //------------------------------------------------------------------------------/* 145885ac19cSjeremylt static int CeedOperatorSetup_Ref(CeedOperator op) { 1468c1105f8SJeremy L Thompson bool is_setup_done; 147ad70ee2cSJeremy L Thompson CeedInt Q, num_input_fields, num_output_fields; 148ad70ee2cSJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 149ad70ee2cSJeremy L Thompson CeedQFunction qf; 150ad70ee2cSJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 151ad70ee2cSJeremy L Thompson CeedOperator_Ref *impl; 152ad70ee2cSJeremy L Thompson 1532b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorIsSetupDone(op, &is_setup_done)); 1548c1105f8SJeremy L Thompson if (is_setup_done) return CEED_ERROR_SUCCESS; 155ad70ee2cSJeremy L Thompson 1562b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 1572b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 1582b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumQuadraturePoints(op, &Q)); 1592b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionIsIdentity(qf, &impl->is_identity_qf)); 1602b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 1612b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 162885ac19cSjeremylt 163885ac19cSjeremylt // Allocate 1642b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(num_input_fields + num_output_fields, &impl->e_vecs_full)); 165885ac19cSjeremylt 1663aab95c0SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->skip_rstr_in)); 167f8a0df59SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->skip_rstr_out)); 168f8a0df59SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_data_out_indices)); 169f8a0df59SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->apply_add_basis_out)); 1702b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->input_states)); 1712b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_vecs_in)); 1722b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_vecs_out)); 1732b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->q_vecs_in)); 1742b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->q_vecs_out)); 175885ac19cSjeremylt 1764fc1f125SJeremy L Thompson impl->num_inputs = num_input_fields; 1774fc1f125SJeremy L Thompson impl->num_outputs = num_output_fields; 178885ac19cSjeremylt 179d1d35e2fSjeremylt // Set up infield and outfield e_vecs and q_vecs 180885ac19cSjeremylt // Infields 181f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorSetupFields_Ref(qf, op, true, impl->skip_rstr_in, NULL, NULL, impl->e_vecs_full, impl->e_vecs_in, impl->q_vecs_in, 0, 182f8a0df59SJeremy L Thompson num_input_fields, Q)); 1833aab95c0SJeremy L Thompson // Outfields 184f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorSetupFields_Ref(qf, op, false, impl->skip_rstr_out, impl->e_data_out_indices, impl->apply_add_basis_out, 185f8a0df59SJeremy L Thompson impl->e_vecs_full, impl->e_vecs_out, impl->q_vecs_out, num_input_fields, num_output_fields, Q)); 186885ac19cSjeremylt 18716911fdaSjeremylt // Identity QFunctions 1880b454692Sjeremylt if (impl->is_identity_qf) { 189d1d35e2fSjeremylt CeedEvalMode in_mode, out_mode; 190d1d35e2fSjeremylt CeedQFunctionField *in_fields, *out_fields; 191ad70ee2cSJeremy L Thompson 1922b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &in_fields, NULL, &out_fields)); 1932b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(in_fields[0], &in_mode)); 1942b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(out_fields[0], &out_mode)); 195d1d35e2fSjeremylt 1960b454692Sjeremylt if (in_mode == CEED_EVAL_NONE && out_mode == CEED_EVAL_NONE) { 197edb2538eSJeremy L Thompson impl->is_identity_rstr_op = true; 1980b454692Sjeremylt } else { 199db002c03SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(impl->q_vecs_in[0], &impl->q_vecs_out[0])); 20016911fdaSjeremylt } 20116911fdaSjeremylt } 20216911fdaSjeremylt 2032b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetSetupDone(op)); 204e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 205885ac19cSjeremylt } 206885ac19cSjeremylt 207f10650afSjeremylt //------------------------------------------------------------------------------ 208f10650afSjeremylt // Setup Operator Inputs 209f10650afSjeremylt //------------------------------------------------------------------------------ 2102b730f8bSJeremy L Thompson static inline int CeedOperatorSetupInputs_Ref(CeedInt num_input_fields, CeedQFunctionField *qf_input_fields, CeedOperatorField *op_input_fields, 2112b730f8bSJeremy L Thompson CeedVector in_vec, const bool skip_active, CeedScalar *e_data_full[2 * CEED_FIELD_MAX], 212a0162de9SJeremy L Thompson CeedOperator_Ref *impl, CeedRequest *request) { 213ad70ee2cSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 214681d0ea7SJeremy L Thompson bool is_active; 215ad70ee2cSJeremy L Thompson uint64_t state; 216d1d35e2fSjeremylt CeedEvalMode eval_mode; 217d1bcdac9Sjeremylt CeedVector vec; 218885ac19cSjeremylt 219d1bcdac9Sjeremylt // Get input vector 2202b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 221681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 222681d0ea7SJeremy L Thompson if (is_active) { 2232b730f8bSJeremy L Thompson if (skip_active) continue; 2242b730f8bSJeremy L Thompson else vec = in_vec; 2251d102b48SJeremy L Thompson } 2261d102b48SJeremy L Thompson 2272b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 2281d102b48SJeremy L Thompson // Restrict and Evec 229d1d35e2fSjeremylt if (eval_mode == CEED_EVAL_WEIGHT) { // Skip 2301d102b48SJeremy L Thompson } else { 231668048e2SJed Brown // Restrict 2322b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorGetState(vec, &state)); 2338d713cf6Sjeremylt // Skip restriction if input is unchanged 2343aab95c0SJeremy L Thompson if ((state != impl->input_states[i] || vec == in_vec) && !impl->skip_rstr_in[i]) { 235681d0ea7SJeremy L Thompson CeedElemRestriction elem_rstr; 236681d0ea7SJeremy L Thompson 237edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 238edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApply(elem_rstr, CEED_NOTRANSPOSE, vec, impl->e_vecs_full[i], request)); 239681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 2408d713cf6Sjeremylt } 2413aab95c0SJeremy L Thompson impl->input_states[i] = state; 242668048e2SJed Brown // Get evec 2432b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorGetArrayRead(impl->e_vecs_full[i], CEED_MEM_HOST, (const CeedScalar **)&e_data_full[i])); 244885ac19cSjeremylt } 245681d0ea7SJeremy L Thompson if (!is_active) CeedCallBackend(CeedVectorDestroy(&vec)); 246885ac19cSjeremylt } 247e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 248885ac19cSjeremylt } 249885ac19cSjeremylt 250f10650afSjeremylt //------------------------------------------------------------------------------ 251f10650afSjeremylt // Input Basis Action 252f10650afSjeremylt //------------------------------------------------------------------------------ 2532b730f8bSJeremy L Thompson static inline int CeedOperatorInputBasis_Ref(CeedInt e, CeedInt Q, CeedQFunctionField *qf_input_fields, CeedOperatorField *op_input_fields, 2542b730f8bSJeremy L Thompson CeedInt num_input_fields, const bool skip_active, CeedScalar *e_data_full[2 * CEED_FIELD_MAX], 2552b730f8bSJeremy L Thompson CeedOperator_Ref *impl) { 256ad70ee2cSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 257a915a514Srezgarshakeri CeedInt elem_size, size, num_comp; 258d1d35e2fSjeremylt CeedEvalMode eval_mode; 259edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 2601d102b48SJeremy L Thompson CeedBasis basis; 2611d102b48SJeremy L Thompson 2621d102b48SJeremy L Thompson // Skip active input 263d1d35e2fSjeremylt if (skip_active) { 264681d0ea7SJeremy L Thompson bool is_active; 2651d102b48SJeremy L Thompson CeedVector vec; 266ad70ee2cSJeremy L Thompson 2672b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 268681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 269681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 270681d0ea7SJeremy L Thompson if (is_active) continue; 2711d102b48SJeremy L Thompson } 272d1d35e2fSjeremylt // Get elem_size, eval_mode, size 273edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 274edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size)); 275681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 2762b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 2772b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &size)); 278885ac19cSjeremylt // Basis action 279d1d35e2fSjeremylt switch (eval_mode) { 280885ac19cSjeremylt case CEED_EVAL_NONE: 28181670346SSebastian Grimberg CeedCallBackend(CeedVectorSetArray(impl->q_vecs_in[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data_full[i][(CeedSize)e * Q * size])); 282885ac19cSjeremylt break; 283885ac19cSjeremylt case CEED_EVAL_INTERP: 284885ac19cSjeremylt case CEED_EVAL_GRAD: 285a915a514Srezgarshakeri case CEED_EVAL_DIV: 286c4e3f59bSSebastian Grimberg case CEED_EVAL_CURL: 287a915a514Srezgarshakeri CeedCallBackend(CeedOperatorFieldGetBasis(op_input_fields[i], &basis)); 288a915a514Srezgarshakeri CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 28981670346SSebastian Grimberg CeedCallBackend(CeedVectorSetArray(impl->e_vecs_in[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data_full[i][(CeedSize)e * elem_size * num_comp])); 290c4e3f59bSSebastian Grimberg CeedCallBackend(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, eval_mode, impl->e_vecs_in[i], impl->q_vecs_in[i])); 291681d0ea7SJeremy L Thompson CeedCallBackend(CeedBasisDestroy(&basis)); 292a915a514Srezgarshakeri break; 293885ac19cSjeremylt case CEED_EVAL_WEIGHT: 294885ac19cSjeremylt break; // No action 295885ac19cSjeremylt } 296885ac19cSjeremylt } 297e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 298885ac19cSjeremylt } 299885ac19cSjeremylt 300f10650afSjeremylt //------------------------------------------------------------------------------ 301f10650afSjeremylt // Output Basis Action 302f10650afSjeremylt //------------------------------------------------------------------------------ 3032b730f8bSJeremy L Thompson static inline int CeedOperatorOutputBasis_Ref(CeedInt e, CeedInt Q, CeedQFunctionField *qf_output_fields, CeedOperatorField *op_output_fields, 304f8a0df59SJeremy L Thompson CeedInt num_input_fields, CeedInt num_output_fields, bool *apply_add_basis, CeedOperator op, 3054fc1f125SJeremy L Thompson CeedScalar *e_data_full[2 * CEED_FIELD_MAX], CeedOperator_Ref *impl) { 306ad70ee2cSJeremy L Thompson for (CeedInt i = 0; i < num_output_fields; i++) { 307a915a514Srezgarshakeri CeedInt elem_size, num_comp; 308d1d35e2fSjeremylt CeedEvalMode eval_mode; 309edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 3101d102b48SJeremy L Thompson CeedBasis basis; 3111d102b48SJeremy L Thompson 312a915a514Srezgarshakeri // Get elem_size, eval_mode 313edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); 314edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size)); 315681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 3162b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); 317885ac19cSjeremylt // Basis action 318d1d35e2fSjeremylt switch (eval_mode) { 319885ac19cSjeremylt case CEED_EVAL_NONE: 320885ac19cSjeremylt break; // No action 321885ac19cSjeremylt case CEED_EVAL_INTERP: 322885ac19cSjeremylt case CEED_EVAL_GRAD: 323a915a514Srezgarshakeri case CEED_EVAL_DIV: 324c4e3f59bSSebastian Grimberg case CEED_EVAL_CURL: 325a915a514Srezgarshakeri CeedCallBackend(CeedOperatorFieldGetBasis(op_output_fields[i], &basis)); 326a915a514Srezgarshakeri CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 32781670346SSebastian Grimberg CeedCallBackend(CeedVectorSetArray(impl->e_vecs_out[i], CEED_MEM_HOST, CEED_USE_POINTER, 32881670346SSebastian Grimberg &e_data_full[i + num_input_fields][(CeedSize)e * elem_size * num_comp])); 329f8a0df59SJeremy L Thompson if (apply_add_basis[i]) { 330f8a0df59SJeremy L Thompson CeedCallBackend(CeedBasisApplyAdd(basis, 1, CEED_TRANSPOSE, eval_mode, impl->q_vecs_out[i], impl->e_vecs_out[i])); 331f8a0df59SJeremy L Thompson } else { 332c4e3f59bSSebastian Grimberg CeedCallBackend(CeedBasisApply(basis, 1, CEED_TRANSPOSE, eval_mode, impl->q_vecs_out[i], impl->e_vecs_out[i])); 333f8a0df59SJeremy L Thompson } 334681d0ea7SJeremy L Thompson CeedCallBackend(CeedBasisDestroy(&basis)); 335a915a514Srezgarshakeri break; 336c042f62fSJeremy L Thompson // LCOV_EXCL_START 337bbfacfcdSjeremylt case CEED_EVAL_WEIGHT: { 3386e536b99SJeremy L Thompson return CeedError(CeedOperatorReturnCeed(op), CEED_ERROR_BACKEND, "CEED_EVAL_WEIGHT cannot be an output evaluation mode"); 3391d102b48SJeremy L Thompson // LCOV_EXCL_STOP 340885ac19cSjeremylt } 341885ac19cSjeremylt } 342885ac19cSjeremylt } 343e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 3441d102b48SJeremy L Thompson } 3451d102b48SJeremy L Thompson 346f10650afSjeremylt //------------------------------------------------------------------------------ 347f10650afSjeremylt // Restore Input Vectors 348f10650afSjeremylt //------------------------------------------------------------------------------ 3492b730f8bSJeremy L Thompson static inline int CeedOperatorRestoreInputs_Ref(CeedInt num_input_fields, CeedQFunctionField *qf_input_fields, CeedOperatorField *op_input_fields, 3502b730f8bSJeremy L Thompson const bool skip_active, CeedScalar *e_data_full[2 * CEED_FIELD_MAX], CeedOperator_Ref *impl) { 351ad70ee2cSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 352d1d35e2fSjeremylt CeedEvalMode eval_mode; 3531d102b48SJeremy L Thompson 3541d102b48SJeremy L Thompson // Skip active inputs 355d1d35e2fSjeremylt if (skip_active) { 356681d0ea7SJeremy L Thompson bool is_active; 3571d102b48SJeremy L Thompson CeedVector vec; 358ad70ee2cSJeremy L Thompson 3592b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 360681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 361681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 362681d0ea7SJeremy L Thompson if (is_active) continue; 3631d102b48SJeremy L Thompson } 3641d102b48SJeremy L Thompson // Restore input 3652b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 366d1d35e2fSjeremylt if (eval_mode == CEED_EVAL_WEIGHT) { // Skip 3671d102b48SJeremy L Thompson } else { 3682b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArrayRead(impl->e_vecs_full[i], (const CeedScalar **)&e_data_full[i])); 3691d102b48SJeremy L Thompson } 3701d102b48SJeremy L Thompson } 371e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 3721d102b48SJeremy L Thompson } 3731d102b48SJeremy L Thompson 374f10650afSjeremylt //------------------------------------------------------------------------------ 375f10650afSjeremylt // Operator Apply 376f10650afSjeremylt //------------------------------------------------------------------------------ 3772b730f8bSJeremy L Thompson static int CeedOperatorApplyAdd_Ref(CeedOperator op, CeedVector in_vec, CeedVector out_vec, CeedRequest *request) { 378d1d35e2fSjeremylt CeedInt Q, num_elem, num_input_fields, num_output_fields, size; 379ad70ee2cSJeremy L Thompson CeedEvalMode eval_mode; 380ad70ee2cSJeremy L Thompson CeedScalar *e_data_full[2 * CEED_FIELD_MAX] = {NULL}; 381ad70ee2cSJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 382ad70ee2cSJeremy L Thompson CeedQFunction qf; 383ad70ee2cSJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 384ad70ee2cSJeremy L Thompson CeedOperator_Ref *impl; 385ad70ee2cSJeremy L Thompson 386ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 387ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 3882b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumQuadraturePoints(op, &Q)); 3892b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 3902b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 3912b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 3921d102b48SJeremy L Thompson 3931d102b48SJeremy L Thompson // Setup 3942b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetup_Ref(op)); 3951d102b48SJeremy L Thompson 3960b454692Sjeremylt // Restriction only operator 397edb2538eSJeremy L Thompson if (impl->is_identity_rstr_op) { 398edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 399ad70ee2cSJeremy L Thompson 400edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[0], &elem_rstr)); 401edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApply(elem_rstr, CEED_NOTRANSPOSE, in_vec, impl->e_vecs_full[0], request)); 402681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 403edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[0], &elem_rstr)); 404edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApply(elem_rstr, CEED_TRANSPOSE, impl->e_vecs_full[0], out_vec, request)); 405681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 4060b454692Sjeremylt return CEED_ERROR_SUCCESS; 4070b454692Sjeremylt } 4080b454692Sjeremylt 4091d102b48SJeremy L Thompson // Input Evecs and Restriction 4102b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, in_vec, false, e_data_full, impl, request)); 4111d102b48SJeremy L Thompson 4121d102b48SJeremy L Thompson // Output Evecs 413f8a0df59SJeremy L Thompson for (CeedInt i = num_output_fields - 1; i >= 0; i--) { 414f8a0df59SJeremy L Thompson if (impl->skip_rstr_out[i]) { 415f8a0df59SJeremy L Thompson e_data_full[i + num_input_fields] = e_data_full[impl->e_data_out_indices[i] + num_input_fields]; 416f8a0df59SJeremy L Thompson } else { 4172b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorGetArrayWrite(impl->e_vecs_full[i + impl->num_inputs], CEED_MEM_HOST, &e_data_full[i + num_input_fields])); 4181d102b48SJeremy L Thompson } 419f8a0df59SJeremy L Thompson } 4201d102b48SJeremy L Thompson 4211d102b48SJeremy L Thompson // Loop through elements 422d1d35e2fSjeremylt for (CeedInt e = 0; e < num_elem; e++) { 4231d102b48SJeremy L Thompson // Output pointers 424d1d35e2fSjeremylt for (CeedInt i = 0; i < num_output_fields; i++) { 4252b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); 426d1d35e2fSjeremylt if (eval_mode == CEED_EVAL_NONE) { 4272b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[i], &size)); 42881670346SSebastian Grimberg CeedCallBackend( 42981670346SSebastian Grimberg CeedVectorSetArray(impl->q_vecs_out[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data_full[i + num_input_fields][(CeedSize)e * Q * size])); 4301d102b48SJeremy L Thompson } 4311d102b48SJeremy L Thompson } 4321d102b48SJeremy L Thompson 43316911fdaSjeremylt // Input basis apply 4342b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorInputBasis_Ref(e, Q, qf_input_fields, op_input_fields, num_input_fields, false, e_data_full, impl)); 43516911fdaSjeremylt 4361d102b48SJeremy L Thompson // Q function 4370b454692Sjeremylt if (!impl->is_identity_qf) { 4382b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionApply(qf, Q, impl->q_vecs_in, impl->q_vecs_out)); 43916911fdaSjeremylt } 4401d102b48SJeremy L Thompson 4411d102b48SJeremy L Thompson // Output basis apply 442f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorOutputBasis_Ref(e, Q, qf_output_fields, op_output_fields, num_input_fields, num_output_fields, 443f8a0df59SJeremy L Thompson impl->apply_add_basis_out, op, e_data_full, impl)); 4441d102b48SJeremy L Thompson } 445885ac19cSjeremylt 446885ac19cSjeremylt // Output restriction 447d1d35e2fSjeremylt for (CeedInt i = 0; i < num_output_fields; i++) { 448681d0ea7SJeremy L Thompson bool is_active; 449ad70ee2cSJeremy L Thompson CeedVector vec; 450edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 451ad70ee2cSJeremy L Thompson 452f8a0df59SJeremy L Thompson if (impl->skip_rstr_out[i]) continue; 453d1d35e2fSjeremylt // Restore Evec 4542b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->e_vecs_full[i + impl->num_inputs], &e_data_full[i + num_input_fields])); 455d1bcdac9Sjeremylt // Get output vector 4562b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[i], &vec)); 457668048e2SJed Brown // Active 458681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 459681d0ea7SJeremy L Thompson if (is_active) vec = out_vec; 4607ca8db16Sjeremylt // Restrict 461edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); 462edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApply(elem_rstr, CEED_TRANSPOSE, impl->e_vecs_full[i + impl->num_inputs], vec, request)); 463681d0ea7SJeremy L Thompson if (!is_active) CeedCallBackend(CeedVectorDestroy(&vec)); 464681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 465885ac19cSjeremylt } 466885ac19cSjeremylt 4677ca8db16Sjeremylt // Restore input arrays 4682b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, false, e_data_full, impl)); 469e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 47021617c04Sjeremylt } 47121617c04Sjeremylt 472f10650afSjeremylt //------------------------------------------------------------------------------ 47370a7ffb3SJeremy L Thompson // Core code for assembling linear QFunction 474f10650afSjeremylt //------------------------------------------------------------------------------ 4752b730f8bSJeremy L Thompson static inline int CeedOperatorLinearAssembleQFunctionCore_Ref(CeedOperator op, bool build_objects, CeedVector *assembled, CeedElemRestriction *rstr, 47670a7ffb3SJeremy L Thompson CeedRequest *request) { 477*9bc66399SJeremy L Thompson Ceed ceed_parent; 478ff8551c5SJeremy L Thompson CeedInt qf_size_in, qf_size_out, Q, num_elem, num_input_fields, num_output_fields; 479ad70ee2cSJeremy L Thompson CeedScalar *assembled_array, *e_data_full[2 * CEED_FIELD_MAX] = {NULL}; 480ad70ee2cSJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 481ad70ee2cSJeremy L Thompson CeedQFunction qf; 482ad70ee2cSJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 483ad70ee2cSJeremy L Thompson CeedOperator_Ref *impl; 484ad70ee2cSJeremy L Thompson 485e910d748SJeremy L Thompson CeedCallBackend(CeedOperatorGetFallbackParentCeed(op, &ceed_parent)); 486e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 487ff8551c5SJeremy L Thompson qf_size_in = impl->qf_size_in; 488ff8551c5SJeremy L Thompson qf_size_out = impl->qf_size_out; 489e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 490e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumQuadraturePoints(op, &Q)); 491e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 492e984cf9aSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 493e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 4941d102b48SJeremy L Thompson 4951d102b48SJeremy L Thompson // Setup 4962b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetup_Ref(op)); 4971d102b48SJeremy L Thompson 498506b1a0cSSebastian Grimberg // Check for restriction only operator 499*9bc66399SJeremy L Thompson CeedCheck(!impl->is_identity_rstr_op, CeedOperatorReturnCeed(op), CEED_ERROR_BACKEND, "Assembling restriction only operators is not supported"); 50016911fdaSjeremylt 5011d102b48SJeremy L Thompson // Input Evecs and Restriction 5022b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, NULL, true, e_data_full, impl, request)); 5031d102b48SJeremy L Thompson 5041d102b48SJeremy L Thompson // Count number of active input fields 505ff8551c5SJeremy L Thompson if (qf_size_in == 0) { 506d1d35e2fSjeremylt for (CeedInt i = 0; i < num_input_fields; i++) { 507c7b67790SJeremy L Thompson CeedInt field_size; 508ad70ee2cSJeremy L Thompson CeedVector vec; 509ad70ee2cSJeremy L Thompson 5101d102b48SJeremy L Thompson // Get input vector 5112b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 5121d102b48SJeremy L Thompson // Check if active input 5131d102b48SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 514c7b67790SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &field_size)); 5152b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(impl->q_vecs_in[i], 0.0)); 516ff8551c5SJeremy L Thompson qf_size_in += field_size; 5171d102b48SJeremy L Thompson } 518681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 5191d102b48SJeremy L Thompson } 520*9bc66399SJeremy L Thompson CeedCheck(qf_size_in > 0, CeedOperatorReturnCeed(op), CEED_ERROR_BACKEND, "Cannot assemble QFunction without active inputs and outputs"); 521ff8551c5SJeremy L Thompson impl->qf_size_in = qf_size_in; 522bb219a0fSJeremy L Thompson } 5231d102b48SJeremy L Thompson 5241d102b48SJeremy L Thompson // Count number of active output fields 525ff8551c5SJeremy L Thompson if (qf_size_out == 0) { 526d1d35e2fSjeremylt for (CeedInt i = 0; i < num_output_fields; i++) { 527c7b67790SJeremy L Thompson CeedInt field_size; 528ad70ee2cSJeremy L Thompson CeedVector vec; 529ad70ee2cSJeremy L Thompson 5301d102b48SJeremy L Thompson // Get output vector 5312b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[i], &vec)); 5321d102b48SJeremy L Thompson // Check if active output 5331d102b48SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 534c7b67790SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[i], &field_size)); 535ff8551c5SJeremy L Thompson qf_size_out += field_size; 5361d102b48SJeremy L Thompson } 537681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 5381d102b48SJeremy L Thompson } 539*9bc66399SJeremy L Thompson CeedCheck(qf_size_out > 0, CeedOperatorReturnCeed(op), CEED_ERROR_BACKEND, "Cannot assemble QFunction without active inputs and outputs"); 540ff8551c5SJeremy L Thompson impl->qf_size_out = qf_size_out; 541bb219a0fSJeremy L Thompson } 5421d102b48SJeremy L Thompson 54370a7ffb3SJeremy L Thompson // Build objects if needed 54470a7ffb3SJeremy L Thompson if (build_objects) { 545ff8551c5SJeremy L Thompson const CeedSize l_size = (CeedSize)num_elem * Q * qf_size_in * qf_size_out; 546ff8551c5SJeremy L Thompson CeedInt strides[3] = {1, Q, qf_size_in * qf_size_out * Q}; /* *NOPAD* */ 547ad70ee2cSJeremy L Thompson 548ad70ee2cSJeremy L Thompson // Create output restriction 5490a5597ceSJeremy L Thompson CeedCallBackend(CeedElemRestrictionCreateStrided(ceed_parent, num_elem, Q, qf_size_in * qf_size_out, 5500a5597ceSJeremy L Thompson (CeedSize)qf_size_in * (CeedSize)qf_size_out * (CeedSize)num_elem * (CeedSize)Q, strides, rstr)); 5511d102b48SJeremy L Thompson // Create assembled vector 552e910d748SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed_parent, l_size, assembled)); 55370a7ffb3SJeremy L Thompson } 55470a7ffb3SJeremy L Thompson // Clear output vector 5552b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(*assembled, 0.0)); 556ad70ee2cSJeremy L Thompson CeedCallBackend(CeedVectorGetArray(*assembled, CEED_MEM_HOST, &assembled_array)); 5571d102b48SJeremy L Thompson 5581d102b48SJeremy L Thompson // Loop through elements 559d1d35e2fSjeremylt for (CeedInt e = 0; e < num_elem; e++) { 5601d102b48SJeremy L Thompson // Input basis apply 5612b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorInputBasis_Ref(e, Q, qf_input_fields, op_input_fields, num_input_fields, true, e_data_full, impl)); 5621d102b48SJeremy L Thompson 5631d102b48SJeremy L Thompson // Assemble QFunction 564c7b67790SJeremy L Thompson 565c7b67790SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 566681d0ea7SJeremy L Thompson bool is_active; 567c7b67790SJeremy L Thompson CeedInt field_size; 568c7b67790SJeremy L Thompson CeedVector vec; 569c7b67790SJeremy L Thompson 5701d102b48SJeremy L Thompson // Set Inputs 571c7b67790SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 572681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 573681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 574681d0ea7SJeremy L Thompson if (!is_active) continue; 575c7b67790SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &field_size)); 576c7b67790SJeremy L Thompson for (CeedInt field = 0; field < field_size; field++) { 577c7b67790SJeremy L Thompson // Set current portion of input to 1.0 578c7b67790SJeremy L Thompson { 579c7b67790SJeremy L Thompson CeedScalar *array; 580c7b67790SJeremy L Thompson 581c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->q_vecs_in[i], CEED_MEM_HOST, &array)); 582c7b67790SJeremy L Thompson for (CeedInt j = 0; j < Q; j++) array[field * Q + j] = 1.0; 583c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->q_vecs_in[i], &array)); 58442ea3801Sjeremylt } 585c7b67790SJeremy L Thompson 586506b1a0cSSebastian Grimberg if (!impl->is_identity_qf) { 5871d102b48SJeremy L Thompson // Set Outputs 588d1d35e2fSjeremylt for (CeedInt out = 0; out < num_output_fields; out++) { 589ad70ee2cSJeremy L Thompson CeedVector vec; 590ad70ee2cSJeremy L Thompson 5911d102b48SJeremy L Thompson // Get output vector 5922b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[out], &vec)); 5931d102b48SJeremy L Thompson // Check if active output 5941d102b48SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 595c7b67790SJeremy L Thompson CeedInt field_size; 596c7b67790SJeremy L Thompson 597ad70ee2cSJeremy L Thompson CeedCallBackend(CeedVectorSetArray(impl->q_vecs_out[out], CEED_MEM_HOST, CEED_USE_POINTER, assembled_array)); 598c7b67790SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[out], &field_size)); 599c7b67790SJeremy L Thompson assembled_array += field_size * Q; // Advance the pointer by the size of the output 6001d102b48SJeremy L Thompson } 601681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 6021d102b48SJeremy L Thompson } 6031d102b48SJeremy L Thompson // Apply QFunction 6042b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionApply(qf, Q, impl->q_vecs_in, impl->q_vecs_out)); 605506b1a0cSSebastian Grimberg } else { 606c7b67790SJeremy L Thompson CeedInt field_size; 607c7b67790SJeremy L Thompson const CeedScalar *array; 608506b1a0cSSebastian Grimberg 609506b1a0cSSebastian Grimberg // Copy Identity Outputs 610c7b67790SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[0], &field_size)); 611c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorGetArrayRead(impl->q_vecs_out[0], CEED_MEM_HOST, &array)); 612c7b67790SJeremy L Thompson for (CeedInt j = 0; j < field_size * Q; j++) assembled_array[j] = array[j]; 613c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArrayRead(impl->q_vecs_out[0], &array)); 614c7b67790SJeremy L Thompson assembled_array += field_size * Q; 615c7b67790SJeremy L Thompson } 616c7b67790SJeremy L Thompson // Reset input to 0.0 617c7b67790SJeremy L Thompson { 618c7b67790SJeremy L Thompson CeedScalar *array; 619c7b67790SJeremy L Thompson 620c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->q_vecs_in[i], CEED_MEM_HOST, &array)); 621c7b67790SJeremy L Thompson for (CeedInt j = 0; j < Q; j++) array[field * Q + j] = 0.0; 622c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->q_vecs_in[i], &array)); 623c7b67790SJeremy L Thompson } 624506b1a0cSSebastian Grimberg } 6251d102b48SJeremy L Thompson } 6261d102b48SJeremy L Thompson } 6271d102b48SJeremy L Thompson 6281d102b48SJeremy L Thompson // Un-set output Qvecs to prevent accidental overwrite of Assembled 629506b1a0cSSebastian Grimberg if (!impl->is_identity_qf) { 630d1d35e2fSjeremylt for (CeedInt out = 0; out < num_output_fields; out++) { 631ad70ee2cSJeremy L Thompson CeedVector vec; 632ad70ee2cSJeremy L Thompson 6331d102b48SJeremy L Thompson // Get output vector 6342b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[out], &vec)); 6351d102b48SJeremy L Thompson // Check if active output 636056ea4bdSJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE && num_elem > 0) { 6372b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorTakeArray(impl->q_vecs_out[out], CEED_MEM_HOST, NULL)); 6381d102b48SJeremy L Thompson } 639681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 6401d102b48SJeremy L Thompson } 641506b1a0cSSebastian Grimberg } 6421d102b48SJeremy L Thompson 6431d102b48SJeremy L Thompson // Restore input arrays 6442b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, true, e_data_full, impl)); 6451d102b48SJeremy L Thompson 6461d102b48SJeremy L Thompson // Restore output 647ad70ee2cSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(*assembled, &assembled_array)); 648*9bc66399SJeremy L Thompson CeedCallBackend(CeedDestroy(&ceed_parent)); 649e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 6501d102b48SJeremy L Thompson } 6511d102b48SJeremy L Thompson 652f10650afSjeremylt //------------------------------------------------------------------------------ 65370a7ffb3SJeremy L Thompson // Assemble Linear QFunction 65470a7ffb3SJeremy L Thompson //------------------------------------------------------------------------------ 6552b730f8bSJeremy L Thompson static int CeedOperatorLinearAssembleQFunction_Ref(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 6562b730f8bSJeremy L Thompson return CeedOperatorLinearAssembleQFunctionCore_Ref(op, true, assembled, rstr, request); 65770a7ffb3SJeremy L Thompson } 65870a7ffb3SJeremy L Thompson 65970a7ffb3SJeremy L Thompson //------------------------------------------------------------------------------ 66070a7ffb3SJeremy L Thompson // Update Assembled Linear QFunction 66170a7ffb3SJeremy L Thompson //------------------------------------------------------------------------------ 6622b730f8bSJeremy L Thompson static int CeedOperatorLinearAssembleQFunctionUpdate_Ref(CeedOperator op, CeedVector assembled, CeedElemRestriction rstr, CeedRequest *request) { 6632b730f8bSJeremy L Thompson return CeedOperatorLinearAssembleQFunctionCore_Ref(op, false, &assembled, &rstr, request); 66470a7ffb3SJeremy L Thompson } 66570a7ffb3SJeremy L Thompson 66670a7ffb3SJeremy L Thompson //------------------------------------------------------------------------------ 66748acf710SJeremy L Thompson // Setup Input/Output Fields 66848acf710SJeremy L Thompson //------------------------------------------------------------------------------ 669f8a0df59SJeremy L Thompson static int CeedOperatorSetupFieldsAtPoints_Ref(CeedQFunction qf, CeedOperator op, bool is_input, bool *skip_rstr, bool *apply_add_basis, 670f8a0df59SJeremy L Thompson CeedVector *e_vecs_full, CeedVector *e_vecs, CeedVector *q_vecs, CeedInt start_e, CeedInt num_fields, 671f8a0df59SJeremy L Thompson CeedInt Q) { 67248acf710SJeremy L Thompson Ceed ceed; 67348acf710SJeremy L Thompson CeedSize e_size, q_size; 674ff1bc20eSJeremy L Thompson CeedInt max_num_points, num_comp, size, P; 67548acf710SJeremy L Thompson CeedQFunctionField *qf_fields; 67648acf710SJeremy L Thompson CeedOperatorField *op_fields; 67748acf710SJeremy L Thompson 678e910d748SJeremy L Thompson { 679e910d748SJeremy L Thompson Ceed ceed_parent; 680e910d748SJeremy L Thompson 68148acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 682e910d748SJeremy L Thompson CeedCallBackend(CeedGetParent(ceed, &ceed_parent)); 683*9bc66399SJeremy L Thompson CeedCallBackend(CeedReferenceCopy(ceed_parent, &ceed)); 684*9bc66399SJeremy L Thompson CeedCallBackend(CeedDestroy(&ceed_parent)); 685e910d748SJeremy L Thompson } 68648acf710SJeremy L Thompson if (is_input) { 68748acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL)); 68848acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL)); 68948acf710SJeremy L Thompson } else { 69048acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields)); 69148acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, NULL, NULL, &qf_fields)); 69248acf710SJeremy L Thompson } 69348acf710SJeremy L Thompson 69448acf710SJeremy L Thompson // Get max number of points 69548acf710SJeremy L Thompson { 69648acf710SJeremy L Thompson CeedInt dim; 69748acf710SJeremy L Thompson CeedElemRestriction rstr_points = NULL; 69848acf710SJeremy L Thompson CeedOperator_Ref *impl; 69948acf710SJeremy L Thompson 70048acf710SJeremy L Thompson CeedCallBackend(CeedOperatorAtPointsGetPoints(op, &rstr_points, NULL)); 70148acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetMaxPointsInElement(rstr_points, &max_num_points)); 70248acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumComponents(rstr_points, &dim)); 70348acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_points)); 70448acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 705b37f8825SJeremy L Thompson if (is_input) { 706b37f8825SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, dim * max_num_points, &impl->point_coords_elem)); 707b37f8825SJeremy L Thompson CeedCallBackend(CeedVectorSetValue(impl->point_coords_elem, 0.0)); 708b37f8825SJeremy L Thompson } 70948acf710SJeremy L Thompson } 71048acf710SJeremy L Thompson 71148acf710SJeremy L Thompson // Loop over fields 71248acf710SJeremy L Thompson for (CeedInt i = 0; i < num_fields; i++) { 71348acf710SJeremy L Thompson CeedEvalMode eval_mode; 71448acf710SJeremy L Thompson CeedBasis basis; 71548acf710SJeremy L Thompson 71648acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 71748acf710SJeremy L Thompson if (eval_mode != CEED_EVAL_WEIGHT) { 71848acf710SJeremy L Thompson CeedElemRestriction elem_rstr; 71948acf710SJeremy L Thompson 72048acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr)); 72148acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionCreateVector(elem_rstr, NULL, &e_vecs_full[i + start_e])); 722681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 723ff1bc20eSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(e_vecs_full[i + start_e], 0.0)); 7246efa0d72SZach Atkins } 72548acf710SJeremy L Thompson 72648acf710SJeremy L Thompson switch (eval_mode) { 72738e83183SJeremy L Thompson case CEED_EVAL_NONE: { 72838e83183SJeremy L Thompson CeedVector vec; 72938e83183SJeremy L Thompson 73048acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_fields[i], &size)); 73148acf710SJeremy L Thompson e_size = (CeedSize)max_num_points * size; 73248acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, e_size, &e_vecs[i])); 73338e83183SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[i], &vec)); 73438e83183SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE || !is_input) { 73538e83183SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs[i], &q_vecs[i])); 73638e83183SJeremy L Thompson } else { 73748acf710SJeremy L Thompson q_size = (CeedSize)max_num_points * size; 73848acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 73938e83183SJeremy L Thompson } 740681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 74148acf710SJeremy L Thompson break; 74238e83183SJeremy L Thompson } 74348acf710SJeremy L Thompson case CEED_EVAL_INTERP: 74448acf710SJeremy L Thompson case CEED_EVAL_GRAD: 74548acf710SJeremy L Thompson case CEED_EVAL_DIV: 74648acf710SJeremy L Thompson case CEED_EVAL_CURL: 74748acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 74848acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_fields[i], &size)); 74948acf710SJeremy L Thompson CeedCallBackend(CeedBasisGetNumNodes(basis, &P)); 75048acf710SJeremy L Thompson CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 75148acf710SJeremy L Thompson e_size = (CeedSize)P * num_comp; 75248acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, e_size, &e_vecs[i])); 75348acf710SJeremy L Thompson q_size = (CeedSize)max_num_points * size; 75448acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 755681d0ea7SJeremy L Thompson CeedCallBackend(CeedBasisDestroy(&basis)); 75648acf710SJeremy L Thompson break; 75748acf710SJeremy L Thompson case CEED_EVAL_WEIGHT: // Only on input fields 75848acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 75948acf710SJeremy L Thompson q_size = (CeedSize)max_num_points; 76048acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 76148acf710SJeremy L Thompson CeedCallBackend( 762fc0f7cc6SJeremy L Thompson CeedBasisApplyAtPoints(basis, 1, &max_num_points, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, CEED_VECTOR_NONE, q_vecs[i])); 763681d0ea7SJeremy L Thompson CeedCallBackend(CeedBasisDestroy(&basis)); 76448acf710SJeremy L Thompson break; 76548acf710SJeremy L Thompson } 766ecc797dfSJeremy L Thompson // Initialize full arrays for E-vectors and Q-vectors 767297a0f46SJeremy L Thompson if (e_vecs[i]) CeedCallBackend(CeedVectorSetValue(e_vecs[i], 0.0)); 768297a0f46SJeremy L Thompson if (eval_mode != CEED_EVAL_WEIGHT) CeedCallBackend(CeedVectorSetValue(q_vecs[i], 0.0)); 76948acf710SJeremy L Thompson } 770f8a0df59SJeremy L Thompson // Drop duplicate restrictions 7713aab95c0SJeremy L Thompson if (is_input) { 7723aab95c0SJeremy L Thompson for (CeedInt i = 0; i < num_fields; i++) { 7733aab95c0SJeremy L Thompson CeedVector vec_i; 7743aab95c0SJeremy L Thompson CeedElemRestriction rstr_i; 7753aab95c0SJeremy L Thompson 7763aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[i], &vec_i)); 7773aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr_i)); 7783aab95c0SJeremy L Thompson for (CeedInt j = i + 1; j < num_fields; j++) { 7793aab95c0SJeremy L Thompson CeedVector vec_j; 7803aab95c0SJeremy L Thompson CeedElemRestriction rstr_j; 7813aab95c0SJeremy L Thompson 7823aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[j], &vec_j)); 7833aab95c0SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[j], &rstr_j)); 7843aab95c0SJeremy L Thompson if (vec_i == vec_j && rstr_i == rstr_j) { 7853aab95c0SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs[i], &e_vecs[j])); 786f8a0df59SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs_full[i + start_e], &e_vecs_full[j + start_e])); 7873aab95c0SJeremy L Thompson skip_rstr[j] = true; 7883aab95c0SJeremy L Thompson } 789681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec_j)); 790681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_j)); 7913aab95c0SJeremy L Thompson } 792681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec_i)); 793681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_i)); 7943aab95c0SJeremy L Thompson } 795f8a0df59SJeremy L Thompson } else { 796f8a0df59SJeremy L Thompson for (CeedInt i = num_fields - 1; i >= 0; i--) { 797f8a0df59SJeremy L Thompson CeedVector vec_i; 798f8a0df59SJeremy L Thompson CeedElemRestriction rstr_i; 799f8a0df59SJeremy L Thompson 800f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[i], &vec_i)); 801f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr_i)); 802f8a0df59SJeremy L Thompson for (CeedInt j = i - 1; j >= 0; j--) { 803f8a0df59SJeremy L Thompson CeedVector vec_j; 804f8a0df59SJeremy L Thompson CeedElemRestriction rstr_j; 805f8a0df59SJeremy L Thompson 806f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[j], &vec_j)); 807f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[j], &rstr_j)); 808f8a0df59SJeremy L Thompson if (vec_i == vec_j && rstr_i == rstr_j) { 809f8a0df59SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs[i], &e_vecs[j])); 810f8a0df59SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs_full[i + start_e], &e_vecs_full[j + start_e])); 811f8a0df59SJeremy L Thompson skip_rstr[j] = true; 812f8a0df59SJeremy L Thompson apply_add_basis[i] = true; 813f8a0df59SJeremy L Thompson } 814681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec_j)); 815681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_j)); 816f8a0df59SJeremy L Thompson } 817681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec_i)); 818681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_i)); 819f8a0df59SJeremy L Thompson } 8203aab95c0SJeremy L Thompson } 821*9bc66399SJeremy L Thompson CeedCallBackend(CeedDestroy(&ceed)); 82248acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 82348acf710SJeremy L Thompson } 82448acf710SJeremy L Thompson 82548acf710SJeremy L Thompson //------------------------------------------------------------------------------ 82648acf710SJeremy L Thompson // Setup Operator 82748acf710SJeremy L Thompson //------------------------------------------------------------------------------ 82848acf710SJeremy L Thompson static int CeedOperatorSetupAtPoints_Ref(CeedOperator op) { 82948acf710SJeremy L Thompson bool is_setup_done; 83048acf710SJeremy L Thompson CeedInt Q, num_input_fields, num_output_fields; 83148acf710SJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 83248acf710SJeremy L Thompson CeedQFunction qf; 83348acf710SJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 83448acf710SJeremy L Thompson CeedOperator_Ref *impl; 83548acf710SJeremy L Thompson 83648acf710SJeremy L Thompson CeedCallBackend(CeedOperatorIsSetupDone(op, &is_setup_done)); 83748acf710SJeremy L Thompson if (is_setup_done) return CEED_ERROR_SUCCESS; 83848acf710SJeremy L Thompson 83948acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 84048acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 84148acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetNumQuadraturePoints(op, &Q)); 84248acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionIsIdentity(qf, &impl->is_identity_qf)); 84348acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 84448acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 84548acf710SJeremy L Thompson 84648acf710SJeremy L Thompson // Allocate 84748acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(num_input_fields + num_output_fields, &impl->e_vecs_full)); 84848acf710SJeremy L Thompson 8493aab95c0SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->skip_rstr_in)); 850f8a0df59SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->skip_rstr_out)); 851f8a0df59SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->apply_add_basis_out)); 85248acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->input_states)); 85348acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_vecs_in)); 85448acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_vecs_out)); 85548acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->q_vecs_in)); 85648acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->q_vecs_out)); 85748acf710SJeremy L Thompson 85848acf710SJeremy L Thompson impl->num_inputs = num_input_fields; 85948acf710SJeremy L Thompson impl->num_outputs = num_output_fields; 86048acf710SJeremy L Thompson 86148acf710SJeremy L Thompson // Set up infield and outfield pointer arrays 86248acf710SJeremy L Thompson // Infields 863f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorSetupFieldsAtPoints_Ref(qf, op, true, impl->skip_rstr_in, NULL, impl->e_vecs_full, impl->e_vecs_in, impl->q_vecs_in, 0, 8643aab95c0SJeremy L Thompson num_input_fields, Q)); 86548acf710SJeremy L Thompson // Outfields 866f8a0df59SJeremy L Thompson CeedCallBackend(CeedOperatorSetupFieldsAtPoints_Ref(qf, op, false, impl->skip_rstr_out, impl->apply_add_basis_out, impl->e_vecs_full, 867f8a0df59SJeremy L Thompson impl->e_vecs_out, impl->q_vecs_out, num_input_fields, num_output_fields, Q)); 86848acf710SJeremy L Thompson 86948acf710SJeremy L Thompson // Identity QFunctions 87048acf710SJeremy L Thompson if (impl->is_identity_qf) { 87148acf710SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(impl->q_vecs_in[0], &impl->q_vecs_out[0])); 87238e83183SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(impl->q_vecs_in[0], &impl->e_vecs_out[0])); 87348acf710SJeremy L Thompson } 87448acf710SJeremy L Thompson 87548acf710SJeremy L Thompson CeedCallBackend(CeedOperatorSetSetupDone(op)); 87648acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 87748acf710SJeremy L Thompson } 87848acf710SJeremy L Thompson 87948acf710SJeremy L Thompson //------------------------------------------------------------------------------ 88048acf710SJeremy L Thompson // Input Basis Action 88148acf710SJeremy L Thompson //------------------------------------------------------------------------------ 88248acf710SJeremy L Thompson static inline int CeedOperatorInputBasisAtPoints_Ref(CeedInt e, CeedInt num_points_offset, CeedInt num_points, CeedQFunctionField *qf_input_fields, 88348acf710SJeremy L Thompson CeedOperatorField *op_input_fields, CeedInt num_input_fields, CeedVector in_vec, 88448acf710SJeremy L Thompson CeedVector point_coords_elem, bool skip_active, CeedScalar *e_data[2 * CEED_FIELD_MAX], 88548acf710SJeremy L Thompson CeedOperator_Ref *impl, CeedRequest *request) { 88648acf710SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 887681d0ea7SJeremy L Thompson bool is_active; 88848acf710SJeremy L Thompson CeedInt elem_size, size, num_comp; 88948acf710SJeremy L Thompson CeedRestrictionType rstr_type; 89048acf710SJeremy L Thompson CeedEvalMode eval_mode; 89148acf710SJeremy L Thompson CeedVector vec; 89248acf710SJeremy L Thompson CeedElemRestriction elem_rstr; 89348acf710SJeremy L Thompson CeedBasis basis; 89448acf710SJeremy L Thompson 89548acf710SJeremy L Thompson // Skip active input 896681d0ea7SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 897681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 898681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 899681d0ea7SJeremy L Thompson if (skip_active && is_active) continue; 90048acf710SJeremy L Thompson 90148acf710SJeremy L Thompson // Get elem_size, eval_mode, size 90248acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 90348acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetType(elem_rstr, &rstr_type)); 90448acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 90548acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &size)); 90648acf710SJeremy L Thompson // Restrict block active input 907681d0ea7SJeremy L Thompson if (is_active && !impl->skip_rstr_in[i]) { 90848acf710SJeremy L Thompson if (rstr_type == CEED_RESTRICTION_POINTS) { 90948acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(elem_rstr, e, CEED_NOTRANSPOSE, in_vec, impl->e_vecs_in[i], request)); 91048acf710SJeremy L Thompson } else { 91148acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyBlock(elem_rstr, e, CEED_NOTRANSPOSE, in_vec, impl->e_vecs_in[i], request)); 91248acf710SJeremy L Thompson } 91348acf710SJeremy L Thompson } 91448acf710SJeremy L Thompson // Basis action 91548acf710SJeremy L Thompson switch (eval_mode) { 91648acf710SJeremy L Thompson case CEED_EVAL_NONE: 917681d0ea7SJeremy L Thompson if (!is_active) { 91848acf710SJeremy L Thompson CeedCallBackend(CeedVectorSetArray(impl->q_vecs_in[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data[i][num_points_offset * size])); 91948acf710SJeremy L Thompson } 92048acf710SJeremy L Thompson break; 92148acf710SJeremy L Thompson // Note - these basis eval modes require FEM fields 92248acf710SJeremy L Thompson case CEED_EVAL_INTERP: 92348acf710SJeremy L Thompson case CEED_EVAL_GRAD: 92448acf710SJeremy L Thompson case CEED_EVAL_DIV: 92548acf710SJeremy L Thompson case CEED_EVAL_CURL: 92648acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_input_fields[i], &basis)); 927681d0ea7SJeremy L Thompson if (!is_active) { 92848acf710SJeremy L Thompson CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 92948acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size)); 93081670346SSebastian Grimberg CeedCallBackend(CeedVectorSetArray(impl->e_vecs_in[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data[i][(CeedSize)e * elem_size * num_comp])); 93148acf710SJeremy L Thompson } 93248acf710SJeremy L Thompson CeedCallBackend( 933fc0f7cc6SJeremy L Thompson CeedBasisApplyAtPoints(basis, 1, &num_points, CEED_NOTRANSPOSE, eval_mode, point_coords_elem, impl->e_vecs_in[i], impl->q_vecs_in[i])); 934681d0ea7SJeremy L Thompson CeedCallBackend(CeedBasisDestroy(&basis)); 93548acf710SJeremy L Thompson break; 93648acf710SJeremy L Thompson case CEED_EVAL_WEIGHT: 93748acf710SJeremy L Thompson break; // No action 93848acf710SJeremy L Thompson } 939681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 94048acf710SJeremy L Thompson } 94148acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 94248acf710SJeremy L Thompson } 94348acf710SJeremy L Thompson 94448acf710SJeremy L Thompson //------------------------------------------------------------------------------ 94548acf710SJeremy L Thompson // Output Basis Action 94648acf710SJeremy L Thompson //------------------------------------------------------------------------------ 94748acf710SJeremy L Thompson static inline int CeedOperatorOutputBasisAtPoints_Ref(CeedInt e, CeedInt num_points_offset, CeedInt num_points, CeedQFunctionField *qf_output_fields, 94848acf710SJeremy L Thompson CeedOperatorField *op_output_fields, CeedInt num_input_fields, CeedInt num_output_fields, 949f8a0df59SJeremy L Thompson bool *apply_add_basis, bool *skip_rstr, CeedOperator op, CeedVector out_vec, 950f8a0df59SJeremy L Thompson CeedVector point_coords_elem, CeedOperator_Ref *impl, CeedRequest *request) { 95148acf710SJeremy L Thompson for (CeedInt i = 0; i < num_output_fields; i++) { 952681d0ea7SJeremy L Thompson bool is_active; 95348acf710SJeremy L Thompson CeedRestrictionType rstr_type; 95448acf710SJeremy L Thompson CeedEvalMode eval_mode; 95548acf710SJeremy L Thompson CeedVector vec; 95648acf710SJeremy L Thompson CeedElemRestriction elem_rstr; 95748acf710SJeremy L Thompson CeedBasis basis; 95848acf710SJeremy L Thompson 95948acf710SJeremy L Thompson // Get elem_size, eval_mode, size 96048acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); 96148acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); 96248acf710SJeremy L Thompson // Basis action 96348acf710SJeremy L Thompson switch (eval_mode) { 96448acf710SJeremy L Thompson case CEED_EVAL_NONE: 96548acf710SJeremy L Thompson break; // No action 96648acf710SJeremy L Thompson case CEED_EVAL_INTERP: 96748acf710SJeremy L Thompson case CEED_EVAL_GRAD: 96848acf710SJeremy L Thompson case CEED_EVAL_DIV: 96948acf710SJeremy L Thompson case CEED_EVAL_CURL: 97048acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_output_fields[i], &basis)); 971f8a0df59SJeremy L Thompson if (apply_add_basis[i]) { 972f8a0df59SJeremy L Thompson CeedCallBackend(CeedBasisApplyAddAtPoints(basis, 1, &num_points, CEED_TRANSPOSE, eval_mode, point_coords_elem, impl->q_vecs_out[i], 973f8a0df59SJeremy L Thompson impl->e_vecs_out[i])); 974f8a0df59SJeremy L Thompson } else { 97548acf710SJeremy L Thompson CeedCallBackend( 976fc0f7cc6SJeremy L Thompson CeedBasisApplyAtPoints(basis, 1, &num_points, CEED_TRANSPOSE, eval_mode, point_coords_elem, impl->q_vecs_out[i], impl->e_vecs_out[i])); 977f8a0df59SJeremy L Thompson } 978681d0ea7SJeremy L Thompson CeedCallBackend(CeedBasisDestroy(&basis)); 97948acf710SJeremy L Thompson break; 98048acf710SJeremy L Thompson // LCOV_EXCL_START 98148acf710SJeremy L Thompson case CEED_EVAL_WEIGHT: { 9826e536b99SJeremy L Thompson return CeedError(CeedOperatorReturnCeed(op), CEED_ERROR_BACKEND, "CEED_EVAL_WEIGHT cannot be an output evaluation mode"); 98348acf710SJeremy L Thompson // LCOV_EXCL_STOP 98448acf710SJeremy L Thompson } 98548acf710SJeremy L Thompson } 98648acf710SJeremy L Thompson // Restrict output block 987bbac207aSZach Atkins if (skip_rstr[i]) { 988bbac207aSZach Atkins CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 989bbac207aSZach Atkins continue; 990bbac207aSZach Atkins } 991bbac207aSZach Atkins 99248acf710SJeremy L Thompson // Get output vector 99348acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetType(elem_rstr, &rstr_type)); 99448acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[i], &vec)); 995681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 996681d0ea7SJeremy L Thompson if (is_active) vec = out_vec; 99748acf710SJeremy L Thompson // Restrict 99848acf710SJeremy L Thompson if (rstr_type == CEED_RESTRICTION_POINTS) { 99948acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(elem_rstr, e, CEED_TRANSPOSE, impl->e_vecs_out[i], vec, request)); 100048acf710SJeremy L Thompson } else { 100148acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyBlock(elem_rstr, e, CEED_TRANSPOSE, impl->e_vecs_out[i], vec, request)); 100248acf710SJeremy L Thompson } 1003681d0ea7SJeremy L Thompson if (!is_active) CeedCallBackend(CeedVectorDestroy(&vec)); 1004681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 100548acf710SJeremy L Thompson } 100648acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 100748acf710SJeremy L Thompson } 100848acf710SJeremy L Thompson 100948acf710SJeremy L Thompson //------------------------------------------------------------------------------ 101048acf710SJeremy L Thompson // Operator Apply 101148acf710SJeremy L Thompson //------------------------------------------------------------------------------ 101248acf710SJeremy L Thompson static int CeedOperatorApplyAddAtPoints_Ref(CeedOperator op, CeedVector in_vec, CeedVector out_vec, CeedRequest *request) { 101348acf710SJeremy L Thompson CeedInt num_points_offset = 0, num_input_fields, num_output_fields, num_elem; 101448acf710SJeremy L Thompson CeedScalar *e_data[2 * CEED_FIELD_MAX] = {0}; 101548acf710SJeremy L Thompson CeedVector point_coords = NULL; 101648acf710SJeremy L Thompson CeedElemRestriction rstr_points = NULL; 101748acf710SJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 101848acf710SJeremy L Thompson CeedQFunction qf; 101948acf710SJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 102048acf710SJeremy L Thompson CeedOperator_Ref *impl; 102148acf710SJeremy L Thompson 102248acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 102348acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 102448acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 102548acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 102648acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 102748acf710SJeremy L Thompson 102848acf710SJeremy L Thompson // Setup 102948acf710SJeremy L Thompson CeedCallBackend(CeedOperatorSetupAtPoints_Ref(op)); 103048acf710SJeremy L Thompson 103148acf710SJeremy L Thompson // Point coordinates 103248acf710SJeremy L Thompson CeedCallBackend(CeedOperatorAtPointsGetPoints(op, &rstr_points, &point_coords)); 103348acf710SJeremy L Thompson 103448acf710SJeremy L Thompson // Input Evecs and Restriction 10356cde1da6SZach Atkins CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, NULL, true, e_data, impl, request)); 103648acf710SJeremy L Thompson 103748acf710SJeremy L Thompson // Loop through elements 103848acf710SJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 103948acf710SJeremy L Thompson CeedInt num_points; 104048acf710SJeremy L Thompson 104148acf710SJeremy L Thompson // Setup points for element 104248acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(rstr_points, e, CEED_NOTRANSPOSE, point_coords, impl->point_coords_elem, request)); 104348acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumPointsInElement(rstr_points, e, &num_points)); 104448acf710SJeremy L Thompson 104548acf710SJeremy L Thompson // Input basis apply 104648acf710SJeremy L Thompson CeedCallBackend(CeedOperatorInputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_input_fields, op_input_fields, num_input_fields, in_vec, 104748acf710SJeremy L Thompson impl->point_coords_elem, false, e_data, impl, request)); 104848acf710SJeremy L Thompson 104948acf710SJeremy L Thompson // Q function 105048acf710SJeremy L Thompson if (!impl->is_identity_qf) { 105148acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionApply(qf, num_points, impl->q_vecs_in, impl->q_vecs_out)); 105248acf710SJeremy L Thompson } 105348acf710SJeremy L Thompson 105448acf710SJeremy L Thompson // Output basis apply and restriction 105548acf710SJeremy L Thompson CeedCallBackend(CeedOperatorOutputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_output_fields, op_output_fields, num_input_fields, 1056f8a0df59SJeremy L Thompson num_output_fields, impl->apply_add_basis_out, impl->skip_rstr_out, op, out_vec, 1057f8a0df59SJeremy L Thompson impl->point_coords_elem, impl, request)); 105848acf710SJeremy L Thompson 105948acf710SJeremy L Thompson num_points_offset += num_points; 106048acf710SJeremy L Thompson } 106148acf710SJeremy L Thompson 106248acf710SJeremy L Thompson // Restore input arrays 10636cde1da6SZach Atkins CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, true, e_data, impl)); 106448acf710SJeremy L Thompson 106548acf710SJeremy L Thompson // Cleanup point coordinates 106648acf710SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&point_coords)); 106748acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_points)); 106848acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 106948acf710SJeremy L Thompson } 107048acf710SJeremy L Thompson 107148acf710SJeremy L Thompson //------------------------------------------------------------------------------ 1072e13f2367SZach Atkins // Core code for assembling linear QFunction 1073e13f2367SZach Atkins //------------------------------------------------------------------------------ 1074e13f2367SZach Atkins static inline int CeedOperatorLinearAssembleQFunctionAtPointsCore_Ref(CeedOperator op, bool build_objects, CeedVector *assembled, 1075e13f2367SZach Atkins CeedElemRestriction *rstr, CeedRequest *request) { 1076e13f2367SZach Atkins Ceed ceed; 1077ff8551c5SJeremy L Thompson CeedInt qf_size_in, qf_size_out, max_num_points, num_elem, num_input_fields, num_output_fields, num_points_offset = 0; 1078e13f2367SZach Atkins CeedScalar *assembled_array, *e_data_full[2 * CEED_FIELD_MAX] = {NULL}; 1079c7b67790SJeremy L Thompson CeedVector point_coords = NULL; 1080e13f2367SZach Atkins CeedQFunctionField *qf_input_fields, *qf_output_fields; 1081e13f2367SZach Atkins CeedQFunction qf; 1082e13f2367SZach Atkins CeedOperatorField *op_input_fields, *op_output_fields; 1083e13f2367SZach Atkins CeedOperator_Ref *impl; 1084e13f2367SZach Atkins CeedElemRestriction rstr_points = NULL; 1085e13f2367SZach Atkins 1086e13f2367SZach Atkins CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 1087e13f2367SZach Atkins CeedCallBackend(CeedOperatorGetData(op, &impl)); 1088ff8551c5SJeremy L Thompson qf_size_in = impl->qf_size_in; 1089ff8551c5SJeremy L Thompson qf_size_out = impl->qf_size_out; 1090e13f2367SZach Atkins CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 1091e13f2367SZach Atkins CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 1092e13f2367SZach Atkins CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 1093e13f2367SZach Atkins CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 1094e13f2367SZach Atkins 1095e13f2367SZach Atkins // Setup 1096e13f2367SZach Atkins CeedCallBackend(CeedOperatorSetupAtPoints_Ref(op)); 1097e13f2367SZach Atkins 1098e13f2367SZach Atkins // Check for restriction only operator 1099e13f2367SZach Atkins CeedCheck(!impl->is_identity_rstr_op, ceed, CEED_ERROR_BACKEND, "Assembling restriction only operators is not supported"); 1100e13f2367SZach Atkins 1101e13f2367SZach Atkins // Point coordinates 1102e13f2367SZach Atkins CeedCallBackend(CeedOperatorAtPointsGetPoints(op, &rstr_points, &point_coords)); 1103e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionGetMaxPointsInElement(rstr_points, &max_num_points)); 1104e13f2367SZach Atkins 1105e13f2367SZach Atkins // Input Evecs and Restriction 1106e13f2367SZach Atkins CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, NULL, true, e_data_full, impl, request)); 1107e13f2367SZach Atkins 1108e13f2367SZach Atkins // Count number of active input fields 1109ff8551c5SJeremy L Thompson if (qf_size_in == 0) { 1110e13f2367SZach Atkins for (CeedInt i = 0; i < num_input_fields; i++) { 1111e13f2367SZach Atkins CeedInt field_size; 1112e13f2367SZach Atkins CeedVector vec; 1113e13f2367SZach Atkins 1114e13f2367SZach Atkins // Get input vector 1115e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 1116e13f2367SZach Atkins // Check if active input 1117e13f2367SZach Atkins if (vec == CEED_VECTOR_ACTIVE) { 1118e13f2367SZach Atkins // Check that all active inputs are nodal fields 1119e13f2367SZach Atkins { 1120e13f2367SZach Atkins CeedElemRestriction elem_rstr; 1121e13f2367SZach Atkins bool is_at_points = false; 1122e13f2367SZach Atkins 1123e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 1124637baffdSJeremy L Thompson CeedCallBackend(CeedElemRestrictionIsAtPoints(elem_rstr, &is_at_points)); 1125681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 1126e13f2367SZach Atkins CeedCheck(!is_at_points, ceed, CEED_ERROR_BACKEND, "Cannot assemble QFunction with active input at points"); 1127e13f2367SZach Atkins } 1128e13f2367SZach Atkins // Get size of active input 1129e13f2367SZach Atkins CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &field_size)); 1130ff8551c5SJeremy L Thompson qf_size_in += field_size; 1131e13f2367SZach Atkins } 1132681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 1133e13f2367SZach Atkins } 1134ff8551c5SJeremy L Thompson CeedCheck(qf_size_in, ceed, CEED_ERROR_BACKEND, "Cannot assemble QFunction without active inputs and outputs"); 1135ff8551c5SJeremy L Thompson impl->qf_size_in = qf_size_in; 1136e13f2367SZach Atkins } 1137e13f2367SZach Atkins 1138e13f2367SZach Atkins // Count number of active output fields 1139ff8551c5SJeremy L Thompson if (qf_size_out == 0) { 1140e13f2367SZach Atkins for (CeedInt i = 0; i < num_output_fields; i++) { 1141e13f2367SZach Atkins CeedInt field_size; 1142c7b67790SJeremy L Thompson CeedVector vec; 1143e13f2367SZach Atkins 1144e13f2367SZach Atkins // Get output vector 1145e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[i], &vec)); 1146e13f2367SZach Atkins // Check if active output 1147e13f2367SZach Atkins if (vec == CEED_VECTOR_ACTIVE) { 1148e13f2367SZach Atkins // Check that all active inputs are nodal fields 1149e13f2367SZach Atkins { 1150e13f2367SZach Atkins CeedElemRestriction elem_rstr; 1151e13f2367SZach Atkins bool is_at_points = false; 1152e13f2367SZach Atkins 1153e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); 1154637baffdSJeremy L Thompson CeedCallBackend(CeedElemRestrictionIsAtPoints(elem_rstr, &is_at_points)); 1155681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 1156e13f2367SZach Atkins CeedCheck(!is_at_points, ceed, CEED_ERROR_BACKEND, "Cannot assemble QFunction with active input at points"); 1157e13f2367SZach Atkins } 1158e13f2367SZach Atkins // Get size of active output 1159e13f2367SZach Atkins CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[i], &field_size)); 1160c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorSetValue(impl->q_vecs_in[i], 0.0)); 1161ff8551c5SJeremy L Thompson qf_size_out += field_size; 1162e13f2367SZach Atkins } 1163681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 1164e13f2367SZach Atkins } 1165ff8551c5SJeremy L Thompson CeedCheck(qf_size_out > 0, ceed, CEED_ERROR_BACKEND, "Cannot assemble QFunction without active inputs and outputs"); 1166ff8551c5SJeremy L Thompson impl->qf_size_out = qf_size_out; 1167e13f2367SZach Atkins } 1168e13f2367SZach Atkins 1169e13f2367SZach Atkins // Build objects if needed 1170e13f2367SZach Atkins if (build_objects) { 1171e13f2367SZach Atkins CeedInt num_points_total; 1172e13f2367SZach Atkins const CeedInt *offsets; 1173e13f2367SZach Atkins 1174e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionGetNumPoints(rstr_points, &num_points_total)); 1175e13f2367SZach Atkins 1176e13f2367SZach Atkins // Create output restriction (at points) 1177e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionGetOffsets(rstr_points, CEED_MEM_HOST, &offsets)); 1178ff8551c5SJeremy L Thompson CeedCallBackend(CeedElemRestrictionCreateAtPoints(ceed, num_elem, num_points_total, qf_size_in * qf_size_out, 1179ff8551c5SJeremy L Thompson qf_size_in * qf_size_out * num_points_total, CEED_MEM_HOST, CEED_COPY_VALUES, offsets, rstr)); 1180e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionRestoreOffsets(rstr_points, &offsets)); 1181e13f2367SZach Atkins 1182e13f2367SZach Atkins // Create assembled vector 1183e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionCreateVector(*rstr, assembled, NULL)); 1184e13f2367SZach Atkins } 1185e13f2367SZach Atkins // Clear output vector 1186e13f2367SZach Atkins CeedCallBackend(CeedVectorSetValue(*assembled, 0.0)); 1187e13f2367SZach Atkins CeedCallBackend(CeedVectorGetArray(*assembled, CEED_MEM_HOST, &assembled_array)); 1188e13f2367SZach Atkins 1189e13f2367SZach Atkins // Loop through elements 1190e13f2367SZach Atkins for (CeedInt e = 0; e < num_elem; e++) { 1191e13f2367SZach Atkins CeedInt num_points; 1192e13f2367SZach Atkins 1193e13f2367SZach Atkins // Setup points for element 1194e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(rstr_points, e, CEED_NOTRANSPOSE, point_coords, impl->point_coords_elem, request)); 1195e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionGetNumPointsInElement(rstr_points, e, &num_points)); 1196e13f2367SZach Atkins 1197e13f2367SZach Atkins // Input basis apply 1198e13f2367SZach Atkins CeedCallBackend(CeedOperatorInputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_input_fields, op_input_fields, num_input_fields, NULL, 1199e13f2367SZach Atkins impl->point_coords_elem, true, e_data_full, impl, request)); 1200e13f2367SZach Atkins 1201e13f2367SZach Atkins // Assemble QFunction 1202c7b67790SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 1203681d0ea7SJeremy L Thompson bool is_active; 1204c7b67790SJeremy L Thompson CeedInt field_size; 1205c7b67790SJeremy L Thompson CeedVector vec; 1206c7b67790SJeremy L Thompson 1207c7b67790SJeremy L Thompson // Get input vector 1208c7b67790SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 1209681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 1210681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 1211c7b67790SJeremy L Thompson // Check if active input 1212681d0ea7SJeremy L Thompson if (!is_active) continue; 1213c7b67790SJeremy L Thompson // Get size of active input 1214c7b67790SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &field_size)); 1215c7b67790SJeremy L Thompson for (CeedInt field = 0; field < field_size; field++) { 1216c7b67790SJeremy L Thompson // Set current portion of input to 1.0 1217c7b67790SJeremy L Thompson { 1218c7b67790SJeremy L Thompson CeedScalar *array; 1219c7b67790SJeremy L Thompson 1220c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->q_vecs_in[i], CEED_MEM_HOST, &array)); 1221c7b67790SJeremy L Thompson for (CeedInt j = 0; j < num_points; j++) array[field * num_points + j] = 1.0; 1222c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->q_vecs_in[i], &array)); 1223e13f2367SZach Atkins } 1224c7b67790SJeremy L Thompson 1225e13f2367SZach Atkins if (!impl->is_identity_qf) { 1226e13f2367SZach Atkins // Set Outputs 1227e13f2367SZach Atkins for (CeedInt out = 0; out < num_output_fields; out++) { 1228e13f2367SZach Atkins CeedVector vec; 1229e13f2367SZach Atkins CeedInt field_size; 1230e13f2367SZach Atkins 1231e13f2367SZach Atkins // Get output vector 1232e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[out], &vec)); 1233e13f2367SZach Atkins // Check if active output 1234e13f2367SZach Atkins if (vec == CEED_VECTOR_ACTIVE) { 1235e13f2367SZach Atkins CeedCallBackend(CeedVectorSetArray(impl->q_vecs_out[out], CEED_MEM_HOST, CEED_USE_POINTER, assembled_array)); 1236e13f2367SZach Atkins CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[out], &field_size)); 1237e13f2367SZach Atkins assembled_array += field_size * num_points; // Advance the pointer by the size of the output 1238e13f2367SZach Atkins } 1239681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 1240e13f2367SZach Atkins } 1241e13f2367SZach Atkins // Apply QFunction 1242e13f2367SZach Atkins CeedCallBackend(CeedQFunctionApply(qf, num_points, impl->q_vecs_in, impl->q_vecs_out)); 1243e13f2367SZach Atkins } else { 1244c7b67790SJeremy L Thompson const CeedScalar *array; 1245e13f2367SZach Atkins CeedInt field_size; 1246e13f2367SZach Atkins 1247e13f2367SZach Atkins // Copy Identity Outputs 1248e13f2367SZach Atkins CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[0], &field_size)); 1249c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorGetArrayRead(impl->q_vecs_out[0], CEED_MEM_HOST, &array)); 1250c7b67790SJeremy L Thompson for (CeedInt j = 0; j < field_size * num_points; j++) assembled_array[j] = array[j]; 1251c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArrayRead(impl->q_vecs_out[0], &array)); 1252e13f2367SZach Atkins assembled_array += field_size * num_points; 1253e13f2367SZach Atkins } 1254c7b67790SJeremy L Thompson // Reset input to 0.0 1255c7b67790SJeremy L Thompson { 1256c7b67790SJeremy L Thompson CeedScalar *array; 1257c7b67790SJeremy L Thompson 1258c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->q_vecs_in[i], CEED_MEM_HOST, &array)); 1259c7b67790SJeremy L Thompson for (CeedInt j = 0; j < num_points; j++) array[field * num_points + j] = 0.0; 1260c7b67790SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->q_vecs_in[i], &array)); 1261c7b67790SJeremy L Thompson } 1262c7b67790SJeremy L Thompson } 1263e13f2367SZach Atkins } 1264e13f2367SZach Atkins num_points_offset += num_points; 1265e13f2367SZach Atkins } 1266e13f2367SZach Atkins 1267e13f2367SZach Atkins // Un-set output Qvecs to prevent accidental overwrite of Assembled 1268e13f2367SZach Atkins if (!impl->is_identity_qf) { 1269e13f2367SZach Atkins for (CeedInt out = 0; out < num_output_fields; out++) { 1270e13f2367SZach Atkins CeedVector vec; 1271e13f2367SZach Atkins 1272e13f2367SZach Atkins // Get output vector 1273e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[out], &vec)); 1274e13f2367SZach Atkins // Check if active output 1275e13f2367SZach Atkins if (vec == CEED_VECTOR_ACTIVE && num_elem > 0) { 1276e13f2367SZach Atkins CeedCallBackend(CeedVectorTakeArray(impl->q_vecs_out[out], CEED_MEM_HOST, NULL)); 1277e13f2367SZach Atkins } 1278681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 1279e13f2367SZach Atkins } 1280e13f2367SZach Atkins } 1281e13f2367SZach Atkins 1282e13f2367SZach Atkins // Restore input arrays 1283e13f2367SZach Atkins CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, true, e_data_full, impl)); 1284e13f2367SZach Atkins 1285e13f2367SZach Atkins // Restore output 1286e13f2367SZach Atkins CeedCallBackend(CeedVectorRestoreArray(*assembled, &assembled_array)); 1287e13f2367SZach Atkins 1288e13f2367SZach Atkins // Cleanup 1289*9bc66399SJeremy L Thompson CeedCallBackend(CeedDestroy(&ceed)); 1290e13f2367SZach Atkins CeedCallBackend(CeedVectorDestroy(&point_coords)); 1291e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionDestroy(&rstr_points)); 1292e13f2367SZach Atkins return CEED_ERROR_SUCCESS; 1293e13f2367SZach Atkins } 1294e13f2367SZach Atkins 1295e13f2367SZach Atkins //------------------------------------------------------------------------------ 1296e13f2367SZach Atkins // Assemble Linear QFunction 1297e13f2367SZach Atkins //------------------------------------------------------------------------------ 1298e13f2367SZach Atkins static int CeedOperatorLinearAssembleQFunctionAtPoints_Ref(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 1299e13f2367SZach Atkins return CeedOperatorLinearAssembleQFunctionAtPointsCore_Ref(op, true, assembled, rstr, request); 1300e13f2367SZach Atkins } 1301e13f2367SZach Atkins 1302e13f2367SZach Atkins //------------------------------------------------------------------------------ 1303e13f2367SZach Atkins // Update Assembled Linear QFunction 1304e13f2367SZach Atkins //------------------------------------------------------------------------------ 1305e13f2367SZach Atkins static int CeedOperatorLinearAssembleQFunctionAtPointsUpdate_Ref(CeedOperator op, CeedVector assembled, CeedElemRestriction rstr, 1306e13f2367SZach Atkins CeedRequest *request) { 1307e13f2367SZach Atkins return CeedOperatorLinearAssembleQFunctionAtPointsCore_Ref(op, false, &assembled, &rstr, request); 1308e13f2367SZach Atkins } 1309e13f2367SZach Atkins 1310e13f2367SZach Atkins //------------------------------------------------------------------------------ 1311fb133d4bSJeremy L Thompson // Assemble Operator Diagonal AtPoints 1312e13f2367SZach Atkins //------------------------------------------------------------------------------ 1313fb133d4bSJeremy L Thompson static int CeedOperatorLinearAssembleAddDiagonalAtPoints_Ref(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1314382e9c83SJeremy L Thompson CeedInt num_points_offset = 0, num_input_fields, num_output_fields, num_elem, num_comp_active = 1; 1315fb133d4bSJeremy L Thompson CeedScalar *e_data[2 * CEED_FIELD_MAX] = {0}; 1316fb133d4bSJeremy L Thompson Ceed ceed; 1317fb133d4bSJeremy L Thompson CeedVector point_coords = NULL, in_vec, out_vec; 1318fb133d4bSJeremy L Thompson CeedElemRestriction rstr_points = NULL; 1319fb133d4bSJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 1320fb133d4bSJeremy L Thompson CeedQFunction qf; 1321fb133d4bSJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 1322fb133d4bSJeremy L Thompson CeedOperator_Ref *impl; 1323fb133d4bSJeremy L Thompson 1324fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 1325fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 1326fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 1327fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 1328fb133d4bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 1329fb133d4bSJeremy L Thompson 1330fb133d4bSJeremy L Thompson // Setup 1331fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorSetupAtPoints_Ref(op)); 1332fb133d4bSJeremy L Thompson 1333fb133d4bSJeremy L Thompson // Ceed 1334fb133d4bSJeremy L Thompson { 1335fb133d4bSJeremy L Thompson Ceed ceed_parent; 1336fb133d4bSJeremy L Thompson 1337fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 1338fb133d4bSJeremy L Thompson CeedCallBackend(CeedGetParent(ceed, &ceed_parent)); 1339*9bc66399SJeremy L Thompson CeedCallBackend(CeedReferenceCopy(ceed_parent, &ceed)); 1340*9bc66399SJeremy L Thompson CeedCallBackend(CeedDestroy(&ceed_parent)); 1341fb133d4bSJeremy L Thompson } 1342fb133d4bSJeremy L Thompson 1343fb133d4bSJeremy L Thompson // Point coordinates 1344fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorAtPointsGetPoints(op, &rstr_points, &point_coords)); 1345fb133d4bSJeremy L Thompson 1346fb133d4bSJeremy L Thompson // Input and output vectors 1347fb133d4bSJeremy L Thompson { 1348fb133d4bSJeremy L Thompson CeedSize input_size, output_size; 1349fb133d4bSJeremy L Thompson 1350fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 1351fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, input_size, &in_vec)); 1352fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, output_size, &out_vec)); 1353fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(out_vec, 0.0)); 1354fb133d4bSJeremy L Thompson } 1355fb133d4bSJeremy L Thompson 1356382e9c83SJeremy L Thompson // Clear input Qvecs 135786e10729SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 1358681d0ea7SJeremy L Thompson bool is_active; 135986e10729SJeremy L Thompson CeedVector vec; 136086e10729SJeremy L Thompson 136186e10729SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 1362681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 1363681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 1364681d0ea7SJeremy L Thompson if (!is_active) continue; 136586e10729SJeremy L Thompson CeedCallBackend(CeedVectorSetValue(impl->q_vecs_in[i], 0.0)); 136686e10729SJeremy L Thompson } 1367382e9c83SJeremy L Thompson 1368fb133d4bSJeremy L Thompson // Input Evecs and Restriction 1369fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, NULL, true, e_data, impl, request)); 1370fb133d4bSJeremy L Thompson 1371fb133d4bSJeremy L Thompson // Loop through elements 1372fb133d4bSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 1373fb133d4bSJeremy L Thompson CeedInt num_points, e_vec_size = 0; 1374fb133d4bSJeremy L Thompson 1375fb133d4bSJeremy L Thompson // Setup points for element 1376fb133d4bSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(rstr_points, e, CEED_NOTRANSPOSE, point_coords, impl->point_coords_elem, request)); 1377fb133d4bSJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumPointsInElement(rstr_points, e, &num_points)); 1378fb133d4bSJeremy L Thompson 1379fb133d4bSJeremy L Thompson // Input basis apply for non-active bases 1380fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorInputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_input_fields, op_input_fields, num_input_fields, in_vec, 1381fb133d4bSJeremy L Thompson impl->point_coords_elem, true, e_data, impl, request)); 1382fb133d4bSJeremy L Thompson 1383fb133d4bSJeremy L Thompson // Loop over points on element 1384fb133d4bSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 1385681d0ea7SJeremy L Thompson bool is_active_at_points = true, is_active; 1386382e9c83SJeremy L Thompson CeedInt elem_size_active = 1; 1387382e9c83SJeremy L Thompson CeedRestrictionType rstr_type; 1388fb133d4bSJeremy L Thompson CeedVector vec; 1389382e9c83SJeremy L Thompson CeedElemRestriction elem_rstr; 1390fb133d4bSJeremy L Thompson 1391382e9c83SJeremy L Thompson // -- Skip non-active input 1392681d0ea7SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 1393681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 1394681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 1395681d0ea7SJeremy L Thompson if (!is_active) continue; 1396fb133d4bSJeremy L Thompson 1397382e9c83SJeremy L Thompson // -- Get active restriction type 1398382e9c83SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 1399382e9c83SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetType(elem_rstr, &rstr_type)); 1400382e9c83SJeremy L Thompson is_active_at_points = rstr_type == CEED_RESTRICTION_POINTS; 1401382e9c83SJeremy L Thompson if (!is_active_at_points) CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size_active)); 1402382e9c83SJeremy L Thompson else elem_size_active = num_points; 1403382e9c83SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumComponents(elem_rstr, &num_comp_active)); 1404681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 1405382e9c83SJeremy L Thompson 1406382e9c83SJeremy L Thompson e_vec_size = elem_size_active * num_comp_active; 1407382e9c83SJeremy L Thompson for (CeedInt s = 0; s < e_vec_size; s++) { 1408382e9c83SJeremy L Thompson CeedEvalMode eval_mode; 1409382e9c83SJeremy L Thompson CeedBasis basis; 1410382e9c83SJeremy L Thompson 1411382e9c83SJeremy L Thompson // -- Update unit vector 1412fb133d4bSJeremy L Thompson { 1413fb133d4bSJeremy L Thompson CeedScalar *array; 1414fb133d4bSJeremy L Thompson 141513062808SJeremy L Thompson if (s == 0) CeedCallBackend(CeedVectorSetValue(impl->e_vecs_in[i], 0.0)); 1416fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->e_vecs_in[i], CEED_MEM_HOST, &array)); 1417fb133d4bSJeremy L Thompson array[s] = 1.0; 1418fb133d4bSJeremy L Thompson if (s > 0) array[s - 1] = 0.0; 1419fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->e_vecs_in[i], &array)); 1420fb133d4bSJeremy L Thompson } 1421382e9c83SJeremy L Thompson // -- Basis action 1422958e607dSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 1423fb133d4bSJeremy L Thompson switch (eval_mode) { 1424fb133d4bSJeremy L Thompson case CEED_EVAL_NONE: 1425fb133d4bSJeremy L Thompson break; 1426fb133d4bSJeremy L Thompson // Note - these basis eval modes require FEM fields 1427fb133d4bSJeremy L Thompson case CEED_EVAL_INTERP: 1428fb133d4bSJeremy L Thompson case CEED_EVAL_GRAD: 1429fb133d4bSJeremy L Thompson case CEED_EVAL_DIV: 1430fb133d4bSJeremy L Thompson case CEED_EVAL_CURL: 1431fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_input_fields[i], &basis)); 1432fc0f7cc6SJeremy L Thompson CeedCallBackend(CeedBasisApplyAtPoints(basis, 1, &num_points, CEED_NOTRANSPOSE, eval_mode, impl->point_coords_elem, impl->e_vecs_in[i], 1433fb133d4bSJeremy L Thompson impl->q_vecs_in[i])); 1434681d0ea7SJeremy L Thompson CeedCallBackend(CeedBasisDestroy(&basis)); 1435fb133d4bSJeremy L Thompson break; 1436fb133d4bSJeremy L Thompson case CEED_EVAL_WEIGHT: 1437fb133d4bSJeremy L Thompson break; // No action 1438fb133d4bSJeremy L Thompson } 1439fb133d4bSJeremy L Thompson 1440fb133d4bSJeremy L Thompson // -- Q function 1441fb133d4bSJeremy L Thompson if (!impl->is_identity_qf) { 1442fb133d4bSJeremy L Thompson CeedCallBackend(CeedQFunctionApply(qf, num_points, impl->q_vecs_in, impl->q_vecs_out)); 1443fb133d4bSJeremy L Thompson } 1444fb133d4bSJeremy L Thompson 1445fb133d4bSJeremy L Thompson // -- Output basis apply and restriction 1446fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorOutputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_output_fields, op_output_fields, num_input_fields, 1447f8a0df59SJeremy L Thompson num_output_fields, impl->apply_add_basis_out, impl->skip_rstr_out, op, out_vec, 1448f8a0df59SJeremy L Thompson impl->point_coords_elem, impl, request)); 1449fb133d4bSJeremy L Thompson 1450fb133d4bSJeremy L Thompson // -- Grab diagonal value 145186e10729SJeremy L Thompson for (CeedInt j = 0; j < num_output_fields; j++) { 1452681d0ea7SJeremy L Thompson bool is_active; 1453382e9c83SJeremy L Thompson CeedInt elem_size = 0; 1454fb133d4bSJeremy L Thompson CeedRestrictionType rstr_type; 1455fb133d4bSJeremy L Thompson CeedEvalMode eval_mode; 1456fb133d4bSJeremy L Thompson CeedVector vec; 1457fb133d4bSJeremy L Thompson CeedElemRestriction elem_rstr; 1458fb133d4bSJeremy L Thompson CeedBasis basis; 1459fb133d4bSJeremy L Thompson 14600c7f167fSZach Atkins // ---- Skip non-active output 1461681d0ea7SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[j], &vec)); 1462681d0ea7SJeremy L Thompson is_active = vec == CEED_VECTOR_ACTIVE; 1463681d0ea7SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&vec)); 1464681d0ea7SJeremy L Thompson if (!is_active) continue; 1465fb133d4bSJeremy L Thompson 1466382e9c83SJeremy L Thompson // ---- Check if elem size matches 146786e10729SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[j], &elem_rstr)); 1468382e9c83SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetType(elem_rstr, &rstr_type)); 146969d19bacSJeremy L Thompson if (is_active_at_points && rstr_type != CEED_RESTRICTION_POINTS) { 147069d19bacSJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 147169d19bacSJeremy L Thompson continue; 147269d19bacSJeremy L Thompson } 1473382e9c83SJeremy L Thompson if (rstr_type == CEED_RESTRICTION_POINTS) { 1474382e9c83SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumPointsInElement(elem_rstr, e, &elem_size)); 1475382e9c83SJeremy L Thompson } else { 1476382e9c83SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size)); 1477382e9c83SJeremy L Thompson } 1478382e9c83SJeremy L Thompson { 1479382e9c83SJeremy L Thompson CeedInt num_comp = 0; 1480382e9c83SJeremy L Thompson 1481382e9c83SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumComponents(elem_rstr, &num_comp)); 148269d19bacSJeremy L Thompson if (e_vec_size != num_comp * elem_size) { 148369d19bacSJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 148469d19bacSJeremy L Thompson continue; 148569d19bacSJeremy L Thompson } 1486382e9c83SJeremy L Thompson } 1487382e9c83SJeremy L Thompson 1488fb133d4bSJeremy L Thompson // ---- Basis action 148986e10729SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[j], &eval_mode)); 1490fb133d4bSJeremy L Thompson switch (eval_mode) { 1491fb133d4bSJeremy L Thompson case CEED_EVAL_NONE: 1492fb133d4bSJeremy L Thompson break; // No action 1493fb133d4bSJeremy L Thompson case CEED_EVAL_INTERP: 1494fb133d4bSJeremy L Thompson case CEED_EVAL_GRAD: 1495fb133d4bSJeremy L Thompson case CEED_EVAL_DIV: 1496fb133d4bSJeremy L Thompson case CEED_EVAL_CURL: 149786e10729SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_output_fields[j], &basis)); 149886e10729SJeremy L Thompson CeedCallBackend(CeedBasisApplyAtPoints(basis, 1, &num_points, CEED_TRANSPOSE, eval_mode, impl->point_coords_elem, impl->q_vecs_out[j], 149986e10729SJeremy L Thompson impl->e_vecs_out[j])); 1500681d0ea7SJeremy L Thompson CeedCallBackend(CeedBasisDestroy(&basis)); 1501fb133d4bSJeremy L Thompson break; 1502fb133d4bSJeremy L Thompson // LCOV_EXCL_START 1503fb133d4bSJeremy L Thompson case CEED_EVAL_WEIGHT: { 1504fb133d4bSJeremy L Thompson return CeedError(CeedOperatorReturnCeed(op), CEED_ERROR_BACKEND, "CEED_EVAL_WEIGHT cannot be an output evaluation mode"); 1505fb133d4bSJeremy L Thompson // LCOV_EXCL_STOP 1506fb133d4bSJeremy L Thompson } 1507fb133d4bSJeremy L Thompson } 1508fb133d4bSJeremy L Thompson // ---- Update output vector 1509fb133d4bSJeremy L Thompson { 1510fb133d4bSJeremy L Thompson CeedScalar *array, current_value = 0.0; 1511fb133d4bSJeremy L Thompson 151286e10729SJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->e_vecs_out[j], CEED_MEM_HOST, &array)); 1513fb133d4bSJeremy L Thompson current_value = array[s]; 151486e10729SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->e_vecs_out[j], &array)); 151586e10729SJeremy L Thompson CeedCallBackend(CeedVectorSetValue(impl->e_vecs_out[j], 0.0)); 151686e10729SJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->e_vecs_out[j], CEED_MEM_HOST, &array)); 1517fb133d4bSJeremy L Thompson array[s] = current_value; 151886e10729SJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->e_vecs_out[j], &array)); 1519fb133d4bSJeremy L Thompson } 1520fb133d4bSJeremy L Thompson // ---- Restrict output block 1521fb133d4bSJeremy L Thompson if (rstr_type == CEED_RESTRICTION_POINTS) { 152286e10729SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(elem_rstr, e, CEED_TRANSPOSE, impl->e_vecs_out[j], assembled, request)); 1523fb133d4bSJeremy L Thompson } else { 152486e10729SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyBlock(elem_rstr, e, CEED_TRANSPOSE, impl->e_vecs_out[j], assembled, request)); 1525fb133d4bSJeremy L Thompson } 1526681d0ea7SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&elem_rstr)); 1527fb133d4bSJeremy L Thompson } 1528382e9c83SJeremy L Thompson // -- Reset unit vector 152913062808SJeremy L Thompson if (s == e_vec_size - 1) CeedCallBackend(CeedVectorSetValue(impl->q_vecs_in[i], 0.0)); 1530382e9c83SJeremy L Thompson } 1531fb133d4bSJeremy L Thompson } 1532fb133d4bSJeremy L Thompson num_points_offset += num_points; 1533fb133d4bSJeremy L Thompson } 1534fb133d4bSJeremy L Thompson 1535fb133d4bSJeremy L Thompson // Restore input arrays 1536fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, true, e_data, impl)); 1537fb133d4bSJeremy L Thompson 1538fb133d4bSJeremy L Thompson // Cleanup 1539*9bc66399SJeremy L Thompson CeedCallBackend(CeedDestroy(&ceed)); 1540fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&in_vec)); 1541fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&out_vec)); 1542fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&point_coords)); 1543fb133d4bSJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_points)); 1544fb133d4bSJeremy L Thompson return CEED_ERROR_SUCCESS; 1545fb133d4bSJeremy L Thompson } 1546e13f2367SZach Atkins 1547e13f2367SZach Atkins //------------------------------------------------------------------------------ 1548f10650afSjeremylt // Operator Destroy 1549f10650afSjeremylt //------------------------------------------------------------------------------ 1550f10650afSjeremylt static int CeedOperatorDestroy_Ref(CeedOperator op) { 1551f10650afSjeremylt CeedOperator_Ref *impl; 1552f10650afSjeremylt 1553ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 15543aab95c0SJeremy L Thompson CeedCallBackend(CeedFree(&impl->skip_rstr_in)); 1555f8a0df59SJeremy L Thompson CeedCallBackend(CeedFree(&impl->skip_rstr_out)); 1556f8a0df59SJeremy L Thompson CeedCallBackend(CeedFree(&impl->e_data_out_indices)); 1557f8a0df59SJeremy L Thompson CeedCallBackend(CeedFree(&impl->apply_add_basis_out)); 15584fc1f125SJeremy L Thompson for (CeedInt i = 0; i < impl->num_inputs + impl->num_outputs; i++) { 15592b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->e_vecs_full[i])); 1560f10650afSjeremylt } 15612b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->e_vecs_full)); 15622b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->input_states)); 1563f10650afSjeremylt 15644fc1f125SJeremy L Thompson for (CeedInt i = 0; i < impl->num_inputs; i++) { 15652b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->e_vecs_in[i])); 15662b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->q_vecs_in[i])); 1567f10650afSjeremylt } 15682b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->e_vecs_in)); 15692b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->q_vecs_in)); 1570f10650afSjeremylt 15714fc1f125SJeremy L Thompson for (CeedInt i = 0; i < impl->num_outputs; i++) { 15722b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->e_vecs_out[i])); 15732b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->q_vecs_out[i])); 1574f10650afSjeremylt } 15752b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->e_vecs_out)); 15762b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->q_vecs_out)); 157748acf710SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->point_coords_elem)); 1578f10650afSjeremylt 15792b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl)); 1580e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 1581f10650afSjeremylt } 1582f10650afSjeremylt 1583f10650afSjeremylt //------------------------------------------------------------------------------ 1584713f43c3Sjeremylt // Operator Create 1585f10650afSjeremylt //------------------------------------------------------------------------------ 158621617c04Sjeremylt int CeedOperatorCreate_Ref(CeedOperator op) { 1587fe2413ffSjeremylt Ceed ceed; 15884ce2993fSjeremylt CeedOperator_Ref *impl; 158921617c04Sjeremylt 1590ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 15912b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(1, &impl)); 15922b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetData(op, impl)); 15932b730f8bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleQFunction", CeedOperatorLinearAssembleQFunction_Ref)); 15942b730f8bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleQFunctionUpdate", CeedOperatorLinearAssembleQFunctionUpdate_Ref)); 15952b730f8bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "ApplyAdd", CeedOperatorApplyAdd_Ref)); 15962b730f8bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "Destroy", CeedOperatorDestroy_Ref)); 1597*9bc66399SJeremy L Thompson CeedCallBackend(CeedDestroy(&ceed)); 1598e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 159921617c04Sjeremylt } 16002a86cc9dSSebastian Grimberg 16012a86cc9dSSebastian Grimberg //------------------------------------------------------------------------------ 160248acf710SJeremy L Thompson // Operator Create At Points 160348acf710SJeremy L Thompson //------------------------------------------------------------------------------ 160448acf710SJeremy L Thompson int CeedOperatorCreateAtPoints_Ref(CeedOperator op) { 160548acf710SJeremy L Thompson Ceed ceed; 160648acf710SJeremy L Thompson CeedOperator_Ref *impl; 160748acf710SJeremy L Thompson 160848acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 160948acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(1, &impl)); 161048acf710SJeremy L Thompson CeedCallBackend(CeedOperatorSetData(op, impl)); 1611e13f2367SZach Atkins CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleQFunction", CeedOperatorLinearAssembleQFunctionAtPoints_Ref)); 1612e13f2367SZach Atkins CeedCallBackend( 1613e13f2367SZach Atkins CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleQFunctionUpdate", CeedOperatorLinearAssembleQFunctionAtPointsUpdate_Ref)); 1614fb133d4bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleAddDiagonal", CeedOperatorLinearAssembleAddDiagonalAtPoints_Ref)); 161548acf710SJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "ApplyAdd", CeedOperatorApplyAddAtPoints_Ref)); 161648acf710SJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "Destroy", CeedOperatorDestroy_Ref)); 1617*9bc66399SJeremy L Thompson CeedCallBackend(CeedDestroy(&ceed)); 161848acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 161948acf710SJeremy L Thompson } 162048acf710SJeremy L Thompson 162148acf710SJeremy L Thompson //------------------------------------------------------------------------------ 1622