15aed82e4SJeremy L Thompson // Copyright (c) 2017-2024, Lawrence Livermore National Security, LLC and other CEED contributors. 23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details. 321617c04Sjeremylt // 43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause 521617c04Sjeremylt // 63d8e8822SJeremy L Thompson // This file is part of CEED: http://github.com/ceed 721617c04Sjeremylt 849aac155SJeremy L Thompson #include <ceed.h> 9ec3da8bcSJed Brown #include <ceed/backend.h> 103d576824SJeremy L Thompson #include <stdbool.h> 113d576824SJeremy L Thompson #include <stddef.h> 123d576824SJeremy L Thompson #include <stdint.h> 132b730f8bSJeremy L Thompson 1421617c04Sjeremylt #include "ceed-ref.h" 1521617c04Sjeremylt 16f10650afSjeremylt //------------------------------------------------------------------------------ 17f10650afSjeremylt // Setup Input/Output Fields 18f10650afSjeremylt //------------------------------------------------------------------------------ 192b730f8bSJeremy L Thompson static int CeedOperatorSetupFields_Ref(CeedQFunction qf, CeedOperator op, bool is_input, CeedVector *e_vecs_full, CeedVector *e_vecs, 202b730f8bSJeremy L Thompson CeedVector *q_vecs, CeedInt start_e, CeedInt num_fields, CeedInt Q) { 21aedaa0e5Sjeremylt Ceed ceed; 226efa0d72SZach Atkins CeedSize e_size, q_size; 23ad70ee2cSJeremy L Thompson CeedInt num_comp, size, P; 24d1d35e2fSjeremylt CeedQFunctionField *qf_fields; 25ad70ee2cSJeremy L Thompson CeedOperatorField *op_fields; 26ad70ee2cSJeremy L Thompson 27e910d748SJeremy L Thompson { 28e910d748SJeremy L Thompson Ceed ceed_parent; 29e910d748SJeremy L Thompson 30ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 31e910d748SJeremy L Thompson CeedCallBackend(CeedGetParent(ceed, &ceed_parent)); 32e910d748SJeremy L Thompson if (ceed_parent) ceed = ceed_parent; 33e910d748SJeremy L Thompson } 344fc1f125SJeremy L Thompson if (is_input) { 352b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL)); 362b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL)); 374fc1f125SJeremy L Thompson } else { 382b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields)); 392b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, NULL, NULL, &qf_fields)); 40fe2413ffSjeremylt } 4121617c04Sjeremylt 42885ac19cSjeremylt // Loop over fields 43d1d35e2fSjeremylt for (CeedInt i = 0; i < num_fields; i++) { 44d1d35e2fSjeremylt CeedEvalMode eval_mode; 45edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 46ad70ee2cSJeremy L Thompson CeedBasis basis; 47d1d35e2fSjeremylt 48ad70ee2cSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 49d1d35e2fSjeremylt if (eval_mode != CEED_EVAL_WEIGHT) { 50edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr)); 51edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionCreateVector(elem_rstr, NULL, &e_vecs_full[i + start_e])); 52135a076eSjeremylt } 53135a076eSjeremylt 54d1d35e2fSjeremylt switch (eval_mode) { 55885ac19cSjeremylt case CEED_EVAL_NONE: 562b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_fields[i], &size)); 57d2643443SJeremy L Thompson q_size = (CeedSize)Q * size; 582b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 59aedaa0e5Sjeremylt break; 60aedaa0e5Sjeremylt case CEED_EVAL_INTERP: 61885ac19cSjeremylt case CEED_EVAL_GRAD: 62a915a514Srezgarshakeri case CEED_EVAL_DIV: 63c4e3f59bSSebastian Grimberg case CEED_EVAL_CURL: 642b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 652b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_fields[i], &size)); 662b730f8bSJeremy L Thompson CeedCallBackend(CeedBasisGetNumNodes(basis, &P)); 672b730f8bSJeremy L Thompson CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 68d2643443SJeremy L Thompson e_size = (CeedSize)P * num_comp; 692b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, e_size, &e_vecs[i])); 70d2643443SJeremy L Thompson q_size = (CeedSize)Q * size; 712b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 72885ac19cSjeremylt break; 73885ac19cSjeremylt case CEED_EVAL_WEIGHT: // Only on input fields 742b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 75d2643443SJeremy L Thompson q_size = (CeedSize)Q; 762b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 772b730f8bSJeremy L Thompson CeedCallBackend(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, q_vecs[i])); 78885ac19cSjeremylt break; 7921617c04Sjeremylt } 80885ac19cSjeremylt } 81e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 8221617c04Sjeremylt } 8321617c04Sjeremylt 84f10650afSjeremylt //------------------------------------------------------------------------------ 85f10650afSjeremylt // Setup Operator 86f10650afSjeremylt //------------------------------------------------------------------------------/* 87885ac19cSjeremylt static int CeedOperatorSetup_Ref(CeedOperator op) { 888c1105f8SJeremy L Thompson bool is_setup_done; 89ad70ee2cSJeremy L Thompson CeedInt Q, num_input_fields, num_output_fields; 90ad70ee2cSJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 91ad70ee2cSJeremy L Thompson CeedQFunction qf; 92ad70ee2cSJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 93ad70ee2cSJeremy L Thompson CeedOperator_Ref *impl; 94ad70ee2cSJeremy L Thompson 952b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorIsSetupDone(op, &is_setup_done)); 968c1105f8SJeremy L Thompson if (is_setup_done) return CEED_ERROR_SUCCESS; 97ad70ee2cSJeremy L Thompson 982b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 992b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 1002b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumQuadraturePoints(op, &Q)); 1012b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionIsIdentity(qf, &impl->is_identity_qf)); 1022b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 1032b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 104885ac19cSjeremylt 105885ac19cSjeremylt // Allocate 1062b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(num_input_fields + num_output_fields, &impl->e_vecs_full)); 107885ac19cSjeremylt 1082b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->input_states)); 1092b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_vecs_in)); 1102b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_vecs_out)); 1112b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->q_vecs_in)); 1122b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->q_vecs_out)); 113885ac19cSjeremylt 1144fc1f125SJeremy L Thompson impl->num_inputs = num_input_fields; 1154fc1f125SJeremy L Thompson impl->num_outputs = num_output_fields; 116885ac19cSjeremylt 117d1d35e2fSjeremylt // Set up infield and outfield e_vecs and q_vecs 118885ac19cSjeremylt // Infields 1192b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetupFields_Ref(qf, op, true, impl->e_vecs_full, impl->e_vecs_in, impl->q_vecs_in, 0, num_input_fields, Q)); 120885ac19cSjeremylt // Outfields 1212b730f8bSJeremy L Thompson CeedCallBackend( 1222b730f8bSJeremy L Thompson CeedOperatorSetupFields_Ref(qf, op, false, impl->e_vecs_full, impl->e_vecs_out, impl->q_vecs_out, num_input_fields, num_output_fields, Q)); 123885ac19cSjeremylt 12416911fdaSjeremylt // Identity QFunctions 1250b454692Sjeremylt if (impl->is_identity_qf) { 126d1d35e2fSjeremylt CeedEvalMode in_mode, out_mode; 127d1d35e2fSjeremylt CeedQFunctionField *in_fields, *out_fields; 128ad70ee2cSJeremy L Thompson 1292b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &in_fields, NULL, &out_fields)); 1302b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(in_fields[0], &in_mode)); 1312b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(out_fields[0], &out_mode)); 132d1d35e2fSjeremylt 1330b454692Sjeremylt if (in_mode == CEED_EVAL_NONE && out_mode == CEED_EVAL_NONE) { 134edb2538eSJeremy L Thompson impl->is_identity_rstr_op = true; 1350b454692Sjeremylt } else { 136db002c03SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(impl->q_vecs_in[0], &impl->q_vecs_out[0])); 13716911fdaSjeremylt } 13816911fdaSjeremylt } 13916911fdaSjeremylt 1402b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetSetupDone(op)); 141e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 142885ac19cSjeremylt } 143885ac19cSjeremylt 144f10650afSjeremylt //------------------------------------------------------------------------------ 145f10650afSjeremylt // Setup Operator Inputs 146f10650afSjeremylt //------------------------------------------------------------------------------ 1472b730f8bSJeremy L Thompson static inline int CeedOperatorSetupInputs_Ref(CeedInt num_input_fields, CeedQFunctionField *qf_input_fields, CeedOperatorField *op_input_fields, 1482b730f8bSJeremy L Thompson CeedVector in_vec, const bool skip_active, CeedScalar *e_data_full[2 * CEED_FIELD_MAX], 149a0162de9SJeremy L Thompson CeedOperator_Ref *impl, CeedRequest *request) { 150ad70ee2cSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 151ad70ee2cSJeremy L Thompson uint64_t state; 152d1d35e2fSjeremylt CeedEvalMode eval_mode; 153d1bcdac9Sjeremylt CeedVector vec; 154edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 155885ac19cSjeremylt 156d1bcdac9Sjeremylt // Get input vector 1572b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 1581d102b48SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 1592b730f8bSJeremy L Thompson if (skip_active) continue; 1602b730f8bSJeremy L Thompson else vec = in_vec; 1611d102b48SJeremy L Thompson } 1621d102b48SJeremy L Thompson 1632b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 1641d102b48SJeremy L Thompson // Restrict and Evec 165d1d35e2fSjeremylt if (eval_mode == CEED_EVAL_WEIGHT) { // Skip 1661d102b48SJeremy L Thompson } else { 167668048e2SJed Brown // Restrict 1682b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorGetState(vec, &state)); 1698d713cf6Sjeremylt // Skip restriction if input is unchanged 1704fc1f125SJeremy L Thompson if (state != impl->input_states[i] || vec == in_vec) { 171edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 172edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApply(elem_rstr, CEED_NOTRANSPOSE, vec, impl->e_vecs_full[i], request)); 1734fc1f125SJeremy L Thompson impl->input_states[i] = state; 1748d713cf6Sjeremylt } 175668048e2SJed Brown // Get evec 1762b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorGetArrayRead(impl->e_vecs_full[i], CEED_MEM_HOST, (const CeedScalar **)&e_data_full[i])); 177885ac19cSjeremylt } 178885ac19cSjeremylt } 179e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 180885ac19cSjeremylt } 181885ac19cSjeremylt 182f10650afSjeremylt //------------------------------------------------------------------------------ 183f10650afSjeremylt // Input Basis Action 184f10650afSjeremylt //------------------------------------------------------------------------------ 1852b730f8bSJeremy L Thompson static inline int CeedOperatorInputBasis_Ref(CeedInt e, CeedInt Q, CeedQFunctionField *qf_input_fields, CeedOperatorField *op_input_fields, 1862b730f8bSJeremy L Thompson CeedInt num_input_fields, const bool skip_active, CeedScalar *e_data_full[2 * CEED_FIELD_MAX], 1872b730f8bSJeremy L Thompson CeedOperator_Ref *impl) { 188ad70ee2cSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 189a915a514Srezgarshakeri CeedInt elem_size, size, num_comp; 190d1d35e2fSjeremylt CeedEvalMode eval_mode; 191edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 1921d102b48SJeremy L Thompson CeedBasis basis; 1931d102b48SJeremy L Thompson 1941d102b48SJeremy L Thompson // Skip active input 195d1d35e2fSjeremylt if (skip_active) { 1961d102b48SJeremy L Thompson CeedVector vec; 197ad70ee2cSJeremy L Thompson 1982b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 1992b730f8bSJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) continue; 2001d102b48SJeremy L Thompson } 201d1d35e2fSjeremylt // Get elem_size, eval_mode, size 202edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 203edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size)); 2042b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 2052b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &size)); 206885ac19cSjeremylt // Basis action 207d1d35e2fSjeremylt switch (eval_mode) { 208885ac19cSjeremylt case CEED_EVAL_NONE: 20981670346SSebastian Grimberg CeedCallBackend(CeedVectorSetArray(impl->q_vecs_in[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data_full[i][(CeedSize)e * Q * size])); 210885ac19cSjeremylt break; 211885ac19cSjeremylt case CEED_EVAL_INTERP: 212885ac19cSjeremylt case CEED_EVAL_GRAD: 213a915a514Srezgarshakeri case CEED_EVAL_DIV: 214c4e3f59bSSebastian Grimberg case CEED_EVAL_CURL: 215a915a514Srezgarshakeri CeedCallBackend(CeedOperatorFieldGetBasis(op_input_fields[i], &basis)); 216a915a514Srezgarshakeri CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 21781670346SSebastian Grimberg CeedCallBackend(CeedVectorSetArray(impl->e_vecs_in[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data_full[i][(CeedSize)e * elem_size * num_comp])); 218c4e3f59bSSebastian Grimberg CeedCallBackend(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, eval_mode, impl->e_vecs_in[i], impl->q_vecs_in[i])); 219a915a514Srezgarshakeri break; 220885ac19cSjeremylt case CEED_EVAL_WEIGHT: 221885ac19cSjeremylt break; // No action 222885ac19cSjeremylt } 223885ac19cSjeremylt } 224e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 225885ac19cSjeremylt } 226885ac19cSjeremylt 227f10650afSjeremylt //------------------------------------------------------------------------------ 228f10650afSjeremylt // Output Basis Action 229f10650afSjeremylt //------------------------------------------------------------------------------ 2302b730f8bSJeremy L Thompson static inline int CeedOperatorOutputBasis_Ref(CeedInt e, CeedInt Q, CeedQFunctionField *qf_output_fields, CeedOperatorField *op_output_fields, 231d1d35e2fSjeremylt CeedInt num_input_fields, CeedInt num_output_fields, CeedOperator op, 2324fc1f125SJeremy L Thompson CeedScalar *e_data_full[2 * CEED_FIELD_MAX], CeedOperator_Ref *impl) { 233ad70ee2cSJeremy L Thompson for (CeedInt i = 0; i < num_output_fields; i++) { 234a915a514Srezgarshakeri CeedInt elem_size, num_comp; 235d1d35e2fSjeremylt CeedEvalMode eval_mode; 236edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 2371d102b48SJeremy L Thompson CeedBasis basis; 2381d102b48SJeremy L Thompson 239a915a514Srezgarshakeri // Get elem_size, eval_mode 240edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); 241edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size)); 2422b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); 243885ac19cSjeremylt // Basis action 244d1d35e2fSjeremylt switch (eval_mode) { 245885ac19cSjeremylt case CEED_EVAL_NONE: 246885ac19cSjeremylt break; // No action 247885ac19cSjeremylt case CEED_EVAL_INTERP: 248885ac19cSjeremylt case CEED_EVAL_GRAD: 249a915a514Srezgarshakeri case CEED_EVAL_DIV: 250c4e3f59bSSebastian Grimberg case CEED_EVAL_CURL: 251a915a514Srezgarshakeri CeedCallBackend(CeedOperatorFieldGetBasis(op_output_fields[i], &basis)); 252a915a514Srezgarshakeri CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 25381670346SSebastian Grimberg CeedCallBackend(CeedVectorSetArray(impl->e_vecs_out[i], CEED_MEM_HOST, CEED_USE_POINTER, 25481670346SSebastian Grimberg &e_data_full[i + num_input_fields][(CeedSize)e * elem_size * num_comp])); 255c4e3f59bSSebastian Grimberg CeedCallBackend(CeedBasisApply(basis, 1, CEED_TRANSPOSE, eval_mode, impl->q_vecs_out[i], impl->e_vecs_out[i])); 256a915a514Srezgarshakeri break; 257c042f62fSJeremy L Thompson // LCOV_EXCL_START 258bbfacfcdSjeremylt case CEED_EVAL_WEIGHT: { 2596e536b99SJeremy L Thompson return CeedError(CeedOperatorReturnCeed(op), CEED_ERROR_BACKEND, "CEED_EVAL_WEIGHT cannot be an output evaluation mode"); 2601d102b48SJeremy L Thompson // LCOV_EXCL_STOP 261885ac19cSjeremylt } 262885ac19cSjeremylt } 263885ac19cSjeremylt } 264e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 2651d102b48SJeremy L Thompson } 2661d102b48SJeremy L Thompson 267f10650afSjeremylt //------------------------------------------------------------------------------ 268f10650afSjeremylt // Restore Input Vectors 269f10650afSjeremylt //------------------------------------------------------------------------------ 2702b730f8bSJeremy L Thompson static inline int CeedOperatorRestoreInputs_Ref(CeedInt num_input_fields, CeedQFunctionField *qf_input_fields, CeedOperatorField *op_input_fields, 2712b730f8bSJeremy L Thompson const bool skip_active, CeedScalar *e_data_full[2 * CEED_FIELD_MAX], CeedOperator_Ref *impl) { 272ad70ee2cSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 273d1d35e2fSjeremylt CeedEvalMode eval_mode; 2741d102b48SJeremy L Thompson 2751d102b48SJeremy L Thompson // Skip active inputs 276d1d35e2fSjeremylt if (skip_active) { 2771d102b48SJeremy L Thompson CeedVector vec; 278ad70ee2cSJeremy L Thompson 2792b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 2802b730f8bSJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) continue; 2811d102b48SJeremy L Thompson } 2821d102b48SJeremy L Thompson // Restore input 2832b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 284d1d35e2fSjeremylt if (eval_mode == CEED_EVAL_WEIGHT) { // Skip 2851d102b48SJeremy L Thompson } else { 2862b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArrayRead(impl->e_vecs_full[i], (const CeedScalar **)&e_data_full[i])); 2871d102b48SJeremy L Thompson } 2881d102b48SJeremy L Thompson } 289e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 2901d102b48SJeremy L Thompson } 2911d102b48SJeremy L Thompson 292f10650afSjeremylt //------------------------------------------------------------------------------ 293f10650afSjeremylt // Operator Apply 294f10650afSjeremylt //------------------------------------------------------------------------------ 2952b730f8bSJeremy L Thompson static int CeedOperatorApplyAdd_Ref(CeedOperator op, CeedVector in_vec, CeedVector out_vec, CeedRequest *request) { 296d1d35e2fSjeremylt CeedInt Q, num_elem, num_input_fields, num_output_fields, size; 297ad70ee2cSJeremy L Thompson CeedEvalMode eval_mode; 298ad70ee2cSJeremy L Thompson CeedScalar *e_data_full[2 * CEED_FIELD_MAX] = {NULL}; 299ad70ee2cSJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 300ad70ee2cSJeremy L Thompson CeedQFunction qf; 301ad70ee2cSJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 302ad70ee2cSJeremy L Thompson CeedOperator_Ref *impl; 303ad70ee2cSJeremy L Thompson 304ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 305ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 3062b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumQuadraturePoints(op, &Q)); 3072b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 3082b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 3092b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 3101d102b48SJeremy L Thompson 3111d102b48SJeremy L Thompson // Setup 3122b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetup_Ref(op)); 3131d102b48SJeremy L Thompson 3140b454692Sjeremylt // Restriction only operator 315edb2538eSJeremy L Thompson if (impl->is_identity_rstr_op) { 316edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 317ad70ee2cSJeremy L Thompson 318edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[0], &elem_rstr)); 319edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApply(elem_rstr, CEED_NOTRANSPOSE, in_vec, impl->e_vecs_full[0], request)); 320edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[0], &elem_rstr)); 321edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApply(elem_rstr, CEED_TRANSPOSE, impl->e_vecs_full[0], out_vec, request)); 3220b454692Sjeremylt return CEED_ERROR_SUCCESS; 3230b454692Sjeremylt } 3240b454692Sjeremylt 3251d102b48SJeremy L Thompson // Input Evecs and Restriction 3262b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, in_vec, false, e_data_full, impl, request)); 3271d102b48SJeremy L Thompson 3281d102b48SJeremy L Thompson // Output Evecs 329d1d35e2fSjeremylt for (CeedInt i = 0; i < num_output_fields; i++) { 3302b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorGetArrayWrite(impl->e_vecs_full[i + impl->num_inputs], CEED_MEM_HOST, &e_data_full[i + num_input_fields])); 3311d102b48SJeremy L Thompson } 3321d102b48SJeremy L Thompson 3331d102b48SJeremy L Thompson // Loop through elements 334d1d35e2fSjeremylt for (CeedInt e = 0; e < num_elem; e++) { 3351d102b48SJeremy L Thompson // Output pointers 336d1d35e2fSjeremylt for (CeedInt i = 0; i < num_output_fields; i++) { 3372b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); 338d1d35e2fSjeremylt if (eval_mode == CEED_EVAL_NONE) { 3392b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[i], &size)); 34081670346SSebastian Grimberg CeedCallBackend( 34181670346SSebastian Grimberg CeedVectorSetArray(impl->q_vecs_out[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data_full[i + num_input_fields][(CeedSize)e * Q * size])); 3421d102b48SJeremy L Thompson } 3431d102b48SJeremy L Thompson } 3441d102b48SJeremy L Thompson 34516911fdaSjeremylt // Input basis apply 3462b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorInputBasis_Ref(e, Q, qf_input_fields, op_input_fields, num_input_fields, false, e_data_full, impl)); 34716911fdaSjeremylt 3481d102b48SJeremy L Thompson // Q function 3490b454692Sjeremylt if (!impl->is_identity_qf) { 3502b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionApply(qf, Q, impl->q_vecs_in, impl->q_vecs_out)); 35116911fdaSjeremylt } 3521d102b48SJeremy L Thompson 3531d102b48SJeremy L Thompson // Output basis apply 3542b730f8bSJeremy L Thompson CeedCallBackend( 3552b730f8bSJeremy L Thompson CeedOperatorOutputBasis_Ref(e, Q, qf_output_fields, op_output_fields, num_input_fields, num_output_fields, op, e_data_full, impl)); 3561d102b48SJeremy L Thompson } 357885ac19cSjeremylt 358885ac19cSjeremylt // Output restriction 359d1d35e2fSjeremylt for (CeedInt i = 0; i < num_output_fields; i++) { 360ad70ee2cSJeremy L Thompson CeedVector vec; 361edb2538eSJeremy L Thompson CeedElemRestriction elem_rstr; 362ad70ee2cSJeremy L Thompson 363d1d35e2fSjeremylt // Restore Evec 3642b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->e_vecs_full[i + impl->num_inputs], &e_data_full[i + num_input_fields])); 365d1bcdac9Sjeremylt // Get output vector 3662b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[i], &vec)); 367668048e2SJed Brown // Active 3682b730f8bSJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) vec = out_vec; 3697ca8db16Sjeremylt // Restrict 370edb2538eSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); 371edb2538eSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApply(elem_rstr, CEED_TRANSPOSE, impl->e_vecs_full[i + impl->num_inputs], vec, request)); 372885ac19cSjeremylt } 373885ac19cSjeremylt 3747ca8db16Sjeremylt // Restore input arrays 3752b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, false, e_data_full, impl)); 376e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 37721617c04Sjeremylt } 37821617c04Sjeremylt 379f10650afSjeremylt //------------------------------------------------------------------------------ 38070a7ffb3SJeremy L Thompson // Core code for assembling linear QFunction 381f10650afSjeremylt //------------------------------------------------------------------------------ 3822b730f8bSJeremy L Thompson static inline int CeedOperatorLinearAssembleQFunctionCore_Ref(CeedOperator op, bool build_objects, CeedVector *assembled, CeedElemRestriction *rstr, 38370a7ffb3SJeremy L Thompson CeedRequest *request) { 384e910d748SJeremy L Thompson Ceed ceed, ceed_parent; 385e984cf9aSJeremy L Thompson CeedSize q_size; 386ad70ee2cSJeremy L Thompson CeedInt num_active_in, num_active_out, Q, num_elem, num_input_fields, num_output_fields, size; 387ad70ee2cSJeremy L Thompson CeedScalar *assembled_array, *e_data_full[2 * CEED_FIELD_MAX] = {NULL}; 388ad70ee2cSJeremy L Thompson CeedVector *active_in; 389ad70ee2cSJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 390ad70ee2cSJeremy L Thompson CeedQFunction qf; 391ad70ee2cSJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 392ad70ee2cSJeremy L Thompson CeedOperator_Ref *impl; 393ad70ee2cSJeremy L Thompson 3942b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 395e910d748SJeremy L Thompson CeedCallBackend(CeedOperatorGetFallbackParentCeed(op, &ceed_parent)); 396e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 397e984cf9aSJeremy L Thompson active_in = impl->qf_active_in; 398e984cf9aSJeremy L Thompson num_active_in = impl->num_active_in, num_active_out = impl->num_active_out; 399e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 400e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumQuadraturePoints(op, &Q)); 401e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 402e984cf9aSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 403e984cf9aSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 4041d102b48SJeremy L Thompson 4051d102b48SJeremy L Thompson // Setup 4062b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetup_Ref(op)); 4071d102b48SJeremy L Thompson 408506b1a0cSSebastian Grimberg // Check for restriction only operator 409506b1a0cSSebastian Grimberg CeedCheck(!impl->is_identity_rstr_op, ceed, CEED_ERROR_BACKEND, "Assembling restriction only operators is not supported"); 41016911fdaSjeremylt 4111d102b48SJeremy L Thompson // Input Evecs and Restriction 4122b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, NULL, true, e_data_full, impl, request)); 4131d102b48SJeremy L Thompson 4141d102b48SJeremy L Thompson // Count number of active input fields 415bb219a0fSJeremy L Thompson if (!num_active_in) { 416d1d35e2fSjeremylt for (CeedInt i = 0; i < num_input_fields; i++) { 417ad70ee2cSJeremy L Thompson CeedScalar *q_vec_array; 418ad70ee2cSJeremy L Thompson CeedVector vec; 419ad70ee2cSJeremy L Thompson 4201d102b48SJeremy L Thompson // Get input vector 4212b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 4221d102b48SJeremy L Thompson // Check if active input 4231d102b48SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 4242b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &size)); 4252b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(impl->q_vecs_in[i], 0.0)); 426ad70ee2cSJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->q_vecs_in[i], CEED_MEM_HOST, &q_vec_array)); 4272b730f8bSJeremy L Thompson CeedCallBackend(CeedRealloc(num_active_in + size, &active_in)); 4281d102b48SJeremy L Thompson for (CeedInt field = 0; field < size; field++) { 429d2643443SJeremy L Thompson q_size = (CeedSize)Q; 430e910d748SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed_parent, q_size, &active_in[num_active_in + field])); 431ad70ee2cSJeremy L Thompson CeedCallBackend(CeedVectorSetArray(active_in[num_active_in + field], CEED_MEM_HOST, CEED_USE_POINTER, &q_vec_array[field * Q])); 4321d102b48SJeremy L Thompson } 433d1d35e2fSjeremylt num_active_in += size; 434ad70ee2cSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->q_vecs_in[i], &q_vec_array)); 4351d102b48SJeremy L Thompson } 4361d102b48SJeremy L Thompson } 4374fc1f125SJeremy L Thompson impl->num_active_in = num_active_in; 438bb219a0fSJeremy L Thompson impl->qf_active_in = active_in; 439bb219a0fSJeremy L Thompson } 4401d102b48SJeremy L Thompson 4411d102b48SJeremy L Thompson // Count number of active output fields 442bb219a0fSJeremy L Thompson if (!num_active_out) { 443d1d35e2fSjeremylt for (CeedInt i = 0; i < num_output_fields; i++) { 444ad70ee2cSJeremy L Thompson CeedVector vec; 445ad70ee2cSJeremy L Thompson 4461d102b48SJeremy L Thompson // Get output vector 4472b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[i], &vec)); 4481d102b48SJeremy L Thompson // Check if active output 4491d102b48SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 4502b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[i], &size)); 451d1d35e2fSjeremylt num_active_out += size; 4521d102b48SJeremy L Thompson } 4531d102b48SJeremy L Thompson } 4544fc1f125SJeremy L Thompson impl->num_active_out = num_active_out; 455bb219a0fSJeremy L Thompson } 4561d102b48SJeremy L Thompson 4571d102b48SJeremy L Thompson // Check sizes 4586574a04fSJeremy L Thompson CeedCheck(num_active_in > 0 && num_active_out > 0, ceed, CEED_ERROR_BACKEND, "Cannot assemble QFunction without active inputs and outputs"); 4591d102b48SJeremy L Thompson 46070a7ffb3SJeremy L Thompson // Build objects if needed 46170a7ffb3SJeremy L Thompson if (build_objects) { 462ad70ee2cSJeremy L Thompson const CeedSize l_size = (CeedSize)num_elem * Q * num_active_in * num_active_out; 463d1d35e2fSjeremylt CeedInt strides[3] = {1, Q, num_active_in * num_active_out * Q}; /* *NOPAD* */ 464ad70ee2cSJeremy L Thompson 465ad70ee2cSJeremy L Thompson // Create output restriction 466e910d748SJeremy L Thompson CeedCallBackend(CeedElemRestrictionCreateStrided(ceed_parent, num_elem, Q, num_active_in * num_active_out, 4672b730f8bSJeremy L Thompson num_active_in * num_active_out * num_elem * Q, strides, rstr)); 4681d102b48SJeremy L Thompson // Create assembled vector 469e910d748SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed_parent, l_size, assembled)); 47070a7ffb3SJeremy L Thompson } 47170a7ffb3SJeremy L Thompson // Clear output vector 4722b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(*assembled, 0.0)); 473ad70ee2cSJeremy L Thompson CeedCallBackend(CeedVectorGetArray(*assembled, CEED_MEM_HOST, &assembled_array)); 4741d102b48SJeremy L Thompson 4751d102b48SJeremy L Thompson // Loop through elements 476d1d35e2fSjeremylt for (CeedInt e = 0; e < num_elem; e++) { 4771d102b48SJeremy L Thompson // Input basis apply 4782b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorInputBasis_Ref(e, Q, qf_input_fields, op_input_fields, num_input_fields, true, e_data_full, impl)); 4791d102b48SJeremy L Thompson 4801d102b48SJeremy L Thompson // Assemble QFunction 481d1d35e2fSjeremylt for (CeedInt in = 0; in < num_active_in; in++) { 4821d102b48SJeremy L Thompson // Set Inputs 4832b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(active_in[in], 1.0)); 484d1d35e2fSjeremylt if (num_active_in > 1) { 4852b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(active_in[(in + num_active_in - 1) % num_active_in], 0.0)); 48642ea3801Sjeremylt } 487506b1a0cSSebastian Grimberg if (!impl->is_identity_qf) { 4881d102b48SJeremy L Thompson // Set Outputs 489d1d35e2fSjeremylt for (CeedInt out = 0; out < num_output_fields; out++) { 490ad70ee2cSJeremy L Thompson CeedVector vec; 491ad70ee2cSJeremy L Thompson 4921d102b48SJeremy L Thompson // Get output vector 4932b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[out], &vec)); 4941d102b48SJeremy L Thompson // Check if active output 4951d102b48SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 496ad70ee2cSJeremy L Thompson CeedCallBackend(CeedVectorSetArray(impl->q_vecs_out[out], CEED_MEM_HOST, CEED_USE_POINTER, assembled_array)); 4972b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[out], &size)); 498ad70ee2cSJeremy L Thompson assembled_array += size * Q; // Advance the pointer by the size of the output 4991d102b48SJeremy L Thompson } 5001d102b48SJeremy L Thompson } 5011d102b48SJeremy L Thompson // Apply QFunction 5022b730f8bSJeremy L Thompson CeedCallBackend(CeedQFunctionApply(qf, Q, impl->q_vecs_in, impl->q_vecs_out)); 503506b1a0cSSebastian Grimberg } else { 504506b1a0cSSebastian Grimberg const CeedScalar *q_vec_array; 505506b1a0cSSebastian Grimberg 506506b1a0cSSebastian Grimberg // Copy Identity Outputs 507506b1a0cSSebastian Grimberg CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[0], &size)); 508506b1a0cSSebastian Grimberg CeedCallBackend(CeedVectorGetArrayRead(impl->q_vecs_out[0], CEED_MEM_HOST, &q_vec_array)); 509506b1a0cSSebastian Grimberg for (CeedInt i = 0; i < size * Q; i++) assembled_array[i] = q_vec_array[i]; 510506b1a0cSSebastian Grimberg CeedCallBackend(CeedVectorRestoreArrayRead(impl->q_vecs_out[0], &q_vec_array)); 511506b1a0cSSebastian Grimberg assembled_array += size * Q; 512506b1a0cSSebastian Grimberg } 5131d102b48SJeremy L Thompson } 5141d102b48SJeremy L Thompson } 5151d102b48SJeremy L Thompson 5161d102b48SJeremy L Thompson // Un-set output Qvecs to prevent accidental overwrite of Assembled 517506b1a0cSSebastian Grimberg if (!impl->is_identity_qf) { 518d1d35e2fSjeremylt for (CeedInt out = 0; out < num_output_fields; out++) { 519ad70ee2cSJeremy L Thompson CeedVector vec; 520ad70ee2cSJeremy L Thompson 5211d102b48SJeremy L Thompson // Get output vector 5222b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[out], &vec)); 5231d102b48SJeremy L Thompson // Check if active output 524056ea4bdSJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE && num_elem > 0) { 5252b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorTakeArray(impl->q_vecs_out[out], CEED_MEM_HOST, NULL)); 5261d102b48SJeremy L Thompson } 5271d102b48SJeremy L Thompson } 528506b1a0cSSebastian Grimberg } 5291d102b48SJeremy L Thompson 5301d102b48SJeremy L Thompson // Restore input arrays 5312b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, true, e_data_full, impl)); 5321d102b48SJeremy L Thompson 5331d102b48SJeremy L Thompson // Restore output 534ad70ee2cSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(*assembled, &assembled_array)); 535e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 5361d102b48SJeremy L Thompson } 5371d102b48SJeremy L Thompson 538f10650afSjeremylt //------------------------------------------------------------------------------ 53970a7ffb3SJeremy L Thompson // Assemble Linear QFunction 54070a7ffb3SJeremy L Thompson //------------------------------------------------------------------------------ 5412b730f8bSJeremy L Thompson static int CeedOperatorLinearAssembleQFunction_Ref(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 5422b730f8bSJeremy L Thompson return CeedOperatorLinearAssembleQFunctionCore_Ref(op, true, assembled, rstr, request); 54370a7ffb3SJeremy L Thompson } 54470a7ffb3SJeremy L Thompson 54570a7ffb3SJeremy L Thompson //------------------------------------------------------------------------------ 54670a7ffb3SJeremy L Thompson // Update Assembled Linear QFunction 54770a7ffb3SJeremy L Thompson //------------------------------------------------------------------------------ 5482b730f8bSJeremy L Thompson static int CeedOperatorLinearAssembleQFunctionUpdate_Ref(CeedOperator op, CeedVector assembled, CeedElemRestriction rstr, CeedRequest *request) { 5492b730f8bSJeremy L Thompson return CeedOperatorLinearAssembleQFunctionCore_Ref(op, false, &assembled, &rstr, request); 55070a7ffb3SJeremy L Thompson } 55170a7ffb3SJeremy L Thompson 55270a7ffb3SJeremy L Thompson //------------------------------------------------------------------------------ 55348acf710SJeremy L Thompson // Setup Input/Output Fields 55448acf710SJeremy L Thompson //------------------------------------------------------------------------------ 55548acf710SJeremy L Thompson static int CeedOperatorSetupFieldsAtPoints_Ref(CeedQFunction qf, CeedOperator op, bool is_input, CeedVector *e_vecs_full, CeedVector *e_vecs, 55648acf710SJeremy L Thompson CeedVector *q_vecs, CeedInt start_e, CeedInt num_fields, CeedInt Q) { 55748acf710SJeremy L Thompson Ceed ceed; 55848acf710SJeremy L Thompson CeedSize e_size, q_size; 559ff1bc20eSJeremy L Thompson CeedInt max_num_points, num_comp, size, P; 56048acf710SJeremy L Thompson CeedQFunctionField *qf_fields; 56148acf710SJeremy L Thompson CeedOperatorField *op_fields; 56248acf710SJeremy L Thompson 563e910d748SJeremy L Thompson { 564e910d748SJeremy L Thompson Ceed ceed_parent; 565e910d748SJeremy L Thompson 56648acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 567e910d748SJeremy L Thompson CeedCallBackend(CeedGetParent(ceed, &ceed_parent)); 568e910d748SJeremy L Thompson if (ceed_parent) ceed = ceed_parent; 569e910d748SJeremy L Thompson } 57048acf710SJeremy L Thompson if (is_input) { 57148acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL)); 57248acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL)); 57348acf710SJeremy L Thompson } else { 57448acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields)); 57548acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, NULL, NULL, &qf_fields)); 57648acf710SJeremy L Thompson } 57748acf710SJeremy L Thompson 57848acf710SJeremy L Thompson // Get max number of points 57948acf710SJeremy L Thompson { 58048acf710SJeremy L Thompson CeedInt dim; 58148acf710SJeremy L Thompson CeedElemRestriction rstr_points = NULL; 58248acf710SJeremy L Thompson CeedOperator_Ref *impl; 58348acf710SJeremy L Thompson 58448acf710SJeremy L Thompson CeedCallBackend(CeedOperatorAtPointsGetPoints(op, &rstr_points, NULL)); 58548acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetMaxPointsInElement(rstr_points, &max_num_points)); 58648acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumComponents(rstr_points, &dim)); 58748acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_points)); 58848acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 589b37f8825SJeremy L Thompson if (is_input) { 590b37f8825SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, dim * max_num_points, &impl->point_coords_elem)); 591b37f8825SJeremy L Thompson CeedCallBackend(CeedVectorSetValue(impl->point_coords_elem, 0.0)); 592b37f8825SJeremy L Thompson } 59348acf710SJeremy L Thompson } 59448acf710SJeremy L Thompson 59548acf710SJeremy L Thompson // Loop over fields 59648acf710SJeremy L Thompson for (CeedInt i = 0; i < num_fields; i++) { 59748acf710SJeremy L Thompson CeedEvalMode eval_mode; 59848acf710SJeremy L Thompson CeedBasis basis; 59948acf710SJeremy L Thompson 60048acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 60148acf710SJeremy L Thompson if (eval_mode != CEED_EVAL_WEIGHT) { 60248acf710SJeremy L Thompson CeedElemRestriction elem_rstr; 60348acf710SJeremy L Thompson 60448acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr)); 60548acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionCreateVector(elem_rstr, NULL, &e_vecs_full[i + start_e])); 606ff1bc20eSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(e_vecs_full[i + start_e], 0.0)); 6076efa0d72SZach Atkins } 60848acf710SJeremy L Thompson 60948acf710SJeremy L Thompson switch (eval_mode) { 61038e83183SJeremy L Thompson case CEED_EVAL_NONE: { 61138e83183SJeremy L Thompson CeedVector vec; 61238e83183SJeremy L Thompson 61348acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_fields[i], &size)); 61448acf710SJeremy L Thompson e_size = (CeedSize)max_num_points * size; 61548acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, e_size, &e_vecs[i])); 61638e83183SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_fields[i], &vec)); 61738e83183SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE || !is_input) { 61838e83183SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(e_vecs[i], &q_vecs[i])); 61938e83183SJeremy L Thompson } else { 62048acf710SJeremy L Thompson q_size = (CeedSize)max_num_points * size; 62148acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 62238e83183SJeremy L Thompson } 62348acf710SJeremy L Thompson break; 62438e83183SJeremy L Thompson } 62548acf710SJeremy L Thompson case CEED_EVAL_INTERP: 62648acf710SJeremy L Thompson case CEED_EVAL_GRAD: 62748acf710SJeremy L Thompson case CEED_EVAL_DIV: 62848acf710SJeremy L Thompson case CEED_EVAL_CURL: 62948acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 63048acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_fields[i], &size)); 63148acf710SJeremy L Thompson CeedCallBackend(CeedBasisGetNumNodes(basis, &P)); 63248acf710SJeremy L Thompson CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 63348acf710SJeremy L Thompson e_size = (CeedSize)P * num_comp; 63448acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, e_size, &e_vecs[i])); 63548acf710SJeremy L Thompson q_size = (CeedSize)max_num_points * size; 63648acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 63748acf710SJeremy L Thompson break; 63848acf710SJeremy L Thompson case CEED_EVAL_WEIGHT: // Only on input fields 63948acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 64048acf710SJeremy L Thompson q_size = (CeedSize)max_num_points; 64148acf710SJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, q_size, &q_vecs[i])); 64248acf710SJeremy L Thompson CeedCallBackend( 64348acf710SJeremy L Thompson CeedBasisApplyAtPoints(basis, max_num_points, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, CEED_VECTOR_NONE, q_vecs[i])); 64448acf710SJeremy L Thompson break; 64548acf710SJeremy L Thompson } 646ecc797dfSJeremy L Thompson // Initialize full arrays for E-vectors and Q-vectors 647297a0f46SJeremy L Thompson if (e_vecs[i]) CeedCallBackend(CeedVectorSetValue(e_vecs[i], 0.0)); 648297a0f46SJeremy L Thompson if (eval_mode != CEED_EVAL_WEIGHT) CeedCallBackend(CeedVectorSetValue(q_vecs[i], 0.0)); 64948acf710SJeremy L Thompson } 65048acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 65148acf710SJeremy L Thompson } 65248acf710SJeremy L Thompson 65348acf710SJeremy L Thompson //------------------------------------------------------------------------------ 65448acf710SJeremy L Thompson // Setup Operator 65548acf710SJeremy L Thompson //------------------------------------------------------------------------------ 65648acf710SJeremy L Thompson static int CeedOperatorSetupAtPoints_Ref(CeedOperator op) { 65748acf710SJeremy L Thompson bool is_setup_done; 65848acf710SJeremy L Thompson CeedInt Q, num_input_fields, num_output_fields; 65948acf710SJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 66048acf710SJeremy L Thompson CeedQFunction qf; 66148acf710SJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 66248acf710SJeremy L Thompson CeedOperator_Ref *impl; 66348acf710SJeremy L Thompson 66448acf710SJeremy L Thompson CeedCallBackend(CeedOperatorIsSetupDone(op, &is_setup_done)); 66548acf710SJeremy L Thompson if (is_setup_done) return CEED_ERROR_SUCCESS; 66648acf710SJeremy L Thompson 66748acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 66848acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 66948acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetNumQuadraturePoints(op, &Q)); 67048acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionIsIdentity(qf, &impl->is_identity_qf)); 67148acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 67248acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 67348acf710SJeremy L Thompson 67448acf710SJeremy L Thompson // Allocate 67548acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(num_input_fields + num_output_fields, &impl->e_vecs_full)); 67648acf710SJeremy L Thompson 67748acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->input_states)); 67848acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_vecs_in)); 67948acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->e_vecs_out)); 68048acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->q_vecs_in)); 68148acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(CEED_FIELD_MAX, &impl->q_vecs_out)); 68248acf710SJeremy L Thompson 68348acf710SJeremy L Thompson impl->num_inputs = num_input_fields; 68448acf710SJeremy L Thompson impl->num_outputs = num_output_fields; 68548acf710SJeremy L Thompson 68648acf710SJeremy L Thompson // Set up infield and outfield pointer arrays 68748acf710SJeremy L Thompson // Infields 68848acf710SJeremy L Thompson CeedCallBackend(CeedOperatorSetupFieldsAtPoints_Ref(qf, op, true, impl->e_vecs_full, impl->e_vecs_in, impl->q_vecs_in, 0, num_input_fields, Q)); 68948acf710SJeremy L Thompson // Outfields 69048acf710SJeremy L Thompson CeedCallBackend(CeedOperatorSetupFieldsAtPoints_Ref(qf, op, false, impl->e_vecs_full, impl->e_vecs_out, impl->q_vecs_out, num_input_fields, 69148acf710SJeremy L Thompson num_output_fields, Q)); 69248acf710SJeremy L Thompson 69348acf710SJeremy L Thompson // Identity QFunctions 69448acf710SJeremy L Thompson if (impl->is_identity_qf) { 69548acf710SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(impl->q_vecs_in[0], &impl->q_vecs_out[0])); 69638e83183SJeremy L Thompson CeedCallBackend(CeedVectorReferenceCopy(impl->q_vecs_in[0], &impl->e_vecs_out[0])); 69748acf710SJeremy L Thompson } 69848acf710SJeremy L Thompson 69948acf710SJeremy L Thompson CeedCallBackend(CeedOperatorSetSetupDone(op)); 70048acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 70148acf710SJeremy L Thompson } 70248acf710SJeremy L Thompson 70348acf710SJeremy L Thompson //------------------------------------------------------------------------------ 70448acf710SJeremy L Thompson // Input Basis Action 70548acf710SJeremy L Thompson //------------------------------------------------------------------------------ 70648acf710SJeremy L Thompson static inline int CeedOperatorInputBasisAtPoints_Ref(CeedInt e, CeedInt num_points_offset, CeedInt num_points, CeedQFunctionField *qf_input_fields, 70748acf710SJeremy L Thompson CeedOperatorField *op_input_fields, CeedInt num_input_fields, CeedVector in_vec, 70848acf710SJeremy L Thompson CeedVector point_coords_elem, bool skip_active, CeedScalar *e_data[2 * CEED_FIELD_MAX], 70948acf710SJeremy L Thompson CeedOperator_Ref *impl, CeedRequest *request) { 71048acf710SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 71148acf710SJeremy L Thompson bool is_active_input = false; 71248acf710SJeremy L Thompson CeedInt elem_size, size, num_comp; 71348acf710SJeremy L Thompson CeedRestrictionType rstr_type; 71448acf710SJeremy L Thompson CeedEvalMode eval_mode; 71548acf710SJeremy L Thompson CeedVector vec; 71648acf710SJeremy L Thompson CeedElemRestriction elem_rstr; 71748acf710SJeremy L Thompson CeedBasis basis; 71848acf710SJeremy L Thompson 71948acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 72048acf710SJeremy L Thompson // Skip active input 72148acf710SJeremy L Thompson is_active_input = vec == CEED_VECTOR_ACTIVE; 72248acf710SJeremy L Thompson if (skip_active && is_active_input) continue; 72348acf710SJeremy L Thompson 72448acf710SJeremy L Thompson // Get elem_size, eval_mode, size 72548acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 72648acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetType(elem_rstr, &rstr_type)); 72748acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 72848acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &size)); 72948acf710SJeremy L Thompson // Restrict block active input 73048acf710SJeremy L Thompson if (is_active_input) { 73148acf710SJeremy L Thompson if (rstr_type == CEED_RESTRICTION_POINTS) { 73248acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(elem_rstr, e, CEED_NOTRANSPOSE, in_vec, impl->e_vecs_in[i], request)); 73348acf710SJeremy L Thompson } else { 73448acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyBlock(elem_rstr, e, CEED_NOTRANSPOSE, in_vec, impl->e_vecs_in[i], request)); 73548acf710SJeremy L Thompson } 73648acf710SJeremy L Thompson } 73748acf710SJeremy L Thompson // Basis action 73848acf710SJeremy L Thompson switch (eval_mode) { 73948acf710SJeremy L Thompson case CEED_EVAL_NONE: 74048acf710SJeremy L Thompson if (!is_active_input) { 74148acf710SJeremy L Thompson CeedCallBackend(CeedVectorSetArray(impl->q_vecs_in[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data[i][num_points_offset * size])); 74248acf710SJeremy L Thompson } 74348acf710SJeremy L Thompson break; 74448acf710SJeremy L Thompson // Note - these basis eval modes require FEM fields 74548acf710SJeremy L Thompson case CEED_EVAL_INTERP: 74648acf710SJeremy L Thompson case CEED_EVAL_GRAD: 74748acf710SJeremy L Thompson case CEED_EVAL_DIV: 74848acf710SJeremy L Thompson case CEED_EVAL_CURL: 74948acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_input_fields[i], &basis)); 75048acf710SJeremy L Thompson if (!is_active_input) { 75148acf710SJeremy L Thompson CeedCallBackend(CeedBasisGetNumComponents(basis, &num_comp)); 75248acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size)); 75381670346SSebastian Grimberg CeedCallBackend(CeedVectorSetArray(impl->e_vecs_in[i], CEED_MEM_HOST, CEED_USE_POINTER, &e_data[i][(CeedSize)e * elem_size * num_comp])); 75448acf710SJeremy L Thompson } 75548acf710SJeremy L Thompson CeedCallBackend( 75648acf710SJeremy L Thompson CeedBasisApplyAtPoints(basis, num_points, CEED_NOTRANSPOSE, eval_mode, point_coords_elem, impl->e_vecs_in[i], impl->q_vecs_in[i])); 75748acf710SJeremy L Thompson break; 75848acf710SJeremy L Thompson case CEED_EVAL_WEIGHT: 75948acf710SJeremy L Thompson break; // No action 76048acf710SJeremy L Thompson } 76148acf710SJeremy L Thompson } 76248acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 76348acf710SJeremy L Thompson } 76448acf710SJeremy L Thompson 76548acf710SJeremy L Thompson //------------------------------------------------------------------------------ 76648acf710SJeremy L Thompson // Output Basis Action 76748acf710SJeremy L Thompson //------------------------------------------------------------------------------ 76848acf710SJeremy L Thompson static inline int CeedOperatorOutputBasisAtPoints_Ref(CeedInt e, CeedInt num_points_offset, CeedInt num_points, CeedQFunctionField *qf_output_fields, 76948acf710SJeremy L Thompson CeedOperatorField *op_output_fields, CeedInt num_input_fields, CeedInt num_output_fields, 77048acf710SJeremy L Thompson CeedOperator op, CeedVector out_vec, CeedVector point_coords_elem, CeedOperator_Ref *impl, 77148acf710SJeremy L Thompson CeedRequest *request) { 77248acf710SJeremy L Thompson for (CeedInt i = 0; i < num_output_fields; i++) { 77348acf710SJeremy L Thompson CeedRestrictionType rstr_type; 77448acf710SJeremy L Thompson CeedEvalMode eval_mode; 77548acf710SJeremy L Thompson CeedVector vec; 77648acf710SJeremy L Thompson CeedElemRestriction elem_rstr; 77748acf710SJeremy L Thompson CeedBasis basis; 77848acf710SJeremy L Thompson 77948acf710SJeremy L Thompson // Get elem_size, eval_mode, size 78048acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); 78148acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); 78248acf710SJeremy L Thompson // Basis action 78348acf710SJeremy L Thompson switch (eval_mode) { 78448acf710SJeremy L Thompson case CEED_EVAL_NONE: 78548acf710SJeremy L Thompson break; // No action 78648acf710SJeremy L Thompson case CEED_EVAL_INTERP: 78748acf710SJeremy L Thompson case CEED_EVAL_GRAD: 78848acf710SJeremy L Thompson case CEED_EVAL_DIV: 78948acf710SJeremy L Thompson case CEED_EVAL_CURL: 79048acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_output_fields[i], &basis)); 79148acf710SJeremy L Thompson CeedCallBackend( 79248acf710SJeremy L Thompson CeedBasisApplyAtPoints(basis, num_points, CEED_TRANSPOSE, eval_mode, point_coords_elem, impl->q_vecs_out[i], impl->e_vecs_out[i])); 79348acf710SJeremy L Thompson break; 79448acf710SJeremy L Thompson // LCOV_EXCL_START 79548acf710SJeremy L Thompson case CEED_EVAL_WEIGHT: { 7966e536b99SJeremy L Thompson return CeedError(CeedOperatorReturnCeed(op), CEED_ERROR_BACKEND, "CEED_EVAL_WEIGHT cannot be an output evaluation mode"); 79748acf710SJeremy L Thompson // LCOV_EXCL_STOP 79848acf710SJeremy L Thompson } 79948acf710SJeremy L Thompson } 80048acf710SJeremy L Thompson // Restrict output block 80148acf710SJeremy L Thompson // Get output vector 80248acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetType(elem_rstr, &rstr_type)); 80348acf710SJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[i], &vec)); 80448acf710SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) vec = out_vec; 80548acf710SJeremy L Thompson // Restrict 80648acf710SJeremy L Thompson if (rstr_type == CEED_RESTRICTION_POINTS) { 80748acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(elem_rstr, e, CEED_TRANSPOSE, impl->e_vecs_out[i], vec, request)); 80848acf710SJeremy L Thompson } else { 80948acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyBlock(elem_rstr, e, CEED_TRANSPOSE, impl->e_vecs_out[i], vec, request)); 81048acf710SJeremy L Thompson } 81148acf710SJeremy L Thompson } 81248acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 81348acf710SJeremy L Thompson } 81448acf710SJeremy L Thompson 81548acf710SJeremy L Thompson //------------------------------------------------------------------------------ 81648acf710SJeremy L Thompson // Operator Apply 81748acf710SJeremy L Thompson //------------------------------------------------------------------------------ 81848acf710SJeremy L Thompson static int CeedOperatorApplyAddAtPoints_Ref(CeedOperator op, CeedVector in_vec, CeedVector out_vec, CeedRequest *request) { 81948acf710SJeremy L Thompson CeedInt num_points_offset = 0, num_input_fields, num_output_fields, num_elem; 82048acf710SJeremy L Thompson CeedScalar *e_data[2 * CEED_FIELD_MAX] = {0}; 82148acf710SJeremy L Thompson CeedVector point_coords = NULL; 82248acf710SJeremy L Thompson CeedElemRestriction rstr_points = NULL; 82348acf710SJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 82448acf710SJeremy L Thompson CeedQFunction qf; 82548acf710SJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 82648acf710SJeremy L Thompson CeedOperator_Ref *impl; 82748acf710SJeremy L Thompson 82848acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 82948acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 83048acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 83148acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 83248acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 83348acf710SJeremy L Thompson 83448acf710SJeremy L Thompson // Setup 83548acf710SJeremy L Thompson CeedCallBackend(CeedOperatorSetupAtPoints_Ref(op)); 83648acf710SJeremy L Thompson 83748acf710SJeremy L Thompson // Point coordinates 83848acf710SJeremy L Thompson CeedCallBackend(CeedOperatorAtPointsGetPoints(op, &rstr_points, &point_coords)); 83948acf710SJeremy L Thompson 84048acf710SJeremy L Thompson // Input Evecs and Restriction 8416cde1da6SZach Atkins CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, NULL, true, e_data, impl, request)); 84248acf710SJeremy L Thompson 84348acf710SJeremy L Thompson // Loop through elements 84448acf710SJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 84548acf710SJeremy L Thompson CeedInt num_points; 84648acf710SJeremy L Thompson 84748acf710SJeremy L Thompson // Setup points for element 84848acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(rstr_points, e, CEED_NOTRANSPOSE, point_coords, impl->point_coords_elem, request)); 84948acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumPointsInElement(rstr_points, e, &num_points)); 85048acf710SJeremy L Thompson 85148acf710SJeremy L Thompson // Input basis apply 85248acf710SJeremy L Thompson CeedCallBackend(CeedOperatorInputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_input_fields, op_input_fields, num_input_fields, in_vec, 85348acf710SJeremy L Thompson impl->point_coords_elem, false, e_data, impl, request)); 85448acf710SJeremy L Thompson 85548acf710SJeremy L Thompson // Q function 85648acf710SJeremy L Thompson if (!impl->is_identity_qf) { 85748acf710SJeremy L Thompson CeedCallBackend(CeedQFunctionApply(qf, num_points, impl->q_vecs_in, impl->q_vecs_out)); 85848acf710SJeremy L Thompson } 85948acf710SJeremy L Thompson 86048acf710SJeremy L Thompson // Output basis apply and restriction 86148acf710SJeremy L Thompson CeedCallBackend(CeedOperatorOutputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_output_fields, op_output_fields, num_input_fields, 86248acf710SJeremy L Thompson num_output_fields, op, out_vec, impl->point_coords_elem, impl, request)); 86348acf710SJeremy L Thompson 86448acf710SJeremy L Thompson num_points_offset += num_points; 86548acf710SJeremy L Thompson } 86648acf710SJeremy L Thompson 86748acf710SJeremy L Thompson // Restore input arrays 8686cde1da6SZach Atkins CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, true, e_data, impl)); 86948acf710SJeremy L Thompson 87048acf710SJeremy L Thompson // Cleanup point coordinates 87148acf710SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&point_coords)); 87248acf710SJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_points)); 87348acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 87448acf710SJeremy L Thompson } 87548acf710SJeremy L Thompson 87648acf710SJeremy L Thompson //------------------------------------------------------------------------------ 877e13f2367SZach Atkins // Core code for assembling linear QFunction 878e13f2367SZach Atkins //------------------------------------------------------------------------------ 879e13f2367SZach Atkins static inline int CeedOperatorLinearAssembleQFunctionAtPointsCore_Ref(CeedOperator op, bool build_objects, CeedVector *assembled, 880e13f2367SZach Atkins CeedElemRestriction *rstr, CeedRequest *request) { 881e13f2367SZach Atkins Ceed ceed; 882e13f2367SZach Atkins CeedSize q_size; 883e13f2367SZach Atkins CeedInt num_active_in, num_active_out, max_num_points, num_elem, num_input_fields, num_output_fields, num_points_offset = 0; 884e13f2367SZach Atkins CeedScalar *assembled_array, *e_data_full[2 * CEED_FIELD_MAX] = {NULL}; 885e13f2367SZach Atkins CeedVector *active_in, point_coords = NULL; 886e13f2367SZach Atkins CeedQFunctionField *qf_input_fields, *qf_output_fields; 887e13f2367SZach Atkins CeedQFunction qf; 888e13f2367SZach Atkins CeedOperatorField *op_input_fields, *op_output_fields; 889e13f2367SZach Atkins CeedOperator_Ref *impl; 890e13f2367SZach Atkins CeedElemRestriction rstr_points = NULL; 891e13f2367SZach Atkins 892e13f2367SZach Atkins CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 893e13f2367SZach Atkins CeedCallBackend(CeedOperatorGetData(op, &impl)); 894e13f2367SZach Atkins active_in = impl->qf_active_in; 895e13f2367SZach Atkins num_active_in = impl->num_active_in, num_active_out = impl->num_active_out; 896e13f2367SZach Atkins CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 897e13f2367SZach Atkins CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 898e13f2367SZach Atkins CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 899e13f2367SZach Atkins CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 900e13f2367SZach Atkins 901e13f2367SZach Atkins // Setup 902e13f2367SZach Atkins CeedCallBackend(CeedOperatorSetupAtPoints_Ref(op)); 903e13f2367SZach Atkins 904e13f2367SZach Atkins // Check for restriction only operator 905e13f2367SZach Atkins CeedCheck(!impl->is_identity_rstr_op, ceed, CEED_ERROR_BACKEND, "Assembling restriction only operators is not supported"); 906e13f2367SZach Atkins 907e13f2367SZach Atkins // Point coordinates 908e13f2367SZach Atkins CeedCallBackend(CeedOperatorAtPointsGetPoints(op, &rstr_points, &point_coords)); 909e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionGetMaxPointsInElement(rstr_points, &max_num_points)); 910e13f2367SZach Atkins 911e13f2367SZach Atkins // Input Evecs and Restriction 912e13f2367SZach Atkins CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, NULL, true, e_data_full, impl, request)); 913e13f2367SZach Atkins 914e13f2367SZach Atkins // Count number of active input fields 915e13f2367SZach Atkins if (!num_active_in) { 916e13f2367SZach Atkins for (CeedInt i = 0; i < num_input_fields; i++) { 917e13f2367SZach Atkins CeedScalar *q_vec_array; 918e13f2367SZach Atkins CeedInt field_size; 919e13f2367SZach Atkins CeedVector vec; 920e13f2367SZach Atkins 921e13f2367SZach Atkins // Get input vector 922e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 923e13f2367SZach Atkins // Check if active input 924e13f2367SZach Atkins if (vec == CEED_VECTOR_ACTIVE) { 925e13f2367SZach Atkins // Check that all active inputs are nodal fields 926e13f2367SZach Atkins { 927e13f2367SZach Atkins CeedElemRestriction elem_rstr; 928e13f2367SZach Atkins bool is_at_points = false; 929e13f2367SZach Atkins 930e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 931637baffdSJeremy L Thompson CeedCallBackend(CeedElemRestrictionIsAtPoints(elem_rstr, &is_at_points)); 932e13f2367SZach Atkins CeedCheck(!is_at_points, ceed, CEED_ERROR_BACKEND, "Cannot assemble QFunction with active input at points"); 933e13f2367SZach Atkins } 934e13f2367SZach Atkins // Get size of active input 935e13f2367SZach Atkins CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &field_size)); 936e13f2367SZach Atkins CeedCallBackend(CeedVectorSetValue(impl->q_vecs_in[i], 0.0)); 937e13f2367SZach Atkins CeedCallBackend(CeedVectorGetArray(impl->q_vecs_in[i], CEED_MEM_HOST, &q_vec_array)); 938e13f2367SZach Atkins CeedCallBackend(CeedRealloc(num_active_in + field_size, &active_in)); 939e13f2367SZach Atkins for (CeedInt field = 0; field < field_size; field++) { 940e13f2367SZach Atkins q_size = (CeedSize)max_num_points; 941e13f2367SZach Atkins CeedCallBackend(CeedVectorCreate(ceed, q_size, &active_in[num_active_in + field])); 942e13f2367SZach Atkins CeedCallBackend(CeedVectorSetArray(active_in[num_active_in + field], CEED_MEM_HOST, CEED_USE_POINTER, &q_vec_array[field * q_size])); 943e13f2367SZach Atkins } 944e13f2367SZach Atkins num_active_in += field_size; 945e13f2367SZach Atkins CeedCallBackend(CeedVectorRestoreArray(impl->q_vecs_in[i], &q_vec_array)); 946e13f2367SZach Atkins } 947e13f2367SZach Atkins } 948e13f2367SZach Atkins impl->num_active_in = num_active_in; 949e13f2367SZach Atkins impl->qf_active_in = active_in; 950e13f2367SZach Atkins } 951e13f2367SZach Atkins 952e13f2367SZach Atkins // Count number of active output fields 953e13f2367SZach Atkins if (!num_active_out) { 954e13f2367SZach Atkins for (CeedInt i = 0; i < num_output_fields; i++) { 955e13f2367SZach Atkins CeedVector vec; 956e13f2367SZach Atkins CeedInt field_size; 957e13f2367SZach Atkins 958e13f2367SZach Atkins // Get output vector 959e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[i], &vec)); 960e13f2367SZach Atkins // Check if active output 961e13f2367SZach Atkins if (vec == CEED_VECTOR_ACTIVE) { 962e13f2367SZach Atkins // Check that all active inputs are nodal fields 963e13f2367SZach Atkins { 964e13f2367SZach Atkins CeedElemRestriction elem_rstr; 965e13f2367SZach Atkins bool is_at_points = false; 966e13f2367SZach Atkins 967e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); 968637baffdSJeremy L Thompson CeedCallBackend(CeedElemRestrictionIsAtPoints(elem_rstr, &is_at_points)); 969e13f2367SZach Atkins CeedCheck(!is_at_points, ceed, CEED_ERROR_BACKEND, "Cannot assemble QFunction with active input at points"); 970e13f2367SZach Atkins } 971e13f2367SZach Atkins // Get size of active output 972e13f2367SZach Atkins CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[i], &field_size)); 973e13f2367SZach Atkins num_active_out += field_size; 974e13f2367SZach Atkins } 975e13f2367SZach Atkins } 976e13f2367SZach Atkins impl->num_active_out = num_active_out; 977e13f2367SZach Atkins } 978e13f2367SZach Atkins 979e13f2367SZach Atkins // Check sizes 980e13f2367SZach Atkins CeedCheck(num_active_in > 0 && num_active_out > 0, ceed, CEED_ERROR_BACKEND, "Cannot assemble QFunction without active inputs and outputs"); 981e13f2367SZach Atkins 982e13f2367SZach Atkins // Build objects if needed 983e13f2367SZach Atkins if (build_objects) { 984e13f2367SZach Atkins CeedInt num_points_total; 985e13f2367SZach Atkins const CeedInt *offsets; 986e13f2367SZach Atkins 987e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionGetNumPoints(rstr_points, &num_points_total)); 988e13f2367SZach Atkins 989e13f2367SZach Atkins // Create output restriction (at points) 990e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionGetOffsets(rstr_points, CEED_MEM_HOST, &offsets)); 991e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionCreateAtPoints(ceed, num_elem, num_points_total, num_active_in * num_active_out, 992e13f2367SZach Atkins num_active_in * num_active_out * num_points_total, CEED_MEM_HOST, CEED_COPY_VALUES, offsets, 993e13f2367SZach Atkins rstr)); 994e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionRestoreOffsets(rstr_points, &offsets)); 995e13f2367SZach Atkins 996e13f2367SZach Atkins // Create assembled vector 997e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionCreateVector(*rstr, assembled, NULL)); 998e13f2367SZach Atkins } 999e13f2367SZach Atkins // Clear output vector 1000e13f2367SZach Atkins CeedCallBackend(CeedVectorSetValue(*assembled, 0.0)); 1001e13f2367SZach Atkins CeedCallBackend(CeedVectorGetArray(*assembled, CEED_MEM_HOST, &assembled_array)); 1002e13f2367SZach Atkins 1003e13f2367SZach Atkins // Loop through elements 1004e13f2367SZach Atkins for (CeedInt e = 0; e < num_elem; e++) { 1005e13f2367SZach Atkins CeedInt num_points; 1006e13f2367SZach Atkins 1007e13f2367SZach Atkins // Setup points for element 1008e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(rstr_points, e, CEED_NOTRANSPOSE, point_coords, impl->point_coords_elem, request)); 1009e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionGetNumPointsInElement(rstr_points, e, &num_points)); 1010e13f2367SZach Atkins 1011e13f2367SZach Atkins // Input basis apply 1012e13f2367SZach Atkins CeedCallBackend(CeedOperatorInputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_input_fields, op_input_fields, num_input_fields, NULL, 1013e13f2367SZach Atkins impl->point_coords_elem, true, e_data_full, impl, request)); 1014e13f2367SZach Atkins 1015e13f2367SZach Atkins // Assemble QFunction 1016e13f2367SZach Atkins for (CeedInt in = 0; in < num_active_in; in++) { 1017e13f2367SZach Atkins // Set Inputs 1018e13f2367SZach Atkins CeedCallBackend(CeedVectorSetValue(active_in[in], 1.0)); 1019e13f2367SZach Atkins if (num_active_in > 1) { 1020e13f2367SZach Atkins CeedCallBackend(CeedVectorSetValue(active_in[(in + num_active_in - 1) % num_active_in], 0.0)); 1021e13f2367SZach Atkins } 1022e13f2367SZach Atkins if (!impl->is_identity_qf) { 1023e13f2367SZach Atkins // Set Outputs 1024e13f2367SZach Atkins for (CeedInt out = 0; out < num_output_fields; out++) { 1025e13f2367SZach Atkins CeedVector vec; 1026e13f2367SZach Atkins CeedInt field_size; 1027e13f2367SZach Atkins 1028e13f2367SZach Atkins // Get output vector 1029e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[out], &vec)); 1030e13f2367SZach Atkins // Check if active output 1031e13f2367SZach Atkins if (vec == CEED_VECTOR_ACTIVE) { 1032e13f2367SZach Atkins CeedCallBackend(CeedVectorSetArray(impl->q_vecs_out[out], CEED_MEM_HOST, CEED_USE_POINTER, assembled_array)); 1033e13f2367SZach Atkins CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[out], &field_size)); 1034e13f2367SZach Atkins assembled_array += field_size * num_points; // Advance the pointer by the size of the output 1035e13f2367SZach Atkins } 1036e13f2367SZach Atkins } 1037e13f2367SZach Atkins // Apply QFunction 1038e13f2367SZach Atkins CeedCallBackend(CeedQFunctionApply(qf, num_points, impl->q_vecs_in, impl->q_vecs_out)); 1039e13f2367SZach Atkins } else { 1040e13f2367SZach Atkins const CeedScalar *q_vec_array; 1041e13f2367SZach Atkins CeedInt field_size; 1042e13f2367SZach Atkins 1043e13f2367SZach Atkins // Copy Identity Outputs 1044e13f2367SZach Atkins CeedCallBackend(CeedQFunctionFieldGetSize(qf_output_fields[0], &field_size)); 1045e13f2367SZach Atkins CeedCallBackend(CeedVectorGetArrayRead(impl->q_vecs_out[0], CEED_MEM_HOST, &q_vec_array)); 1046e13f2367SZach Atkins for (CeedInt i = 0; i < field_size * num_points; i++) assembled_array[i] = q_vec_array[i]; 1047e13f2367SZach Atkins CeedCallBackend(CeedVectorRestoreArrayRead(impl->q_vecs_out[0], &q_vec_array)); 1048e13f2367SZach Atkins assembled_array += field_size * num_points; 1049e13f2367SZach Atkins } 1050e13f2367SZach Atkins } 1051e13f2367SZach Atkins num_points_offset += num_points; 1052e13f2367SZach Atkins } 1053e13f2367SZach Atkins 1054e13f2367SZach Atkins // Un-set output Qvecs to prevent accidental overwrite of Assembled 1055e13f2367SZach Atkins if (!impl->is_identity_qf) { 1056e13f2367SZach Atkins for (CeedInt out = 0; out < num_output_fields; out++) { 1057e13f2367SZach Atkins CeedVector vec; 1058e13f2367SZach Atkins 1059e13f2367SZach Atkins // Get output vector 1060e13f2367SZach Atkins CeedCallBackend(CeedOperatorFieldGetVector(op_output_fields[out], &vec)); 1061e13f2367SZach Atkins // Check if active output 1062e13f2367SZach Atkins if (vec == CEED_VECTOR_ACTIVE && num_elem > 0) { 1063e13f2367SZach Atkins CeedCallBackend(CeedVectorTakeArray(impl->q_vecs_out[out], CEED_MEM_HOST, NULL)); 1064e13f2367SZach Atkins } 1065e13f2367SZach Atkins } 1066e13f2367SZach Atkins } 1067e13f2367SZach Atkins 1068e13f2367SZach Atkins // Restore input arrays 1069e13f2367SZach Atkins CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, true, e_data_full, impl)); 1070e13f2367SZach Atkins 1071e13f2367SZach Atkins // Restore output 1072e13f2367SZach Atkins CeedCallBackend(CeedVectorRestoreArray(*assembled, &assembled_array)); 1073e13f2367SZach Atkins 1074e13f2367SZach Atkins // Cleanup 1075e13f2367SZach Atkins CeedCallBackend(CeedVectorDestroy(&point_coords)); 1076e13f2367SZach Atkins CeedCallBackend(CeedElemRestrictionDestroy(&rstr_points)); 1077e13f2367SZach Atkins return CEED_ERROR_SUCCESS; 1078e13f2367SZach Atkins } 1079e13f2367SZach Atkins 1080e13f2367SZach Atkins //------------------------------------------------------------------------------ 1081e13f2367SZach Atkins // Assemble Linear QFunction 1082e13f2367SZach Atkins //------------------------------------------------------------------------------ 1083e13f2367SZach Atkins static int CeedOperatorLinearAssembleQFunctionAtPoints_Ref(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 1084e13f2367SZach Atkins return CeedOperatorLinearAssembleQFunctionAtPointsCore_Ref(op, true, assembled, rstr, request); 1085e13f2367SZach Atkins } 1086e13f2367SZach Atkins 1087e13f2367SZach Atkins //------------------------------------------------------------------------------ 1088e13f2367SZach Atkins // Update Assembled Linear QFunction 1089e13f2367SZach Atkins //------------------------------------------------------------------------------ 1090e13f2367SZach Atkins static int CeedOperatorLinearAssembleQFunctionAtPointsUpdate_Ref(CeedOperator op, CeedVector assembled, CeedElemRestriction rstr, 1091e13f2367SZach Atkins CeedRequest *request) { 1092e13f2367SZach Atkins return CeedOperatorLinearAssembleQFunctionAtPointsCore_Ref(op, false, &assembled, &rstr, request); 1093e13f2367SZach Atkins } 1094e13f2367SZach Atkins 1095e13f2367SZach Atkins //------------------------------------------------------------------------------ 1096fb133d4bSJeremy L Thompson // Assemble Operator Diagonal AtPoints 1097e13f2367SZach Atkins //------------------------------------------------------------------------------ 1098fb133d4bSJeremy L Thompson static int CeedOperatorLinearAssembleAddDiagonalAtPoints_Ref(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1099fb133d4bSJeremy L Thompson bool is_active_at_points = true; 1100*831877b7SJeremy L Thompson CeedInt num_points_offset = 0, num_input_fields, num_output_fields, num_elem, elem_size_active = 1, num_comp_active = 1; 1101fb133d4bSJeremy L Thompson CeedScalar *e_data[2 * CEED_FIELD_MAX] = {0}; 1102fb133d4bSJeremy L Thompson Ceed ceed; 1103fb133d4bSJeremy L Thompson CeedVector point_coords = NULL, in_vec, out_vec; 1104fb133d4bSJeremy L Thompson CeedElemRestriction rstr_points = NULL; 1105fb133d4bSJeremy L Thompson CeedQFunctionField *qf_input_fields, *qf_output_fields; 1106fb133d4bSJeremy L Thompson CeedQFunction qf; 1107fb133d4bSJeremy L Thompson CeedOperatorField *op_input_fields, *op_output_fields; 1108fb133d4bSJeremy L Thompson CeedOperator_Ref *impl; 1109fb133d4bSJeremy L Thompson 1110fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 1111fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetNumElements(op, &num_elem)); 1112fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetQFunction(op, &qf)); 1113fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetFields(op, &num_input_fields, &op_input_fields, &num_output_fields, &op_output_fields)); 1114fb133d4bSJeremy L Thompson CeedCallBackend(CeedQFunctionGetFields(qf, NULL, &qf_input_fields, NULL, &qf_output_fields)); 1115fb133d4bSJeremy L Thompson 1116fb133d4bSJeremy L Thompson // Setup 1117fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorSetupAtPoints_Ref(op)); 1118fb133d4bSJeremy L Thompson 1119fb133d4bSJeremy L Thompson // Ceed 1120fb133d4bSJeremy L Thompson { 1121fb133d4bSJeremy L Thompson Ceed ceed_parent; 1122fb133d4bSJeremy L Thompson 1123fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 1124fb133d4bSJeremy L Thompson CeedCallBackend(CeedGetParent(ceed, &ceed_parent)); 1125fb133d4bSJeremy L Thompson if (ceed_parent) ceed = ceed_parent; 1126fb133d4bSJeremy L Thompson } 1127fb133d4bSJeremy L Thompson 1128fb133d4bSJeremy L Thompson // Point coordinates 1129fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorAtPointsGetPoints(op, &rstr_points, &point_coords)); 1130fb133d4bSJeremy L Thompson 1131fb133d4bSJeremy L Thompson // Input and output vectors 1132fb133d4bSJeremy L Thompson { 1133fb133d4bSJeremy L Thompson CeedSize input_size, output_size; 1134fb133d4bSJeremy L Thompson 1135fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 1136fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, input_size, &in_vec)); 1137fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorCreate(ceed, output_size, &out_vec)); 1138fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(out_vec, 0.0)); 1139fb133d4bSJeremy L Thompson } 1140fb133d4bSJeremy L Thompson 1141fb133d4bSJeremy L Thompson // Input Evecs and Restriction 1142fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorSetupInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, NULL, true, e_data, impl, request)); 1143fb133d4bSJeremy L Thompson 1144fb133d4bSJeremy L Thompson // Check if active field is at points 1145fb133d4bSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 1146fb133d4bSJeremy L Thompson CeedRestrictionType rstr_type; 1147fb133d4bSJeremy L Thompson CeedVector vec; 1148fb133d4bSJeremy L Thompson CeedElemRestriction elem_rstr; 1149fb133d4bSJeremy L Thompson 1150fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 1151fb133d4bSJeremy L Thompson // Skip non-active input 1152fb133d4bSJeremy L Thompson if (vec != CEED_VECTOR_ACTIVE) continue; 1153fb133d4bSJeremy L Thompson 1154fb133d4bSJeremy L Thompson // Get active restriction type 1155fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 1156fb133d4bSJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetType(elem_rstr, &rstr_type)); 1157fb133d4bSJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumComponents(elem_rstr, &num_comp_active)); 1158fb133d4bSJeremy L Thompson is_active_at_points = rstr_type == CEED_RESTRICTION_POINTS; 1159fb133d4bSJeremy L Thompson if (!is_active_at_points) CeedCallBackend(CeedElemRestrictionGetElementSize(elem_rstr, &elem_size_active)); 1160fb133d4bSJeremy L Thompson } 1161fb133d4bSJeremy L Thompson 1162fb133d4bSJeremy L Thompson // Loop through elements 1163fb133d4bSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 1164fb133d4bSJeremy L Thompson CeedInt num_points, e_vec_size = 0; 1165fb133d4bSJeremy L Thompson 1166fb133d4bSJeremy L Thompson // Setup points for element 1167fb133d4bSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(rstr_points, e, CEED_NOTRANSPOSE, point_coords, impl->point_coords_elem, request)); 1168fb133d4bSJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetNumPointsInElement(rstr_points, e, &num_points)); 1169fb133d4bSJeremy L Thompson 1170fb133d4bSJeremy L Thompson // Input basis apply for non-active bases 1171fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorInputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_input_fields, op_input_fields, num_input_fields, in_vec, 1172fb133d4bSJeremy L Thompson impl->point_coords_elem, true, e_data, impl, request)); 1173fb133d4bSJeremy L Thompson 1174fb133d4bSJeremy L Thompson // Loop over points on element 1175fb133d4bSJeremy L Thompson e_vec_size = (is_active_at_points ? num_points : elem_size_active) * num_comp_active; 1176fb133d4bSJeremy L Thompson for (CeedInt s = 0; s < e_vec_size; s++) { 1177fb133d4bSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 1178fb133d4bSJeremy L Thompson bool is_active_input = false; 1179fb133d4bSJeremy L Thompson CeedInt size; 1180fb133d4bSJeremy L Thompson CeedRestrictionType rstr_type; 1181fb133d4bSJeremy L Thompson CeedEvalMode eval_mode; 1182fb133d4bSJeremy L Thompson CeedVector vec; 1183fb133d4bSJeremy L Thompson CeedElemRestriction elem_rstr; 1184fb133d4bSJeremy L Thompson CeedBasis basis; 1185fb133d4bSJeremy L Thompson 1186fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 1187fb133d4bSJeremy L Thompson // Skip non-active input 1188fb133d4bSJeremy L Thompson is_active_input = vec == CEED_VECTOR_ACTIVE; 1189fb133d4bSJeremy L Thompson if (!is_active_input) continue; 1190fb133d4bSJeremy L Thompson 1191fb133d4bSJeremy L Thompson // Get elem_size, eval_mode, size 1192fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_input_fields[i], &elem_rstr)); 1193fb133d4bSJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetType(elem_rstr, &rstr_type)); 1194fb133d4bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_input_fields[i], &eval_mode)); 1195fb133d4bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetSize(qf_input_fields[i], &size)); 1196fb133d4bSJeremy L Thompson // Update unit vector 1197fb133d4bSJeremy L Thompson { 1198fb133d4bSJeremy L Thompson CeedScalar *array; 1199fb133d4bSJeremy L Thompson 1200fb133d4bSJeremy L Thompson if (s == 0) CeedCallBackend(CeedVectorSetValue(impl->e_vecs_in[i], 0.0)); 1201fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->e_vecs_in[i], CEED_MEM_HOST, &array)); 1202fb133d4bSJeremy L Thompson array[s] = 1.0; 1203fb133d4bSJeremy L Thompson if (s > 0) array[s - 1] = 0.0; 1204fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->e_vecs_in[i], &array)); 1205fb133d4bSJeremy L Thompson } 1206fb133d4bSJeremy L Thompson // Basis action 1207fb133d4bSJeremy L Thompson switch (eval_mode) { 1208fb133d4bSJeremy L Thompson case CEED_EVAL_NONE: 1209fb133d4bSJeremy L Thompson break; 1210fb133d4bSJeremy L Thompson // Note - these basis eval modes require FEM fields 1211fb133d4bSJeremy L Thompson case CEED_EVAL_INTERP: 1212fb133d4bSJeremy L Thompson case CEED_EVAL_GRAD: 1213fb133d4bSJeremy L Thompson case CEED_EVAL_DIV: 1214fb133d4bSJeremy L Thompson case CEED_EVAL_CURL: 1215fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_input_fields[i], &basis)); 1216fb133d4bSJeremy L Thompson CeedCallBackend(CeedBasisApplyAtPoints(basis, num_points, CEED_NOTRANSPOSE, eval_mode, impl->point_coords_elem, impl->e_vecs_in[i], 1217fb133d4bSJeremy L Thompson impl->q_vecs_in[i])); 1218fb133d4bSJeremy L Thompson break; 1219fb133d4bSJeremy L Thompson case CEED_EVAL_WEIGHT: 1220fb133d4bSJeremy L Thompson break; // No action 1221fb133d4bSJeremy L Thompson } 1222fb133d4bSJeremy L Thompson } 1223fb133d4bSJeremy L Thompson 1224fb133d4bSJeremy L Thompson // -- Q function 1225fb133d4bSJeremy L Thompson if (!impl->is_identity_qf) { 1226fb133d4bSJeremy L Thompson CeedCallBackend(CeedQFunctionApply(qf, num_points, impl->q_vecs_in, impl->q_vecs_out)); 1227fb133d4bSJeremy L Thompson } 1228fb133d4bSJeremy L Thompson 1229fb133d4bSJeremy L Thompson // -- Output basis apply and restriction 1230fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorOutputBasisAtPoints_Ref(e, num_points_offset, num_points, qf_output_fields, op_output_fields, num_input_fields, 1231fb133d4bSJeremy L Thompson num_output_fields, op, out_vec, impl->point_coords_elem, impl, request)); 1232fb133d4bSJeremy L Thompson 1233fb133d4bSJeremy L Thompson // -- Grab diagonal value 1234fb133d4bSJeremy L Thompson for (CeedInt i = 0; i < num_output_fields; i++) { 1235fb133d4bSJeremy L Thompson bool is_active_input = false; 1236fb133d4bSJeremy L Thompson CeedRestrictionType rstr_type; 1237fb133d4bSJeremy L Thompson CeedEvalMode eval_mode; 1238fb133d4bSJeremy L Thompson CeedVector vec; 1239fb133d4bSJeremy L Thompson CeedElemRestriction elem_rstr; 1240fb133d4bSJeremy L Thompson CeedBasis basis; 1241fb133d4bSJeremy L Thompson 1242fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetVector(op_input_fields[i], &vec)); 1243fb133d4bSJeremy L Thompson // ---- Skip non-active input 1244fb133d4bSJeremy L Thompson is_active_input = vec == CEED_VECTOR_ACTIVE; 1245fb133d4bSJeremy L Thompson if (!is_active_input) continue; 1246fb133d4bSJeremy L Thompson 1247fb133d4bSJeremy L Thompson // ---- Get elem_size, eval_mode, size 1248fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetElemRestriction(op_output_fields[i], &elem_rstr)); 1249fb133d4bSJeremy L Thompson CeedCallBackend(CeedQFunctionFieldGetEvalMode(qf_output_fields[i], &eval_mode)); 1250fb133d4bSJeremy L Thompson // ---- Basis action 1251fb133d4bSJeremy L Thompson switch (eval_mode) { 1252fb133d4bSJeremy L Thompson case CEED_EVAL_NONE: 1253fb133d4bSJeremy L Thompson break; // No action 1254fb133d4bSJeremy L Thompson case CEED_EVAL_INTERP: 1255fb133d4bSJeremy L Thompson case CEED_EVAL_GRAD: 1256fb133d4bSJeremy L Thompson case CEED_EVAL_DIV: 1257fb133d4bSJeremy L Thompson case CEED_EVAL_CURL: 1258fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorFieldGetBasis(op_output_fields[i], &basis)); 1259fb133d4bSJeremy L Thompson CeedCallBackend(CeedBasisApplyAtPoints(basis, num_points, CEED_TRANSPOSE, eval_mode, impl->point_coords_elem, impl->q_vecs_out[i], 1260fb133d4bSJeremy L Thompson impl->e_vecs_out[i])); 1261fb133d4bSJeremy L Thompson break; 1262fb133d4bSJeremy L Thompson // LCOV_EXCL_START 1263fb133d4bSJeremy L Thompson case CEED_EVAL_WEIGHT: { 1264fb133d4bSJeremy L Thompson return CeedError(CeedOperatorReturnCeed(op), CEED_ERROR_BACKEND, "CEED_EVAL_WEIGHT cannot be an output evaluation mode"); 1265fb133d4bSJeremy L Thompson // LCOV_EXCL_STOP 1266fb133d4bSJeremy L Thompson } 1267fb133d4bSJeremy L Thompson } 1268fb133d4bSJeremy L Thompson // ---- Update output vector 1269fb133d4bSJeremy L Thompson { 1270fb133d4bSJeremy L Thompson CeedScalar *array, current_value = 0.0; 1271fb133d4bSJeremy L Thompson 1272fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->e_vecs_out[i], CEED_MEM_HOST, &array)); 1273fb133d4bSJeremy L Thompson current_value = array[s]; 1274fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->e_vecs_out[i], &array)); 1275fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorSetValue(impl->e_vecs_out[i], 0.0)); 1276fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorGetArray(impl->e_vecs_out[i], CEED_MEM_HOST, &array)); 1277fb133d4bSJeremy L Thompson array[s] = current_value; 1278fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorRestoreArray(impl->e_vecs_out[i], &array)); 1279fb133d4bSJeremy L Thompson } 1280fb133d4bSJeremy L Thompson // ---- Restrict output block 1281fb133d4bSJeremy L Thompson CeedCallBackend(CeedElemRestrictionGetType(elem_rstr, &rstr_type)); 1282fb133d4bSJeremy L Thompson if (rstr_type == CEED_RESTRICTION_POINTS) { 1283fb133d4bSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyAtPointsInElement(elem_rstr, e, CEED_TRANSPOSE, impl->e_vecs_out[i], assembled, request)); 1284fb133d4bSJeremy L Thompson } else { 1285fb133d4bSJeremy L Thompson CeedCallBackend(CeedElemRestrictionApplyBlock(elem_rstr, e, CEED_TRANSPOSE, impl->e_vecs_out[i], assembled, request)); 1286fb133d4bSJeremy L Thompson } 1287fb133d4bSJeremy L Thompson } 1288fb133d4bSJeremy L Thompson } 1289fb133d4bSJeremy L Thompson num_points_offset += num_points; 1290fb133d4bSJeremy L Thompson } 1291fb133d4bSJeremy L Thompson 1292fb133d4bSJeremy L Thompson // Restore input arrays 1293fb133d4bSJeremy L Thompson CeedCallBackend(CeedOperatorRestoreInputs_Ref(num_input_fields, qf_input_fields, op_input_fields, true, e_data, impl)); 1294fb133d4bSJeremy L Thompson 1295fb133d4bSJeremy L Thompson // Cleanup 1296fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&in_vec)); 1297fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&out_vec)); 1298fb133d4bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&point_coords)); 1299fb133d4bSJeremy L Thompson CeedCallBackend(CeedElemRestrictionDestroy(&rstr_points)); 1300fb133d4bSJeremy L Thompson return CEED_ERROR_SUCCESS; 1301fb133d4bSJeremy L Thompson } 1302e13f2367SZach Atkins 1303e13f2367SZach Atkins //------------------------------------------------------------------------------ 1304f10650afSjeremylt // Operator Destroy 1305f10650afSjeremylt //------------------------------------------------------------------------------ 1306f10650afSjeremylt static int CeedOperatorDestroy_Ref(CeedOperator op) { 1307f10650afSjeremylt CeedOperator_Ref *impl; 1308f10650afSjeremylt 1309ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetData(op, &impl)); 13104fc1f125SJeremy L Thompson for (CeedInt i = 0; i < impl->num_inputs + impl->num_outputs; i++) { 13112b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->e_vecs_full[i])); 1312f10650afSjeremylt } 13132b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->e_vecs_full)); 13142b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->input_states)); 1315f10650afSjeremylt 13164fc1f125SJeremy L Thompson for (CeedInt i = 0; i < impl->num_inputs; i++) { 13172b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->e_vecs_in[i])); 13182b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->q_vecs_in[i])); 1319f10650afSjeremylt } 13202b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->e_vecs_in)); 13212b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->q_vecs_in)); 1322f10650afSjeremylt 13234fc1f125SJeremy L Thompson for (CeedInt i = 0; i < impl->num_outputs; i++) { 13242b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->e_vecs_out[i])); 13252b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->q_vecs_out[i])); 1326f10650afSjeremylt } 13272b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->e_vecs_out)); 13282b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->q_vecs_out)); 132948acf710SJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->point_coords_elem)); 1330f10650afSjeremylt 1331bb219a0fSJeremy L Thompson // QFunction assembly 13324fc1f125SJeremy L Thompson for (CeedInt i = 0; i < impl->num_active_in; i++) { 13332b730f8bSJeremy L Thompson CeedCallBackend(CeedVectorDestroy(&impl->qf_active_in[i])); 1334bb219a0fSJeremy L Thompson } 13352b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl->qf_active_in)); 1336bb219a0fSJeremy L Thompson 13372b730f8bSJeremy L Thompson CeedCallBackend(CeedFree(&impl)); 1338e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 1339f10650afSjeremylt } 1340f10650afSjeremylt 1341f10650afSjeremylt //------------------------------------------------------------------------------ 1342713f43c3Sjeremylt // Operator Create 1343f10650afSjeremylt //------------------------------------------------------------------------------ 134421617c04Sjeremylt int CeedOperatorCreate_Ref(CeedOperator op) { 1345fe2413ffSjeremylt Ceed ceed; 13464ce2993fSjeremylt CeedOperator_Ref *impl; 134721617c04Sjeremylt 1348ad70ee2cSJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 13492b730f8bSJeremy L Thompson CeedCallBackend(CeedCalloc(1, &impl)); 13502b730f8bSJeremy L Thompson CeedCallBackend(CeedOperatorSetData(op, impl)); 13512b730f8bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleQFunction", CeedOperatorLinearAssembleQFunction_Ref)); 13522b730f8bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleQFunctionUpdate", CeedOperatorLinearAssembleQFunctionUpdate_Ref)); 13532b730f8bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "ApplyAdd", CeedOperatorApplyAdd_Ref)); 13542b730f8bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "Destroy", CeedOperatorDestroy_Ref)); 1355e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 135621617c04Sjeremylt } 13572a86cc9dSSebastian Grimberg 13582a86cc9dSSebastian Grimberg //------------------------------------------------------------------------------ 135948acf710SJeremy L Thompson // Operator Create At Points 136048acf710SJeremy L Thompson //------------------------------------------------------------------------------ 136148acf710SJeremy L Thompson int CeedOperatorCreateAtPoints_Ref(CeedOperator op) { 136248acf710SJeremy L Thompson Ceed ceed; 136348acf710SJeremy L Thompson CeedOperator_Ref *impl; 136448acf710SJeremy L Thompson 136548acf710SJeremy L Thompson CeedCallBackend(CeedOperatorGetCeed(op, &ceed)); 136648acf710SJeremy L Thompson CeedCallBackend(CeedCalloc(1, &impl)); 136748acf710SJeremy L Thompson CeedCallBackend(CeedOperatorSetData(op, impl)); 1368e13f2367SZach Atkins CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleQFunction", CeedOperatorLinearAssembleQFunctionAtPoints_Ref)); 1369e13f2367SZach Atkins CeedCallBackend( 1370e13f2367SZach Atkins CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleQFunctionUpdate", CeedOperatorLinearAssembleQFunctionAtPointsUpdate_Ref)); 1371fb133d4bSJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "LinearAssembleAddDiagonal", CeedOperatorLinearAssembleAddDiagonalAtPoints_Ref)); 137248acf710SJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "ApplyAdd", CeedOperatorApplyAddAtPoints_Ref)); 137348acf710SJeremy L Thompson CeedCallBackend(CeedSetBackendFunction(ceed, "Operator", op, "Destroy", CeedOperatorDestroy_Ref)); 137448acf710SJeremy L Thompson return CEED_ERROR_SUCCESS; 137548acf710SJeremy L Thompson } 137648acf710SJeremy L Thompson 137748acf710SJeremy L Thompson //------------------------------------------------------------------------------ 1378