13d8e8822SJeremy L Thompson // Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors. 23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details. 3eaf62fffSJeremy L Thompson // 43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause 5eaf62fffSJeremy L Thompson // 63d8e8822SJeremy L Thompson // This file is part of CEED: http://github.com/ceed 7eaf62fffSJeremy L Thompson 82b730f8bSJeremy L Thompson #include <ceed-impl.h> 949aac155SJeremy L Thompson #include <ceed.h> 102b730f8bSJeremy L Thompson #include <ceed/backend.h> 11c85e8640SSebastian Grimberg #include <assert.h> 122b730f8bSJeremy L Thompson #include <math.h> 13eaf62fffSJeremy L Thompson #include <stdbool.h> 14eaf62fffSJeremy L Thompson #include <stdio.h> 15eaf62fffSJeremy L Thompson #include <string.h> 16eaf62fffSJeremy L Thompson 17eaf62fffSJeremy L Thompson /// @file 18eaf62fffSJeremy L Thompson /// Implementation of CeedOperator preconditioning interfaces 19eaf62fffSJeremy L Thompson 20eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 21eaf62fffSJeremy L Thompson /// CeedOperator Library Internal Preconditioning Functions 22eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 23eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorDeveloper 24eaf62fffSJeremy L Thompson /// @{ 25eaf62fffSJeremy L Thompson 26eaf62fffSJeremy L Thompson /** 27ea61e9acSJeremy L Thompson @brief Duplicate a CeedQFunction with a reference Ceed to fallback for advanced CeedOperator functionality 289e77b9c8SJeremy L Thompson 2901ea9c81SJed Brown @param[in] fallback_ceed Ceed on which to create fallback CeedQFunction 309e77b9c8SJeremy L Thompson @param[in] qf CeedQFunction to create fallback for 3101ea9c81SJed Brown @param[out] qf_fallback fallback CeedQFunction 329e77b9c8SJeremy L Thompson 339e77b9c8SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 349e77b9c8SJeremy L Thompson 359e77b9c8SJeremy L Thompson @ref Developer 369e77b9c8SJeremy L Thompson **/ 372b730f8bSJeremy L Thompson static int CeedQFunctionCreateFallback(Ceed fallback_ceed, CeedQFunction qf, CeedQFunction *qf_fallback) { 389e77b9c8SJeremy L Thompson // Check if NULL qf passed in 399e77b9c8SJeremy L Thompson if (!qf) return CEED_ERROR_SUCCESS; 409e77b9c8SJeremy L Thompson 41d04bbc78SJeremy L Thompson CeedDebug256(qf->ceed, 1, "---------- CeedOperator Fallback ----------\n"); 4213f886e9SJeremy L Thompson CeedDebug(qf->ceed, "Creating fallback CeedQFunction\n"); 43d04bbc78SJeremy L Thompson 449e77b9c8SJeremy L Thompson char *source_path_with_name = ""; 459e77b9c8SJeremy L Thompson if (qf->source_path) { 462b730f8bSJeremy L Thompson size_t path_len = strlen(qf->source_path), name_len = strlen(qf->kernel_name); 472b730f8bSJeremy L Thompson CeedCall(CeedCalloc(path_len + name_len + 2, &source_path_with_name)); 489e77b9c8SJeremy L Thompson memcpy(source_path_with_name, qf->source_path, path_len); 499e77b9c8SJeremy L Thompson memcpy(&source_path_with_name[path_len], ":", 1); 509e77b9c8SJeremy L Thompson memcpy(&source_path_with_name[path_len + 1], qf->kernel_name, name_len); 519e77b9c8SJeremy L Thompson } else { 522b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &source_path_with_name)); 539e77b9c8SJeremy L Thompson } 549e77b9c8SJeremy L Thompson 552b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateInterior(fallback_ceed, qf->vec_length, qf->function, source_path_with_name, qf_fallback)); 569e77b9c8SJeremy L Thompson { 579e77b9c8SJeremy L Thompson CeedQFunctionContext ctx; 589e77b9c8SJeremy L Thompson 592b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetContext(qf, &ctx)); 602b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(*qf_fallback, ctx)); 619e77b9c8SJeremy L Thompson } 629e77b9c8SJeremy L Thompson for (CeedInt i = 0; i < qf->num_input_fields; i++) { 632b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(*qf_fallback, qf->input_fields[i]->field_name, qf->input_fields[i]->size, qf->input_fields[i]->eval_mode)); 649e77b9c8SJeremy L Thompson } 659e77b9c8SJeremy L Thompson for (CeedInt i = 0; i < qf->num_output_fields; i++) { 662b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(*qf_fallback, qf->output_fields[i]->field_name, qf->output_fields[i]->size, qf->output_fields[i]->eval_mode)); 679e77b9c8SJeremy L Thompson } 682b730f8bSJeremy L Thompson CeedCall(CeedFree(&source_path_with_name)); 699e77b9c8SJeremy L Thompson 709e77b9c8SJeremy L Thompson return CEED_ERROR_SUCCESS; 719e77b9c8SJeremy L Thompson } 729e77b9c8SJeremy L Thompson 739e77b9c8SJeremy L Thompson /** 74ea61e9acSJeremy L Thompson @brief Duplicate a CeedOperator with a reference Ceed to fallback for advanced CeedOperator functionality 75eaf62fffSJeremy L Thompson 76ea61e9acSJeremy L Thompson @param[in,out] op CeedOperator to create fallback for 77eaf62fffSJeremy L Thompson 78eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 79eaf62fffSJeremy L Thompson 80eaf62fffSJeremy L Thompson @ref Developer 81eaf62fffSJeremy L Thompson **/ 82d04bbc78SJeremy L Thompson static int CeedOperatorCreateFallback(CeedOperator op) { 83b275c451SJeremy L Thompson bool is_composite; 849e77b9c8SJeremy L Thompson Ceed ceed_fallback; 85eaf62fffSJeremy L Thompson 86805fe78eSJeremy L Thompson // Check not already created 87805fe78eSJeremy L Thompson if (op->op_fallback) return CEED_ERROR_SUCCESS; 88805fe78eSJeremy L Thompson 89eaf62fffSJeremy L Thompson // Fallback Ceed 902b730f8bSJeremy L Thompson CeedCall(CeedGetOperatorFallbackCeed(op->ceed, &ceed_fallback)); 91d04bbc78SJeremy L Thompson if (!ceed_fallback) return CEED_ERROR_SUCCESS; 92d04bbc78SJeremy L Thompson 93d04bbc78SJeremy L Thompson CeedDebug256(op->ceed, 1, "---------- CeedOperator Fallback ----------\n"); 9413f886e9SJeremy L Thompson CeedDebug(op->ceed, "Creating fallback CeedOperator\n"); 95eaf62fffSJeremy L Thompson 96eaf62fffSJeremy L Thompson // Clone Op 97805fe78eSJeremy L Thompson CeedOperator op_fallback; 98b275c451SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 99b275c451SJeremy L Thompson if (is_composite) { 100b275c451SJeremy L Thompson CeedInt num_suboperators; 101b275c451SJeremy L Thompson CeedOperator *sub_operators; 102b275c451SJeremy L Thompson 1032b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorCreate(ceed_fallback, &op_fallback)); 104b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 105b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 106b275c451SJeremy L Thompson for (CeedInt i = 0; i < num_suboperators; i++) { 107d04bbc78SJeremy L Thompson CeedOperator op_sub_fallback; 108d04bbc78SJeremy L Thompson 109b275c451SJeremy L Thompson CeedCall(CeedOperatorGetFallback(sub_operators[i], &op_sub_fallback)); 1102b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorAddSub(op_fallback, op_sub_fallback)); 111805fe78eSJeremy L Thompson } 112805fe78eSJeremy L Thompson } else { 1139e77b9c8SJeremy L Thompson CeedQFunction qf_fallback = NULL, dqf_fallback = NULL, dqfT_fallback = NULL; 1142b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->qf, &qf_fallback)); 1152b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqf, &dqf_fallback)); 1162b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqfT, &dqfT_fallback)); 1172b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed_fallback, qf_fallback, dqf_fallback, dqfT_fallback, &op_fallback)); 118805fe78eSJeremy L Thompson for (CeedInt i = 0; i < op->qf->num_input_fields; i++) { 119437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(op_fallback, op->input_fields[i]->field_name, op->input_fields[i]->elem_rstr, op->input_fields[i]->basis, 1202b730f8bSJeremy L Thompson op->input_fields[i]->vec)); 121805fe78eSJeremy L Thompson } 122805fe78eSJeremy L Thompson for (CeedInt i = 0; i < op->qf->num_output_fields; i++) { 123437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(op_fallback, op->output_fields[i]->field_name, op->output_fields[i]->elem_rstr, op->output_fields[i]->basis, 1242b730f8bSJeremy L Thompson op->output_fields[i]->vec)); 125805fe78eSJeremy L Thompson } 1262b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op->qf_assembled, &op_fallback->qf_assembled)); 127805fe78eSJeremy L Thompson if (op_fallback->num_qpts == 0) { 1282b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetNumQuadraturePoints(op_fallback, op->num_qpts)); 129805fe78eSJeremy L Thompson } 1309e77b9c8SJeremy L Thompson // Cleanup 1312b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&qf_fallback)); 1322b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&dqf_fallback)); 1332b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&dqfT_fallback)); 134805fe78eSJeremy L Thompson } 1352b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetName(op_fallback, op->name)); 1362b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fallback)); 137805fe78eSJeremy L Thompson op->op_fallback = op_fallback; 138eaf62fffSJeremy L Thompson 139eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 140eaf62fffSJeremy L Thompson } 141eaf62fffSJeremy L Thompson 142eaf62fffSJeremy L Thompson /** 143ea61e9acSJeremy L Thompson @brief Retrieve fallback CeedOperator with a reference Ceed for advanced CeedOperator functionality 144d04bbc78SJeremy L Thompson 145d04bbc78SJeremy L Thompson @param[in] op CeedOperator to retrieve fallback for 146d04bbc78SJeremy L Thompson @param[out] op_fallback Fallback CeedOperator 147d04bbc78SJeremy L Thompson 148d04bbc78SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 149d04bbc78SJeremy L Thompson 150d04bbc78SJeremy L Thompson @ref Developer 151d04bbc78SJeremy L Thompson **/ 152d04bbc78SJeremy L Thompson int CeedOperatorGetFallback(CeedOperator op, CeedOperator *op_fallback) { 153d04bbc78SJeremy L Thompson // Create if needed 154d04bbc78SJeremy L Thompson if (!op->op_fallback) { 1552b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreateFallback(op)); 156d04bbc78SJeremy L Thompson } 157d04bbc78SJeremy L Thompson if (op->op_fallback) { 158d04bbc78SJeremy L Thompson bool is_debug; 159d04bbc78SJeremy L Thompson 1602b730f8bSJeremy L Thompson CeedCall(CeedIsDebug(op->ceed, &is_debug)); 161d04bbc78SJeremy L Thompson if (is_debug) { 162b275c451SJeremy L Thompson Ceed ceed, ceed_fallback; 163d04bbc78SJeremy L Thompson const char *resource, *resource_fallback; 164d04bbc78SJeremy L Thompson 165b275c451SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 166b275c451SJeremy L Thompson CeedCall(CeedGetOperatorFallbackCeed(ceed, &ceed_fallback)); 167b275c451SJeremy L Thompson CeedCall(CeedGetResource(ceed, &resource)); 1682b730f8bSJeremy L Thompson CeedCall(CeedGetResource(ceed_fallback, &resource_fallback)); 169d04bbc78SJeremy L Thompson 170b275c451SJeremy L Thompson CeedDebug256(ceed, 1, "---------- CeedOperator Fallback ----------\n"); 171b275c451SJeremy L Thompson CeedDebug(ceed, "Falling back from %s operator at address %ld to %s operator at address %ld\n", resource, op, resource_fallback, 1722b730f8bSJeremy L Thompson op->op_fallback); 173d04bbc78SJeremy L Thompson } 174d04bbc78SJeremy L Thompson } 175d04bbc78SJeremy L Thompson *op_fallback = op->op_fallback; 176d04bbc78SJeremy L Thompson 177d04bbc78SJeremy L Thompson return CEED_ERROR_SUCCESS; 178d04bbc78SJeremy L Thompson } 179d04bbc78SJeremy L Thompson 180d04bbc78SJeremy L Thompson /** 181eaf62fffSJeremy L Thompson @brief Select correct basis matrix pointer based on CeedEvalMode 182eaf62fffSJeremy L Thompson 183352a5e7cSSebastian Grimberg @param[in] basis CeedBasis from which to get the basis matrix 184eaf62fffSJeremy L Thompson @param[in] eval_mode Current basis evaluation mode 185eaf62fffSJeremy L Thompson @param[in] identity Pointer to identity matrix 186eaf62fffSJeremy L Thompson @param[out] basis_ptr Basis pointer to set 187eaf62fffSJeremy L Thompson 188eaf62fffSJeremy L Thompson @ref Developer 189eaf62fffSJeremy L Thompson **/ 190352a5e7cSSebastian Grimberg static inline int CeedOperatorGetBasisPointer(CeedBasis basis, CeedEvalMode eval_mode, const CeedScalar *identity, const CeedScalar **basis_ptr) { 191eaf62fffSJeremy L Thompson switch (eval_mode) { 192eaf62fffSJeremy L Thompson case CEED_EVAL_NONE: 193eaf62fffSJeremy L Thompson *basis_ptr = identity; 194eaf62fffSJeremy L Thompson break; 195eaf62fffSJeremy L Thompson case CEED_EVAL_INTERP: 196352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetInterp(basis, basis_ptr)); 197eaf62fffSJeremy L Thompson break; 198eaf62fffSJeremy L Thompson case CEED_EVAL_GRAD: 199352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetGrad(basis, basis_ptr)); 200352a5e7cSSebastian Grimberg break; 201352a5e7cSSebastian Grimberg case CEED_EVAL_DIV: 202352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetDiv(basis, basis_ptr)); 203352a5e7cSSebastian Grimberg break; 204352a5e7cSSebastian Grimberg case CEED_EVAL_CURL: 205352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetCurl(basis, basis_ptr)); 206eaf62fffSJeremy L Thompson break; 207eaf62fffSJeremy L Thompson case CEED_EVAL_WEIGHT: 208eaf62fffSJeremy L Thompson break; // Caught by QF Assembly 209eaf62fffSJeremy L Thompson } 210ed9e99e6SJeremy L Thompson assert(*basis_ptr != NULL); 211352a5e7cSSebastian Grimberg 212352a5e7cSSebastian Grimberg return CEED_ERROR_SUCCESS; 213eaf62fffSJeremy L Thompson } 214eaf62fffSJeremy L Thompson 215eaf62fffSJeremy L Thompson /** 216eaf62fffSJeremy L Thompson @brief Create point block restriction for active operator field 217eaf62fffSJeremy L Thompson 218eaf62fffSJeremy L Thompson @param[in] rstr Original CeedElemRestriction for active field 219ea61e9acSJeremy L Thompson @param[out] pointblock_rstr Address of the variable where the newly created CeedElemRestriction will be stored 220eaf62fffSJeremy L Thompson 221eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 222eaf62fffSJeremy L Thompson 223eaf62fffSJeremy L Thompson @ref Developer 224eaf62fffSJeremy L Thompson **/ 2252b730f8bSJeremy L Thompson static int CeedOperatorCreateActivePointBlockRestriction(CeedElemRestriction rstr, CeedElemRestriction *pointblock_rstr) { 226eaf62fffSJeremy L Thompson Ceed ceed; 2272b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetCeed(rstr, &ceed)); 228eaf62fffSJeremy L Thompson const CeedInt *offsets; 2292b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetOffsets(rstr, CEED_MEM_HOST, &offsets)); 230eaf62fffSJeremy L Thompson 231eaf62fffSJeremy L Thompson // Expand offsets 2327b63f5c6SJed Brown CeedInt num_elem, num_comp, elem_size, comp_stride, *pointblock_offsets; 2337b63f5c6SJed Brown CeedSize l_size; 2342b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem)); 2352b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp)); 2362b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size)); 2372b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetCompStride(rstr, &comp_stride)); 2382b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size)); 239eaf62fffSJeremy L Thompson CeedInt shift = num_comp; 2402b730f8bSJeremy L Thompson if (comp_stride != 1) shift *= num_comp; 2412b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_elem * elem_size, &pointblock_offsets)); 242eaf62fffSJeremy L Thompson for (CeedInt i = 0; i < num_elem * elem_size; i++) { 243eaf62fffSJeremy L Thompson pointblock_offsets[i] = offsets[i] * shift; 244eaf62fffSJeremy L Thompson } 245eaf62fffSJeremy L Thompson 246eaf62fffSJeremy L Thompson // Create new restriction 2472b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionCreate(ceed, num_elem, elem_size, num_comp * num_comp, 1, l_size * num_comp, CEED_MEM_HOST, CEED_OWN_POINTER, 2482b730f8bSJeremy L Thompson pointblock_offsets, pointblock_rstr)); 249eaf62fffSJeremy L Thompson 250eaf62fffSJeremy L Thompson // Cleanup 2512b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionRestoreOffsets(rstr, &offsets)); 252eaf62fffSJeremy L Thompson 253eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 254eaf62fffSJeremy L Thompson } 255eaf62fffSJeremy L Thompson 256eaf62fffSJeremy L Thompson /** 257eaf62fffSJeremy L Thompson @brief Core logic for assembling operator diagonal or point block diagonal 258eaf62fffSJeremy L Thompson 259eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble point block diagonal 260ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE 261eaf62fffSJeremy L Thompson @param[in] is_pointblock Boolean flag to assemble diagonal or point block diagonal 262eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled diagonal 263eaf62fffSJeremy L Thompson 264eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 265eaf62fffSJeremy L Thompson 266eaf62fffSJeremy L Thompson @ref Developer 267eaf62fffSJeremy L Thompson **/ 2682b730f8bSJeremy L Thompson static inline int CeedSingleOperatorAssembleAddDiagonal_Core(CeedOperator op, CeedRequest *request, const bool is_pointblock, CeedVector assembled) { 269eaf62fffSJeremy L Thompson Ceed ceed; 2702b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 271eaf62fffSJeremy L Thompson 272eaf62fffSJeremy L Thompson // Assemble QFunction 273eaf62fffSJeremy L Thompson CeedQFunction qf; 274437c7c90SJeremy L Thompson const CeedScalar *assembled_qf_array; 275eaf62fffSJeremy L Thompson CeedVector assembled_qf; 276437c7c90SJeremy L Thompson CeedElemRestriction assembled_elem_rstr; 277437c7c90SJeremy L Thompson CeedInt num_input_fields, num_output_fields; 278eaf62fffSJeremy L Thompson CeedInt layout[3]; 279437c7c90SJeremy L Thompson 280437c7c90SJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 281437c7c90SJeremy L Thompson CeedCall(CeedQFunctionGetNumArgs(qf, &num_input_fields, &num_output_fields)); 282437c7c90SJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &assembled_elem_rstr, request)); 283437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(assembled_elem_rstr, &layout)); 284437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&assembled_elem_rstr)); 285437c7c90SJeremy L Thompson CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array)); 286eaf62fffSJeremy L Thompson 287ed9e99e6SJeremy L Thompson // Get assembly data 288ed9e99e6SJeremy L Thompson CeedOperatorAssemblyData data; 289437c7c90SJeremy L Thompson const CeedEvalMode **eval_modes_in, **eval_modes_out; 290437c7c90SJeremy L Thompson CeedInt *num_eval_modes_in, *num_eval_modes_out, num_active_bases; 291437c7c90SJeremy L Thompson CeedSize **eval_mode_offsets_in, **eval_mode_offsets_out, num_output_components; 292437c7c90SJeremy L Thompson CeedBasis *active_bases; 293437c7c90SJeremy L Thompson CeedElemRestriction *active_elem_rstrs; 294437c7c90SJeremy L Thompson CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data)); 295437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_active_bases, &num_eval_modes_in, &eval_modes_in, &eval_mode_offsets_in, 296437c7c90SJeremy L Thompson &num_eval_modes_out, &eval_modes_out, &eval_mode_offsets_out, &num_output_components)); 297437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, &active_bases, NULL, NULL)); 298437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetElemRestrictions(data, NULL, &active_elem_rstrs)); 299437c7c90SJeremy L Thompson 300437c7c90SJeremy L Thompson // Loop over all active bases 301437c7c90SJeremy L Thompson for (CeedInt b = 0; b < num_active_bases; b++) { 302eaf62fffSJeremy L Thompson // Assemble point block diagonal restriction, if needed 303437c7c90SJeremy L Thompson CeedElemRestriction diag_elem_rstr = active_elem_rstrs[b]; 304437c7c90SJeremy L Thompson 305eaf62fffSJeremy L Thompson if (is_pointblock) { 306437c7c90SJeremy L Thompson CeedElemRestriction point_block_elem_rstr; 307437c7c90SJeremy L Thompson 308437c7c90SJeremy L Thompson CeedCall(CeedOperatorCreateActivePointBlockRestriction(diag_elem_rstr, &point_block_elem_rstr)); 309437c7c90SJeremy L Thompson diag_elem_rstr = point_block_elem_rstr; 310eaf62fffSJeremy L Thompson } 311eaf62fffSJeremy L Thompson 312eaf62fffSJeremy L Thompson // Create diagonal vector 313eaf62fffSJeremy L Thompson CeedVector elem_diag; 314437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionCreateVector(diag_elem_rstr, NULL, &elem_diag)); 315eaf62fffSJeremy L Thompson 316eaf62fffSJeremy L Thompson // Assemble element operator diagonals 3179c774eddSJeremy L Thompson CeedScalar *elem_diag_array; 318437c7c90SJeremy L Thompson CeedInt num_elem, num_nodes, num_qpts, num_components; 319437c7c90SJeremy L Thompson 3202b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(elem_diag, 0.0)); 3212b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArray(elem_diag, CEED_MEM_HOST, &elem_diag_array)); 322437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(diag_elem_rstr, &num_elem)); 323437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumNodes(active_bases[b], &num_nodes)); 324437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumComponents(active_bases[b], &num_components)); 325437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(active_bases[b], &num_qpts)); 326ed9e99e6SJeremy L Thompson 327352a5e7cSSebastian Grimberg // Construct identity matrix for basis if required 328ed9e99e6SJeremy L Thompson bool has_eval_none = false; 329352a5e7cSSebastian Grimberg CeedScalar *identity = NULL; 330437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_eval_modes_in[b]; i++) { 331437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (eval_modes_in[b][i] == CEED_EVAL_NONE); 332ed9e99e6SJeremy L Thompson } 333437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_eval_modes_out[b]; i++) { 334437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (eval_modes_out[b][i] == CEED_EVAL_NONE); 335ed9e99e6SJeremy L Thompson } 336ed9e99e6SJeremy L Thompson if (has_eval_none) { 3372b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_qpts * num_nodes, &identity)); 3382b730f8bSJeremy L Thompson for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) identity[i * num_nodes + i] = 1.0; 339eaf62fffSJeremy L Thompson } 340352a5e7cSSebastian Grimberg 341eaf62fffSJeremy L Thompson // Compute the diagonal of B^T D B 342eaf62fffSJeremy L Thompson // Each element 343eaf62fffSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 344eaf62fffSJeremy L Thompson // Each basis eval mode pair 345352a5e7cSSebastian Grimberg CeedInt d_out = 0, q_comp_out; 346352a5e7cSSebastian Grimberg CeedEvalMode eval_mode_out_prev = CEED_EVAL_NONE; 347437c7c90SJeremy L Thompson for (CeedInt e_out = 0; e_out < num_eval_modes_out[b]; e_out++) { 348437c7c90SJeremy L Thompson const CeedScalar *B_t = NULL; 349352a5e7cSSebastian Grimberg CeedOperatorGetBasisPointer(active_bases[b], eval_modes_out[b][e_out], identity, &B_t); 350352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(active_bases[b], eval_modes_out[b][e_out], &q_comp_out)); 351352a5e7cSSebastian Grimberg if (q_comp_out > 1) { 352352a5e7cSSebastian Grimberg if (e_out == 0 || eval_modes_out[b][e_out] != eval_mode_out_prev) d_out = 0; 353352a5e7cSSebastian Grimberg else B_t = &B_t[(++d_out) * num_qpts * num_nodes]; 354352a5e7cSSebastian Grimberg } 355352a5e7cSSebastian Grimberg eval_mode_out_prev = eval_modes_out[b][e_out]; 356352a5e7cSSebastian Grimberg 357352a5e7cSSebastian Grimberg CeedInt d_in = 0, q_comp_in; 358352a5e7cSSebastian Grimberg CeedEvalMode eval_mode_in_prev = CEED_EVAL_NONE; 359437c7c90SJeremy L Thompson for (CeedInt e_in = 0; e_in < num_eval_modes_in[b]; e_in++) { 360437c7c90SJeremy L Thompson const CeedScalar *B = NULL; 361352a5e7cSSebastian Grimberg CeedOperatorGetBasisPointer(active_bases[b], eval_modes_in[b][e_in], identity, &B); 362352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(active_bases[b], eval_modes_in[b][e_in], &q_comp_in)); 363352a5e7cSSebastian Grimberg if (q_comp_in > 1) { 364352a5e7cSSebastian Grimberg if (e_in == 0 || eval_modes_in[b][e_in] != eval_mode_in_prev) d_in = 0; 365352a5e7cSSebastian Grimberg else B = &B[(++d_in) * num_qpts * num_nodes]; 366352a5e7cSSebastian Grimberg } 367352a5e7cSSebastian Grimberg eval_mode_in_prev = eval_modes_in[b][e_in]; 368352a5e7cSSebastian Grimberg 369eaf62fffSJeremy L Thompson // Each component 370437c7c90SJeremy L Thompson for (CeedInt c_out = 0; c_out < num_components; c_out++) { 371437c7c90SJeremy L Thompson // Each qpt/node pair 3722b730f8bSJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 373eaf62fffSJeremy L Thompson if (is_pointblock) { 374eaf62fffSJeremy L Thompson // Point Block Diagonal 375437c7c90SJeremy L Thompson for (CeedInt c_in = 0; c_in < num_components; c_in++) { 376437c7c90SJeremy L Thompson const CeedInt c_offset = (eval_mode_offsets_in[b][e_in] + c_in) * num_output_components + eval_mode_offsets_out[b][e_out] + c_out; 377437c7c90SJeremy L Thompson const CeedScalar qf_value = assembled_qf_array[q * layout[0] + c_offset * layout[1] + e * layout[2]]; 3782b730f8bSJeremy L Thompson for (CeedInt n = 0; n < num_nodes; n++) { 379437c7c90SJeremy L Thompson elem_diag_array[((e * num_components + c_out) * num_components + c_in) * num_nodes + n] += 380437c7c90SJeremy L Thompson B_t[q * num_nodes + n] * qf_value * B[q * num_nodes + n]; 381eaf62fffSJeremy L Thompson } 3822b730f8bSJeremy L Thompson } 383eaf62fffSJeremy L Thompson } else { 384eaf62fffSJeremy L Thompson // Diagonal Only 385437c7c90SJeremy L Thompson const CeedInt c_offset = (eval_mode_offsets_in[b][e_in] + c_out) * num_output_components + eval_mode_offsets_out[b][e_out] + c_out; 386437c7c90SJeremy L Thompson const CeedScalar qf_value = assembled_qf_array[q * layout[0] + c_offset * layout[1] + e * layout[2]]; 3872b730f8bSJeremy L Thompson for (CeedInt n = 0; n < num_nodes; n++) { 388437c7c90SJeremy L Thompson elem_diag_array[(e * num_components + c_out) * num_nodes + n] += B_t[q * num_nodes + n] * qf_value * B[q * num_nodes + n]; 389eaf62fffSJeremy L Thompson } 390eaf62fffSJeremy L Thompson } 391eaf62fffSJeremy L Thompson } 392eaf62fffSJeremy L Thompson } 3932b730f8bSJeremy L Thompson } 3942b730f8bSJeremy L Thompson } 3952b730f8bSJeremy L Thompson } 3962b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(elem_diag, &elem_diag_array)); 397eaf62fffSJeremy L Thompson 398eaf62fffSJeremy L Thompson // Assemble local operator diagonal 399*f30b1135SSebastian Grimberg CeedCall(CeedElemRestrictionApplyUnsigned(diag_elem_rstr, CEED_TRANSPOSE, elem_diag, assembled, request)); 400eaf62fffSJeremy L Thompson 401eaf62fffSJeremy L Thompson // Cleanup 402437c7c90SJeremy L Thompson if (is_pointblock) CeedCall(CeedElemRestrictionDestroy(&diag_elem_rstr)); 4032b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&elem_diag)); 4042b730f8bSJeremy L Thompson CeedCall(CeedFree(&identity)); 405437c7c90SJeremy L Thompson } 406437c7c90SJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array)); 407437c7c90SJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled_qf)); 408eaf62fffSJeremy L Thompson 409eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 410eaf62fffSJeremy L Thompson } 411eaf62fffSJeremy L Thompson 412eaf62fffSJeremy L Thompson /** 413eaf62fffSJeremy L Thompson @brief Core logic for assembling composite operator diagonal 414eaf62fffSJeremy L Thompson 415eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble point block diagonal 416ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE 417eaf62fffSJeremy L Thompson @param[in] is_pointblock Boolean flag to assemble diagonal or point block diagonal 418eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled diagonal 419eaf62fffSJeremy L Thompson 420eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 421eaf62fffSJeremy L Thompson 422eaf62fffSJeremy L Thompson @ref Developer 423eaf62fffSJeremy L Thompson **/ 4242b730f8bSJeremy L Thompson static inline int CeedCompositeOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedRequest *request, const bool is_pointblock, 425eaf62fffSJeremy L Thompson CeedVector assembled) { 426eaf62fffSJeremy L Thompson CeedInt num_sub; 427eaf62fffSJeremy L Thompson CeedOperator *suboperators; 428c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_sub)); 429c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &suboperators)); 430eaf62fffSJeremy L Thompson for (CeedInt i = 0; i < num_sub; i++) { 4316aa95790SJeremy L Thompson if (is_pointblock) { 4322b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(suboperators[i], assembled, request)); 4336aa95790SJeremy L Thompson } else { 4342b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddDiagonal(suboperators[i], assembled, request)); 4356aa95790SJeremy L Thompson } 436eaf62fffSJeremy L Thompson } 437eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 438eaf62fffSJeremy L Thompson } 439eaf62fffSJeremy L Thompson 440eaf62fffSJeremy L Thompson /** 441eaf62fffSJeremy L Thompson @brief Build nonzero pattern for non-composite operator 442eaf62fffSJeremy L Thompson 443eaf62fffSJeremy L Thompson Users should generally use CeedOperatorLinearAssembleSymbolic() 444eaf62fffSJeremy L Thompson 445*f30b1135SSebastian Grimberg Note: For operators using oriented element restrictions, entries in rows or cols may be negative indicating the assembled value at this nonzero should be negated 446*f30b1135SSebastian Grimberg 447eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble nonzero pattern 448eaf62fffSJeremy L Thompson @param[in] offset Offset for number of entries 449eaf62fffSJeremy L Thompson @param[out] rows Row number for each entry 450eaf62fffSJeremy L Thompson @param[out] cols Column number for each entry 451eaf62fffSJeremy L Thompson 452eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 453eaf62fffSJeremy L Thompson 454eaf62fffSJeremy L Thompson @ref Developer 455eaf62fffSJeremy L Thompson **/ 4562b730f8bSJeremy L Thompson static int CeedSingleOperatorAssembleSymbolic(CeedOperator op, CeedInt offset, CeedInt *rows, CeedInt *cols) { 457f3d47e36SJeremy L Thompson Ceed ceed; 458f3d47e36SJeremy L Thompson bool is_composite; 459f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 460f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 461f3d47e36SJeremy L Thompson 4626574a04fSJeremy L Thompson CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 463eaf62fffSJeremy L Thompson 464c9366a6bSJeremy L Thompson CeedSize num_nodes; 4652b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &num_nodes, NULL)); 466eaf62fffSJeremy L Thompson CeedElemRestriction rstr_in; 4672b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(op, &rstr_in)); 468e79b91d9SJeremy L Thompson CeedInt num_elem, elem_size, num_comp; 4692b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr_in, &num_elem)); 4702b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr_in, &elem_size)); 4712b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(rstr_in, &num_comp)); 472eaf62fffSJeremy L Thompson CeedInt layout_er[3]; 4732b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(rstr_in, &layout_er)); 474eaf62fffSJeremy L Thompson 475eaf62fffSJeremy L Thompson CeedInt local_num_entries = elem_size * num_comp * elem_size * num_comp * num_elem; 476eaf62fffSJeremy L Thompson 477eaf62fffSJeremy L Thompson // Determine elem_dof relation 478eaf62fffSJeremy L Thompson CeedVector index_vec; 4792b730f8bSJeremy L Thompson CeedCall(CeedVectorCreate(ceed, num_nodes, &index_vec)); 480eaf62fffSJeremy L Thompson CeedScalar *array; 4812b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayWrite(index_vec, CEED_MEM_HOST, &array)); 482ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_nodes; i++) array[i] = i; 4832b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(index_vec, &array)); 484eaf62fffSJeremy L Thompson CeedVector elem_dof; 4852b730f8bSJeremy L Thompson CeedCall(CeedVectorCreate(ceed, num_elem * elem_size * num_comp, &elem_dof)); 4862b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(elem_dof, 0.0)); 4872b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionApply(rstr_in, CEED_NOTRANSPOSE, index_vec, elem_dof, CEED_REQUEST_IMMEDIATE)); 488eaf62fffSJeremy L Thompson const CeedScalar *elem_dof_a; 4892b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(elem_dof, CEED_MEM_HOST, &elem_dof_a)); 4902b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&index_vec)); 491eaf62fffSJeremy L Thompson 492eaf62fffSJeremy L Thompson // Determine i, j locations for element matrices 493eaf62fffSJeremy L Thompson CeedInt count = 0; 494ed9e99e6SJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 495ed9e99e6SJeremy L Thompson for (CeedInt comp_in = 0; comp_in < num_comp; comp_in++) { 496ed9e99e6SJeremy L Thompson for (CeedInt comp_out = 0; comp_out < num_comp; comp_out++) { 497ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < elem_size; i++) { 498ed9e99e6SJeremy L Thompson for (CeedInt j = 0; j < elem_size; j++) { 4992b730f8bSJeremy L Thompson const CeedInt elem_dof_index_row = i * layout_er[0] + (comp_out)*layout_er[1] + e * layout_er[2]; 5002b730f8bSJeremy L Thompson const CeedInt elem_dof_index_col = j * layout_er[0] + comp_in * layout_er[1] + e * layout_er[2]; 501eaf62fffSJeremy L Thompson 502eaf62fffSJeremy L Thompson const CeedInt row = elem_dof_a[elem_dof_index_row]; 503eaf62fffSJeremy L Thompson const CeedInt col = elem_dof_a[elem_dof_index_col]; 504eaf62fffSJeremy L Thompson 505eaf62fffSJeremy L Thompson rows[offset + count] = row; 506eaf62fffSJeremy L Thompson cols[offset + count] = col; 507eaf62fffSJeremy L Thompson count++; 508eaf62fffSJeremy L Thompson } 509eaf62fffSJeremy L Thompson } 510eaf62fffSJeremy L Thompson } 511eaf62fffSJeremy L Thompson } 512eaf62fffSJeremy L Thompson } 5136574a04fSJeremy L Thompson CeedCheck(count == local_num_entries, ceed, CEED_ERROR_MAJOR, "Error computing assembled entries"); 5142b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(elem_dof, &elem_dof_a)); 5152b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&elem_dof)); 516eaf62fffSJeremy L Thompson 517eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 518eaf62fffSJeremy L Thompson } 519eaf62fffSJeremy L Thompson 520eaf62fffSJeremy L Thompson /** 521eaf62fffSJeremy L Thompson @brief Assemble nonzero entries for non-composite operator 522eaf62fffSJeremy L Thompson 523eaf62fffSJeremy L Thompson Users should generally use CeedOperatorLinearAssemble() 524eaf62fffSJeremy L Thompson 525eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 526ea61e9acSJeremy L Thompson @param[in] offset Offset for number of entries 527eaf62fffSJeremy L Thompson @param[out] values Values to assemble into matrix 528eaf62fffSJeremy L Thompson 529eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 530eaf62fffSJeremy L Thompson 531eaf62fffSJeremy L Thompson @ref Developer 532eaf62fffSJeremy L Thompson **/ 5332b730f8bSJeremy L Thompson static int CeedSingleOperatorAssemble(CeedOperator op, CeedInt offset, CeedVector values) { 534f3d47e36SJeremy L Thompson Ceed ceed; 535f3d47e36SJeremy L Thompson bool is_composite; 536f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 537f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 538f3d47e36SJeremy L Thompson 5396574a04fSJeremy L Thompson CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 540f3d47e36SJeremy L Thompson 541f3d47e36SJeremy L Thompson // Early exit for empty operator 542f3d47e36SJeremy L Thompson { 543f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 544f3d47e36SJeremy L Thompson 545f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 546f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 547f3d47e36SJeremy L Thompson } 548eaf62fffSJeremy L Thompson 549cefa2673SJeremy L Thompson if (op->LinearAssembleSingle) { 550cefa2673SJeremy L Thompson // Backend version 5512b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleSingle(op, offset, values)); 552cefa2673SJeremy L Thompson return CEED_ERROR_SUCCESS; 553cefa2673SJeremy L Thompson } else { 554cefa2673SJeremy L Thompson // Operator fallback 555cefa2673SJeremy L Thompson CeedOperator op_fallback; 556cefa2673SJeremy L Thompson 5572b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 558cefa2673SJeremy L Thompson if (op_fallback) { 5592b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemble(op_fallback, offset, values)); 560cefa2673SJeremy L Thompson return CEED_ERROR_SUCCESS; 561cefa2673SJeremy L Thompson } 562cefa2673SJeremy L Thompson } 563cefa2673SJeremy L Thompson 564eaf62fffSJeremy L Thompson // Assemble QFunction 565eaf62fffSJeremy L Thompson CeedQFunction qf; 5662b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 567eaf62fffSJeremy L Thompson CeedVector assembled_qf; 568eaf62fffSJeremy L Thompson CeedElemRestriction rstr_q; 5692b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &rstr_q, CEED_REQUEST_IMMEDIATE)); 5701f9221feSJeremy L Thompson CeedSize qf_length; 5712b730f8bSJeremy L Thompson CeedCall(CeedVectorGetLength(assembled_qf, &qf_length)); 572eaf62fffSJeremy L Thompson 5737e7773b5SJeremy L Thompson CeedInt num_input_fields, num_output_fields; 574eaf62fffSJeremy L Thompson CeedOperatorField *input_fields; 575eaf62fffSJeremy L Thompson CeedOperatorField *output_fields; 5762b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, &num_input_fields, &input_fields, &num_output_fields, &output_fields)); 577eaf62fffSJeremy L Thompson 578ed9e99e6SJeremy L Thompson // Get assembly data 579ed9e99e6SJeremy L Thompson CeedOperatorAssemblyData data; 5802b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data)); 581437c7c90SJeremy L Thompson const CeedEvalMode **eval_modes_in, **eval_modes_out; 582437c7c90SJeremy L Thompson CeedInt *num_eval_modes_in, *num_eval_modes_out, num_active_bases; 583437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_active_bases, &num_eval_modes_in, &eval_modes_in, NULL, &num_eval_modes_out, 584437c7c90SJeremy L Thompson &eval_modes_out, NULL, NULL)); 585437c7c90SJeremy L Thompson CeedBasis *bases; 586437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, &bases, NULL, NULL)); 587437c7c90SJeremy L Thompson CeedBasis basis_in = bases[0]; 588eaf62fffSJeremy L Thompson 5896574a04fSJeremy L Thompson CeedCheck(num_active_bases == 1, ceed, CEED_ERROR_UNSUPPORTED, "Cannot assemble operator with multiple active bases"); 5906574a04fSJeremy L Thompson CeedCheck(num_eval_modes_in[0] > 0 && num_eval_modes_out[0] > 0, ceed, CEED_ERROR_UNSUPPORTED, "Cannot assemble operator with out inputs/outputs"); 591eaf62fffSJeremy L Thompson 592ed9e99e6SJeremy L Thompson CeedElemRestriction active_rstr; 593eaf62fffSJeremy L Thompson CeedInt num_elem, elem_size, num_qpts, num_comp; 5942b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(op, &active_rstr)); 5952b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(active_rstr, &num_elem)); 5962b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(active_rstr, &elem_size)); 5972b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(active_rstr, &num_comp)); 5982b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_in, &num_qpts)); 599eaf62fffSJeremy L Thompson 600eaf62fffSJeremy L Thompson CeedInt local_num_entries = elem_size * num_comp * elem_size * num_comp * num_elem; 601eaf62fffSJeremy L Thompson 602eaf62fffSJeremy L Thompson // loop over elements and put in data structure 603eaf62fffSJeremy L Thompson const CeedScalar *assembled_qf_array; 6042b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array)); 605eaf62fffSJeremy L Thompson 606eaf62fffSJeremy L Thompson CeedInt layout_qf[3]; 6072b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(rstr_q, &layout_qf)); 6082b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_q)); 609eaf62fffSJeremy L Thompson 610eaf62fffSJeremy L Thompson // we store B_mat_in, B_mat_out, BTD, elem_mat in row-major order 611437c7c90SJeremy L Thompson const CeedScalar **B_mats_in, **B_mats_out; 612437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, NULL, &B_mats_in, &B_mats_out)); 613437c7c90SJeremy L Thompson const CeedScalar *B_mat_in = B_mats_in[0], *B_mat_out = B_mats_out[0]; 614437c7c90SJeremy L Thompson CeedScalar BTD_mat[elem_size * num_qpts * num_eval_modes_in[0]]; 615eaf62fffSJeremy L Thompson CeedScalar elem_mat[elem_size * elem_size]; 61692ae7e47SJeremy L Thompson CeedInt count = 0; 617eaf62fffSJeremy L Thompson CeedScalar *vals; 61828ec399dSJeremy L Thompson CeedCall(CeedVectorGetArray(values, CEED_MEM_HOST, &vals)); 619ed9e99e6SJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 620ed9e99e6SJeremy L Thompson for (CeedInt comp_in = 0; comp_in < num_comp; comp_in++) { 621ed9e99e6SJeremy L Thompson for (CeedInt comp_out = 0; comp_out < num_comp; comp_out++) { 622ed9e99e6SJeremy L Thompson // Compute B^T*D 623ed9e99e6SJeremy L Thompson for (CeedInt n = 0; n < elem_size; n++) { 624ed9e99e6SJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 625437c7c90SJeremy L Thompson for (CeedInt e_in = 0; e_in < num_eval_modes_in[0]; e_in++) { 626437c7c90SJeremy L Thompson const CeedInt btd_index = n * (num_qpts * num_eval_modes_in[0]) + (num_eval_modes_in[0] * q + e_in); 627067fd99fSJeremy L Thompson CeedScalar sum = 0.0; 628437c7c90SJeremy L Thompson for (CeedInt e_out = 0; e_out < num_eval_modes_out[0]; e_out++) { 629437c7c90SJeremy L Thompson const CeedInt b_out_index = (num_eval_modes_out[0] * q + e_out) * elem_size + n; 630437c7c90SJeremy L Thompson const CeedInt eval_mode_index = ((e_in * num_comp + comp_in) * num_eval_modes_out[0] + e_out) * num_comp + comp_out; 6312b730f8bSJeremy L Thompson const CeedInt qf_index = q * layout_qf[0] + eval_mode_index * layout_qf[1] + e * layout_qf[2]; 632067fd99fSJeremy L Thompson sum += B_mat_out[b_out_index] * assembled_qf_array[qf_index]; 633eaf62fffSJeremy L Thompson } 634067fd99fSJeremy L Thompson BTD_mat[btd_index] = sum; 635ed9e99e6SJeremy L Thompson } 636ed9e99e6SJeremy L Thompson } 637eaf62fffSJeremy L Thompson } 638eaf62fffSJeremy L Thompson // form element matrix itself (for each block component) 639437c7c90SJeremy L Thompson CeedCall(CeedMatrixMatrixMultiply(ceed, BTD_mat, B_mat_in, elem_mat, elem_size, elem_size, num_qpts * num_eval_modes_in[0])); 640eaf62fffSJeremy L Thompson 641eaf62fffSJeremy L Thompson // put element matrix in coordinate data structure 642ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < elem_size; i++) { 643ed9e99e6SJeremy L Thompson for (CeedInt j = 0; j < elem_size; j++) { 644eaf62fffSJeremy L Thompson vals[offset + count] = elem_mat[i * elem_size + j]; 645eaf62fffSJeremy L Thompson count++; 646eaf62fffSJeremy L Thompson } 647eaf62fffSJeremy L Thompson } 648eaf62fffSJeremy L Thompson } 649eaf62fffSJeremy L Thompson } 650eaf62fffSJeremy L Thompson } 6516574a04fSJeremy L Thompson CeedCheck(count == local_num_entries, ceed, CEED_ERROR_MAJOR, "Error computing entries"); 6522b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(values, &vals)); 653eaf62fffSJeremy L Thompson 6542b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array)); 6552b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled_qf)); 656eaf62fffSJeremy L Thompson 657eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 658eaf62fffSJeremy L Thompson } 659eaf62fffSJeremy L Thompson 660eaf62fffSJeremy L Thompson /** 661eaf62fffSJeremy L Thompson @brief Count number of entries for assembled CeedOperator 662eaf62fffSJeremy L Thompson 663eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 664eaf62fffSJeremy L Thompson @param[out] num_entries Number of entries in assembled representation 665eaf62fffSJeremy L Thompson 666eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 667eaf62fffSJeremy L Thompson 668eaf62fffSJeremy L Thompson @ref Utility 669eaf62fffSJeremy L Thompson **/ 6702b730f8bSJeremy L Thompson static int CeedSingleOperatorAssemblyCountEntries(CeedOperator op, CeedInt *num_entries) { 671b275c451SJeremy L Thompson bool is_composite; 672eaf62fffSJeremy L Thompson CeedElemRestriction rstr; 673eaf62fffSJeremy L Thompson CeedInt num_elem, elem_size, num_comp; 674eaf62fffSJeremy L Thompson 675b275c451SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 6766574a04fSJeremy L Thompson CeedCheck(!is_composite, op->ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 6772b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(op, &rstr)); 6782b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem)); 6792b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size)); 6802b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp)); 681eaf62fffSJeremy L Thompson *num_entries = elem_size * num_comp * elem_size * num_comp * num_elem; 682eaf62fffSJeremy L Thompson 683eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 684eaf62fffSJeremy L Thompson } 685eaf62fffSJeremy L Thompson 686eaf62fffSJeremy L Thompson /** 687ea61e9acSJeremy L Thompson @brief Common code for creating a multigrid coarse operator and level transfer operators for a CeedOperator 688eaf62fffSJeremy L Thompson 689eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 69085bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 691eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 692eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 69385bb9dcfSJeremy L Thompson @param[in] basis_c_to_f Basis for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators 694eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 69585bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 69685bb9dcfSJeremy L Thompson @param[out] op_restrict Fine to coarse operator, or NULL 697eaf62fffSJeremy L Thompson 698eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 699eaf62fffSJeremy L Thompson 700eaf62fffSJeremy L Thompson @ref Developer 701eaf62fffSJeremy L Thompson **/ 7022b730f8bSJeremy L Thompson static int CeedSingleOperatorMultigridLevel(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 7032b730f8bSJeremy L Thompson CeedBasis basis_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) { 704eaf62fffSJeremy L Thompson Ceed ceed; 70585bb9dcfSJeremy L Thompson CeedVector mult_vec = NULL; 7062b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op_fine, &ceed)); 707eaf62fffSJeremy L Thompson 708eaf62fffSJeremy L Thompson // Check for composite operator 709eaf62fffSJeremy L Thompson bool is_composite; 7102b730f8bSJeremy L Thompson CeedCall(CeedOperatorIsComposite(op_fine, &is_composite)); 7116574a04fSJeremy L Thompson CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Automatic multigrid setup for composite operators not supported"); 712eaf62fffSJeremy L Thompson 713eaf62fffSJeremy L Thompson // Coarse Grid 7142b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed, op_fine->qf, op_fine->dqf, op_fine->dqfT, op_coarse)); 715eaf62fffSJeremy L Thompson CeedElemRestriction rstr_fine = NULL; 716eaf62fffSJeremy L Thompson // -- Clone input fields 71792ae7e47SJeremy L Thompson for (CeedInt i = 0; i < op_fine->qf->num_input_fields; i++) { 718eaf62fffSJeremy L Thompson if (op_fine->input_fields[i]->vec == CEED_VECTOR_ACTIVE) { 719437c7c90SJeremy L Thompson rstr_fine = op_fine->input_fields[i]->elem_rstr; 7202b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE)); 721eaf62fffSJeremy L Thompson } else { 722437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, op_fine->input_fields[i]->elem_rstr, 7232b730f8bSJeremy L Thompson op_fine->input_fields[i]->basis, op_fine->input_fields[i]->vec)); 724eaf62fffSJeremy L Thompson } 725eaf62fffSJeremy L Thompson } 726eaf62fffSJeremy L Thompson // -- Clone output fields 72792ae7e47SJeremy L Thompson for (CeedInt i = 0; i < op_fine->qf->num_output_fields; i++) { 728eaf62fffSJeremy L Thompson if (op_fine->output_fields[i]->vec == CEED_VECTOR_ACTIVE) { 7292b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE)); 730eaf62fffSJeremy L Thompson } else { 731437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, op_fine->output_fields[i]->elem_rstr, 7322b730f8bSJeremy L Thompson op_fine->output_fields[i]->basis, op_fine->output_fields[i]->vec)); 733eaf62fffSJeremy L Thompson } 734eaf62fffSJeremy L Thompson } 735af99e877SJeremy L Thompson // -- Clone QFunctionAssemblyData 7362b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op_fine->qf_assembled, &(*op_coarse)->qf_assembled)); 737eaf62fffSJeremy L Thompson 738eaf62fffSJeremy L Thompson // Multiplicity vector 73985bb9dcfSJeremy L Thompson if (op_restrict || op_prolong) { 74085bb9dcfSJeremy L Thompson CeedVector mult_e_vec; 74185bb9dcfSJeremy L Thompson 7426574a04fSJeremy L Thompson CeedCheck(p_mult_fine, ceed, CEED_ERROR_INCOMPATIBLE, "Prolongation or restriction operator creation requires fine grid multiplicity vector"); 7432b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionCreateVector(rstr_fine, &mult_vec, &mult_e_vec)); 7442b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(mult_e_vec, 0.0)); 7452b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionApply(rstr_fine, CEED_NOTRANSPOSE, p_mult_fine, mult_e_vec, CEED_REQUEST_IMMEDIATE)); 7462b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(mult_vec, 0.0)); 7472b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionApply(rstr_fine, CEED_TRANSPOSE, mult_e_vec, mult_vec, CEED_REQUEST_IMMEDIATE)); 7482b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&mult_e_vec)); 7492b730f8bSJeremy L Thompson CeedCall(CeedVectorReciprocal(mult_vec)); 75085bb9dcfSJeremy L Thompson } 751eaf62fffSJeremy L Thompson 752addd79feSZach Atkins // Clone name 753addd79feSZach Atkins bool has_name = op_fine->name; 754addd79feSZach Atkins size_t name_len = op_fine->name ? strlen(op_fine->name) : 0; 755addd79feSZach Atkins CeedCall(CeedOperatorSetName(*op_coarse, op_fine->name)); 756addd79feSZach Atkins 75783d6adf3SZach Atkins // Check that coarse to fine basis is provided if prolong/restrict operators are requested 7586574a04fSJeremy L Thompson CeedCheck(basis_c_to_f || (!op_restrict && !op_prolong), ceed, CEED_ERROR_INCOMPATIBLE, 7596574a04fSJeremy L Thompson "Prolongation or restriction operator creation requires coarse-to-fine basis"); 76083d6adf3SZach Atkins 76185bb9dcfSJeremy L Thompson // Restriction/Prolongation Operators 762eaf62fffSJeremy L Thompson CeedInt num_comp; 7632b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_coarse, &num_comp)); 764addd79feSZach Atkins 765addd79feSZach Atkins // Restriction 766addd79feSZach Atkins if (op_restrict) { 767eaf62fffSJeremy L Thompson CeedInt *num_comp_r_data; 76885bb9dcfSJeremy L Thompson CeedQFunction qf_restrict; 76985bb9dcfSJeremy L Thompson CeedQFunctionContext ctx_r; 77085bb9dcfSJeremy L Thompson 77185bb9dcfSJeremy L Thompson CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_restrict)); 7722b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &num_comp_r_data)); 773eaf62fffSJeremy L Thompson num_comp_r_data[0] = num_comp; 7742b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextCreate(ceed, &ctx_r)); 7752b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextSetData(ctx_r, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_r_data), num_comp_r_data)); 7762b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(qf_restrict, ctx_r)); 7772b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextDestroy(&ctx_r)); 7782b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_restrict, "input", num_comp, CEED_EVAL_NONE)); 7792b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_restrict, "scale", num_comp, CEED_EVAL_NONE)); 7802b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(qf_restrict, "output", num_comp, CEED_EVAL_INTERP)); 7812b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_restrict, num_comp)); 782eaf62fffSJeremy L Thompson 7832b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed, qf_restrict, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_restrict)); 7842b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_restrict, "input", rstr_fine, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE)); 7852b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_restrict, "scale", rstr_fine, CEED_BASIS_COLLOCATED, mult_vec)); 7862b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_restrict, "output", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE)); 787eaf62fffSJeremy L Thompson 788addd79feSZach Atkins // Set name 789addd79feSZach Atkins char *restriction_name; 790addd79feSZach Atkins CeedCall(CeedCalloc(17 + name_len, &restriction_name)); 791addd79feSZach Atkins sprintf(restriction_name, "restriction%s%s", has_name ? " for " : "", has_name ? op_fine->name : ""); 792addd79feSZach Atkins CeedCall(CeedOperatorSetName(*op_restrict, restriction_name)); 793addd79feSZach Atkins CeedCall(CeedFree(&restriction_name)); 794addd79feSZach Atkins 795addd79feSZach Atkins // Check 796addd79feSZach Atkins CeedCall(CeedOperatorCheckReady(*op_restrict)); 797addd79feSZach Atkins 798addd79feSZach Atkins // Cleanup 799addd79feSZach Atkins CeedCall(CeedQFunctionDestroy(&qf_restrict)); 800addd79feSZach Atkins } 801addd79feSZach Atkins 802eaf62fffSJeremy L Thompson // Prolongation 803addd79feSZach Atkins if (op_prolong) { 804eaf62fffSJeremy L Thompson CeedInt *num_comp_p_data; 80585bb9dcfSJeremy L Thompson CeedQFunction qf_prolong; 80685bb9dcfSJeremy L Thompson CeedQFunctionContext ctx_p; 80785bb9dcfSJeremy L Thompson 80885bb9dcfSJeremy L Thompson CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_prolong)); 8092b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &num_comp_p_data)); 810eaf62fffSJeremy L Thompson num_comp_p_data[0] = num_comp; 8112b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextCreate(ceed, &ctx_p)); 8122b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextSetData(ctx_p, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_p_data), num_comp_p_data)); 8132b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(qf_prolong, ctx_p)); 8142b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextDestroy(&ctx_p)); 8152b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_prolong, "input", num_comp, CEED_EVAL_INTERP)); 8162b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_prolong, "scale", num_comp, CEED_EVAL_NONE)); 8172b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(qf_prolong, "output", num_comp, CEED_EVAL_NONE)); 8182b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_prolong, num_comp)); 819eaf62fffSJeremy L Thompson 8202b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed, qf_prolong, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_prolong)); 8212b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_prolong, "input", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE)); 8222b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_prolong, "scale", rstr_fine, CEED_BASIS_COLLOCATED, mult_vec)); 8232b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_prolong, "output", rstr_fine, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE)); 824eaf62fffSJeremy L Thompson 825addd79feSZach Atkins // Set name 826ea6b5821SJeremy L Thompson char *prolongation_name; 8272b730f8bSJeremy L Thompson CeedCall(CeedCalloc(18 + name_len, &prolongation_name)); 8282b730f8bSJeremy L Thompson sprintf(prolongation_name, "prolongation%s%s", has_name ? " for " : "", has_name ? op_fine->name : ""); 8292b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetName(*op_prolong, prolongation_name)); 8302b730f8bSJeremy L Thompson CeedCall(CeedFree(&prolongation_name)); 831addd79feSZach Atkins 832addd79feSZach Atkins // Check 833addd79feSZach Atkins CeedCall(CeedOperatorCheckReady(*op_prolong)); 834addd79feSZach Atkins 835addd79feSZach Atkins // Cleanup 836addd79feSZach Atkins CeedCall(CeedQFunctionDestroy(&qf_prolong)); 837ea6b5821SJeremy L Thompson } 838ea6b5821SJeremy L Thompson 83958e4b056SJeremy L Thompson // Check 84058e4b056SJeremy L Thompson CeedCall(CeedOperatorCheckReady(*op_coarse)); 84158e4b056SJeremy L Thompson 842eaf62fffSJeremy L Thompson // Cleanup 8432b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&mult_vec)); 8442b730f8bSJeremy L Thompson CeedCall(CeedBasisDestroy(&basis_c_to_f)); 845805fe78eSJeremy L Thompson 846eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 847eaf62fffSJeremy L Thompson } 848eaf62fffSJeremy L Thompson 849eaf62fffSJeremy L Thompson /** 850eaf62fffSJeremy L Thompson @brief Build 1D mass matrix and Laplacian with perturbation 851eaf62fffSJeremy L Thompson 852eaf62fffSJeremy L Thompson @param[in] interp_1d Interpolation matrix in one dimension 853eaf62fffSJeremy L Thompson @param[in] grad_1d Gradient matrix in one dimension 854eaf62fffSJeremy L Thompson @param[in] q_weight_1d Quadrature weights in one dimension 855eaf62fffSJeremy L Thompson @param[in] P_1d Number of basis nodes in one dimension 856eaf62fffSJeremy L Thompson @param[in] Q_1d Number of quadrature points in one dimension 857eaf62fffSJeremy L Thompson @param[in] dim Dimension of basis 858eaf62fffSJeremy L Thompson @param[out] mass Assembled mass matrix in one dimension 859eaf62fffSJeremy L Thompson @param[out] laplace Assembled perturbed Laplacian in one dimension 860eaf62fffSJeremy L Thompson 861eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 862eaf62fffSJeremy L Thompson 863eaf62fffSJeremy L Thompson @ref Developer 864eaf62fffSJeremy L Thompson **/ 8652c2ea1dbSJeremy L Thompson CeedPragmaOptimizeOff 8662c2ea1dbSJeremy L Thompson static int CeedBuildMassLaplace(const CeedScalar *interp_1d, const CeedScalar *grad_1d, const CeedScalar *q_weight_1d, CeedInt P_1d, CeedInt Q_1d, 8672c2ea1dbSJeremy L Thompson CeedInt dim, CeedScalar *mass, CeedScalar *laplace) { 8682b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) { 869eaf62fffSJeremy L Thompson for (CeedInt j = 0; j < P_1d; j++) { 870eaf62fffSJeremy L Thompson CeedScalar sum = 0.0; 8712b730f8bSJeremy L Thompson for (CeedInt k = 0; k < Q_1d; k++) sum += interp_1d[k * P_1d + i] * q_weight_1d[k] * interp_1d[k * P_1d + j]; 872eaf62fffSJeremy L Thompson mass[i + j * P_1d] = sum; 873eaf62fffSJeremy L Thompson } 8742b730f8bSJeremy L Thompson } 875eaf62fffSJeremy L Thompson // -- Laplacian 8762b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) { 877eaf62fffSJeremy L Thompson for (CeedInt j = 0; j < P_1d; j++) { 878eaf62fffSJeremy L Thompson CeedScalar sum = 0.0; 8792b730f8bSJeremy L Thompson for (CeedInt k = 0; k < Q_1d; k++) sum += grad_1d[k * P_1d + i] * q_weight_1d[k] * grad_1d[k * P_1d + j]; 880eaf62fffSJeremy L Thompson laplace[i + j * P_1d] = sum; 881eaf62fffSJeremy L Thompson } 8822b730f8bSJeremy L Thompson } 883eaf62fffSJeremy L Thompson CeedScalar perturbation = dim > 2 ? 1e-6 : 1e-4; 8842b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) laplace[i + P_1d * i] += perturbation; 885eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 886eaf62fffSJeremy L Thompson } 8872c2ea1dbSJeremy L Thompson CeedPragmaOptimizeOn 888eaf62fffSJeremy L Thompson 889eaf62fffSJeremy L Thompson /// @} 890eaf62fffSJeremy L Thompson 891eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 892480fae85SJeremy L Thompson /// CeedOperator Backend API 893480fae85SJeremy L Thompson /// ---------------------------------------------------------------------------- 894480fae85SJeremy L Thompson /// @addtogroup CeedOperatorBackend 895480fae85SJeremy L Thompson /// @{ 896480fae85SJeremy L Thompson 897480fae85SJeremy L Thompson /** 898480fae85SJeremy L Thompson @brief Create object holding CeedQFunction assembly data for CeedOperator 899480fae85SJeremy L Thompson 900480fae85SJeremy L Thompson @param[in] ceed A Ceed object where the CeedQFunctionAssemblyData will be created 901ea61e9acSJeremy L Thompson @param[out] data Address of the variable where the newly created CeedQFunctionAssemblyData will be stored 902480fae85SJeremy L Thompson 903480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 904480fae85SJeremy L Thompson 905480fae85SJeremy L Thompson @ref Backend 906480fae85SJeremy L Thompson **/ 907ea61e9acSJeremy L Thompson int CeedQFunctionAssemblyDataCreate(Ceed ceed, CeedQFunctionAssemblyData *data) { 9082b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, data)); 909480fae85SJeremy L Thompson (*data)->ref_count = 1; 910480fae85SJeremy L Thompson (*data)->ceed = ceed; 9112b730f8bSJeremy L Thompson CeedCall(CeedReference(ceed)); 912480fae85SJeremy L Thompson 913480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 914480fae85SJeremy L Thompson } 915480fae85SJeremy L Thompson 916480fae85SJeremy L Thompson /** 917480fae85SJeremy L Thompson @brief Increment the reference counter for a CeedQFunctionAssemblyData 918480fae85SJeremy L Thompson 919ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to increment the reference counter 920480fae85SJeremy L Thompson 921480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 922480fae85SJeremy L Thompson 923480fae85SJeremy L Thompson @ref Backend 924480fae85SJeremy L Thompson **/ 925480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataReference(CeedQFunctionAssemblyData data) { 926480fae85SJeremy L Thompson data->ref_count++; 927480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 928480fae85SJeremy L Thompson } 929480fae85SJeremy L Thompson 930480fae85SJeremy L Thompson /** 931beecbf24SJeremy L Thompson @brief Set re-use of CeedQFunctionAssemblyData 9328b919e6bSJeremy L Thompson 933ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to mark for reuse 934ea61e9acSJeremy L Thompson @param[in] reuse_data Boolean flag indicating data re-use 9358b919e6bSJeremy L Thompson 9368b919e6bSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 9378b919e6bSJeremy L Thompson 9388b919e6bSJeremy L Thompson @ref Backend 9398b919e6bSJeremy L Thompson **/ 9402b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetReuse(CeedQFunctionAssemblyData data, bool reuse_data) { 941beecbf24SJeremy L Thompson data->reuse_data = reuse_data; 942beecbf24SJeremy L Thompson data->needs_data_update = true; 943beecbf24SJeremy L Thompson return CEED_ERROR_SUCCESS; 944beecbf24SJeremy L Thompson } 945beecbf24SJeremy L Thompson 946beecbf24SJeremy L Thompson /** 947beecbf24SJeremy L Thompson @brief Mark QFunctionAssemblyData as stale 948beecbf24SJeremy L Thompson 949ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to mark as stale 950ea61e9acSJeremy L Thompson @param[in] needs_data_update Boolean flag indicating if update is needed or completed 951beecbf24SJeremy L Thompson 952beecbf24SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 953beecbf24SJeremy L Thompson 954beecbf24SJeremy L Thompson @ref Backend 955beecbf24SJeremy L Thompson **/ 9562b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetUpdateNeeded(CeedQFunctionAssemblyData data, bool needs_data_update) { 957beecbf24SJeremy L Thompson data->needs_data_update = needs_data_update; 9588b919e6bSJeremy L Thompson return CEED_ERROR_SUCCESS; 9598b919e6bSJeremy L Thompson } 9608b919e6bSJeremy L Thompson 9618b919e6bSJeremy L Thompson /** 9628b919e6bSJeremy L Thompson @brief Determine if QFunctionAssemblyData needs update 9638b919e6bSJeremy L Thompson 9648b919e6bSJeremy L Thompson @param[in] data CeedQFunctionAssemblyData to mark as stale 9658b919e6bSJeremy L Thompson @param[out] is_update_needed Boolean flag indicating if re-assembly is required 9668b919e6bSJeremy L Thompson 9678b919e6bSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 9688b919e6bSJeremy L Thompson 9698b919e6bSJeremy L Thompson @ref Backend 9708b919e6bSJeremy L Thompson **/ 9712b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsUpdateNeeded(CeedQFunctionAssemblyData data, bool *is_update_needed) { 972beecbf24SJeremy L Thompson *is_update_needed = !data->reuse_data || data->needs_data_update; 9738b919e6bSJeremy L Thompson return CEED_ERROR_SUCCESS; 9748b919e6bSJeremy L Thompson } 9758b919e6bSJeremy L Thompson 9768b919e6bSJeremy L Thompson /** 977ea61e9acSJeremy L Thompson @brief Copy the pointer to a CeedQFunctionAssemblyData. 9784385fb7fSSebastian Grimberg 979ea61e9acSJeremy L Thompson Both pointers should be destroyed with `CeedCeedQFunctionAssemblyDataDestroy()`. 980512bb800SJeremy L Thompson 981512bb800SJeremy L Thompson Note: If the value of `data_copy` passed to this function is non-NULL, then it is assumed that `*data_copy` is a pointer to a 982512bb800SJeremy L Thompson CeedQFunctionAssemblyData. This CeedQFunctionAssemblyData will be destroyed if `data_copy` is the only reference to this 983512bb800SJeremy L Thompson CeedQFunctionAssemblyData. 984480fae85SJeremy L Thompson 985ea61e9acSJeremy L Thompson @param[in] data CeedQFunctionAssemblyData to copy reference to 986ea61e9acSJeremy L Thompson @param[in,out] data_copy Variable to store copied reference 987480fae85SJeremy L Thompson 988480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 989480fae85SJeremy L Thompson 990480fae85SJeremy L Thompson @ref Backend 991480fae85SJeremy L Thompson **/ 9922b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataReferenceCopy(CeedQFunctionAssemblyData data, CeedQFunctionAssemblyData *data_copy) { 9932b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataReference(data)); 9942b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataDestroy(data_copy)); 995480fae85SJeremy L Thompson *data_copy = data; 996480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 997480fae85SJeremy L Thompson } 998480fae85SJeremy L Thompson 999480fae85SJeremy L Thompson /** 1000480fae85SJeremy L Thompson @brief Get setup status for internal objects for CeedQFunctionAssemblyData 1001480fae85SJeremy L Thompson 1002ea61e9acSJeremy L Thompson @param[in] data CeedQFunctionAssemblyData to retrieve status 1003480fae85SJeremy L Thompson @param[out] is_setup Boolean flag for setup status 1004480fae85SJeremy L Thompson 1005480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1006480fae85SJeremy L Thompson 1007480fae85SJeremy L Thompson @ref Backend 1008480fae85SJeremy L Thompson **/ 10092b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsSetup(CeedQFunctionAssemblyData data, bool *is_setup) { 1010480fae85SJeremy L Thompson *is_setup = data->is_setup; 1011480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1012480fae85SJeremy L Thompson } 1013480fae85SJeremy L Thompson 1014480fae85SJeremy L Thompson /** 1015480fae85SJeremy L Thompson @brief Set internal objects for CeedQFunctionAssemblyData 1016480fae85SJeremy L Thompson 1017ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to set objects 1018480fae85SJeremy L Thompson @param[in] vec CeedVector to store assembled CeedQFunction at quadrature points 1019480fae85SJeremy L Thompson @param[in] rstr CeedElemRestriction for CeedVector containing assembled CeedQFunction 1020480fae85SJeremy L Thompson 1021480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1022480fae85SJeremy L Thompson 1023480fae85SJeremy L Thompson @ref Backend 1024480fae85SJeremy L Thompson **/ 10252b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetObjects(CeedQFunctionAssemblyData data, CeedVector vec, CeedElemRestriction rstr) { 10262b730f8bSJeremy L Thompson CeedCall(CeedVectorReferenceCopy(vec, &data->vec)); 10272b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(rstr, &data->rstr)); 1028480fae85SJeremy L Thompson 1029480fae85SJeremy L Thompson data->is_setup = true; 1030480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1031480fae85SJeremy L Thompson } 1032480fae85SJeremy L Thompson 10332b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataGetObjects(CeedQFunctionAssemblyData data, CeedVector *vec, CeedElemRestriction *rstr) { 10346574a04fSJeremy L Thompson CeedCheck(data->is_setup, data->ceed, CEED_ERROR_INCOMPLETE, "Internal objects not set; must call CeedQFunctionAssemblyDataSetObjects first."); 1035480fae85SJeremy L Thompson 10362b730f8bSJeremy L Thompson CeedCall(CeedVectorReferenceCopy(data->vec, vec)); 10372b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(data->rstr, rstr)); 1038480fae85SJeremy L Thompson 1039480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1040480fae85SJeremy L Thompson } 1041480fae85SJeremy L Thompson 1042480fae85SJeremy L Thompson /** 1043480fae85SJeremy L Thompson @brief Destroy CeedQFunctionAssemblyData 1044480fae85SJeremy L Thompson 1045ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to destroy 1046480fae85SJeremy L Thompson 1047480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1048480fae85SJeremy L Thompson 1049480fae85SJeremy L Thompson @ref Backend 1050480fae85SJeremy L Thompson **/ 1051480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataDestroy(CeedQFunctionAssemblyData *data) { 1052ad6481ceSJeremy L Thompson if (!*data || --(*data)->ref_count > 0) { 1053ad6481ceSJeremy L Thompson *data = NULL; 1054ad6481ceSJeremy L Thompson return CEED_ERROR_SUCCESS; 1055ad6481ceSJeremy L Thompson } 10562b730f8bSJeremy L Thompson CeedCall(CeedDestroy(&(*data)->ceed)); 10572b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&(*data)->vec)); 10582b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&(*data)->rstr)); 1059480fae85SJeremy L Thompson 10602b730f8bSJeremy L Thompson CeedCall(CeedFree(data)); 1061480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1062480fae85SJeremy L Thompson } 1063480fae85SJeremy L Thompson 1064ed9e99e6SJeremy L Thompson /** 1065ed9e99e6SJeremy L Thompson @brief Get CeedOperatorAssemblyData 1066ed9e99e6SJeremy L Thompson 1067ed9e99e6SJeremy L Thompson @param[in] op CeedOperator to assemble 1068ed9e99e6SJeremy L Thompson @param[out] data CeedQFunctionAssemblyData 1069ed9e99e6SJeremy L Thompson 1070ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1071ed9e99e6SJeremy L Thompson 1072ed9e99e6SJeremy L Thompson @ref Backend 1073ed9e99e6SJeremy L Thompson **/ 10742b730f8bSJeremy L Thompson int CeedOperatorGetOperatorAssemblyData(CeedOperator op, CeedOperatorAssemblyData *data) { 1075ed9e99e6SJeremy L Thompson if (!op->op_assembled) { 1076ed9e99e6SJeremy L Thompson CeedOperatorAssemblyData data; 1077ed9e99e6SJeremy L Thompson 10782b730f8bSJeremy L Thompson CeedCall(CeedOperatorAssemblyDataCreate(op->ceed, op, &data)); 1079ed9e99e6SJeremy L Thompson op->op_assembled = data; 1080ed9e99e6SJeremy L Thompson } 1081ed9e99e6SJeremy L Thompson *data = op->op_assembled; 1082ed9e99e6SJeremy L Thompson 1083ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1084ed9e99e6SJeremy L Thompson } 1085ed9e99e6SJeremy L Thompson 1086ed9e99e6SJeremy L Thompson /** 1087ba746a46SJeremy L Thompson @brief Create object holding CeedOperator assembly data. 1088ba746a46SJeremy L Thompson 1089ba746a46SJeremy L Thompson The CeedOperatorAssemblyData holds an array with references to every active CeedBasis used in the CeedOperator. 1090ba746a46SJeremy L Thompson An array with references to the corresponding active CeedElemRestrictions is also stored. 1091ba746a46SJeremy L Thompson For each active CeedBasis, the CeedOperatorAssemblyData holds an array of all input and output CeedEvalModes for this CeedBasis. 1092ba746a46SJeremy L Thompson The CeedOperatorAssemblyData holds an array of offsets for indexing into the assembled CeedQFunction arrays to the row representing each 1093ba746a46SJeremy L Thompson CeedEvalMode. 1094ba746a46SJeremy L Thompson The number of input columns across all active bases for the assembled CeedQFunction is also stored. 1095ba746a46SJeremy L Thompson Lastly, the CeedOperatorAssembly data holds assembled matrices representing the full action of the CeedBasis for all CeedEvalModes. 1096ed9e99e6SJeremy L Thompson 1097ea61e9acSJeremy L Thompson @param[in] ceed Ceed object where the CeedOperatorAssemblyData will be created 1098ed9e99e6SJeremy L Thompson @param[in] op CeedOperator to be assembled 1099ea61e9acSJeremy L Thompson @param[out] data Address of the variable where the newly created CeedOperatorAssemblyData will be stored 1100ed9e99e6SJeremy L Thompson 1101ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1102ed9e99e6SJeremy L Thompson 1103ed9e99e6SJeremy L Thompson @ref Backend 1104ed9e99e6SJeremy L Thompson **/ 11052b730f8bSJeremy L Thompson int CeedOperatorAssemblyDataCreate(Ceed ceed, CeedOperator op, CeedOperatorAssemblyData *data) { 1106437c7c90SJeremy L Thompson CeedInt num_active_bases = 0; 1107437c7c90SJeremy L Thompson 1108437c7c90SJeremy L Thompson // Allocate 11092b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, data)); 1110ed9e99e6SJeremy L Thompson (*data)->ceed = ceed; 11112b730f8bSJeremy L Thompson CeedCall(CeedReference(ceed)); 1112ed9e99e6SJeremy L Thompson 1113ed9e99e6SJeremy L Thompson // Build OperatorAssembly data 1114ed9e99e6SJeremy L Thompson CeedQFunction qf; 1115ed9e99e6SJeremy L Thompson CeedQFunctionField *qf_fields; 1116ed9e99e6SJeremy L Thompson CeedOperatorField *op_fields; 1117ed9e99e6SJeremy L Thompson CeedInt num_input_fields; 11182b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 11192b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetFields(qf, &num_input_fields, &qf_fields, NULL, NULL)); 11202b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL)); 1121ed9e99e6SJeremy L Thompson 1122ed9e99e6SJeremy L Thompson // Determine active input basis 1123437c7c90SJeremy L Thompson CeedInt *num_eval_modes_in = NULL, *num_eval_modes_out = NULL, offset = 0; 1124437c7c90SJeremy L Thompson CeedEvalMode **eval_modes_in = NULL, **eval_modes_out = NULL; 1125437c7c90SJeremy L Thompson CeedSize **eval_mode_offsets_in = NULL, **eval_mode_offsets_out = NULL; 1126ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 1127ed9e99e6SJeremy L Thompson CeedVector vec; 11282b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec)); 1129ed9e99e6SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 1130437c7c90SJeremy L Thompson CeedBasis basis_in = NULL; 1131437c7c90SJeremy L Thompson CeedEvalMode eval_mode; 1132352a5e7cSSebastian Grimberg CeedInt index = -1, dim, num_comp, q_comp; 11332b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_in)); 11342b730f8bSJeremy L Thompson CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 1135352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetDimension(basis_in, &dim)); 1136352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumComponents(basis_in, &num_comp)); 1137352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(basis_in, eval_mode, &q_comp)); 1138437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_active_bases; i++) { 1139437c7c90SJeremy L Thompson if ((*data)->active_bases[i] == basis_in) index = i; 1140437c7c90SJeremy L Thompson } 1141437c7c90SJeremy L Thompson if (index == -1) { 1142437c7c90SJeremy L Thompson CeedElemRestriction elem_rstr_in; 1143437c7c90SJeremy L Thompson index = num_active_bases; 1144437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_bases)); 1145437c7c90SJeremy L Thompson (*data)->active_bases[num_active_bases] = NULL; 1146437c7c90SJeremy L Thompson CeedCall(CeedBasisReferenceCopy(basis_in, &(*data)->active_bases[num_active_bases])); 1147437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_elem_rstrs)); 1148437c7c90SJeremy L Thompson (*data)->active_elem_rstrs[num_active_bases] = NULL; 1149437c7c90SJeremy L Thompson CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr_in)); 1150437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(elem_rstr_in, &(*data)->active_elem_rstrs[num_active_bases])); 1151437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_in)); 1152437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_out)); 1153437c7c90SJeremy L Thompson num_eval_modes_in[index] = 0; 1154437c7c90SJeremy L Thompson num_eval_modes_out[index] = 0; 1155437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_in)); 1156437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_out)); 1157437c7c90SJeremy L Thompson eval_modes_in[index] = NULL; 1158437c7c90SJeremy L Thompson eval_modes_out[index] = NULL; 1159437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_in)); 1160437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_out)); 1161437c7c90SJeremy L Thompson eval_mode_offsets_in[index] = NULL; 1162437c7c90SJeremy L Thompson eval_mode_offsets_out[index] = NULL; 1163437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_in)); 1164437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_out)); 1165437c7c90SJeremy L Thompson (*data)->assembled_bases_in[index] = NULL; 1166437c7c90SJeremy L Thompson (*data)->assembled_bases_out[index] = NULL; 1167437c7c90SJeremy L Thompson num_active_bases++; 1168437c7c90SJeremy L Thompson } 1169352a5e7cSSebastian Grimberg if (eval_mode != CEED_EVAL_WEIGHT) { 1170352a5e7cSSebastian Grimberg // q_comp = 1 if CEED_EVAL_NONE, CEED_EVAL_WEIGHT caught by QF Assembly 1171352a5e7cSSebastian Grimberg CeedCall(CeedRealloc(num_eval_modes_in[index] + q_comp, &eval_modes_in[index])); 1172352a5e7cSSebastian Grimberg CeedCall(CeedRealloc(num_eval_modes_in[index] + q_comp, &eval_mode_offsets_in[index])); 1173352a5e7cSSebastian Grimberg for (CeedInt d = 0; d < q_comp; d++) { 1174437c7c90SJeremy L Thompson eval_modes_in[index][num_eval_modes_in[index] + d] = eval_mode; 1175437c7c90SJeremy L Thompson eval_mode_offsets_in[index][num_eval_modes_in[index] + d] = offset; 1176352a5e7cSSebastian Grimberg offset += num_comp; 1177ed9e99e6SJeremy L Thompson } 1178352a5e7cSSebastian Grimberg num_eval_modes_in[index] += q_comp; 1179ed9e99e6SJeremy L Thompson } 1180ed9e99e6SJeremy L Thompson } 1181ed9e99e6SJeremy L Thompson } 1182437c7c90SJeremy L Thompson (*data)->num_eval_modes_in = num_eval_modes_in; 1183437c7c90SJeremy L Thompson (*data)->eval_modes_in = eval_modes_in; 1184437c7c90SJeremy L Thompson (*data)->eval_mode_offsets_in = eval_mode_offsets_in; 1185ed9e99e6SJeremy L Thompson 1186ed9e99e6SJeremy L Thompson // Determine active output basis 1187ed9e99e6SJeremy L Thompson CeedInt num_output_fields; 11882b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetFields(qf, NULL, NULL, &num_output_fields, &qf_fields)); 11892b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields)); 1190437c7c90SJeremy L Thompson offset = 0; 1191ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_output_fields; i++) { 1192ed9e99e6SJeremy L Thompson CeedVector vec; 11932b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec)); 1194ed9e99e6SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 1195437c7c90SJeremy L Thompson CeedBasis basis_out = NULL; 1196ed9e99e6SJeremy L Thompson CeedEvalMode eval_mode; 1197352a5e7cSSebastian Grimberg CeedInt index = -1, dim, num_comp, q_comp; 1198437c7c90SJeremy L Thompson CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_out)); 11992b730f8bSJeremy L Thompson CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 1200352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetDimension(basis_out, &dim)); 1201352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumComponents(basis_out, &num_comp)); 1202352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(basis_out, eval_mode, &q_comp)); 1203437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_active_bases; i++) { 1204437c7c90SJeremy L Thompson if ((*data)->active_bases[i] == basis_out) index = i; 1205437c7c90SJeremy L Thompson } 1206437c7c90SJeremy L Thompson if (index == -1) { 1207437c7c90SJeremy L Thompson CeedElemRestriction elem_rstr_out; 1208437c7c90SJeremy L Thompson 1209437c7c90SJeremy L Thompson index = num_active_bases; 1210437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_bases)); 1211437c7c90SJeremy L Thompson (*data)->active_bases[num_active_bases] = NULL; 1212437c7c90SJeremy L Thompson CeedCall(CeedBasisReferenceCopy(basis_out, &(*data)->active_bases[num_active_bases])); 1213437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_elem_rstrs)); 1214437c7c90SJeremy L Thompson (*data)->active_elem_rstrs[num_active_bases] = NULL; 1215437c7c90SJeremy L Thompson CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr_out)); 1216437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(elem_rstr_out, &(*data)->active_elem_rstrs[num_active_bases])); 1217437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_in)); 1218437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_out)); 1219437c7c90SJeremy L Thompson num_eval_modes_in[index] = 0; 1220437c7c90SJeremy L Thompson num_eval_modes_out[index] = 0; 1221437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_in)); 1222437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_out)); 1223437c7c90SJeremy L Thompson eval_modes_in[index] = NULL; 1224437c7c90SJeremy L Thompson eval_modes_out[index] = NULL; 1225437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_in)); 1226437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_out)); 1227437c7c90SJeremy L Thompson eval_mode_offsets_in[index] = NULL; 1228437c7c90SJeremy L Thompson eval_mode_offsets_out[index] = NULL; 1229437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_in)); 1230437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_out)); 1231437c7c90SJeremy L Thompson (*data)->assembled_bases_in[index] = NULL; 1232437c7c90SJeremy L Thompson (*data)->assembled_bases_out[index] = NULL; 1233437c7c90SJeremy L Thompson num_active_bases++; 1234437c7c90SJeremy L Thompson } 1235352a5e7cSSebastian Grimberg if (eval_mode != CEED_EVAL_WEIGHT) { 1236352a5e7cSSebastian Grimberg // q_comp = 1 if CEED_EVAL_NONE, CEED_EVAL_WEIGHT caught by QF Assembly 1237352a5e7cSSebastian Grimberg CeedCall(CeedRealloc(num_eval_modes_out[index] + q_comp, &eval_modes_out[index])); 1238352a5e7cSSebastian Grimberg CeedCall(CeedRealloc(num_eval_modes_out[index] + q_comp, &eval_mode_offsets_out[index])); 1239352a5e7cSSebastian Grimberg for (CeedInt d = 0; d < q_comp; d++) { 1240437c7c90SJeremy L Thompson eval_modes_out[index][num_eval_modes_out[index] + d] = eval_mode; 1241437c7c90SJeremy L Thompson eval_mode_offsets_out[index][num_eval_modes_out[index] + d] = offset; 1242352a5e7cSSebastian Grimberg offset += num_comp; 1243ed9e99e6SJeremy L Thompson } 1244352a5e7cSSebastian Grimberg num_eval_modes_out[index] += q_comp; 1245ed9e99e6SJeremy L Thompson } 1246ed9e99e6SJeremy L Thompson } 1247ed9e99e6SJeremy L Thompson } 1248437c7c90SJeremy L Thompson (*data)->num_output_components = offset; 1249437c7c90SJeremy L Thompson (*data)->num_eval_modes_out = num_eval_modes_out; 1250437c7c90SJeremy L Thompson (*data)->eval_modes_out = eval_modes_out; 1251437c7c90SJeremy L Thompson (*data)->eval_mode_offsets_out = eval_mode_offsets_out; 1252437c7c90SJeremy L Thompson (*data)->num_active_bases = num_active_bases; 1253ed9e99e6SJeremy L Thompson 1254ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1255ed9e99e6SJeremy L Thompson } 1256ed9e99e6SJeremy L Thompson 1257ed9e99e6SJeremy L Thompson /** 1258ba746a46SJeremy L Thompson @brief Get CeedOperator CeedEvalModes for assembly. 1259ba746a46SJeremy L Thompson 1260ba746a46SJeremy L Thompson Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object. 1261ed9e99e6SJeremy L Thompson 1262ed9e99e6SJeremy L Thompson @param[in] data CeedOperatorAssemblyData 1263ba746a46SJeremy L Thompson @param[out] num_active_bases Total number of active bases 1264c5d0f995SJed Brown @param[out] num_eval_modes_in Pointer to hold array of numbers of input CeedEvalModes, or NULL. 1265ba746a46SJeremy L Thompson `eval_modes_in[0]` holds an array of eval modes for the first active basis. 1266c5d0f995SJed Brown @param[out] eval_modes_in Pointer to hold arrays of input CeedEvalModes, or NULL. 1267ba746a46SJeremy L Thompson @param[out] eval_mode_offsets_in Pointer to hold arrays of input offsets at each quadrature point. 1268c5d0f995SJed Brown @param[out] num_eval_modes_out Pointer to hold array of numbers of output CeedEvalModes, or NULL 1269c5d0f995SJed Brown @param[out] eval_modes_out Pointer to hold arrays of output CeedEvalModes, or NULL. 1270437c7c90SJeremy L Thompson @param[out] eval_mode_offsets_out Pointer to hold arrays of output offsets at each quadrature point 1271ba746a46SJeremy L Thompson @param[out] num_output_components The number of columns in the assembled CeedQFunction matrix for each quadrature point, 1272ba746a46SJeremy L Thompson including contributions of all active bases 1273ed9e99e6SJeremy L Thompson 1274ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1275ed9e99e6SJeremy L Thompson 1276c5d0f995SJed Brown 1277ed9e99e6SJeremy L Thompson @ref Backend 1278ed9e99e6SJeremy L Thompson **/ 1279437c7c90SJeremy L Thompson int CeedOperatorAssemblyDataGetEvalModes(CeedOperatorAssemblyData data, CeedInt *num_active_bases, CeedInt **num_eval_modes_in, 1280437c7c90SJeremy L Thompson const CeedEvalMode ***eval_modes_in, CeedSize ***eval_mode_offsets_in, CeedInt **num_eval_modes_out, 1281437c7c90SJeremy L Thompson const CeedEvalMode ***eval_modes_out, CeedSize ***eval_mode_offsets_out, CeedSize *num_output_components) { 1282437c7c90SJeremy L Thompson if (num_active_bases) *num_active_bases = data->num_active_bases; 1283437c7c90SJeremy L Thompson if (num_eval_modes_in) *num_eval_modes_in = data->num_eval_modes_in; 1284437c7c90SJeremy L Thompson if (eval_modes_in) *eval_modes_in = (const CeedEvalMode **)data->eval_modes_in; 1285437c7c90SJeremy L Thompson if (eval_mode_offsets_in) *eval_mode_offsets_in = data->eval_mode_offsets_in; 1286437c7c90SJeremy L Thompson if (num_eval_modes_out) *num_eval_modes_out = data->num_eval_modes_out; 1287437c7c90SJeremy L Thompson if (eval_modes_out) *eval_modes_out = (const CeedEvalMode **)data->eval_modes_out; 1288437c7c90SJeremy L Thompson if (eval_mode_offsets_out) *eval_mode_offsets_out = data->eval_mode_offsets_out; 1289437c7c90SJeremy L Thompson if (num_output_components) *num_output_components = data->num_output_components; 1290ed9e99e6SJeremy L Thompson 1291ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1292ed9e99e6SJeremy L Thompson } 1293ed9e99e6SJeremy L Thompson 1294ed9e99e6SJeremy L Thompson /** 1295ba746a46SJeremy L Thompson @brief Get CeedOperator CeedBasis data for assembly. 1296ba746a46SJeremy L Thompson 1297ba746a46SJeremy L Thompson Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object. 1298ed9e99e6SJeremy L Thompson 1299ed9e99e6SJeremy L Thompson @param[in] data CeedOperatorAssemblyData 1300437c7c90SJeremy L Thompson @param[out] num_active_bases Number of active bases, or NULL 1301437c7c90SJeremy L Thompson @param[out] active_bases Pointer to hold active CeedBasis, or NULL 1302437c7c90SJeremy L Thompson @param[out] assembled_bases_in Pointer to hold assembled active input B, or NULL 1303437c7c90SJeremy L Thompson @param[out] assembled_bases_out Pointer to hold assembled active output B, or NULL 1304ed9e99e6SJeremy L Thompson 1305ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1306ed9e99e6SJeremy L Thompson 1307ed9e99e6SJeremy L Thompson @ref Backend 1308ed9e99e6SJeremy L Thompson **/ 1309437c7c90SJeremy L Thompson int CeedOperatorAssemblyDataGetBases(CeedOperatorAssemblyData data, CeedInt *num_active_bases, CeedBasis **active_bases, 1310437c7c90SJeremy L Thompson const CeedScalar ***assembled_bases_in, const CeedScalar ***assembled_bases_out) { 1311ed9e99e6SJeremy L Thompson // Assemble B_in, B_out if needed 1312437c7c90SJeremy L Thompson if (assembled_bases_in && !data->assembled_bases_in[0]) { 1313437c7c90SJeremy L Thompson CeedInt num_qpts; 1314437c7c90SJeremy L Thompson 1315437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(data->active_bases[0], &num_qpts)); 1316437c7c90SJeremy L Thompson for (CeedInt b = 0; b < data->num_active_bases; b++) { 1317352a5e7cSSebastian Grimberg CeedInt num_nodes; 1318437c7c90SJeremy L Thompson CeedScalar *B_in = NULL, *identity = NULL; 1319ed9e99e6SJeremy L Thompson bool has_eval_none = false; 1320ed9e99e6SJeremy L Thompson 1321352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumNodes(data->active_bases[b], &num_nodes)); 1322352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_qpts * num_nodes * data->num_eval_modes_in[b], &B_in)); 1323ed9e99e6SJeremy L Thompson 1324437c7c90SJeremy L Thompson for (CeedInt i = 0; i < data->num_eval_modes_in[b]; i++) { 1325437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (data->eval_modes_in[b][i] == CEED_EVAL_NONE); 1326ed9e99e6SJeremy L Thompson } 1327ed9e99e6SJeremy L Thompson if (has_eval_none) { 1328352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_qpts * num_nodes, &identity)); 1329352a5e7cSSebastian Grimberg for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) { 1330352a5e7cSSebastian Grimberg identity[i * num_nodes + i] = 1.0; 1331ed9e99e6SJeremy L Thompson } 1332ed9e99e6SJeremy L Thompson } 1333ed9e99e6SJeremy L Thompson 1334ed9e99e6SJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 1335352a5e7cSSebastian Grimberg for (CeedInt n = 0; n < num_nodes; n++) { 1336352a5e7cSSebastian Grimberg CeedInt d_in = 0, q_comp_in; 1337352a5e7cSSebastian Grimberg CeedEvalMode eval_mode_in_prev = CEED_EVAL_NONE; 1338437c7c90SJeremy L Thompson for (CeedInt e_in = 0; e_in < data->num_eval_modes_in[b]; e_in++) { 1339437c7c90SJeremy L Thompson const CeedInt qq = data->num_eval_modes_in[b] * q; 1340437c7c90SJeremy L Thompson const CeedScalar *B = NULL; 1341352a5e7cSSebastian Grimberg CeedOperatorGetBasisPointer(data->active_bases[b], data->eval_modes_in[b][e_in], identity, &B); 1342352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(data->active_bases[b], data->eval_modes_in[b][e_in], &q_comp_in)); 1343352a5e7cSSebastian Grimberg if (q_comp_in > 1) { 1344352a5e7cSSebastian Grimberg if (e_in == 0 || data->eval_modes_in[b][e_in] != eval_mode_in_prev) d_in = 0; 1345352a5e7cSSebastian Grimberg else B = &B[(++d_in) * num_qpts * num_nodes]; 1346352a5e7cSSebastian Grimberg } 1347352a5e7cSSebastian Grimberg eval_mode_in_prev = data->eval_modes_in[b][e_in]; 1348352a5e7cSSebastian Grimberg B_in[(qq + e_in) * num_nodes + n] = B[q * num_nodes + n]; 1349ed9e99e6SJeremy L Thompson } 1350ed9e99e6SJeremy L Thompson } 1351ed9e99e6SJeremy L Thompson } 1352437c7c90SJeremy L Thompson if (identity) CeedCall(CeedFree(identity)); 1353437c7c90SJeremy L Thompson data->assembled_bases_in[b] = B_in; 1354437c7c90SJeremy L Thompson } 1355ed9e99e6SJeremy L Thompson } 1356ed9e99e6SJeremy L Thompson 1357437c7c90SJeremy L Thompson if (assembled_bases_out && !data->assembled_bases_out[0]) { 1358437c7c90SJeremy L Thompson CeedInt num_qpts; 1359437c7c90SJeremy L Thompson 1360437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(data->active_bases[0], &num_qpts)); 1361437c7c90SJeremy L Thompson for (CeedInt b = 0; b < data->num_active_bases; b++) { 1362352a5e7cSSebastian Grimberg CeedInt num_nodes; 1363ed9e99e6SJeremy L Thompson bool has_eval_none = false; 1364437c7c90SJeremy L Thompson CeedScalar *B_out = NULL, *identity = NULL; 1365ed9e99e6SJeremy L Thompson 1366352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumNodes(data->active_bases[b], &num_nodes)); 1367352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_qpts * num_nodes * data->num_eval_modes_out[b], &B_out)); 1368ed9e99e6SJeremy L Thompson 1369437c7c90SJeremy L Thompson for (CeedInt i = 0; i < data->num_eval_modes_out[b]; i++) { 1370437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (data->eval_modes_out[b][i] == CEED_EVAL_NONE); 1371ed9e99e6SJeremy L Thompson } 1372ed9e99e6SJeremy L Thompson if (has_eval_none) { 1373352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_qpts * num_nodes, &identity)); 1374352a5e7cSSebastian Grimberg for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) { 1375352a5e7cSSebastian Grimberg identity[i * num_nodes + i] = 1.0; 1376ed9e99e6SJeremy L Thompson } 1377ed9e99e6SJeremy L Thompson } 1378ed9e99e6SJeremy L Thompson 1379ed9e99e6SJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 1380352a5e7cSSebastian Grimberg for (CeedInt n = 0; n < num_nodes; n++) { 1381352a5e7cSSebastian Grimberg CeedInt d_out = 0, q_comp_out; 1382352a5e7cSSebastian Grimberg CeedEvalMode eval_mode_out_prev = CEED_EVAL_NONE; 1383437c7c90SJeremy L Thompson for (CeedInt e_out = 0; e_out < data->num_eval_modes_out[b]; e_out++) { 1384437c7c90SJeremy L Thompson const CeedInt qq = data->num_eval_modes_out[b] * q; 1385437c7c90SJeremy L Thompson const CeedScalar *B = NULL; 1386352a5e7cSSebastian Grimberg CeedOperatorGetBasisPointer(data->active_bases[b], data->eval_modes_out[b][e_out], identity, &B); 1387352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(data->active_bases[b], data->eval_modes_out[b][e_out], &q_comp_out)); 1388352a5e7cSSebastian Grimberg if (q_comp_out > 1) { 1389352a5e7cSSebastian Grimberg if (e_out == 0 || data->eval_modes_out[b][e_out] != eval_mode_out_prev) d_out = 0; 1390352a5e7cSSebastian Grimberg else B = &B[(++d_out) * num_qpts * num_nodes]; 1391352a5e7cSSebastian Grimberg } 1392352a5e7cSSebastian Grimberg eval_mode_out_prev = data->eval_modes_out[b][e_out]; 1393352a5e7cSSebastian Grimberg B_out[(qq + e_out) * num_nodes + n] = B[q * num_nodes + n]; 1394ed9e99e6SJeremy L Thompson } 1395ed9e99e6SJeremy L Thompson } 1396ed9e99e6SJeremy L Thompson } 1397437c7c90SJeremy L Thompson if (identity) CeedCall(CeedFree(identity)); 1398437c7c90SJeremy L Thompson data->assembled_bases_out[b] = B_out; 1399437c7c90SJeremy L Thompson } 1400ed9e99e6SJeremy L Thompson } 1401ed9e99e6SJeremy L Thompson 1402437c7c90SJeremy L Thompson // Pass out assembled data 1403437c7c90SJeremy L Thompson if (active_bases) *active_bases = data->active_bases; 1404437c7c90SJeremy L Thompson if (assembled_bases_in) *assembled_bases_in = (const CeedScalar **)data->assembled_bases_in; 1405437c7c90SJeremy L Thompson if (assembled_bases_out) *assembled_bases_out = (const CeedScalar **)data->assembled_bases_out; 1406437c7c90SJeremy L Thompson 1407437c7c90SJeremy L Thompson return CEED_ERROR_SUCCESS; 1408437c7c90SJeremy L Thompson } 1409437c7c90SJeremy L Thompson 1410437c7c90SJeremy L Thompson /** 1411ba746a46SJeremy L Thompson @brief Get CeedOperator CeedBasis data for assembly. 1412ba746a46SJeremy L Thompson 1413ba746a46SJeremy L Thompson Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object. 1414437c7c90SJeremy L Thompson 1415437c7c90SJeremy L Thompson @param[in] data CeedOperatorAssemblyData 1416437c7c90SJeremy L Thompson @param[out] num_active_elem_rstrs Number of active element restrictions, or NULL 1417437c7c90SJeremy L Thompson @param[out] active_elem_rstrs Pointer to hold active CeedElemRestrictions, or NULL 1418437c7c90SJeremy L Thompson 1419437c7c90SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1420437c7c90SJeremy L Thompson 1421437c7c90SJeremy L Thompson @ref Backend 1422437c7c90SJeremy L Thompson **/ 1423437c7c90SJeremy L Thompson int CeedOperatorAssemblyDataGetElemRestrictions(CeedOperatorAssemblyData data, CeedInt *num_active_elem_rstrs, 1424437c7c90SJeremy L Thompson CeedElemRestriction **active_elem_rstrs) { 1425437c7c90SJeremy L Thompson if (num_active_elem_rstrs) *num_active_elem_rstrs = data->num_active_bases; 1426437c7c90SJeremy L Thompson if (active_elem_rstrs) *active_elem_rstrs = data->active_elem_rstrs; 1427ed9e99e6SJeremy L Thompson 1428ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1429ed9e99e6SJeremy L Thompson } 1430ed9e99e6SJeremy L Thompson 1431ed9e99e6SJeremy L Thompson /** 1432ed9e99e6SJeremy L Thompson @brief Destroy CeedOperatorAssemblyData 1433ed9e99e6SJeremy L Thompson 1434ea61e9acSJeremy L Thompson @param[in,out] data CeedOperatorAssemblyData to destroy 1435ed9e99e6SJeremy L Thompson 1436ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1437ed9e99e6SJeremy L Thompson 1438ed9e99e6SJeremy L Thompson @ref Backend 1439ed9e99e6SJeremy L Thompson **/ 1440ed9e99e6SJeremy L Thompson int CeedOperatorAssemblyDataDestroy(CeedOperatorAssemblyData *data) { 1441ad6481ceSJeremy L Thompson if (!*data) { 1442ad6481ceSJeremy L Thompson *data = NULL; 1443ad6481ceSJeremy L Thompson return CEED_ERROR_SUCCESS; 1444ad6481ceSJeremy L Thompson } 14452b730f8bSJeremy L Thompson CeedCall(CeedDestroy(&(*data)->ceed)); 1446437c7c90SJeremy L Thompson for (CeedInt b = 0; b < (*data)->num_active_bases; b++) { 1447437c7c90SJeremy L Thompson CeedCall(CeedBasisDestroy(&(*data)->active_bases[b])); 1448437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&(*data)->active_elem_rstrs[b])); 1449437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_in[b])); 1450437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_out[b])); 1451437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_in[b])); 1452437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_out[b])); 1453437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_in[b])); 1454437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_out[b])); 1455437c7c90SJeremy L Thompson } 1456437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->active_bases)); 1457437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->active_elem_rstrs)); 1458437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->num_eval_modes_in)); 1459437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->num_eval_modes_out)); 1460437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_in)); 1461437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_out)); 1462437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_in)); 1463437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_out)); 1464437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_in)); 1465437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_out)); 1466ed9e99e6SJeremy L Thompson 14672b730f8bSJeremy L Thompson CeedCall(CeedFree(data)); 1468ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1469ed9e99e6SJeremy L Thompson } 1470ed9e99e6SJeremy L Thompson 1471480fae85SJeremy L Thompson /// @} 1472480fae85SJeremy L Thompson 1473480fae85SJeremy L Thompson /// ---------------------------------------------------------------------------- 1474eaf62fffSJeremy L Thompson /// CeedOperator Public API 1475eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 1476eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorUser 1477eaf62fffSJeremy L Thompson /// @{ 1478eaf62fffSJeremy L Thompson 1479eaf62fffSJeremy L Thompson /** 1480eaf62fffSJeremy L Thompson @brief Assemble a linear CeedQFunction associated with a CeedOperator 1481eaf62fffSJeremy L Thompson 1482ea61e9acSJeremy L Thompson This returns a CeedVector containing a matrix at each quadrature point providing the action of the CeedQFunction associated with the CeedOperator. 1483859c15bbSJames Wright The vector `assembled` is of shape `[num_elements, num_input_fields, num_output_fields, num_quad_points]` and contains column-major matrices 1484859c15bbSJames Wright representing the action of the CeedQFunction for a corresponding quadrature point on an element. 1485859c15bbSJames Wright 14869fd66db6SSebastian Grimberg Inputs and outputs are in the order provided by the user when adding CeedOperator fields. 14879fd66db6SSebastian Grimberg For example, a CeedQFunction with inputs 'u' and 'gradu' and outputs 'gradv' and 'v', provided in that order, would result in an assembled QFunction 14889fd66db6SSebastian Grimberg that consists of (1 + dim) x (dim + 1) matrices at each quadrature point acting on the input [u, du_0, du_1] and producing the output [dv_0, dv_1, v]. 1489eaf62fffSJeremy L Thompson 1490ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1491f04ea552SJeremy L Thompson 1492ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1493ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points 1494ea61e9acSJeremy L Thompson @param[out] rstr CeedElemRestriction for CeedVector containing assembled CeedQFunction 1495ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1496eaf62fffSJeremy L Thompson 1497eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1498eaf62fffSJeremy L Thompson 1499eaf62fffSJeremy L Thompson @ref User 1500eaf62fffSJeremy L Thompson **/ 15012b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunction(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 15022b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1503eaf62fffSJeremy L Thompson 1504eaf62fffSJeremy L Thompson if (op->LinearAssembleQFunction) { 1505d04bbc78SJeremy L Thompson // Backend version 15062b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleQFunction(op, assembled, rstr, request)); 1507eaf62fffSJeremy L Thompson } else { 1508d04bbc78SJeremy L Thompson // Operator fallback 1509d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1510d04bbc78SJeremy L Thompson 15112b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 15126574a04fSJeremy L Thompson if (op_fallback) CeedCall(CeedOperatorLinearAssembleQFunction(op_fallback, assembled, rstr, request)); 15136574a04fSJeremy L Thompson else return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunction"); 151470a7ffb3SJeremy L Thompson } 1515eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1516eaf62fffSJeremy L Thompson } 151770a7ffb3SJeremy L Thompson 151870a7ffb3SJeremy L Thompson /** 1519ea61e9acSJeremy L Thompson @brief Assemble CeedQFunction and store result internally. 15204385fb7fSSebastian Grimberg 1521ea61e9acSJeremy L Thompson Return copied references of stored data to the caller. 1522ea61e9acSJeremy L Thompson Caller is responsible for ownership and destruction of the copied references. 1523ea61e9acSJeremy L Thompson See also @ref CeedOperatorLinearAssembleQFunction 152470a7ffb3SJeremy L Thompson 1525ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1526ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points 1527ea61e9acSJeremy L Thompson @param[out] rstr CeedElemRestriction for CeedVector containing assembledCeedQFunction 1528ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 152970a7ffb3SJeremy L Thompson 153070a7ffb3SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 153170a7ffb3SJeremy L Thompson 153270a7ffb3SJeremy L Thompson @ref User 153370a7ffb3SJeremy L Thompson **/ 15342b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunctionBuildOrUpdate(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 15352b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 153670a7ffb3SJeremy L Thompson 153770a7ffb3SJeremy L Thompson if (op->LinearAssembleQFunctionUpdate) { 1538d04bbc78SJeremy L Thompson // Backend version 1539480fae85SJeremy L Thompson bool qf_assembled_is_setup; 15402efa2d85SJeremy L Thompson CeedVector assembled_vec = NULL; 15412efa2d85SJeremy L Thompson CeedElemRestriction assembled_rstr = NULL; 1542480fae85SJeremy L Thompson 15432b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataIsSetup(op->qf_assembled, &qf_assembled_is_setup)); 1544480fae85SJeremy L Thompson if (qf_assembled_is_setup) { 1545d04bbc78SJeremy L Thompson bool update_needed; 1546d04bbc78SJeremy L Thompson 15472b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataGetObjects(op->qf_assembled, &assembled_vec, &assembled_rstr)); 15482b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataIsUpdateNeeded(op->qf_assembled, &update_needed)); 15498b919e6bSJeremy L Thompson if (update_needed) { 15502b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleQFunctionUpdate(op, assembled_vec, assembled_rstr, request)); 15518b919e6bSJeremy L Thompson } 155270a7ffb3SJeremy L Thompson } else { 15532b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleQFunction(op, &assembled_vec, &assembled_rstr, request)); 15542b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataSetObjects(op->qf_assembled, assembled_vec, assembled_rstr)); 155570a7ffb3SJeremy L Thompson } 15562b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataSetUpdateNeeded(op->qf_assembled, false)); 15572efa2d85SJeremy L Thompson 1558d04bbc78SJeremy L Thompson // Copy reference from internally held copy 155970a7ffb3SJeremy L Thompson *assembled = NULL; 156070a7ffb3SJeremy L Thompson *rstr = NULL; 15612b730f8bSJeremy L Thompson CeedCall(CeedVectorReferenceCopy(assembled_vec, assembled)); 15622b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled_vec)); 15632b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(assembled_rstr, rstr)); 15642b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&assembled_rstr)); 156570a7ffb3SJeremy L Thompson } else { 1566d04bbc78SJeremy L Thompson // Operator fallback 1567d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1568d04bbc78SJeremy L Thompson 15692b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 15706574a04fSJeremy L Thompson if (op_fallback) CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op_fallback, assembled, rstr, request)); 15716574a04fSJeremy L Thompson else return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunctionUpdate"); 157270a7ffb3SJeremy L Thompson } 157370a7ffb3SJeremy L Thompson 157470a7ffb3SJeremy L Thompson return CEED_ERROR_SUCCESS; 1575eaf62fffSJeremy L Thompson } 1576eaf62fffSJeremy L Thompson 1577eaf62fffSJeremy L Thompson /** 1578eaf62fffSJeremy L Thompson @brief Assemble the diagonal of a square linear CeedOperator 1579eaf62fffSJeremy L Thompson 1580eaf62fffSJeremy L Thompson This overwrites a CeedVector with the diagonal of a linear CeedOperator. 1581eaf62fffSJeremy L Thompson 1582ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1583eaf62fffSJeremy L Thompson 1584ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1585f04ea552SJeremy L Thompson 1586ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1587eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator diagonal 1588ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1589eaf62fffSJeremy L Thompson 1590eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1591eaf62fffSJeremy L Thompson 1592eaf62fffSJeremy L Thompson @ref User 1593eaf62fffSJeremy L Thompson **/ 15942b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1595f3d47e36SJeremy L Thompson bool is_composite; 15962b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1597f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1598eaf62fffSJeremy L Thompson 1599c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 16002b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 16016574a04fSJeremy L Thompson CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1602c9366a6bSJeremy L Thompson 1603f3d47e36SJeremy L Thompson // Early exit for empty operator 1604f3d47e36SJeremy L Thompson if (!is_composite) { 1605f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1606f3d47e36SJeremy L Thompson 1607f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1608f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1609f3d47e36SJeremy L Thompson } 1610f3d47e36SJeremy L Thompson 1611eaf62fffSJeremy L Thompson if (op->LinearAssembleDiagonal) { 1612d04bbc78SJeremy L Thompson // Backend version 16132b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleDiagonal(op, assembled, request)); 1614eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1615eaf62fffSJeremy L Thompson } else if (op->LinearAssembleAddDiagonal) { 1616d04bbc78SJeremy L Thompson // Backend version with zeroing first 16172b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 16182b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request)); 1619eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1620eaf62fffSJeremy L Thompson } else { 1621d04bbc78SJeremy L Thompson // Operator fallback 1622d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1623d04bbc78SJeremy L Thompson 16242b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1625d04bbc78SJeremy L Thompson if (op_fallback) { 16262b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleDiagonal(op_fallback, assembled, request)); 1627eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1628eaf62fffSJeremy L Thompson } 1629eaf62fffSJeremy L Thompson } 1630eaf62fffSJeremy L Thompson // Default interface implementation 16312b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 16322b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddDiagonal(op, assembled, request)); 1633d04bbc78SJeremy L Thompson 1634eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1635eaf62fffSJeremy L Thompson } 1636eaf62fffSJeremy L Thompson 1637eaf62fffSJeremy L Thompson /** 1638eaf62fffSJeremy L Thompson @brief Assemble the diagonal of a square linear CeedOperator 1639eaf62fffSJeremy L Thompson 1640eaf62fffSJeremy L Thompson This sums into a CeedVector the diagonal of a linear CeedOperator. 1641eaf62fffSJeremy L Thompson 1642ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1643eaf62fffSJeremy L Thompson 1644ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1645f04ea552SJeremy L Thompson 1646ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1647eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator diagonal 1648ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1649eaf62fffSJeremy L Thompson 1650eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1651eaf62fffSJeremy L Thompson 1652eaf62fffSJeremy L Thompson @ref User 1653eaf62fffSJeremy L Thompson **/ 16542b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1655f3d47e36SJeremy L Thompson bool is_composite; 16562b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1657f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1658eaf62fffSJeremy L Thompson 1659c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 16602b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 16616574a04fSJeremy L Thompson CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1662c9366a6bSJeremy L Thompson 1663f3d47e36SJeremy L Thompson // Early exit for empty operator 1664f3d47e36SJeremy L Thompson if (!is_composite) { 1665f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1666f3d47e36SJeremy L Thompson 1667f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1668f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1669f3d47e36SJeremy L Thompson } 1670f3d47e36SJeremy L Thompson 1671eaf62fffSJeremy L Thompson if (op->LinearAssembleAddDiagonal) { 1672d04bbc78SJeremy L Thompson // Backend version 16732b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request)); 1674eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1675eaf62fffSJeremy L Thompson } else { 1676d04bbc78SJeremy L Thompson // Operator fallback 1677d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1678d04bbc78SJeremy L Thompson 16792b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1680d04bbc78SJeremy L Thompson if (op_fallback) { 16812b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddDiagonal(op_fallback, assembled, request)); 1682eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1683eaf62fffSJeremy L Thompson } 1684eaf62fffSJeremy L Thompson } 1685eaf62fffSJeremy L Thompson // Default interface implementation 1686eaf62fffSJeremy L Thompson if (is_composite) { 16872b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, false, assembled)); 1688eaf62fffSJeremy L Thompson } else { 16892b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, false, assembled)); 1690eaf62fffSJeremy L Thompson } 1691d04bbc78SJeremy L Thompson 1692d04bbc78SJeremy L Thompson return CEED_ERROR_SUCCESS; 1693eaf62fffSJeremy L Thompson } 1694eaf62fffSJeremy L Thompson 1695eaf62fffSJeremy L Thompson /** 1696eaf62fffSJeremy L Thompson @brief Assemble the point block diagonal of a square linear CeedOperator 1697eaf62fffSJeremy L Thompson 1698ea61e9acSJeremy L Thompson This overwrites a CeedVector with the point block diagonal of a linear CeedOperator. 1699eaf62fffSJeremy L Thompson 1700ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1701eaf62fffSJeremy L Thompson 1702ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1703f04ea552SJeremy L Thompson 1704ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1705ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp 1706ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out, 1707ea61e9acSJeremy L Thompson component in]. 1708ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1709eaf62fffSJeremy L Thompson 1710eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1711eaf62fffSJeremy L Thompson 1712eaf62fffSJeremy L Thompson @ref User 1713eaf62fffSJeremy L Thompson **/ 17142b730f8bSJeremy L Thompson int CeedOperatorLinearAssemblePointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1715f3d47e36SJeremy L Thompson bool is_composite; 17162b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1717f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1718eaf62fffSJeremy L Thompson 1719c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 17202b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 17216574a04fSJeremy L Thompson CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1722c9366a6bSJeremy L Thompson 1723f3d47e36SJeremy L Thompson // Early exit for empty operator 1724f3d47e36SJeremy L Thompson if (!is_composite) { 1725f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1726f3d47e36SJeremy L Thompson 1727f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1728f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1729f3d47e36SJeremy L Thompson } 1730f3d47e36SJeremy L Thompson 1731eaf62fffSJeremy L Thompson if (op->LinearAssemblePointBlockDiagonal) { 1732d04bbc78SJeremy L Thompson // Backend version 17332b730f8bSJeremy L Thompson CeedCall(op->LinearAssemblePointBlockDiagonal(op, assembled, request)); 1734eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1735eaf62fffSJeremy L Thompson } else if (op->LinearAssembleAddPointBlockDiagonal) { 1736d04bbc78SJeremy L Thompson // Backend version with zeroing first 17372b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 17382b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request)); 1739eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1740eaf62fffSJeremy L Thompson } else { 1741d04bbc78SJeremy L Thompson // Operator fallback 1742d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1743d04bbc78SJeremy L Thompson 17442b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1745d04bbc78SJeremy L Thompson if (op_fallback) { 17462b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssemblePointBlockDiagonal(op_fallback, assembled, request)); 1747eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1748eaf62fffSJeremy L Thompson } 1749eaf62fffSJeremy L Thompson } 1750eaf62fffSJeremy L Thompson // Default interface implementation 17512b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 17522b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request)); 1753d04bbc78SJeremy L Thompson 1754eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1755eaf62fffSJeremy L Thompson } 1756eaf62fffSJeremy L Thompson 1757eaf62fffSJeremy L Thompson /** 1758eaf62fffSJeremy L Thompson @brief Assemble the point block diagonal of a square linear CeedOperator 1759eaf62fffSJeremy L Thompson 1760ea61e9acSJeremy L Thompson This sums into a CeedVector with the point block diagonal of a linear CeedOperator. 1761eaf62fffSJeremy L Thompson 1762ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1763eaf62fffSJeremy L Thompson 1764ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1765f04ea552SJeremy L Thompson 1766ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1767ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp 1768ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out, 1769ea61e9acSJeremy L Thompson component in]. 1770ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1771eaf62fffSJeremy L Thompson 1772eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1773eaf62fffSJeremy L Thompson 1774eaf62fffSJeremy L Thompson @ref User 1775eaf62fffSJeremy L Thompson **/ 17762b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddPointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1777f3d47e36SJeremy L Thompson bool is_composite; 17782b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1779f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1780eaf62fffSJeremy L Thompson 1781c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 17822b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 17836574a04fSJeremy L Thompson CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1784c9366a6bSJeremy L Thompson 1785f3d47e36SJeremy L Thompson // Early exit for empty operator 1786f3d47e36SJeremy L Thompson if (!is_composite) { 1787f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1788f3d47e36SJeremy L Thompson 1789f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1790f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1791f3d47e36SJeremy L Thompson } 1792f3d47e36SJeremy L Thompson 1793eaf62fffSJeremy L Thompson if (op->LinearAssembleAddPointBlockDiagonal) { 1794d04bbc78SJeremy L Thompson // Backend version 17952b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleAddPointBlockDiagonal(op, assembled, request)); 1796eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1797eaf62fffSJeremy L Thompson } else { 1798d04bbc78SJeremy L Thompson // Operator fallback 1799d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1800d04bbc78SJeremy L Thompson 18012b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1802d04bbc78SJeremy L Thompson if (op_fallback) { 18032b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op_fallback, assembled, request)); 1804eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1805eaf62fffSJeremy L Thompson } 1806eaf62fffSJeremy L Thompson } 1807ea61e9acSJeremy L Thompson // Default interface implementation 1808eaf62fffSJeremy L Thompson if (is_composite) { 18092b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, true, assembled)); 1810eaf62fffSJeremy L Thompson } else { 18112b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, true, assembled)); 1812eaf62fffSJeremy L Thompson } 1813d04bbc78SJeremy L Thompson 1814d04bbc78SJeremy L Thompson return CEED_ERROR_SUCCESS; 1815eaf62fffSJeremy L Thompson } 1816eaf62fffSJeremy L Thompson 1817eaf62fffSJeremy L Thompson /** 1818eaf62fffSJeremy L Thompson @brief Fully assemble the nonzero pattern of a linear operator. 1819eaf62fffSJeremy L Thompson 1820ea61e9acSJeremy L Thompson Expected to be used in conjunction with CeedOperatorLinearAssemble(). 1821eaf62fffSJeremy L Thompson 1822ea61e9acSJeremy L Thompson The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the 18239fd66db6SSebastian Grimberg matrix in entry (i, j). 18249fd66db6SSebastian Grimberg Note that the (i, j) pairs are not unique and may repeat. 18259fd66db6SSebastian Grimberg This function returns the number of entries and their (i, j) locations, while CeedOperatorLinearAssemble() provides the values in the same ordering. 1826eaf62fffSJeremy L Thompson 1827eaf62fffSJeremy L Thompson This will generally be slow unless your operator is low-order. 1828eaf62fffSJeremy L Thompson 1829ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1830f04ea552SJeremy L Thompson 1831eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 1832eaf62fffSJeremy L Thompson @param[out] num_entries Number of entries in coordinate nonzero pattern 1833eaf62fffSJeremy L Thompson @param[out] rows Row number for each entry 1834eaf62fffSJeremy L Thompson @param[out] cols Column number for each entry 1835eaf62fffSJeremy L Thompson 1836eaf62fffSJeremy L Thompson @ref User 1837eaf62fffSJeremy L Thompson **/ 18382b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleSymbolic(CeedOperator op, CeedSize *num_entries, CeedInt **rows, CeedInt **cols) { 1839eaf62fffSJeremy L Thompson CeedInt num_suboperators, single_entries; 1840eaf62fffSJeremy L Thompson CeedOperator *sub_operators; 1841eaf62fffSJeremy L Thompson bool is_composite; 18422b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1843f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1844eaf62fffSJeremy L Thompson 1845eaf62fffSJeremy L Thompson if (op->LinearAssembleSymbolic) { 1846d04bbc78SJeremy L Thompson // Backend version 18472b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleSymbolic(op, num_entries, rows, cols)); 1848eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1849eaf62fffSJeremy L Thompson } else { 1850d04bbc78SJeremy L Thompson // Operator fallback 1851d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1852d04bbc78SJeremy L Thompson 18532b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1854d04bbc78SJeremy L Thompson if (op_fallback) { 18552b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleSymbolic(op_fallback, num_entries, rows, cols)); 1856eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1857eaf62fffSJeremy L Thompson } 1858eaf62fffSJeremy L Thompson } 1859eaf62fffSJeremy L Thompson 1860eaf62fffSJeremy L Thompson // Default interface implementation 1861eaf62fffSJeremy L Thompson 1862eaf62fffSJeremy L Thompson // count entries and allocate rows, cols arrays 1863eaf62fffSJeremy L Thompson *num_entries = 0; 1864eaf62fffSJeremy L Thompson if (is_composite) { 1865c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1866c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 186792ae7e47SJeremy L Thompson for (CeedInt k = 0; k < num_suboperators; ++k) { 18682b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries)); 1869eaf62fffSJeremy L Thompson *num_entries += single_entries; 1870eaf62fffSJeremy L Thompson } 1871eaf62fffSJeremy L Thompson } else { 18722b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(op, &single_entries)); 1873eaf62fffSJeremy L Thompson *num_entries += single_entries; 1874eaf62fffSJeremy L Thompson } 18752b730f8bSJeremy L Thompson CeedCall(CeedCalloc(*num_entries, rows)); 18762b730f8bSJeremy L Thompson CeedCall(CeedCalloc(*num_entries, cols)); 1877eaf62fffSJeremy L Thompson 1878eaf62fffSJeremy L Thompson // assemble nonzero locations 1879eaf62fffSJeremy L Thompson CeedInt offset = 0; 1880eaf62fffSJeremy L Thompson if (is_composite) { 1881c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1882c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 188392ae7e47SJeremy L Thompson for (CeedInt k = 0; k < num_suboperators; ++k) { 18842b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleSymbolic(sub_operators[k], offset, *rows, *cols)); 18852b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries)); 1886eaf62fffSJeremy L Thompson offset += single_entries; 1887eaf62fffSJeremy L Thompson } 1888eaf62fffSJeremy L Thompson } else { 18892b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleSymbolic(op, offset, *rows, *cols)); 1890eaf62fffSJeremy L Thompson } 1891eaf62fffSJeremy L Thompson 1892eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1893eaf62fffSJeremy L Thompson } 1894eaf62fffSJeremy L Thompson 1895eaf62fffSJeremy L Thompson /** 1896eaf62fffSJeremy L Thompson @brief Fully assemble the nonzero entries of a linear operator. 1897eaf62fffSJeremy L Thompson 1898ea61e9acSJeremy L Thompson Expected to be used in conjunction with CeedOperatorLinearAssembleSymbolic(). 1899eaf62fffSJeremy L Thompson 1900ea61e9acSJeremy L Thompson The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the 19019fd66db6SSebastian Grimberg matrix in entry (i, j). 19029fd66db6SSebastian Grimberg Note that the (i, j) pairs are not unique and may repeat. 19039fd66db6SSebastian Grimberg This function returns the values of the nonzero entries to be added, their (i, j) locations are provided by CeedOperatorLinearAssembleSymbolic() 1904eaf62fffSJeremy L Thompson 1905eaf62fffSJeremy L Thompson This will generally be slow unless your operator is low-order. 1906eaf62fffSJeremy L Thompson 1907ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1908f04ea552SJeremy L Thompson 1909eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 1910eaf62fffSJeremy L Thompson @param[out] values Values to assemble into matrix 1911eaf62fffSJeremy L Thompson 1912eaf62fffSJeremy L Thompson @ref User 1913eaf62fffSJeremy L Thompson **/ 1914eaf62fffSJeremy L Thompson int CeedOperatorLinearAssemble(CeedOperator op, CeedVector values) { 1915eaf62fffSJeremy L Thompson CeedInt num_suboperators, single_entries = 0; 1916eaf62fffSJeremy L Thompson CeedOperator *sub_operators; 1917f3d47e36SJeremy L Thompson bool is_composite; 19182b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1919f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1920f3d47e36SJeremy L Thompson 1921f3d47e36SJeremy L Thompson // Early exit for empty operator 1922f3d47e36SJeremy L Thompson if (!is_composite) { 1923f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1924f3d47e36SJeremy L Thompson 1925f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1926f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1927f3d47e36SJeremy L Thompson } 1928eaf62fffSJeremy L Thompson 1929eaf62fffSJeremy L Thompson if (op->LinearAssemble) { 1930d04bbc78SJeremy L Thompson // Backend version 19312b730f8bSJeremy L Thompson CeedCall(op->LinearAssemble(op, values)); 1932eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1933eaf62fffSJeremy L Thompson } else { 1934d04bbc78SJeremy L Thompson // Operator fallback 1935d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1936d04bbc78SJeremy L Thompson 19372b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1938d04bbc78SJeremy L Thompson if (op_fallback) { 19392b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssemble(op_fallback, values)); 1940eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1941eaf62fffSJeremy L Thompson } 1942eaf62fffSJeremy L Thompson } 1943eaf62fffSJeremy L Thompson 1944eaf62fffSJeremy L Thompson // Default interface implementation 1945eaf62fffSJeremy L Thompson CeedInt offset = 0; 194628ec399dSJeremy L Thompson CeedCall(CeedVectorSetValue(values, 0.0)); 1947eaf62fffSJeremy L Thompson if (is_composite) { 1948c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1949c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 1950cefa2673SJeremy L Thompson for (CeedInt k = 0; k < num_suboperators; k++) { 19512b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemble(sub_operators[k], offset, values)); 19522b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries)); 1953eaf62fffSJeremy L Thompson offset += single_entries; 1954eaf62fffSJeremy L Thompson } 1955eaf62fffSJeremy L Thompson } else { 19562b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemble(op, offset, values)); 1957eaf62fffSJeremy L Thompson } 1958eaf62fffSJeremy L Thompson 1959eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1960eaf62fffSJeremy L Thompson } 1961eaf62fffSJeremy L Thompson 1962eaf62fffSJeremy L Thompson /** 196375f0d5a4SJeremy L Thompson @brief Get the multiplicity of nodes across suboperators in a composite CeedOperator 196475f0d5a4SJeremy L Thompson 196575f0d5a4SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 196675f0d5a4SJeremy L Thompson 196775f0d5a4SJeremy L Thompson @param[in] op Composite CeedOperator 196875f0d5a4SJeremy L Thompson @param[in] num_skip_indices Number of suboperators to skip 196975f0d5a4SJeremy L Thompson @param[in] skip_indices Array of indices of suboperators to skip 197075f0d5a4SJeremy L Thompson @param[out] mult Vector to store multiplicity (of size l_size) 197175f0d5a4SJeremy L Thompson 197275f0d5a4SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 197375f0d5a4SJeremy L Thompson 197475f0d5a4SJeremy L Thompson @ref User 197575f0d5a4SJeremy L Thompson **/ 197675f0d5a4SJeremy L Thompson int CeedCompositeOperatorGetMultiplicity(CeedOperator op, CeedInt num_skip_indices, CeedInt *skip_indices, CeedVector mult) { 197775f0d5a4SJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 197875f0d5a4SJeremy L Thompson 197975f0d5a4SJeremy L Thompson Ceed ceed; 1980b275c451SJeremy L Thompson CeedInt num_suboperators; 198175f0d5a4SJeremy L Thompson CeedSize l_vec_len; 198275f0d5a4SJeremy L Thompson CeedScalar *mult_array; 198375f0d5a4SJeremy L Thompson CeedVector ones_l_vec; 1984437c7c90SJeremy L Thompson CeedElemRestriction elem_rstr; 1985b275c451SJeremy L Thompson CeedOperator *sub_operators; 198675f0d5a4SJeremy L Thompson 198775f0d5a4SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 198875f0d5a4SJeremy L Thompson 198975f0d5a4SJeremy L Thompson // Zero mult vector 199075f0d5a4SJeremy L Thompson CeedCall(CeedVectorSetValue(mult, 0.0)); 199175f0d5a4SJeremy L Thompson 199275f0d5a4SJeremy L Thompson // Get suboperators 1993b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1994b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 1995b275c451SJeremy L Thompson if (num_suboperators == 0) return CEED_ERROR_SUCCESS; 199675f0d5a4SJeremy L Thompson 199775f0d5a4SJeremy L Thompson // Work vector 199875f0d5a4SJeremy L Thompson CeedCall(CeedVectorGetLength(mult, &l_vec_len)); 199975f0d5a4SJeremy L Thompson CeedCall(CeedVectorCreate(ceed, l_vec_len, &ones_l_vec)); 200075f0d5a4SJeremy L Thompson CeedCall(CeedVectorSetValue(ones_l_vec, 1.0)); 200175f0d5a4SJeremy L Thompson CeedCall(CeedVectorGetArray(mult, CEED_MEM_HOST, &mult_array)); 200275f0d5a4SJeremy L Thompson 200375f0d5a4SJeremy L Thompson // Compute multiplicity across suboperators 2004b275c451SJeremy L Thompson for (CeedInt i = 0; i < num_suboperators; i++) { 200575f0d5a4SJeremy L Thompson const CeedScalar *sub_mult_array; 200675f0d5a4SJeremy L Thompson CeedVector sub_mult_l_vec, ones_e_vec; 200775f0d5a4SJeremy L Thompson 200875f0d5a4SJeremy L Thompson // -- Check for suboperator to skip 200975f0d5a4SJeremy L Thompson for (CeedInt j = 0; j < num_skip_indices; j++) { 201075f0d5a4SJeremy L Thompson if (skip_indices[j] == i) continue; 201175f0d5a4SJeremy L Thompson } 201275f0d5a4SJeremy L Thompson 201375f0d5a4SJeremy L Thompson // -- Sub operator multiplicity 2014437c7c90SJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(sub_operators[i], &elem_rstr)); 2015437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionCreateVector(elem_rstr, &sub_mult_l_vec, &ones_e_vec)); 201675f0d5a4SJeremy L Thompson CeedCall(CeedVectorSetValue(sub_mult_l_vec, 0.0)); 2017437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionApply(elem_rstr, CEED_NOTRANSPOSE, ones_l_vec, ones_e_vec, CEED_REQUEST_IMMEDIATE)); 2018437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionApply(elem_rstr, CEED_TRANSPOSE, ones_e_vec, sub_mult_l_vec, CEED_REQUEST_IMMEDIATE)); 201975f0d5a4SJeremy L Thompson CeedCall(CeedVectorGetArrayRead(sub_mult_l_vec, CEED_MEM_HOST, &sub_mult_array)); 202075f0d5a4SJeremy L Thompson // ---- Flag every node present in the current suboperator 202175f0d5a4SJeremy L Thompson for (CeedInt j = 0; j < l_vec_len; j++) { 202275f0d5a4SJeremy L Thompson if (sub_mult_array[j] > 0.0) mult_array[j] += 1.0; 202375f0d5a4SJeremy L Thompson } 202475f0d5a4SJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(sub_mult_l_vec, &sub_mult_array)); 202575f0d5a4SJeremy L Thompson CeedCall(CeedVectorDestroy(&sub_mult_l_vec)); 202675f0d5a4SJeremy L Thompson CeedCall(CeedVectorDestroy(&ones_e_vec)); 202775f0d5a4SJeremy L Thompson } 202875f0d5a4SJeremy L Thompson CeedCall(CeedVectorRestoreArray(mult, &mult_array)); 2029811d0ccfSJeremy L Thompson CeedCall(CeedVectorDestroy(&ones_l_vec)); 203075f0d5a4SJeremy L Thompson 203175f0d5a4SJeremy L Thompson return CEED_ERROR_SUCCESS; 203275f0d5a4SJeremy L Thompson } 203375f0d5a4SJeremy L Thompson 203475f0d5a4SJeremy L Thompson /** 2035ea61e9acSJeremy L Thompson @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator, creating the prolongation basis from the fine and coarse 2036ea61e9acSJeremy L Thompson grid interpolation 2037eaf62fffSJeremy L Thompson 203858e4b056SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable. 2039f04ea552SJeremy L Thompson 2040eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 204185bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 2042eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 2043eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 2044eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 204585bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 204685bb9dcfSJeremy L Thompson @param[out] op_restrict Fine to coarse operator, or NULL 2047eaf62fffSJeremy L Thompson 2048eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2049eaf62fffSJeremy L Thompson 2050eaf62fffSJeremy L Thompson @ref User 2051eaf62fffSJeremy L Thompson **/ 20522b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreate(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 20532b730f8bSJeremy L Thompson CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) { 20542b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fine)); 2055eaf62fffSJeremy L Thompson 205683d6adf3SZach Atkins // Build prolongation matrix, if required 205783d6adf3SZach Atkins CeedBasis basis_c_to_f = NULL; 205883d6adf3SZach Atkins if (op_prolong || op_restrict) { 205983d6adf3SZach Atkins CeedBasis basis_fine; 20602b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine)); 20612b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateProjection(basis_coarse, basis_fine, &basis_c_to_f)); 206283d6adf3SZach Atkins } 2063eaf62fffSJeremy L Thompson 2064f113e5dcSJeremy L Thompson // Core code 20652b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict)); 2066f113e5dcSJeremy L Thompson 2067eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2068eaf62fffSJeremy L Thompson } 2069eaf62fffSJeremy L Thompson 2070eaf62fffSJeremy L Thompson /** 2071ea61e9acSJeremy L Thompson @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a tensor basis for the active basis 2072eaf62fffSJeremy L Thompson 207358e4b056SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable. 2074f04ea552SJeremy L Thompson 2075eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 207685bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 2077eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 2078eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 207985bb9dcfSJeremy L Thompson @param[in] interp_c_to_f Matrix for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators 2080eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 208185bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 208285bb9dcfSJeremy L Thompson @param[out] op_restrict Fine to coarse operator, or NULL 2083eaf62fffSJeremy L Thompson 2084eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2085eaf62fffSJeremy L Thompson 2086eaf62fffSJeremy L Thompson @ref User 2087eaf62fffSJeremy L Thompson **/ 20882b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateTensorH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 20892b730f8bSJeremy L Thompson const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, 20902b730f8bSJeremy L Thompson CeedOperator *op_restrict) { 20912b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fine)); 2092eaf62fffSJeremy L Thompson Ceed ceed; 20932b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op_fine, &ceed)); 2094eaf62fffSJeremy L Thompson 2095eaf62fffSJeremy L Thompson // Check for compatible quadrature spaces 2096eaf62fffSJeremy L Thompson CeedBasis basis_fine; 20972b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine)); 2098eaf62fffSJeremy L Thompson CeedInt Q_f, Q_c; 20992b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f)); 21002b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c)); 21016574a04fSJeremy L Thompson CeedCheck(Q_f == Q_c, ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces"); 2102eaf62fffSJeremy L Thompson 210383d6adf3SZach Atkins // Create coarse to fine basis, if required 210483d6adf3SZach Atkins CeedBasis basis_c_to_f = NULL; 210583d6adf3SZach Atkins if (op_prolong || op_restrict) { 210683d6adf3SZach Atkins // Check if interpolation matrix is provided 21076574a04fSJeremy L Thompson CeedCheck(interp_c_to_f, ceed, CEED_ERROR_INCOMPATIBLE, 21086574a04fSJeremy L Thompson "Prolongation or restriction operator creation requires coarse-to-fine interpolation matrix"); 2109eaf62fffSJeremy L Thompson CeedInt dim, num_comp, num_nodes_c, P_1d_f, P_1d_c; 21102b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis_fine, &dim)); 21112b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp)); 21122b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes1D(basis_fine, &P_1d_f)); 21132b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c)); 21142b730f8bSJeremy L Thompson P_1d_c = dim == 1 ? num_nodes_c : dim == 2 ? sqrt(num_nodes_c) : cbrt(num_nodes_c); 2115eaf62fffSJeremy L Thompson CeedScalar *q_ref, *q_weight, *grad; 21162b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d_f, &q_ref)); 21172b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d_f, &q_weight)); 21182b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d_f * P_1d_c * dim, &grad)); 21192b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateTensorH1(ceed, dim, num_comp, P_1d_c, P_1d_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f)); 21202b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_ref)); 21212b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_weight)); 21222b730f8bSJeremy L Thompson CeedCall(CeedFree(&grad)); 212383d6adf3SZach Atkins } 2124eaf62fffSJeremy L Thompson 2125eaf62fffSJeremy L Thompson // Core code 21262b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict)); 2127eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2128eaf62fffSJeremy L Thompson } 2129eaf62fffSJeremy L Thompson 2130eaf62fffSJeremy L Thompson /** 2131ea61e9acSJeremy L Thompson @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a non-tensor basis for the active vector 2132eaf62fffSJeremy L Thompson 213358e4b056SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable. 2134f04ea552SJeremy L Thompson 2135eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 213685bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 2137eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 2138eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 213985bb9dcfSJeremy L Thompson @param[in] interp_c_to_f Matrix for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators 2140eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 214185bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 214285bb9dcfSJeremy L Thompson @param[out] op_restrict Fine to coarse operator, or NULL 2143eaf62fffSJeremy L Thompson 2144eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2145eaf62fffSJeremy L Thompson 2146eaf62fffSJeremy L Thompson @ref User 2147eaf62fffSJeremy L Thompson **/ 21482b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 21492b730f8bSJeremy L Thompson const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, 2150eaf62fffSJeremy L Thompson CeedOperator *op_restrict) { 21512b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fine)); 2152eaf62fffSJeremy L Thompson Ceed ceed; 21532b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op_fine, &ceed)); 2154eaf62fffSJeremy L Thompson 2155eaf62fffSJeremy L Thompson // Check for compatible quadrature spaces 2156eaf62fffSJeremy L Thompson CeedBasis basis_fine; 21572b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine)); 2158eaf62fffSJeremy L Thompson CeedInt Q_f, Q_c; 21592b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f)); 21602b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c)); 21616574a04fSJeremy L Thompson CeedCheck(Q_f == Q_c, ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces"); 2162eaf62fffSJeremy L Thompson 2163eaf62fffSJeremy L Thompson // Coarse to fine basis 216483d6adf3SZach Atkins CeedBasis basis_c_to_f = NULL; 216583d6adf3SZach Atkins if (op_prolong || op_restrict) { 216683d6adf3SZach Atkins // Check if interpolation matrix is provided 21676574a04fSJeremy L Thompson CeedCheck(interp_c_to_f, ceed, CEED_ERROR_INCOMPATIBLE, 21686574a04fSJeremy L Thompson "Prolongation or restriction operator creation requires coarse-to-fine interpolation matrix"); 2169eaf62fffSJeremy L Thompson CeedElemTopology topo; 21702b730f8bSJeremy L Thompson CeedCall(CeedBasisGetTopology(basis_fine, &topo)); 2171eaf62fffSJeremy L Thompson CeedInt dim, num_comp, num_nodes_c, num_nodes_f; 21722b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis_fine, &dim)); 21732b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp)); 21742b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes(basis_fine, &num_nodes_f)); 21752b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c)); 2176eaf62fffSJeremy L Thompson CeedScalar *q_ref, *q_weight, *grad; 21772b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_nodes_f * dim, &q_ref)); 21782b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_nodes_f, &q_weight)); 21792b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_nodes_f * num_nodes_c * dim, &grad)); 21802b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateH1(ceed, topo, num_comp, num_nodes_c, num_nodes_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f)); 21812b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_ref)); 21822b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_weight)); 21832b730f8bSJeremy L Thompson CeedCall(CeedFree(&grad)); 218483d6adf3SZach Atkins } 2185eaf62fffSJeremy L Thompson 2186eaf62fffSJeremy L Thompson // Core code 21872b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict)); 2188eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2189eaf62fffSJeremy L Thompson } 2190eaf62fffSJeremy L Thompson 2191eaf62fffSJeremy L Thompson /** 2192ea61e9acSJeremy L Thompson @brief Build a FDM based approximate inverse for each element for a CeedOperator 2193eaf62fffSJeremy L Thompson 2194ea61e9acSJeremy L Thompson This returns a CeedOperator and CeedVector to apply a Fast Diagonalization Method based approximate inverse. 2195859c15bbSJames Wright This function obtains the simultaneous diagonalization for the 1D mass and Laplacian operators, \f$M = V^T V, K = V^T S V\f$. 2196859c15bbSJames Wright The assembled QFunction is used to modify the eigenvalues from simultaneous diagonalization and obtain an approximate inverse of the form \f$V^T 21979fd66db6SSebastian Grimberg \hat S V\f$. 21989fd66db6SSebastian Grimberg The CeedOperator must be linear and non-composite. 21999fd66db6SSebastian Grimberg The associated CeedQFunction must therefore also be linear. 2200eaf62fffSJeremy L Thompson 2201ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 2202f04ea552SJeremy L Thompson 2203ea61e9acSJeremy L Thompson @param[in] op CeedOperator to create element inverses 2204ea61e9acSJeremy L Thompson @param[out] fdm_inv CeedOperator to apply the action of a FDM based inverse for each element 2205ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 2206eaf62fffSJeremy L Thompson 2207eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2208eaf62fffSJeremy L Thompson 2209480fae85SJeremy L Thompson @ref User 2210eaf62fffSJeremy L Thompson **/ 22112b730f8bSJeremy L Thompson int CeedOperatorCreateFDMElementInverse(CeedOperator op, CeedOperator *fdm_inv, CeedRequest *request) { 22122b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 2213eaf62fffSJeremy L Thompson 2214eaf62fffSJeremy L Thompson if (op->CreateFDMElementInverse) { 2215d04bbc78SJeremy L Thompson // Backend version 22162b730f8bSJeremy L Thompson CeedCall(op->CreateFDMElementInverse(op, fdm_inv, request)); 2217eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2218eaf62fffSJeremy L Thompson } else { 2219d04bbc78SJeremy L Thompson // Operator fallback 2220d04bbc78SJeremy L Thompson CeedOperator op_fallback; 2221d04bbc78SJeremy L Thompson 22222b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 2223d04bbc78SJeremy L Thompson if (op_fallback) { 22242b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreateFDMElementInverse(op_fallback, fdm_inv, request)); 2225eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2226eaf62fffSJeremy L Thompson } 2227eaf62fffSJeremy L Thompson } 2228eaf62fffSJeremy L Thompson 2229d04bbc78SJeremy L Thompson // Default interface implementation 2230eaf62fffSJeremy L Thompson Ceed ceed, ceed_parent; 22312b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 22322b730f8bSJeremy L Thompson CeedCall(CeedGetOperatorFallbackParentCeed(ceed, &ceed_parent)); 2233eaf62fffSJeremy L Thompson ceed_parent = ceed_parent ? ceed_parent : ceed; 2234eaf62fffSJeremy L Thompson CeedQFunction qf; 22352b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 2236eaf62fffSJeremy L Thompson 2237eaf62fffSJeremy L Thompson // Determine active input basis 2238eaf62fffSJeremy L Thompson bool interp = false, grad = false; 2239eaf62fffSJeremy L Thompson CeedBasis basis = NULL; 2240eaf62fffSJeremy L Thompson CeedElemRestriction rstr = NULL; 2241eaf62fffSJeremy L Thompson CeedOperatorField *op_fields; 2242eaf62fffSJeremy L Thompson CeedQFunctionField *qf_fields; 2243eaf62fffSJeremy L Thompson CeedInt num_input_fields; 22442b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, &num_input_fields, &op_fields, NULL, NULL)); 22452b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL)); 2246eaf62fffSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 2247eaf62fffSJeremy L Thompson CeedVector vec; 22482b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec)); 2249eaf62fffSJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 2250eaf62fffSJeremy L Thompson CeedEvalMode eval_mode; 22512b730f8bSJeremy L Thompson CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 2252eaf62fffSJeremy L Thompson interp = interp || eval_mode == CEED_EVAL_INTERP; 2253eaf62fffSJeremy L Thompson grad = grad || eval_mode == CEED_EVAL_GRAD; 22542b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 22552b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr)); 2256eaf62fffSJeremy L Thompson } 2257eaf62fffSJeremy L Thompson } 22586574a04fSJeremy L Thompson CeedCheck(basis, ceed, CEED_ERROR_BACKEND, "No active field set"); 2259e79b91d9SJeremy L Thompson CeedSize l_size = 1; 2260352a5e7cSSebastian Grimberg CeedInt P_1d, Q_1d, num_nodes, num_qpts, dim, num_comp = 1, num_elem = 1; 22612b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes1D(basis, &P_1d)); 2262352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumNodes(basis, &num_nodes)); 22632b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints1D(basis, &Q_1d)); 22642b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis, &num_qpts)); 22652b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis, &dim)); 22662b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis, &num_comp)); 22672b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem)); 22682b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size)); 2269eaf62fffSJeremy L Thompson 2270eaf62fffSJeremy L Thompson // Build and diagonalize 1D Mass and Laplacian 22716574a04fSJeremy L Thompson bool is_tensor_basis; 22726574a04fSJeremy L Thompson CeedCall(CeedBasisIsTensor(basis, &is_tensor_basis)); 22736574a04fSJeremy L Thompson CeedCheck(is_tensor_basis, ceed, CEED_ERROR_BACKEND, "FDMElementInverse only supported for tensor bases"); 2274eaf62fffSJeremy L Thompson CeedScalar *mass, *laplace, *x, *fdm_interp, *lambda; 22752b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &mass)); 22762b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &laplace)); 22772b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &x)); 22782b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &fdm_interp)); 22792b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d, &lambda)); 2280eaf62fffSJeremy L Thompson // -- Build matrices 2281eaf62fffSJeremy L Thompson const CeedScalar *interp_1d, *grad_1d, *q_weight_1d; 22822b730f8bSJeremy L Thompson CeedCall(CeedBasisGetInterp1D(basis, &interp_1d)); 22832b730f8bSJeremy L Thompson CeedCall(CeedBasisGetGrad1D(basis, &grad_1d)); 22842b730f8bSJeremy L Thompson CeedCall(CeedBasisGetQWeights(basis, &q_weight_1d)); 22852b730f8bSJeremy L Thompson CeedCall(CeedBuildMassLaplace(interp_1d, grad_1d, q_weight_1d, P_1d, Q_1d, dim, mass, laplace)); 2286eaf62fffSJeremy L Thompson 2287eaf62fffSJeremy L Thompson // -- Diagonalize 22882b730f8bSJeremy L Thompson CeedCall(CeedSimultaneousDiagonalization(ceed, laplace, mass, x, lambda, P_1d)); 22892b730f8bSJeremy L Thompson CeedCall(CeedFree(&mass)); 22902b730f8bSJeremy L Thompson CeedCall(CeedFree(&laplace)); 22912b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) { 22922b730f8bSJeremy L Thompson for (CeedInt j = 0; j < P_1d; j++) fdm_interp[i + j * P_1d] = x[j + i * P_1d]; 22932b730f8bSJeremy L Thompson } 22942b730f8bSJeremy L Thompson CeedCall(CeedFree(&x)); 2295eaf62fffSJeremy L Thompson 2296eaf62fffSJeremy L Thompson // Assemble QFunction 2297eaf62fffSJeremy L Thompson CeedVector assembled; 2298eaf62fffSJeremy L Thompson CeedElemRestriction rstr_qf; 22992b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled, &rstr_qf, request)); 2300eaf62fffSJeremy L Thompson CeedInt layout[3]; 23012b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(rstr_qf, &layout)); 23022b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_qf)); 2303eaf62fffSJeremy L Thompson CeedScalar max_norm = 0; 23042b730f8bSJeremy L Thompson CeedCall(CeedVectorNorm(assembled, CEED_NORM_MAX, &max_norm)); 2305eaf62fffSJeremy L Thompson 2306eaf62fffSJeremy L Thompson // Calculate element averages 2307eaf62fffSJeremy L Thompson CeedInt num_modes = (interp ? 1 : 0) + (grad ? dim : 0); 2308eaf62fffSJeremy L Thompson CeedScalar *elem_avg; 2309eaf62fffSJeremy L Thompson const CeedScalar *assembled_array, *q_weight_array; 2310eaf62fffSJeremy L Thompson CeedVector q_weight; 23112b730f8bSJeremy L Thompson CeedCall(CeedVectorCreate(ceed_parent, num_qpts, &q_weight)); 23122b730f8bSJeremy L Thompson CeedCall(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, q_weight)); 23132b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(assembled, CEED_MEM_HOST, &assembled_array)); 23142b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(q_weight, CEED_MEM_HOST, &q_weight_array)); 23152b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_elem, &elem_avg)); 2316eaf62fffSJeremy L Thompson const CeedScalar qf_value_bound = max_norm * 100 * CEED_EPSILON; 2317eaf62fffSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 2318eaf62fffSJeremy L Thompson CeedInt count = 0; 23192b730f8bSJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 23202b730f8bSJeremy L Thompson for (CeedInt i = 0; i < num_comp * num_comp * num_modes * num_modes; i++) { 23212b730f8bSJeremy L Thompson if (fabs(assembled_array[q * layout[0] + i * layout[1] + e * layout[2]]) > qf_value_bound) { 23222b730f8bSJeremy L Thompson elem_avg[e] += assembled_array[q * layout[0] + i * layout[1] + e * layout[2]] / q_weight_array[q]; 2323eaf62fffSJeremy L Thompson count++; 2324eaf62fffSJeremy L Thompson } 23252b730f8bSJeremy L Thompson } 23262b730f8bSJeremy L Thompson } 2327eaf62fffSJeremy L Thompson if (count) { 2328eaf62fffSJeremy L Thompson elem_avg[e] /= count; 2329eaf62fffSJeremy L Thompson } else { 2330eaf62fffSJeremy L Thompson elem_avg[e] = 1.0; 2331eaf62fffSJeremy L Thompson } 2332eaf62fffSJeremy L Thompson } 23332b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(assembled, &assembled_array)); 23342b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled)); 23352b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(q_weight, &q_weight_array)); 23362b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&q_weight)); 2337eaf62fffSJeremy L Thompson 2338eaf62fffSJeremy L Thompson // Build FDM diagonal 2339eaf62fffSJeremy L Thompson CeedVector q_data; 2340eaf62fffSJeremy L Thompson CeedScalar *q_data_array, *fdm_diagonal; 2341352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_comp * num_nodes, &fdm_diagonal)); 2342352a5e7cSSebastian Grimberg const CeedScalar fdm_diagonal_bound = num_nodes * CEED_EPSILON; 23432b730f8bSJeremy L Thompson for (CeedInt c = 0; c < num_comp; c++) { 2344352a5e7cSSebastian Grimberg for (CeedInt n = 0; n < num_nodes; n++) { 2345352a5e7cSSebastian Grimberg if (interp) fdm_diagonal[c * num_nodes + n] = 1.0; 23462b730f8bSJeremy L Thompson if (grad) { 2347eaf62fffSJeremy L Thompson for (CeedInt d = 0; d < dim; d++) { 2348eaf62fffSJeremy L Thompson CeedInt i = (n / CeedIntPow(P_1d, d)) % P_1d; 2349352a5e7cSSebastian Grimberg fdm_diagonal[c * num_nodes + n] += lambda[i]; 2350eaf62fffSJeremy L Thompson } 2351eaf62fffSJeremy L Thompson } 2352352a5e7cSSebastian Grimberg if (fabs(fdm_diagonal[c * num_nodes + n]) < fdm_diagonal_bound) fdm_diagonal[c * num_nodes + n] = fdm_diagonal_bound; 23532b730f8bSJeremy L Thompson } 23542b730f8bSJeremy L Thompson } 2355352a5e7cSSebastian Grimberg CeedCall(CeedVectorCreate(ceed_parent, num_elem * num_comp * num_nodes, &q_data)); 23562b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(q_data, 0.0)); 23572b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayWrite(q_data, CEED_MEM_HOST, &q_data_array)); 23582b730f8bSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 23592b730f8bSJeremy L Thompson for (CeedInt c = 0; c < num_comp; c++) { 2360352a5e7cSSebastian Grimberg for (CeedInt n = 0; n < num_nodes; n++) q_data_array[(e * num_comp + c) * num_nodes + n] = 1. / (elem_avg[e] * fdm_diagonal[c * num_nodes + n]); 23612b730f8bSJeremy L Thompson } 23622b730f8bSJeremy L Thompson } 23632b730f8bSJeremy L Thompson CeedCall(CeedFree(&elem_avg)); 23642b730f8bSJeremy L Thompson CeedCall(CeedFree(&fdm_diagonal)); 23652b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(q_data, &q_data_array)); 2366eaf62fffSJeremy L Thompson 2367eaf62fffSJeremy L Thompson // Setup FDM operator 2368eaf62fffSJeremy L Thompson // -- Basis 2369eaf62fffSJeremy L Thompson CeedBasis fdm_basis; 2370eaf62fffSJeremy L Thompson CeedScalar *grad_dummy, *q_ref_dummy, *q_weight_dummy; 23712b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &grad_dummy)); 23722b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d, &q_ref_dummy)); 23732b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d, &q_weight_dummy)); 23742b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateTensorH1(ceed_parent, dim, num_comp, P_1d, P_1d, fdm_interp, grad_dummy, q_ref_dummy, q_weight_dummy, &fdm_basis)); 23752b730f8bSJeremy L Thompson CeedCall(CeedFree(&fdm_interp)); 23762b730f8bSJeremy L Thompson CeedCall(CeedFree(&grad_dummy)); 23772b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_ref_dummy)); 23782b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_weight_dummy)); 23792b730f8bSJeremy L Thompson CeedCall(CeedFree(&lambda)); 2380eaf62fffSJeremy L Thompson 2381eaf62fffSJeremy L Thompson // -- Restriction 2382eaf62fffSJeremy L Thompson CeedElemRestriction rstr_qd_i; 2383352a5e7cSSebastian Grimberg CeedInt strides[3] = {1, num_nodes, num_nodes * num_comp}; 2384352a5e7cSSebastian Grimberg CeedCall(CeedElemRestrictionCreateStrided(ceed_parent, num_elem, num_nodes, num_comp, num_elem * num_comp * num_nodes, strides, &rstr_qd_i)); 2385eaf62fffSJeremy L Thompson // -- QFunction 2386eaf62fffSJeremy L Thompson CeedQFunction qf_fdm; 23872b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateInteriorByName(ceed_parent, "Scale", &qf_fdm)); 23882b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_fdm, "input", num_comp, CEED_EVAL_INTERP)); 23892b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_fdm, "scale", num_comp, CEED_EVAL_NONE)); 23902b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(qf_fdm, "output", num_comp, CEED_EVAL_INTERP)); 23912b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_fdm, num_comp)); 2392eaf62fffSJeremy L Thompson // -- QFunction context 2393eaf62fffSJeremy L Thompson CeedInt *num_comp_data; 23942b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &num_comp_data)); 2395eaf62fffSJeremy L Thompson num_comp_data[0] = num_comp; 2396eaf62fffSJeremy L Thompson CeedQFunctionContext ctx_fdm; 23972b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextCreate(ceed, &ctx_fdm)); 23982b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextSetData(ctx_fdm, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_data), num_comp_data)); 23992b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(qf_fdm, ctx_fdm)); 24002b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextDestroy(&ctx_fdm)); 2401eaf62fffSJeremy L Thompson // -- Operator 24022b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed_parent, qf_fdm, NULL, NULL, fdm_inv)); 24032b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*fdm_inv, "input", rstr, fdm_basis, CEED_VECTOR_ACTIVE)); 24042b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*fdm_inv, "scale", rstr_qd_i, CEED_BASIS_COLLOCATED, q_data)); 24052b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*fdm_inv, "output", rstr, fdm_basis, CEED_VECTOR_ACTIVE)); 2406eaf62fffSJeremy L Thompson 2407eaf62fffSJeremy L Thompson // Cleanup 24082b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&q_data)); 24092b730f8bSJeremy L Thompson CeedCall(CeedBasisDestroy(&fdm_basis)); 24102b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_qd_i)); 24112b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&qf_fdm)); 2412eaf62fffSJeremy L Thompson 2413eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2414eaf62fffSJeremy L Thompson } 2415eaf62fffSJeremy L Thompson 2416eaf62fffSJeremy L Thompson /// @} 2417