13d8e8822SJeremy L Thompson // Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors. 23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details. 3eaf62fffSJeremy L Thompson // 43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause 5eaf62fffSJeremy L Thompson // 63d8e8822SJeremy L Thompson // This file is part of CEED: http://github.com/ceed 7eaf62fffSJeremy L Thompson 8ed9e99e6SJeremy L Thompson #include <assert.h> 92b730f8bSJeremy L Thompson #include <ceed-impl.h> 1049aac155SJeremy L Thompson #include <ceed.h> 112b730f8bSJeremy L Thompson #include <ceed/backend.h> 122b730f8bSJeremy L Thompson #include <math.h> 13eaf62fffSJeremy L Thompson #include <stdbool.h> 14eaf62fffSJeremy L Thompson #include <stdio.h> 15eaf62fffSJeremy L Thompson #include <string.h> 16eaf62fffSJeremy L Thompson 17eaf62fffSJeremy L Thompson /// @file 18eaf62fffSJeremy L Thompson /// Implementation of CeedOperator preconditioning interfaces 19eaf62fffSJeremy L Thompson 20eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 21eaf62fffSJeremy L Thompson /// CeedOperator Library Internal Preconditioning Functions 22eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 23eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorDeveloper 24eaf62fffSJeremy L Thompson /// @{ 25eaf62fffSJeremy L Thompson 26eaf62fffSJeremy L Thompson /** 27ea61e9acSJeremy L Thompson @brief Duplicate a CeedQFunction with a reference Ceed to fallback for advanced CeedOperator functionality 289e77b9c8SJeremy L Thompson 2901ea9c81SJed Brown @param[in] fallback_ceed Ceed on which to create fallback CeedQFunction 309e77b9c8SJeremy L Thompson @param[in] qf CeedQFunction to create fallback for 3101ea9c81SJed Brown @param[out] qf_fallback fallback CeedQFunction 329e77b9c8SJeremy L Thompson 339e77b9c8SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 349e77b9c8SJeremy L Thompson 359e77b9c8SJeremy L Thompson @ref Developer 369e77b9c8SJeremy L Thompson **/ 372b730f8bSJeremy L Thompson static int CeedQFunctionCreateFallback(Ceed fallback_ceed, CeedQFunction qf, CeedQFunction *qf_fallback) { 389e77b9c8SJeremy L Thompson // Check if NULL qf passed in 399e77b9c8SJeremy L Thompson if (!qf) return CEED_ERROR_SUCCESS; 409e77b9c8SJeremy L Thompson 41d04bbc78SJeremy L Thompson CeedDebug256(qf->ceed, 1, "---------- CeedOperator Fallback ----------\n"); 4213f886e9SJeremy L Thompson CeedDebug(qf->ceed, "Creating fallback CeedQFunction\n"); 43d04bbc78SJeremy L Thompson 449e77b9c8SJeremy L Thompson char *source_path_with_name = ""; 459e77b9c8SJeremy L Thompson if (qf->source_path) { 462b730f8bSJeremy L Thompson size_t path_len = strlen(qf->source_path), name_len = strlen(qf->kernel_name); 472b730f8bSJeremy L Thompson CeedCall(CeedCalloc(path_len + name_len + 2, &source_path_with_name)); 489e77b9c8SJeremy L Thompson memcpy(source_path_with_name, qf->source_path, path_len); 499e77b9c8SJeremy L Thompson memcpy(&source_path_with_name[path_len], ":", 1); 509e77b9c8SJeremy L Thompson memcpy(&source_path_with_name[path_len + 1], qf->kernel_name, name_len); 519e77b9c8SJeremy L Thompson } else { 522b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &source_path_with_name)); 539e77b9c8SJeremy L Thompson } 549e77b9c8SJeremy L Thompson 552b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateInterior(fallback_ceed, qf->vec_length, qf->function, source_path_with_name, qf_fallback)); 569e77b9c8SJeremy L Thompson { 579e77b9c8SJeremy L Thompson CeedQFunctionContext ctx; 589e77b9c8SJeremy L Thompson 592b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetContext(qf, &ctx)); 602b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(*qf_fallback, ctx)); 619e77b9c8SJeremy L Thompson } 629e77b9c8SJeremy L Thompson for (CeedInt i = 0; i < qf->num_input_fields; i++) { 632b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(*qf_fallback, qf->input_fields[i]->field_name, qf->input_fields[i]->size, qf->input_fields[i]->eval_mode)); 649e77b9c8SJeremy L Thompson } 659e77b9c8SJeremy L Thompson for (CeedInt i = 0; i < qf->num_output_fields; i++) { 662b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(*qf_fallback, qf->output_fields[i]->field_name, qf->output_fields[i]->size, qf->output_fields[i]->eval_mode)); 679e77b9c8SJeremy L Thompson } 682b730f8bSJeremy L Thompson CeedCall(CeedFree(&source_path_with_name)); 699e77b9c8SJeremy L Thompson 709e77b9c8SJeremy L Thompson return CEED_ERROR_SUCCESS; 719e77b9c8SJeremy L Thompson } 729e77b9c8SJeremy L Thompson 739e77b9c8SJeremy L Thompson /** 74ea61e9acSJeremy L Thompson @brief Duplicate a CeedOperator with a reference Ceed to fallback for advanced CeedOperator functionality 75eaf62fffSJeremy L Thompson 76ea61e9acSJeremy L Thompson @param[in,out] op CeedOperator to create fallback for 77eaf62fffSJeremy L Thompson 78eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 79eaf62fffSJeremy L Thompson 80eaf62fffSJeremy L Thompson @ref Developer 81eaf62fffSJeremy L Thompson **/ 82d04bbc78SJeremy L Thompson static int CeedOperatorCreateFallback(CeedOperator op) { 83b275c451SJeremy L Thompson bool is_composite; 849e77b9c8SJeremy L Thompson Ceed ceed_fallback; 85eaf62fffSJeremy L Thompson 86805fe78eSJeremy L Thompson // Check not already created 87805fe78eSJeremy L Thompson if (op->op_fallback) return CEED_ERROR_SUCCESS; 88805fe78eSJeremy L Thompson 89eaf62fffSJeremy L Thompson // Fallback Ceed 902b730f8bSJeremy L Thompson CeedCall(CeedGetOperatorFallbackCeed(op->ceed, &ceed_fallback)); 91d04bbc78SJeremy L Thompson if (!ceed_fallback) return CEED_ERROR_SUCCESS; 92d04bbc78SJeremy L Thompson 93d04bbc78SJeremy L Thompson CeedDebug256(op->ceed, 1, "---------- CeedOperator Fallback ----------\n"); 9413f886e9SJeremy L Thompson CeedDebug(op->ceed, "Creating fallback CeedOperator\n"); 95eaf62fffSJeremy L Thompson 96eaf62fffSJeremy L Thompson // Clone Op 97805fe78eSJeremy L Thompson CeedOperator op_fallback; 98b275c451SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 99b275c451SJeremy L Thompson if (is_composite) { 100b275c451SJeremy L Thompson CeedInt num_suboperators; 101b275c451SJeremy L Thompson CeedOperator *sub_operators; 102b275c451SJeremy L Thompson 1032b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorCreate(ceed_fallback, &op_fallback)); 104b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 105b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 106b275c451SJeremy L Thompson for (CeedInt i = 0; i < num_suboperators; i++) { 107d04bbc78SJeremy L Thompson CeedOperator op_sub_fallback; 108d04bbc78SJeremy L Thompson 109b275c451SJeremy L Thompson CeedCall(CeedOperatorGetFallback(sub_operators[i], &op_sub_fallback)); 1102b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorAddSub(op_fallback, op_sub_fallback)); 111805fe78eSJeremy L Thompson } 112805fe78eSJeremy L Thompson } else { 1139e77b9c8SJeremy L Thompson CeedQFunction qf_fallback = NULL, dqf_fallback = NULL, dqfT_fallback = NULL; 1142b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->qf, &qf_fallback)); 1152b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqf, &dqf_fallback)); 1162b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqfT, &dqfT_fallback)); 1172b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed_fallback, qf_fallback, dqf_fallback, dqfT_fallback, &op_fallback)); 118805fe78eSJeremy L Thompson for (CeedInt i = 0; i < op->qf->num_input_fields; i++) { 119437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(op_fallback, op->input_fields[i]->field_name, op->input_fields[i]->elem_rstr, op->input_fields[i]->basis, 1202b730f8bSJeremy L Thompson op->input_fields[i]->vec)); 121805fe78eSJeremy L Thompson } 122805fe78eSJeremy L Thompson for (CeedInt i = 0; i < op->qf->num_output_fields; i++) { 123437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(op_fallback, op->output_fields[i]->field_name, op->output_fields[i]->elem_rstr, op->output_fields[i]->basis, 1242b730f8bSJeremy L Thompson op->output_fields[i]->vec)); 125805fe78eSJeremy L Thompson } 1262b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op->qf_assembled, &op_fallback->qf_assembled)); 127805fe78eSJeremy L Thompson if (op_fallback->num_qpts == 0) { 1282b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetNumQuadraturePoints(op_fallback, op->num_qpts)); 129805fe78eSJeremy L Thompson } 1309e77b9c8SJeremy L Thompson // Cleanup 1312b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&qf_fallback)); 1322b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&dqf_fallback)); 1332b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&dqfT_fallback)); 134805fe78eSJeremy L Thompson } 1352b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetName(op_fallback, op->name)); 1362b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fallback)); 137805fe78eSJeremy L Thompson op->op_fallback = op_fallback; 138eaf62fffSJeremy L Thompson 139eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 140eaf62fffSJeremy L Thompson } 141eaf62fffSJeremy L Thompson 142eaf62fffSJeremy L Thompson /** 143ea61e9acSJeremy L Thompson @brief Retrieve fallback CeedOperator with a reference Ceed for advanced CeedOperator functionality 144d04bbc78SJeremy L Thompson 145d04bbc78SJeremy L Thompson @param[in] op CeedOperator to retrieve fallback for 146d04bbc78SJeremy L Thompson @param[out] op_fallback Fallback CeedOperator 147d04bbc78SJeremy L Thompson 148d04bbc78SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 149d04bbc78SJeremy L Thompson 150d04bbc78SJeremy L Thompson @ref Developer 151d04bbc78SJeremy L Thompson **/ 152d04bbc78SJeremy L Thompson int CeedOperatorGetFallback(CeedOperator op, CeedOperator *op_fallback) { 153d04bbc78SJeremy L Thompson // Create if needed 154d04bbc78SJeremy L Thompson if (!op->op_fallback) { 1552b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreateFallback(op)); 156d04bbc78SJeremy L Thompson } 157d04bbc78SJeremy L Thompson if (op->op_fallback) { 158d04bbc78SJeremy L Thompson bool is_debug; 159d04bbc78SJeremy L Thompson 1602b730f8bSJeremy L Thompson CeedCall(CeedIsDebug(op->ceed, &is_debug)); 161d04bbc78SJeremy L Thompson if (is_debug) { 162b275c451SJeremy L Thompson Ceed ceed, ceed_fallback; 163d04bbc78SJeremy L Thompson const char *resource, *resource_fallback; 164d04bbc78SJeremy L Thompson 165b275c451SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 166b275c451SJeremy L Thompson CeedCall(CeedGetOperatorFallbackCeed(ceed, &ceed_fallback)); 167b275c451SJeremy L Thompson CeedCall(CeedGetResource(ceed, &resource)); 1682b730f8bSJeremy L Thompson CeedCall(CeedGetResource(ceed_fallback, &resource_fallback)); 169d04bbc78SJeremy L Thompson 170b275c451SJeremy L Thompson CeedDebug256(ceed, 1, "---------- CeedOperator Fallback ----------\n"); 171b275c451SJeremy L Thompson CeedDebug(ceed, "Falling back from %s operator at address %ld to %s operator at address %ld\n", resource, op, resource_fallback, 1722b730f8bSJeremy L Thompson op->op_fallback); 173d04bbc78SJeremy L Thompson } 174d04bbc78SJeremy L Thompson } 175d04bbc78SJeremy L Thompson *op_fallback = op->op_fallback; 176d04bbc78SJeremy L Thompson 177d04bbc78SJeremy L Thompson return CEED_ERROR_SUCCESS; 178d04bbc78SJeremy L Thompson } 179d04bbc78SJeremy L Thompson 180d04bbc78SJeremy L Thompson /** 181eaf62fffSJeremy L Thompson @brief Select correct basis matrix pointer based on CeedEvalMode 182eaf62fffSJeremy L Thompson 183352a5e7cSSebastian Grimberg @param[in] basis CeedBasis from which to get the basis matrix 184eaf62fffSJeremy L Thompson @param[in] eval_mode Current basis evaluation mode 185eaf62fffSJeremy L Thompson @param[in] identity Pointer to identity matrix 186eaf62fffSJeremy L Thompson @param[out] basis_ptr Basis pointer to set 187eaf62fffSJeremy L Thompson 188eaf62fffSJeremy L Thompson @ref Developer 189eaf62fffSJeremy L Thompson **/ 190352a5e7cSSebastian Grimberg static inline int CeedOperatorGetBasisPointer(CeedBasis basis, CeedEvalMode eval_mode, const CeedScalar *identity, const CeedScalar **basis_ptr) { 191eaf62fffSJeremy L Thompson switch (eval_mode) { 192eaf62fffSJeremy L Thompson case CEED_EVAL_NONE: 193eaf62fffSJeremy L Thompson *basis_ptr = identity; 194eaf62fffSJeremy L Thompson break; 195eaf62fffSJeremy L Thompson case CEED_EVAL_INTERP: 196352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetInterp(basis, basis_ptr)); 197eaf62fffSJeremy L Thompson break; 198eaf62fffSJeremy L Thompson case CEED_EVAL_GRAD: 199352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetGrad(basis, basis_ptr)); 200352a5e7cSSebastian Grimberg break; 201352a5e7cSSebastian Grimberg case CEED_EVAL_DIV: 202352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetDiv(basis, basis_ptr)); 203352a5e7cSSebastian Grimberg break; 204352a5e7cSSebastian Grimberg case CEED_EVAL_CURL: 205352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetCurl(basis, basis_ptr)); 206eaf62fffSJeremy L Thompson break; 207eaf62fffSJeremy L Thompson case CEED_EVAL_WEIGHT: 208eaf62fffSJeremy L Thompson break; // Caught by QF Assembly 209eaf62fffSJeremy L Thompson } 210ed9e99e6SJeremy L Thompson assert(*basis_ptr != NULL); 211352a5e7cSSebastian Grimberg 212352a5e7cSSebastian Grimberg return CEED_ERROR_SUCCESS; 213eaf62fffSJeremy L Thompson } 214eaf62fffSJeremy L Thompson 215eaf62fffSJeremy L Thompson /** 216eaf62fffSJeremy L Thompson @brief Create point block restriction for active operator field 217eaf62fffSJeremy L Thompson 218eaf62fffSJeremy L Thompson @param[in] rstr Original CeedElemRestriction for active field 219ea61e9acSJeremy L Thompson @param[out] pointblock_rstr Address of the variable where the newly created CeedElemRestriction will be stored 220eaf62fffSJeremy L Thompson 221eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 222eaf62fffSJeremy L Thompson 223eaf62fffSJeremy L Thompson @ref Developer 224eaf62fffSJeremy L Thompson **/ 2252b730f8bSJeremy L Thompson static int CeedOperatorCreateActivePointBlockRestriction(CeedElemRestriction rstr, CeedElemRestriction *pointblock_rstr) { 226eaf62fffSJeremy L Thompson Ceed ceed; 2272b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetCeed(rstr, &ceed)); 228eaf62fffSJeremy L Thompson const CeedInt *offsets; 2292b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetOffsets(rstr, CEED_MEM_HOST, &offsets)); 230eaf62fffSJeremy L Thompson 231eaf62fffSJeremy L Thompson // Expand offsets 2327b63f5c6SJed Brown CeedInt num_elem, num_comp, elem_size, comp_stride, *pointblock_offsets; 2337b63f5c6SJed Brown CeedSize l_size; 2342b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem)); 2352b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp)); 2362b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size)); 2372b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetCompStride(rstr, &comp_stride)); 2382b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size)); 239eaf62fffSJeremy L Thompson CeedInt shift = num_comp; 2402b730f8bSJeremy L Thompson if (comp_stride != 1) shift *= num_comp; 2412b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_elem * elem_size, &pointblock_offsets)); 242eaf62fffSJeremy L Thompson for (CeedInt i = 0; i < num_elem * elem_size; i++) { 243eaf62fffSJeremy L Thompson pointblock_offsets[i] = offsets[i] * shift; 244eaf62fffSJeremy L Thompson } 245eaf62fffSJeremy L Thompson 246eaf62fffSJeremy L Thompson // Create new restriction 2472b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionCreate(ceed, num_elem, elem_size, num_comp * num_comp, 1, l_size * num_comp, CEED_MEM_HOST, CEED_OWN_POINTER, 2482b730f8bSJeremy L Thompson pointblock_offsets, pointblock_rstr)); 249eaf62fffSJeremy L Thompson 250eaf62fffSJeremy L Thompson // Cleanup 2512b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionRestoreOffsets(rstr, &offsets)); 252eaf62fffSJeremy L Thompson 253eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 254eaf62fffSJeremy L Thompson } 255eaf62fffSJeremy L Thompson 256eaf62fffSJeremy L Thompson /** 257eaf62fffSJeremy L Thompson @brief Core logic for assembling operator diagonal or point block diagonal 258eaf62fffSJeremy L Thompson 259eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble point block diagonal 260ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE 261eaf62fffSJeremy L Thompson @param[in] is_pointblock Boolean flag to assemble diagonal or point block diagonal 262eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled diagonal 263eaf62fffSJeremy L Thompson 264eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 265eaf62fffSJeremy L Thompson 266eaf62fffSJeremy L Thompson @ref Developer 267eaf62fffSJeremy L Thompson **/ 2682b730f8bSJeremy L Thompson static inline int CeedSingleOperatorAssembleAddDiagonal_Core(CeedOperator op, CeedRequest *request, const bool is_pointblock, CeedVector assembled) { 269eaf62fffSJeremy L Thompson Ceed ceed; 2702b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 271eaf62fffSJeremy L Thompson 272eaf62fffSJeremy L Thompson // Assemble QFunction 273eaf62fffSJeremy L Thompson CeedQFunction qf; 274437c7c90SJeremy L Thompson const CeedScalar *assembled_qf_array; 275eaf62fffSJeremy L Thompson CeedVector assembled_qf; 276437c7c90SJeremy L Thompson CeedElemRestriction assembled_elem_rstr; 277437c7c90SJeremy L Thompson CeedInt num_input_fields, num_output_fields; 278eaf62fffSJeremy L Thompson CeedInt layout[3]; 279437c7c90SJeremy L Thompson 280437c7c90SJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 281437c7c90SJeremy L Thompson CeedCall(CeedQFunctionGetNumArgs(qf, &num_input_fields, &num_output_fields)); 282437c7c90SJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &assembled_elem_rstr, request)); 283437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(assembled_elem_rstr, &layout)); 284437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&assembled_elem_rstr)); 285437c7c90SJeremy L Thompson CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array)); 286eaf62fffSJeremy L Thompson 287ed9e99e6SJeremy L Thompson // Get assembly data 288ed9e99e6SJeremy L Thompson CeedOperatorAssemblyData data; 289437c7c90SJeremy L Thompson const CeedEvalMode **eval_modes_in, **eval_modes_out; 290437c7c90SJeremy L Thompson CeedInt *num_eval_modes_in, *num_eval_modes_out, num_active_bases; 291437c7c90SJeremy L Thompson CeedSize **eval_mode_offsets_in, **eval_mode_offsets_out, num_output_components; 292437c7c90SJeremy L Thompson CeedBasis *active_bases; 293437c7c90SJeremy L Thompson CeedElemRestriction *active_elem_rstrs; 294437c7c90SJeremy L Thompson CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data)); 295437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_active_bases, &num_eval_modes_in, &eval_modes_in, &eval_mode_offsets_in, 296437c7c90SJeremy L Thompson &num_eval_modes_out, &eval_modes_out, &eval_mode_offsets_out, &num_output_components)); 297437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, &active_bases, NULL, NULL)); 298437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetElemRestrictions(data, NULL, &active_elem_rstrs)); 299437c7c90SJeremy L Thompson 300437c7c90SJeremy L Thompson // Loop over all active bases 301437c7c90SJeremy L Thompson for (CeedInt b = 0; b < num_active_bases; b++) { 302eaf62fffSJeremy L Thompson // Assemble point block diagonal restriction, if needed 303437c7c90SJeremy L Thompson CeedElemRestriction diag_elem_rstr = active_elem_rstrs[b]; 304437c7c90SJeremy L Thompson 305eaf62fffSJeremy L Thompson if (is_pointblock) { 306437c7c90SJeremy L Thompson CeedElemRestriction point_block_elem_rstr; 307437c7c90SJeremy L Thompson 308437c7c90SJeremy L Thompson CeedCall(CeedOperatorCreateActivePointBlockRestriction(diag_elem_rstr, &point_block_elem_rstr)); 309437c7c90SJeremy L Thompson diag_elem_rstr = point_block_elem_rstr; 310eaf62fffSJeremy L Thompson } 311eaf62fffSJeremy L Thompson 312eaf62fffSJeremy L Thompson // Create diagonal vector 313eaf62fffSJeremy L Thompson CeedVector elem_diag; 314437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionCreateVector(diag_elem_rstr, NULL, &elem_diag)); 315eaf62fffSJeremy L Thompson 316eaf62fffSJeremy L Thompson // Assemble element operator diagonals 3179c774eddSJeremy L Thompson CeedScalar *elem_diag_array; 318437c7c90SJeremy L Thompson CeedInt num_elem, num_nodes, num_qpts, num_components; 319437c7c90SJeremy L Thompson 3202b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(elem_diag, 0.0)); 3212b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArray(elem_diag, CEED_MEM_HOST, &elem_diag_array)); 322437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(diag_elem_rstr, &num_elem)); 323437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumNodes(active_bases[b], &num_nodes)); 324437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumComponents(active_bases[b], &num_components)); 325437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(active_bases[b], &num_qpts)); 326ed9e99e6SJeremy L Thompson 327352a5e7cSSebastian Grimberg // Construct identity matrix for basis if required 328ed9e99e6SJeremy L Thompson bool has_eval_none = false; 329352a5e7cSSebastian Grimberg CeedScalar *identity = NULL; 330437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_eval_modes_in[b]; i++) { 331437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (eval_modes_in[b][i] == CEED_EVAL_NONE); 332ed9e99e6SJeremy L Thompson } 333437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_eval_modes_out[b]; i++) { 334437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (eval_modes_out[b][i] == CEED_EVAL_NONE); 335ed9e99e6SJeremy L Thompson } 336ed9e99e6SJeremy L Thompson if (has_eval_none) { 3372b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_qpts * num_nodes, &identity)); 3382b730f8bSJeremy L Thompson for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) identity[i * num_nodes + i] = 1.0; 339eaf62fffSJeremy L Thompson } 340352a5e7cSSebastian Grimberg 341eaf62fffSJeremy L Thompson // Compute the diagonal of B^T D B 342eaf62fffSJeremy L Thompson // Each element 343eaf62fffSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 344eaf62fffSJeremy L Thompson // Each basis eval mode pair 345352a5e7cSSebastian Grimberg CeedInt d_out = 0, q_comp_out; 346352a5e7cSSebastian Grimberg CeedEvalMode eval_mode_out_prev = CEED_EVAL_NONE; 347437c7c90SJeremy L Thompson for (CeedInt e_out = 0; e_out < num_eval_modes_out[b]; e_out++) { 348437c7c90SJeremy L Thompson const CeedScalar *B_t = NULL; 349352a5e7cSSebastian Grimberg CeedOperatorGetBasisPointer(active_bases[b], eval_modes_out[b][e_out], identity, &B_t); 350352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(active_bases[b], eval_modes_out[b][e_out], &q_comp_out)); 351352a5e7cSSebastian Grimberg if (q_comp_out > 1) { 352352a5e7cSSebastian Grimberg if (e_out == 0 || eval_modes_out[b][e_out] != eval_mode_out_prev) d_out = 0; 353352a5e7cSSebastian Grimberg else B_t = &B_t[(++d_out) * num_qpts * num_nodes]; 354352a5e7cSSebastian Grimberg } 355352a5e7cSSebastian Grimberg eval_mode_out_prev = eval_modes_out[b][e_out]; 356352a5e7cSSebastian Grimberg 357352a5e7cSSebastian Grimberg CeedInt d_in = 0, q_comp_in; 358352a5e7cSSebastian Grimberg CeedEvalMode eval_mode_in_prev = CEED_EVAL_NONE; 359437c7c90SJeremy L Thompson for (CeedInt e_in = 0; e_in < num_eval_modes_in[b]; e_in++) { 360437c7c90SJeremy L Thompson const CeedScalar *B = NULL; 361352a5e7cSSebastian Grimberg CeedOperatorGetBasisPointer(active_bases[b], eval_modes_in[b][e_in], identity, &B); 362352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(active_bases[b], eval_modes_in[b][e_in], &q_comp_in)); 363352a5e7cSSebastian Grimberg if (q_comp_in > 1) { 364352a5e7cSSebastian Grimberg if (e_in == 0 || eval_modes_in[b][e_in] != eval_mode_in_prev) d_in = 0; 365352a5e7cSSebastian Grimberg else B = &B[(++d_in) * num_qpts * num_nodes]; 366352a5e7cSSebastian Grimberg } 367352a5e7cSSebastian Grimberg eval_mode_in_prev = eval_modes_in[b][e_in]; 368352a5e7cSSebastian Grimberg 369eaf62fffSJeremy L Thompson // Each component 370437c7c90SJeremy L Thompson for (CeedInt c_out = 0; c_out < num_components; c_out++) { 371437c7c90SJeremy L Thompson // Each qpt/node pair 3722b730f8bSJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 373eaf62fffSJeremy L Thompson if (is_pointblock) { 374eaf62fffSJeremy L Thompson // Point Block Diagonal 375437c7c90SJeremy L Thompson for (CeedInt c_in = 0; c_in < num_components; c_in++) { 376437c7c90SJeremy L Thompson const CeedInt c_offset = (eval_mode_offsets_in[b][e_in] + c_in) * num_output_components + eval_mode_offsets_out[b][e_out] + c_out; 377437c7c90SJeremy L Thompson const CeedScalar qf_value = assembled_qf_array[q * layout[0] + c_offset * layout[1] + e * layout[2]]; 3782b730f8bSJeremy L Thompson for (CeedInt n = 0; n < num_nodes; n++) { 379437c7c90SJeremy L Thompson elem_diag_array[((e * num_components + c_out) * num_components + c_in) * num_nodes + n] += 380437c7c90SJeremy L Thompson B_t[q * num_nodes + n] * qf_value * B[q * num_nodes + n]; 381eaf62fffSJeremy L Thompson } 3822b730f8bSJeremy L Thompson } 383eaf62fffSJeremy L Thompson } else { 384eaf62fffSJeremy L Thompson // Diagonal Only 385437c7c90SJeremy L Thompson const CeedInt c_offset = (eval_mode_offsets_in[b][e_in] + c_out) * num_output_components + eval_mode_offsets_out[b][e_out] + c_out; 386437c7c90SJeremy L Thompson const CeedScalar qf_value = assembled_qf_array[q * layout[0] + c_offset * layout[1] + e * layout[2]]; 3872b730f8bSJeremy L Thompson for (CeedInt n = 0; n < num_nodes; n++) { 388437c7c90SJeremy L Thompson elem_diag_array[(e * num_components + c_out) * num_nodes + n] += B_t[q * num_nodes + n] * qf_value * B[q * num_nodes + n]; 389eaf62fffSJeremy L Thompson } 390eaf62fffSJeremy L Thompson } 391eaf62fffSJeremy L Thompson } 392eaf62fffSJeremy L Thompson } 3932b730f8bSJeremy L Thompson } 3942b730f8bSJeremy L Thompson } 3952b730f8bSJeremy L Thompson } 3962b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(elem_diag, &elem_diag_array)); 397eaf62fffSJeremy L Thompson 398eaf62fffSJeremy L Thompson // Assemble local operator diagonal 399437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionApply(diag_elem_rstr, CEED_TRANSPOSE, elem_diag, assembled, request)); 400eaf62fffSJeremy L Thompson 401eaf62fffSJeremy L Thompson // Cleanup 402437c7c90SJeremy L Thompson if (is_pointblock) CeedCall(CeedElemRestrictionDestroy(&diag_elem_rstr)); 4032b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&elem_diag)); 4042b730f8bSJeremy L Thompson CeedCall(CeedFree(&identity)); 405437c7c90SJeremy L Thompson } 406437c7c90SJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array)); 407437c7c90SJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled_qf)); 408eaf62fffSJeremy L Thompson 409eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 410eaf62fffSJeremy L Thompson } 411eaf62fffSJeremy L Thompson 412eaf62fffSJeremy L Thompson /** 413eaf62fffSJeremy L Thompson @brief Core logic for assembling composite operator diagonal 414eaf62fffSJeremy L Thompson 415eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble point block diagonal 416ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE 417eaf62fffSJeremy L Thompson @param[in] is_pointblock Boolean flag to assemble diagonal or point block diagonal 418eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled diagonal 419eaf62fffSJeremy L Thompson 420eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 421eaf62fffSJeremy L Thompson 422eaf62fffSJeremy L Thompson @ref Developer 423eaf62fffSJeremy L Thompson **/ 4242b730f8bSJeremy L Thompson static inline int CeedCompositeOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedRequest *request, const bool is_pointblock, 425eaf62fffSJeremy L Thompson CeedVector assembled) { 426eaf62fffSJeremy L Thompson CeedInt num_sub; 427eaf62fffSJeremy L Thompson CeedOperator *suboperators; 428c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_sub)); 429c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &suboperators)); 430eaf62fffSJeremy L Thompson for (CeedInt i = 0; i < num_sub; i++) { 4316aa95790SJeremy L Thompson if (is_pointblock) { 4322b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(suboperators[i], assembled, request)); 4336aa95790SJeremy L Thompson } else { 4342b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddDiagonal(suboperators[i], assembled, request)); 4356aa95790SJeremy L Thompson } 436eaf62fffSJeremy L Thompson } 437eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 438eaf62fffSJeremy L Thompson } 439eaf62fffSJeremy L Thompson 440eaf62fffSJeremy L Thompson /** 441eaf62fffSJeremy L Thompson @brief Build nonzero pattern for non-composite operator 442eaf62fffSJeremy L Thompson 443eaf62fffSJeremy L Thompson Users should generally use CeedOperatorLinearAssembleSymbolic() 444eaf62fffSJeremy L Thompson 445eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble nonzero pattern 446eaf62fffSJeremy L Thompson @param[in] offset Offset for number of entries 447eaf62fffSJeremy L Thompson @param[out] rows Row number for each entry 448eaf62fffSJeremy L Thompson @param[out] cols Column number for each entry 449eaf62fffSJeremy L Thompson 450eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 451eaf62fffSJeremy L Thompson 452eaf62fffSJeremy L Thompson @ref Developer 453eaf62fffSJeremy L Thompson **/ 4542b730f8bSJeremy L Thompson static int CeedSingleOperatorAssembleSymbolic(CeedOperator op, CeedInt offset, CeedInt *rows, CeedInt *cols) { 455f3d47e36SJeremy L Thompson Ceed ceed; 456f3d47e36SJeremy L Thompson bool is_composite; 457f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 458f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 459f3d47e36SJeremy L Thompson 460*6574a04fSJeremy L Thompson CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 461eaf62fffSJeremy L Thompson 462c9366a6bSJeremy L Thompson CeedSize num_nodes; 4632b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &num_nodes, NULL)); 464eaf62fffSJeremy L Thompson CeedElemRestriction rstr_in; 4652b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(op, &rstr_in)); 466e79b91d9SJeremy L Thompson CeedInt num_elem, elem_size, num_comp; 4672b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr_in, &num_elem)); 4682b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr_in, &elem_size)); 4692b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(rstr_in, &num_comp)); 470eaf62fffSJeremy L Thompson CeedInt layout_er[3]; 4712b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(rstr_in, &layout_er)); 472eaf62fffSJeremy L Thompson 473eaf62fffSJeremy L Thompson CeedInt local_num_entries = elem_size * num_comp * elem_size * num_comp * num_elem; 474eaf62fffSJeremy L Thompson 475eaf62fffSJeremy L Thompson // Determine elem_dof relation 476eaf62fffSJeremy L Thompson CeedVector index_vec; 4772b730f8bSJeremy L Thompson CeedCall(CeedVectorCreate(ceed, num_nodes, &index_vec)); 478eaf62fffSJeremy L Thompson CeedScalar *array; 4792b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayWrite(index_vec, CEED_MEM_HOST, &array)); 480ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_nodes; i++) array[i] = i; 4812b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(index_vec, &array)); 482eaf62fffSJeremy L Thompson CeedVector elem_dof; 4832b730f8bSJeremy L Thompson CeedCall(CeedVectorCreate(ceed, num_elem * elem_size * num_comp, &elem_dof)); 4842b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(elem_dof, 0.0)); 4852b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionApply(rstr_in, CEED_NOTRANSPOSE, index_vec, elem_dof, CEED_REQUEST_IMMEDIATE)); 486eaf62fffSJeremy L Thompson const CeedScalar *elem_dof_a; 4872b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(elem_dof, CEED_MEM_HOST, &elem_dof_a)); 4882b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&index_vec)); 489eaf62fffSJeremy L Thompson 490eaf62fffSJeremy L Thompson // Determine i, j locations for element matrices 491eaf62fffSJeremy L Thompson CeedInt count = 0; 492ed9e99e6SJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 493ed9e99e6SJeremy L Thompson for (CeedInt comp_in = 0; comp_in < num_comp; comp_in++) { 494ed9e99e6SJeremy L Thompson for (CeedInt comp_out = 0; comp_out < num_comp; comp_out++) { 495ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < elem_size; i++) { 496ed9e99e6SJeremy L Thompson for (CeedInt j = 0; j < elem_size; j++) { 4972b730f8bSJeremy L Thompson const CeedInt elem_dof_index_row = i * layout_er[0] + (comp_out)*layout_er[1] + e * layout_er[2]; 4982b730f8bSJeremy L Thompson const CeedInt elem_dof_index_col = j * layout_er[0] + comp_in * layout_er[1] + e * layout_er[2]; 499eaf62fffSJeremy L Thompson 500eaf62fffSJeremy L Thompson const CeedInt row = elem_dof_a[elem_dof_index_row]; 501eaf62fffSJeremy L Thompson const CeedInt col = elem_dof_a[elem_dof_index_col]; 502eaf62fffSJeremy L Thompson 503eaf62fffSJeremy L Thompson rows[offset + count] = row; 504eaf62fffSJeremy L Thompson cols[offset + count] = col; 505eaf62fffSJeremy L Thompson count++; 506eaf62fffSJeremy L Thompson } 507eaf62fffSJeremy L Thompson } 508eaf62fffSJeremy L Thompson } 509eaf62fffSJeremy L Thompson } 510eaf62fffSJeremy L Thompson } 511*6574a04fSJeremy L Thompson CeedCheck(count == local_num_entries, ceed, CEED_ERROR_MAJOR, "Error computing assembled entries"); 5122b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(elem_dof, &elem_dof_a)); 5132b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&elem_dof)); 514eaf62fffSJeremy L Thompson 515eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 516eaf62fffSJeremy L Thompson } 517eaf62fffSJeremy L Thompson 518eaf62fffSJeremy L Thompson /** 519eaf62fffSJeremy L Thompson @brief Assemble nonzero entries for non-composite operator 520eaf62fffSJeremy L Thompson 521eaf62fffSJeremy L Thompson Users should generally use CeedOperatorLinearAssemble() 522eaf62fffSJeremy L Thompson 523eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 524ea61e9acSJeremy L Thompson @param[in] offset Offset for number of entries 525eaf62fffSJeremy L Thompson @param[out] values Values to assemble into matrix 526eaf62fffSJeremy L Thompson 527eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 528eaf62fffSJeremy L Thompson 529eaf62fffSJeremy L Thompson @ref Developer 530eaf62fffSJeremy L Thompson **/ 5312b730f8bSJeremy L Thompson static int CeedSingleOperatorAssemble(CeedOperator op, CeedInt offset, CeedVector values) { 532f3d47e36SJeremy L Thompson Ceed ceed; 533f3d47e36SJeremy L Thompson bool is_composite; 534f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 535f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 536f3d47e36SJeremy L Thompson 537*6574a04fSJeremy L Thompson CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 538f3d47e36SJeremy L Thompson 539f3d47e36SJeremy L Thompson // Early exit for empty operator 540f3d47e36SJeremy L Thompson { 541f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 542f3d47e36SJeremy L Thompson 543f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 544f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 545f3d47e36SJeremy L Thompson } 546eaf62fffSJeremy L Thompson 547cefa2673SJeremy L Thompson if (op->LinearAssembleSingle) { 548cefa2673SJeremy L Thompson // Backend version 5492b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleSingle(op, offset, values)); 550cefa2673SJeremy L Thompson return CEED_ERROR_SUCCESS; 551cefa2673SJeremy L Thompson } else { 552cefa2673SJeremy L Thompson // Operator fallback 553cefa2673SJeremy L Thompson CeedOperator op_fallback; 554cefa2673SJeremy L Thompson 5552b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 556cefa2673SJeremy L Thompson if (op_fallback) { 5572b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemble(op_fallback, offset, values)); 558cefa2673SJeremy L Thompson return CEED_ERROR_SUCCESS; 559cefa2673SJeremy L Thompson } 560cefa2673SJeremy L Thompson } 561cefa2673SJeremy L Thompson 562eaf62fffSJeremy L Thompson // Assemble QFunction 563eaf62fffSJeremy L Thompson CeedQFunction qf; 5642b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 565eaf62fffSJeremy L Thompson CeedVector assembled_qf; 566eaf62fffSJeremy L Thompson CeedElemRestriction rstr_q; 5672b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &rstr_q, CEED_REQUEST_IMMEDIATE)); 5681f9221feSJeremy L Thompson CeedSize qf_length; 5692b730f8bSJeremy L Thompson CeedCall(CeedVectorGetLength(assembled_qf, &qf_length)); 570eaf62fffSJeremy L Thompson 5717e7773b5SJeremy L Thompson CeedInt num_input_fields, num_output_fields; 572eaf62fffSJeremy L Thompson CeedOperatorField *input_fields; 573eaf62fffSJeremy L Thompson CeedOperatorField *output_fields; 5742b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, &num_input_fields, &input_fields, &num_output_fields, &output_fields)); 575eaf62fffSJeremy L Thompson 576ed9e99e6SJeremy L Thompson // Get assembly data 577ed9e99e6SJeremy L Thompson CeedOperatorAssemblyData data; 5782b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data)); 579437c7c90SJeremy L Thompson const CeedEvalMode **eval_modes_in, **eval_modes_out; 580437c7c90SJeremy L Thompson CeedInt *num_eval_modes_in, *num_eval_modes_out, num_active_bases; 581437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_active_bases, &num_eval_modes_in, &eval_modes_in, NULL, &num_eval_modes_out, 582437c7c90SJeremy L Thompson &eval_modes_out, NULL, NULL)); 583437c7c90SJeremy L Thompson CeedBasis *bases; 584437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, &bases, NULL, NULL)); 585437c7c90SJeremy L Thompson CeedBasis basis_in = bases[0]; 586eaf62fffSJeremy L Thompson 587*6574a04fSJeremy L Thompson CeedCheck(num_active_bases == 1, ceed, CEED_ERROR_UNSUPPORTED, "Cannot assemble operator with multiple active bases"); 588*6574a04fSJeremy L Thompson CeedCheck(num_eval_modes_in[0] > 0 && num_eval_modes_out[0] > 0, ceed, CEED_ERROR_UNSUPPORTED, "Cannot assemble operator with out inputs/outputs"); 589eaf62fffSJeremy L Thompson 590ed9e99e6SJeremy L Thompson CeedElemRestriction active_rstr; 591eaf62fffSJeremy L Thompson CeedInt num_elem, elem_size, num_qpts, num_comp; 5922b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(op, &active_rstr)); 5932b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(active_rstr, &num_elem)); 5942b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(active_rstr, &elem_size)); 5952b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(active_rstr, &num_comp)); 5962b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_in, &num_qpts)); 597eaf62fffSJeremy L Thompson 598eaf62fffSJeremy L Thompson CeedInt local_num_entries = elem_size * num_comp * elem_size * num_comp * num_elem; 599eaf62fffSJeremy L Thompson 600eaf62fffSJeremy L Thompson // loop over elements and put in data structure 601eaf62fffSJeremy L Thompson const CeedScalar *assembled_qf_array; 6022b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array)); 603eaf62fffSJeremy L Thompson 604eaf62fffSJeremy L Thompson CeedInt layout_qf[3]; 6052b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(rstr_q, &layout_qf)); 6062b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_q)); 607eaf62fffSJeremy L Thompson 608eaf62fffSJeremy L Thompson // we store B_mat_in, B_mat_out, BTD, elem_mat in row-major order 609437c7c90SJeremy L Thompson const CeedScalar **B_mats_in, **B_mats_out; 610437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, NULL, &B_mats_in, &B_mats_out)); 611437c7c90SJeremy L Thompson const CeedScalar *B_mat_in = B_mats_in[0], *B_mat_out = B_mats_out[0]; 612437c7c90SJeremy L Thompson CeedScalar BTD_mat[elem_size * num_qpts * num_eval_modes_in[0]]; 613eaf62fffSJeremy L Thompson CeedScalar elem_mat[elem_size * elem_size]; 61492ae7e47SJeremy L Thompson CeedInt count = 0; 615eaf62fffSJeremy L Thompson CeedScalar *vals; 61628ec399dSJeremy L Thompson CeedCall(CeedVectorGetArray(values, CEED_MEM_HOST, &vals)); 617ed9e99e6SJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 618ed9e99e6SJeremy L Thompson for (CeedInt comp_in = 0; comp_in < num_comp; comp_in++) { 619ed9e99e6SJeremy L Thompson for (CeedInt comp_out = 0; comp_out < num_comp; comp_out++) { 620ed9e99e6SJeremy L Thompson // Compute B^T*D 621ed9e99e6SJeremy L Thompson for (CeedInt n = 0; n < elem_size; n++) { 622ed9e99e6SJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 623437c7c90SJeremy L Thompson for (CeedInt e_in = 0; e_in < num_eval_modes_in[0]; e_in++) { 624437c7c90SJeremy L Thompson const CeedInt btd_index = n * (num_qpts * num_eval_modes_in[0]) + (num_eval_modes_in[0] * q + e_in); 625067fd99fSJeremy L Thompson CeedScalar sum = 0.0; 626437c7c90SJeremy L Thompson for (CeedInt e_out = 0; e_out < num_eval_modes_out[0]; e_out++) { 627437c7c90SJeremy L Thompson const CeedInt b_out_index = (num_eval_modes_out[0] * q + e_out) * elem_size + n; 628437c7c90SJeremy L Thompson const CeedInt eval_mode_index = ((e_in * num_comp + comp_in) * num_eval_modes_out[0] + e_out) * num_comp + comp_out; 6292b730f8bSJeremy L Thompson const CeedInt qf_index = q * layout_qf[0] + eval_mode_index * layout_qf[1] + e * layout_qf[2]; 630067fd99fSJeremy L Thompson sum += B_mat_out[b_out_index] * assembled_qf_array[qf_index]; 631eaf62fffSJeremy L Thompson } 632067fd99fSJeremy L Thompson BTD_mat[btd_index] = sum; 633ed9e99e6SJeremy L Thompson } 634ed9e99e6SJeremy L Thompson } 635eaf62fffSJeremy L Thompson } 636eaf62fffSJeremy L Thompson // form element matrix itself (for each block component) 637437c7c90SJeremy L Thompson CeedCall(CeedMatrixMatrixMultiply(ceed, BTD_mat, B_mat_in, elem_mat, elem_size, elem_size, num_qpts * num_eval_modes_in[0])); 638eaf62fffSJeremy L Thompson 639eaf62fffSJeremy L Thompson // put element matrix in coordinate data structure 640ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < elem_size; i++) { 641ed9e99e6SJeremy L Thompson for (CeedInt j = 0; j < elem_size; j++) { 642eaf62fffSJeremy L Thompson vals[offset + count] = elem_mat[i * elem_size + j]; 643eaf62fffSJeremy L Thompson count++; 644eaf62fffSJeremy L Thompson } 645eaf62fffSJeremy L Thompson } 646eaf62fffSJeremy L Thompson } 647eaf62fffSJeremy L Thompson } 648eaf62fffSJeremy L Thompson } 649*6574a04fSJeremy L Thompson CeedCheck(count == local_num_entries, ceed, CEED_ERROR_MAJOR, "Error computing entries"); 6502b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(values, &vals)); 651eaf62fffSJeremy L Thompson 6522b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array)); 6532b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled_qf)); 654eaf62fffSJeremy L Thompson 655eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 656eaf62fffSJeremy L Thompson } 657eaf62fffSJeremy L Thompson 658eaf62fffSJeremy L Thompson /** 659eaf62fffSJeremy L Thompson @brief Count number of entries for assembled CeedOperator 660eaf62fffSJeremy L Thompson 661eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 662eaf62fffSJeremy L Thompson @param[out] num_entries Number of entries in assembled representation 663eaf62fffSJeremy L Thompson 664eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 665eaf62fffSJeremy L Thompson 666eaf62fffSJeremy L Thompson @ref Utility 667eaf62fffSJeremy L Thompson **/ 6682b730f8bSJeremy L Thompson static int CeedSingleOperatorAssemblyCountEntries(CeedOperator op, CeedInt *num_entries) { 669b275c451SJeremy L Thompson bool is_composite; 670eaf62fffSJeremy L Thompson CeedElemRestriction rstr; 671eaf62fffSJeremy L Thompson CeedInt num_elem, elem_size, num_comp; 672eaf62fffSJeremy L Thompson 673b275c451SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 674*6574a04fSJeremy L Thompson CeedCheck(!is_composite, op->ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 6752b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(op, &rstr)); 6762b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem)); 6772b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size)); 6782b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp)); 679eaf62fffSJeremy L Thompson *num_entries = elem_size * num_comp * elem_size * num_comp * num_elem; 680eaf62fffSJeremy L Thompson 681eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 682eaf62fffSJeremy L Thompson } 683eaf62fffSJeremy L Thompson 684eaf62fffSJeremy L Thompson /** 685ea61e9acSJeremy L Thompson @brief Common code for creating a multigrid coarse operator and level transfer operators for a CeedOperator 686eaf62fffSJeremy L Thompson 687eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 68885bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 689eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 690eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 69185bb9dcfSJeremy L Thompson @param[in] basis_c_to_f Basis for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators 692eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 69385bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 69485bb9dcfSJeremy L Thompson @param[out] op_restrict Fine to coarse operator, or NULL 695eaf62fffSJeremy L Thompson 696eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 697eaf62fffSJeremy L Thompson 698eaf62fffSJeremy L Thompson @ref Developer 699eaf62fffSJeremy L Thompson **/ 7002b730f8bSJeremy L Thompson static int CeedSingleOperatorMultigridLevel(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 7012b730f8bSJeremy L Thompson CeedBasis basis_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) { 702eaf62fffSJeremy L Thompson Ceed ceed; 70385bb9dcfSJeremy L Thompson CeedVector mult_vec = NULL; 7042b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op_fine, &ceed)); 705eaf62fffSJeremy L Thompson 706eaf62fffSJeremy L Thompson // Check for composite operator 707eaf62fffSJeremy L Thompson bool is_composite; 7082b730f8bSJeremy L Thompson CeedCall(CeedOperatorIsComposite(op_fine, &is_composite)); 709*6574a04fSJeremy L Thompson CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Automatic multigrid setup for composite operators not supported"); 710eaf62fffSJeremy L Thompson 711eaf62fffSJeremy L Thompson // Coarse Grid 7122b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed, op_fine->qf, op_fine->dqf, op_fine->dqfT, op_coarse)); 713eaf62fffSJeremy L Thompson CeedElemRestriction rstr_fine = NULL; 714eaf62fffSJeremy L Thompson // -- Clone input fields 71592ae7e47SJeremy L Thompson for (CeedInt i = 0; i < op_fine->qf->num_input_fields; i++) { 716eaf62fffSJeremy L Thompson if (op_fine->input_fields[i]->vec == CEED_VECTOR_ACTIVE) { 717437c7c90SJeremy L Thompson rstr_fine = op_fine->input_fields[i]->elem_rstr; 7182b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE)); 719eaf62fffSJeremy L Thompson } else { 720437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, op_fine->input_fields[i]->elem_rstr, 7212b730f8bSJeremy L Thompson op_fine->input_fields[i]->basis, op_fine->input_fields[i]->vec)); 722eaf62fffSJeremy L Thompson } 723eaf62fffSJeremy L Thompson } 724eaf62fffSJeremy L Thompson // -- Clone output fields 72592ae7e47SJeremy L Thompson for (CeedInt i = 0; i < op_fine->qf->num_output_fields; i++) { 726eaf62fffSJeremy L Thompson if (op_fine->output_fields[i]->vec == CEED_VECTOR_ACTIVE) { 7272b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE)); 728eaf62fffSJeremy L Thompson } else { 729437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, op_fine->output_fields[i]->elem_rstr, 7302b730f8bSJeremy L Thompson op_fine->output_fields[i]->basis, op_fine->output_fields[i]->vec)); 731eaf62fffSJeremy L Thompson } 732eaf62fffSJeremy L Thompson } 733af99e877SJeremy L Thompson // -- Clone QFunctionAssemblyData 7342b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op_fine->qf_assembled, &(*op_coarse)->qf_assembled)); 735eaf62fffSJeremy L Thompson 736eaf62fffSJeremy L Thompson // Multiplicity vector 73785bb9dcfSJeremy L Thompson if (op_restrict || op_prolong) { 73885bb9dcfSJeremy L Thompson CeedVector mult_e_vec; 73985bb9dcfSJeremy L Thompson 740*6574a04fSJeremy L Thompson CeedCheck(p_mult_fine, ceed, CEED_ERROR_INCOMPATIBLE, "Prolongation or restriction operator creation requires fine grid multiplicity vector"); 7412b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionCreateVector(rstr_fine, &mult_vec, &mult_e_vec)); 7422b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(mult_e_vec, 0.0)); 7432b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionApply(rstr_fine, CEED_NOTRANSPOSE, p_mult_fine, mult_e_vec, CEED_REQUEST_IMMEDIATE)); 7442b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(mult_vec, 0.0)); 7452b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionApply(rstr_fine, CEED_TRANSPOSE, mult_e_vec, mult_vec, CEED_REQUEST_IMMEDIATE)); 7462b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&mult_e_vec)); 7472b730f8bSJeremy L Thompson CeedCall(CeedVectorReciprocal(mult_vec)); 74885bb9dcfSJeremy L Thompson } 749eaf62fffSJeremy L Thompson 750addd79feSZach Atkins // Clone name 751addd79feSZach Atkins bool has_name = op_fine->name; 752addd79feSZach Atkins size_t name_len = op_fine->name ? strlen(op_fine->name) : 0; 753addd79feSZach Atkins CeedCall(CeedOperatorSetName(*op_coarse, op_fine->name)); 754addd79feSZach Atkins 75583d6adf3SZach Atkins // Check that coarse to fine basis is provided if prolong/restrict operators are requested 756*6574a04fSJeremy L Thompson CeedCheck(basis_c_to_f || (!op_restrict && !op_prolong), ceed, CEED_ERROR_INCOMPATIBLE, 757*6574a04fSJeremy L Thompson "Prolongation or restriction operator creation requires coarse-to-fine basis"); 75883d6adf3SZach Atkins 75985bb9dcfSJeremy L Thompson // Restriction/Prolongation Operators 760eaf62fffSJeremy L Thompson CeedInt num_comp; 7612b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_coarse, &num_comp)); 762addd79feSZach Atkins 763addd79feSZach Atkins // Restriction 764addd79feSZach Atkins if (op_restrict) { 765eaf62fffSJeremy L Thompson CeedInt *num_comp_r_data; 76685bb9dcfSJeremy L Thompson CeedQFunction qf_restrict; 76785bb9dcfSJeremy L Thompson CeedQFunctionContext ctx_r; 76885bb9dcfSJeremy L Thompson 76985bb9dcfSJeremy L Thompson CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_restrict)); 7702b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &num_comp_r_data)); 771eaf62fffSJeremy L Thompson num_comp_r_data[0] = num_comp; 7722b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextCreate(ceed, &ctx_r)); 7732b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextSetData(ctx_r, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_r_data), num_comp_r_data)); 7742b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(qf_restrict, ctx_r)); 7752b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextDestroy(&ctx_r)); 7762b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_restrict, "input", num_comp, CEED_EVAL_NONE)); 7772b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_restrict, "scale", num_comp, CEED_EVAL_NONE)); 7782b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(qf_restrict, "output", num_comp, CEED_EVAL_INTERP)); 7792b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_restrict, num_comp)); 780eaf62fffSJeremy L Thompson 7812b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed, qf_restrict, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_restrict)); 7822b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_restrict, "input", rstr_fine, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE)); 7832b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_restrict, "scale", rstr_fine, CEED_BASIS_COLLOCATED, mult_vec)); 7842b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_restrict, "output", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE)); 785eaf62fffSJeremy L Thompson 786addd79feSZach Atkins // Set name 787addd79feSZach Atkins char *restriction_name; 788addd79feSZach Atkins CeedCall(CeedCalloc(17 + name_len, &restriction_name)); 789addd79feSZach Atkins sprintf(restriction_name, "restriction%s%s", has_name ? " for " : "", has_name ? op_fine->name : ""); 790addd79feSZach Atkins CeedCall(CeedOperatorSetName(*op_restrict, restriction_name)); 791addd79feSZach Atkins CeedCall(CeedFree(&restriction_name)); 792addd79feSZach Atkins 793addd79feSZach Atkins // Check 794addd79feSZach Atkins CeedCall(CeedOperatorCheckReady(*op_restrict)); 795addd79feSZach Atkins 796addd79feSZach Atkins // Cleanup 797addd79feSZach Atkins CeedCall(CeedQFunctionDestroy(&qf_restrict)); 798addd79feSZach Atkins } 799addd79feSZach Atkins 800eaf62fffSJeremy L Thompson // Prolongation 801addd79feSZach Atkins if (op_prolong) { 802eaf62fffSJeremy L Thompson CeedInt *num_comp_p_data; 80385bb9dcfSJeremy L Thompson CeedQFunction qf_prolong; 80485bb9dcfSJeremy L Thompson CeedQFunctionContext ctx_p; 80585bb9dcfSJeremy L Thompson 80685bb9dcfSJeremy L Thompson CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_prolong)); 8072b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &num_comp_p_data)); 808eaf62fffSJeremy L Thompson num_comp_p_data[0] = num_comp; 8092b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextCreate(ceed, &ctx_p)); 8102b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextSetData(ctx_p, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_p_data), num_comp_p_data)); 8112b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(qf_prolong, ctx_p)); 8122b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextDestroy(&ctx_p)); 8132b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_prolong, "input", num_comp, CEED_EVAL_INTERP)); 8142b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_prolong, "scale", num_comp, CEED_EVAL_NONE)); 8152b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(qf_prolong, "output", num_comp, CEED_EVAL_NONE)); 8162b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_prolong, num_comp)); 817eaf62fffSJeremy L Thompson 8182b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed, qf_prolong, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_prolong)); 8192b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_prolong, "input", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE)); 8202b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_prolong, "scale", rstr_fine, CEED_BASIS_COLLOCATED, mult_vec)); 8212b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_prolong, "output", rstr_fine, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE)); 822eaf62fffSJeremy L Thompson 823addd79feSZach Atkins // Set name 824ea6b5821SJeremy L Thompson char *prolongation_name; 8252b730f8bSJeremy L Thompson CeedCall(CeedCalloc(18 + name_len, &prolongation_name)); 8262b730f8bSJeremy L Thompson sprintf(prolongation_name, "prolongation%s%s", has_name ? " for " : "", has_name ? op_fine->name : ""); 8272b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetName(*op_prolong, prolongation_name)); 8282b730f8bSJeremy L Thompson CeedCall(CeedFree(&prolongation_name)); 829addd79feSZach Atkins 830addd79feSZach Atkins // Check 831addd79feSZach Atkins CeedCall(CeedOperatorCheckReady(*op_prolong)); 832addd79feSZach Atkins 833addd79feSZach Atkins // Cleanup 834addd79feSZach Atkins CeedCall(CeedQFunctionDestroy(&qf_prolong)); 835ea6b5821SJeremy L Thompson } 836ea6b5821SJeremy L Thompson 83758e4b056SJeremy L Thompson // Check 83858e4b056SJeremy L Thompson CeedCall(CeedOperatorCheckReady(*op_coarse)); 83958e4b056SJeremy L Thompson 840eaf62fffSJeremy L Thompson // Cleanup 8412b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&mult_vec)); 8422b730f8bSJeremy L Thompson CeedCall(CeedBasisDestroy(&basis_c_to_f)); 843805fe78eSJeremy L Thompson 844eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 845eaf62fffSJeremy L Thompson } 846eaf62fffSJeremy L Thompson 847eaf62fffSJeremy L Thompson /** 848eaf62fffSJeremy L Thompson @brief Build 1D mass matrix and Laplacian with perturbation 849eaf62fffSJeremy L Thompson 850eaf62fffSJeremy L Thompson @param[in] interp_1d Interpolation matrix in one dimension 851eaf62fffSJeremy L Thompson @param[in] grad_1d Gradient matrix in one dimension 852eaf62fffSJeremy L Thompson @param[in] q_weight_1d Quadrature weights in one dimension 853eaf62fffSJeremy L Thompson @param[in] P_1d Number of basis nodes in one dimension 854eaf62fffSJeremy L Thompson @param[in] Q_1d Number of quadrature points in one dimension 855eaf62fffSJeremy L Thompson @param[in] dim Dimension of basis 856eaf62fffSJeremy L Thompson @param[out] mass Assembled mass matrix in one dimension 857eaf62fffSJeremy L Thompson @param[out] laplace Assembled perturbed Laplacian in one dimension 858eaf62fffSJeremy L Thompson 859eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 860eaf62fffSJeremy L Thompson 861eaf62fffSJeremy L Thompson @ref Developer 862eaf62fffSJeremy L Thompson **/ 8632c2ea1dbSJeremy L Thompson CeedPragmaOptimizeOff 8642c2ea1dbSJeremy L Thompson static int CeedBuildMassLaplace(const CeedScalar *interp_1d, const CeedScalar *grad_1d, const CeedScalar *q_weight_1d, CeedInt P_1d, CeedInt Q_1d, 8652c2ea1dbSJeremy L Thompson CeedInt dim, CeedScalar *mass, CeedScalar *laplace) { 8662b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) { 867eaf62fffSJeremy L Thompson for (CeedInt j = 0; j < P_1d; j++) { 868eaf62fffSJeremy L Thompson CeedScalar sum = 0.0; 8692b730f8bSJeremy L Thompson for (CeedInt k = 0; k < Q_1d; k++) sum += interp_1d[k * P_1d + i] * q_weight_1d[k] * interp_1d[k * P_1d + j]; 870eaf62fffSJeremy L Thompson mass[i + j * P_1d] = sum; 871eaf62fffSJeremy L Thompson } 8722b730f8bSJeremy L Thompson } 873eaf62fffSJeremy L Thompson // -- Laplacian 8742b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) { 875eaf62fffSJeremy L Thompson for (CeedInt j = 0; j < P_1d; j++) { 876eaf62fffSJeremy L Thompson CeedScalar sum = 0.0; 8772b730f8bSJeremy L Thompson for (CeedInt k = 0; k < Q_1d; k++) sum += grad_1d[k * P_1d + i] * q_weight_1d[k] * grad_1d[k * P_1d + j]; 878eaf62fffSJeremy L Thompson laplace[i + j * P_1d] = sum; 879eaf62fffSJeremy L Thompson } 8802b730f8bSJeremy L Thompson } 881eaf62fffSJeremy L Thompson CeedScalar perturbation = dim > 2 ? 1e-6 : 1e-4; 8822b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) laplace[i + P_1d * i] += perturbation; 883eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 884eaf62fffSJeremy L Thompson } 8852c2ea1dbSJeremy L Thompson CeedPragmaOptimizeOn 886eaf62fffSJeremy L Thompson 887eaf62fffSJeremy L Thompson /// @} 888eaf62fffSJeremy L Thompson 889eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 890480fae85SJeremy L Thompson /// CeedOperator Backend API 891480fae85SJeremy L Thompson /// ---------------------------------------------------------------------------- 892480fae85SJeremy L Thompson /// @addtogroup CeedOperatorBackend 893480fae85SJeremy L Thompson /// @{ 894480fae85SJeremy L Thompson 895480fae85SJeremy L Thompson /** 896480fae85SJeremy L Thompson @brief Create object holding CeedQFunction assembly data for CeedOperator 897480fae85SJeremy L Thompson 898480fae85SJeremy L Thompson @param[in] ceed A Ceed object where the CeedQFunctionAssemblyData will be created 899ea61e9acSJeremy L Thompson @param[out] data Address of the variable where the newly created CeedQFunctionAssemblyData will be stored 900480fae85SJeremy L Thompson 901480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 902480fae85SJeremy L Thompson 903480fae85SJeremy L Thompson @ref Backend 904480fae85SJeremy L Thompson **/ 905ea61e9acSJeremy L Thompson int CeedQFunctionAssemblyDataCreate(Ceed ceed, CeedQFunctionAssemblyData *data) { 9062b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, data)); 907480fae85SJeremy L Thompson (*data)->ref_count = 1; 908480fae85SJeremy L Thompson (*data)->ceed = ceed; 9092b730f8bSJeremy L Thompson CeedCall(CeedReference(ceed)); 910480fae85SJeremy L Thompson 911480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 912480fae85SJeremy L Thompson } 913480fae85SJeremy L Thompson 914480fae85SJeremy L Thompson /** 915480fae85SJeremy L Thompson @brief Increment the reference counter for a CeedQFunctionAssemblyData 916480fae85SJeremy L Thompson 917ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to increment the reference counter 918480fae85SJeremy L Thompson 919480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 920480fae85SJeremy L Thompson 921480fae85SJeremy L Thompson @ref Backend 922480fae85SJeremy L Thompson **/ 923480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataReference(CeedQFunctionAssemblyData data) { 924480fae85SJeremy L Thompson data->ref_count++; 925480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 926480fae85SJeremy L Thompson } 927480fae85SJeremy L Thompson 928480fae85SJeremy L Thompson /** 929beecbf24SJeremy L Thompson @brief Set re-use of CeedQFunctionAssemblyData 9308b919e6bSJeremy L Thompson 931ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to mark for reuse 932ea61e9acSJeremy L Thompson @param[in] reuse_data Boolean flag indicating data re-use 9338b919e6bSJeremy L Thompson 9348b919e6bSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 9358b919e6bSJeremy L Thompson 9368b919e6bSJeremy L Thompson @ref Backend 9378b919e6bSJeremy L Thompson **/ 9382b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetReuse(CeedQFunctionAssemblyData data, bool reuse_data) { 939beecbf24SJeremy L Thompson data->reuse_data = reuse_data; 940beecbf24SJeremy L Thompson data->needs_data_update = true; 941beecbf24SJeremy L Thompson return CEED_ERROR_SUCCESS; 942beecbf24SJeremy L Thompson } 943beecbf24SJeremy L Thompson 944beecbf24SJeremy L Thompson /** 945beecbf24SJeremy L Thompson @brief Mark QFunctionAssemblyData as stale 946beecbf24SJeremy L Thompson 947ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to mark as stale 948ea61e9acSJeremy L Thompson @param[in] needs_data_update Boolean flag indicating if update is needed or completed 949beecbf24SJeremy L Thompson 950beecbf24SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 951beecbf24SJeremy L Thompson 952beecbf24SJeremy L Thompson @ref Backend 953beecbf24SJeremy L Thompson **/ 9542b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetUpdateNeeded(CeedQFunctionAssemblyData data, bool needs_data_update) { 955beecbf24SJeremy L Thompson data->needs_data_update = needs_data_update; 9568b919e6bSJeremy L Thompson return CEED_ERROR_SUCCESS; 9578b919e6bSJeremy L Thompson } 9588b919e6bSJeremy L Thompson 9598b919e6bSJeremy L Thompson /** 9608b919e6bSJeremy L Thompson @brief Determine if QFunctionAssemblyData needs update 9618b919e6bSJeremy L Thompson 9628b919e6bSJeremy L Thompson @param[in] data CeedQFunctionAssemblyData to mark as stale 9638b919e6bSJeremy L Thompson @param[out] is_update_needed Boolean flag indicating if re-assembly is required 9648b919e6bSJeremy L Thompson 9658b919e6bSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 9668b919e6bSJeremy L Thompson 9678b919e6bSJeremy L Thompson @ref Backend 9688b919e6bSJeremy L Thompson **/ 9692b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsUpdateNeeded(CeedQFunctionAssemblyData data, bool *is_update_needed) { 970beecbf24SJeremy L Thompson *is_update_needed = !data->reuse_data || data->needs_data_update; 9718b919e6bSJeremy L Thompson return CEED_ERROR_SUCCESS; 9728b919e6bSJeremy L Thompson } 9738b919e6bSJeremy L Thompson 9748b919e6bSJeremy L Thompson /** 975ea61e9acSJeremy L Thompson @brief Copy the pointer to a CeedQFunctionAssemblyData. 976ea61e9acSJeremy L Thompson Both pointers should be destroyed with `CeedCeedQFunctionAssemblyDataDestroy()`. 977512bb800SJeremy L Thompson 978512bb800SJeremy L Thompson Note: If the value of `data_copy` passed to this function is non-NULL, then it is assumed that `*data_copy` is a pointer to a 979512bb800SJeremy L Thompson CeedQFunctionAssemblyData. This CeedQFunctionAssemblyData will be destroyed if `data_copy` is the only reference to this 980512bb800SJeremy L Thompson CeedQFunctionAssemblyData. 981480fae85SJeremy L Thompson 982ea61e9acSJeremy L Thompson @param[in] data CeedQFunctionAssemblyData to copy reference to 983ea61e9acSJeremy L Thompson @param[in,out] data_copy Variable to store copied reference 984480fae85SJeremy L Thompson 985480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 986480fae85SJeremy L Thompson 987480fae85SJeremy L Thompson @ref Backend 988480fae85SJeremy L Thompson **/ 9892b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataReferenceCopy(CeedQFunctionAssemblyData data, CeedQFunctionAssemblyData *data_copy) { 9902b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataReference(data)); 9912b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataDestroy(data_copy)); 992480fae85SJeremy L Thompson *data_copy = data; 993480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 994480fae85SJeremy L Thompson } 995480fae85SJeremy L Thompson 996480fae85SJeremy L Thompson /** 997480fae85SJeremy L Thompson @brief Get setup status for internal objects for CeedQFunctionAssemblyData 998480fae85SJeremy L Thompson 999ea61e9acSJeremy L Thompson @param[in] data CeedQFunctionAssemblyData to retrieve status 1000480fae85SJeremy L Thompson @param[out] is_setup Boolean flag for setup status 1001480fae85SJeremy L Thompson 1002480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1003480fae85SJeremy L Thompson 1004480fae85SJeremy L Thompson @ref Backend 1005480fae85SJeremy L Thompson **/ 10062b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsSetup(CeedQFunctionAssemblyData data, bool *is_setup) { 1007480fae85SJeremy L Thompson *is_setup = data->is_setup; 1008480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1009480fae85SJeremy L Thompson } 1010480fae85SJeremy L Thompson 1011480fae85SJeremy L Thompson /** 1012480fae85SJeremy L Thompson @brief Set internal objects for CeedQFunctionAssemblyData 1013480fae85SJeremy L Thompson 1014ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to set objects 1015480fae85SJeremy L Thompson @param[in] vec CeedVector to store assembled CeedQFunction at quadrature points 1016480fae85SJeremy L Thompson @param[in] rstr CeedElemRestriction for CeedVector containing assembled CeedQFunction 1017480fae85SJeremy L Thompson 1018480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1019480fae85SJeremy L Thompson 1020480fae85SJeremy L Thompson @ref Backend 1021480fae85SJeremy L Thompson **/ 10222b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetObjects(CeedQFunctionAssemblyData data, CeedVector vec, CeedElemRestriction rstr) { 10232b730f8bSJeremy L Thompson CeedCall(CeedVectorReferenceCopy(vec, &data->vec)); 10242b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(rstr, &data->rstr)); 1025480fae85SJeremy L Thompson 1026480fae85SJeremy L Thompson data->is_setup = true; 1027480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1028480fae85SJeremy L Thompson } 1029480fae85SJeremy L Thompson 10302b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataGetObjects(CeedQFunctionAssemblyData data, CeedVector *vec, CeedElemRestriction *rstr) { 1031*6574a04fSJeremy L Thompson CeedCheck(data->is_setup, data->ceed, CEED_ERROR_INCOMPLETE, "Internal objects not set; must call CeedQFunctionAssemblyDataSetObjects first."); 1032480fae85SJeremy L Thompson 10332b730f8bSJeremy L Thompson CeedCall(CeedVectorReferenceCopy(data->vec, vec)); 10342b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(data->rstr, rstr)); 1035480fae85SJeremy L Thompson 1036480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1037480fae85SJeremy L Thompson } 1038480fae85SJeremy L Thompson 1039480fae85SJeremy L Thompson /** 1040480fae85SJeremy L Thompson @brief Destroy CeedQFunctionAssemblyData 1041480fae85SJeremy L Thompson 1042ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to destroy 1043480fae85SJeremy L Thompson 1044480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1045480fae85SJeremy L Thompson 1046480fae85SJeremy L Thompson @ref Backend 1047480fae85SJeremy L Thompson **/ 1048480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataDestroy(CeedQFunctionAssemblyData *data) { 1049ad6481ceSJeremy L Thompson if (!*data || --(*data)->ref_count > 0) { 1050ad6481ceSJeremy L Thompson *data = NULL; 1051ad6481ceSJeremy L Thompson return CEED_ERROR_SUCCESS; 1052ad6481ceSJeremy L Thompson } 10532b730f8bSJeremy L Thompson CeedCall(CeedDestroy(&(*data)->ceed)); 10542b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&(*data)->vec)); 10552b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&(*data)->rstr)); 1056480fae85SJeremy L Thompson 10572b730f8bSJeremy L Thompson CeedCall(CeedFree(data)); 1058480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1059480fae85SJeremy L Thompson } 1060480fae85SJeremy L Thompson 1061ed9e99e6SJeremy L Thompson /** 1062ed9e99e6SJeremy L Thompson @brief Get CeedOperatorAssemblyData 1063ed9e99e6SJeremy L Thompson 1064ed9e99e6SJeremy L Thompson @param[in] op CeedOperator to assemble 1065ed9e99e6SJeremy L Thompson @param[out] data CeedQFunctionAssemblyData 1066ed9e99e6SJeremy L Thompson 1067ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1068ed9e99e6SJeremy L Thompson 1069ed9e99e6SJeremy L Thompson @ref Backend 1070ed9e99e6SJeremy L Thompson **/ 10712b730f8bSJeremy L Thompson int CeedOperatorGetOperatorAssemblyData(CeedOperator op, CeedOperatorAssemblyData *data) { 1072ed9e99e6SJeremy L Thompson if (!op->op_assembled) { 1073ed9e99e6SJeremy L Thompson CeedOperatorAssemblyData data; 1074ed9e99e6SJeremy L Thompson 10752b730f8bSJeremy L Thompson CeedCall(CeedOperatorAssemblyDataCreate(op->ceed, op, &data)); 1076ed9e99e6SJeremy L Thompson op->op_assembled = data; 1077ed9e99e6SJeremy L Thompson } 1078ed9e99e6SJeremy L Thompson *data = op->op_assembled; 1079ed9e99e6SJeremy L Thompson 1080ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1081ed9e99e6SJeremy L Thompson } 1082ed9e99e6SJeremy L Thompson 1083ed9e99e6SJeremy L Thompson /** 1084ba746a46SJeremy L Thompson @brief Create object holding CeedOperator assembly data. 1085ba746a46SJeremy L Thompson 1086ba746a46SJeremy L Thompson The CeedOperatorAssemblyData holds an array with references to every active CeedBasis used in the CeedOperator. 1087ba746a46SJeremy L Thompson An array with references to the corresponding active CeedElemRestrictions is also stored. 1088ba746a46SJeremy L Thompson For each active CeedBasis, the CeedOperatorAssemblyData holds an array of all input and output CeedEvalModes for this CeedBasis. 1089ba746a46SJeremy L Thompson The CeedOperatorAssemblyData holds an array of offsets for indexing into the assembled CeedQFunction arrays to the row representing each 1090ba746a46SJeremy L Thompson CeedEvalMode. 1091ba746a46SJeremy L Thompson The number of input columns across all active bases for the assembled CeedQFunction is also stored. 1092ba746a46SJeremy L Thompson Lastly, the CeedOperatorAssembly data holds assembled matrices representing the full action of the CeedBasis for all CeedEvalModes. 1093ed9e99e6SJeremy L Thompson 1094ea61e9acSJeremy L Thompson @param[in] ceed Ceed object where the CeedOperatorAssemblyData will be created 1095ed9e99e6SJeremy L Thompson @param[in] op CeedOperator to be assembled 1096ea61e9acSJeremy L Thompson @param[out] data Address of the variable where the newly created CeedOperatorAssemblyData will be stored 1097ed9e99e6SJeremy L Thompson 1098ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1099ed9e99e6SJeremy L Thompson 1100ed9e99e6SJeremy L Thompson @ref Backend 1101ed9e99e6SJeremy L Thompson **/ 11022b730f8bSJeremy L Thompson int CeedOperatorAssemblyDataCreate(Ceed ceed, CeedOperator op, CeedOperatorAssemblyData *data) { 1103437c7c90SJeremy L Thompson CeedInt num_active_bases = 0; 1104437c7c90SJeremy L Thompson 1105437c7c90SJeremy L Thompson // Allocate 11062b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, data)); 1107ed9e99e6SJeremy L Thompson (*data)->ceed = ceed; 11082b730f8bSJeremy L Thompson CeedCall(CeedReference(ceed)); 1109ed9e99e6SJeremy L Thompson 1110ed9e99e6SJeremy L Thompson // Build OperatorAssembly data 1111ed9e99e6SJeremy L Thompson CeedQFunction qf; 1112ed9e99e6SJeremy L Thompson CeedQFunctionField *qf_fields; 1113ed9e99e6SJeremy L Thompson CeedOperatorField *op_fields; 1114ed9e99e6SJeremy L Thompson CeedInt num_input_fields; 11152b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 11162b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetFields(qf, &num_input_fields, &qf_fields, NULL, NULL)); 11172b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL)); 1118ed9e99e6SJeremy L Thompson 1119ed9e99e6SJeremy L Thompson // Determine active input basis 1120437c7c90SJeremy L Thompson CeedInt *num_eval_modes_in = NULL, *num_eval_modes_out = NULL, offset = 0; 1121437c7c90SJeremy L Thompson CeedEvalMode **eval_modes_in = NULL, **eval_modes_out = NULL; 1122437c7c90SJeremy L Thompson CeedSize **eval_mode_offsets_in = NULL, **eval_mode_offsets_out = NULL; 1123ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 1124ed9e99e6SJeremy L Thompson CeedVector vec; 11252b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec)); 1126ed9e99e6SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 1127437c7c90SJeremy L Thompson CeedBasis basis_in = NULL; 1128437c7c90SJeremy L Thompson CeedEvalMode eval_mode; 1129352a5e7cSSebastian Grimberg CeedInt index = -1, dim, num_comp, q_comp; 11302b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_in)); 11312b730f8bSJeremy L Thompson CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 1132352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetDimension(basis_in, &dim)); 1133352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumComponents(basis_in, &num_comp)); 1134352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(basis_in, eval_mode, &q_comp)); 1135437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_active_bases; i++) { 1136437c7c90SJeremy L Thompson if ((*data)->active_bases[i] == basis_in) index = i; 1137437c7c90SJeremy L Thompson } 1138437c7c90SJeremy L Thompson if (index == -1) { 1139437c7c90SJeremy L Thompson CeedElemRestriction elem_rstr_in; 1140437c7c90SJeremy L Thompson index = num_active_bases; 1141437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_bases)); 1142437c7c90SJeremy L Thompson (*data)->active_bases[num_active_bases] = NULL; 1143437c7c90SJeremy L Thompson CeedCall(CeedBasisReferenceCopy(basis_in, &(*data)->active_bases[num_active_bases])); 1144437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_elem_rstrs)); 1145437c7c90SJeremy L Thompson (*data)->active_elem_rstrs[num_active_bases] = NULL; 1146437c7c90SJeremy L Thompson CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr_in)); 1147437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(elem_rstr_in, &(*data)->active_elem_rstrs[num_active_bases])); 1148437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_in)); 1149437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_out)); 1150437c7c90SJeremy L Thompson num_eval_modes_in[index] = 0; 1151437c7c90SJeremy L Thompson num_eval_modes_out[index] = 0; 1152437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_in)); 1153437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_out)); 1154437c7c90SJeremy L Thompson eval_modes_in[index] = NULL; 1155437c7c90SJeremy L Thompson eval_modes_out[index] = NULL; 1156437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_in)); 1157437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_out)); 1158437c7c90SJeremy L Thompson eval_mode_offsets_in[index] = NULL; 1159437c7c90SJeremy L Thompson eval_mode_offsets_out[index] = NULL; 1160437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_in)); 1161437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_out)); 1162437c7c90SJeremy L Thompson (*data)->assembled_bases_in[index] = NULL; 1163437c7c90SJeremy L Thompson (*data)->assembled_bases_out[index] = NULL; 1164437c7c90SJeremy L Thompson num_active_bases++; 1165437c7c90SJeremy L Thompson } 1166352a5e7cSSebastian Grimberg if (eval_mode != CEED_EVAL_WEIGHT) { 1167352a5e7cSSebastian Grimberg // q_comp = 1 if CEED_EVAL_NONE, CEED_EVAL_WEIGHT caught by QF Assembly 1168352a5e7cSSebastian Grimberg CeedCall(CeedRealloc(num_eval_modes_in[index] + q_comp, &eval_modes_in[index])); 1169352a5e7cSSebastian Grimberg CeedCall(CeedRealloc(num_eval_modes_in[index] + q_comp, &eval_mode_offsets_in[index])); 1170352a5e7cSSebastian Grimberg for (CeedInt d = 0; d < q_comp; d++) { 1171437c7c90SJeremy L Thompson eval_modes_in[index][num_eval_modes_in[index] + d] = eval_mode; 1172437c7c90SJeremy L Thompson eval_mode_offsets_in[index][num_eval_modes_in[index] + d] = offset; 1173352a5e7cSSebastian Grimberg offset += num_comp; 1174ed9e99e6SJeremy L Thompson } 1175352a5e7cSSebastian Grimberg num_eval_modes_in[index] += q_comp; 1176ed9e99e6SJeremy L Thompson } 1177ed9e99e6SJeremy L Thompson } 1178ed9e99e6SJeremy L Thompson } 1179437c7c90SJeremy L Thompson (*data)->num_eval_modes_in = num_eval_modes_in; 1180437c7c90SJeremy L Thompson (*data)->eval_modes_in = eval_modes_in; 1181437c7c90SJeremy L Thompson (*data)->eval_mode_offsets_in = eval_mode_offsets_in; 1182ed9e99e6SJeremy L Thompson 1183ed9e99e6SJeremy L Thompson // Determine active output basis 1184ed9e99e6SJeremy L Thompson CeedInt num_output_fields; 11852b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetFields(qf, NULL, NULL, &num_output_fields, &qf_fields)); 11862b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields)); 1187437c7c90SJeremy L Thompson offset = 0; 1188ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_output_fields; i++) { 1189ed9e99e6SJeremy L Thompson CeedVector vec; 11902b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec)); 1191ed9e99e6SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 1192437c7c90SJeremy L Thompson CeedBasis basis_out = NULL; 1193ed9e99e6SJeremy L Thompson CeedEvalMode eval_mode; 1194352a5e7cSSebastian Grimberg CeedInt index = -1, dim, num_comp, q_comp; 1195437c7c90SJeremy L Thompson CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_out)); 11962b730f8bSJeremy L Thompson CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 1197352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetDimension(basis_out, &dim)); 1198352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumComponents(basis_out, &num_comp)); 1199352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(basis_out, eval_mode, &q_comp)); 1200437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_active_bases; i++) { 1201437c7c90SJeremy L Thompson if ((*data)->active_bases[i] == basis_out) index = i; 1202437c7c90SJeremy L Thompson } 1203437c7c90SJeremy L Thompson if (index == -1) { 1204437c7c90SJeremy L Thompson CeedElemRestriction elem_rstr_out; 1205437c7c90SJeremy L Thompson 1206437c7c90SJeremy L Thompson index = num_active_bases; 1207437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_bases)); 1208437c7c90SJeremy L Thompson (*data)->active_bases[num_active_bases] = NULL; 1209437c7c90SJeremy L Thompson CeedCall(CeedBasisReferenceCopy(basis_out, &(*data)->active_bases[num_active_bases])); 1210437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_elem_rstrs)); 1211437c7c90SJeremy L Thompson (*data)->active_elem_rstrs[num_active_bases] = NULL; 1212437c7c90SJeremy L Thompson CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr_out)); 1213437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(elem_rstr_out, &(*data)->active_elem_rstrs[num_active_bases])); 1214437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_in)); 1215437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_out)); 1216437c7c90SJeremy L Thompson num_eval_modes_in[index] = 0; 1217437c7c90SJeremy L Thompson num_eval_modes_out[index] = 0; 1218437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_in)); 1219437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_out)); 1220437c7c90SJeremy L Thompson eval_modes_in[index] = NULL; 1221437c7c90SJeremy L Thompson eval_modes_out[index] = NULL; 1222437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_in)); 1223437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_out)); 1224437c7c90SJeremy L Thompson eval_mode_offsets_in[index] = NULL; 1225437c7c90SJeremy L Thompson eval_mode_offsets_out[index] = NULL; 1226437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_in)); 1227437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_out)); 1228437c7c90SJeremy L Thompson (*data)->assembled_bases_in[index] = NULL; 1229437c7c90SJeremy L Thompson (*data)->assembled_bases_out[index] = NULL; 1230437c7c90SJeremy L Thompson num_active_bases++; 1231437c7c90SJeremy L Thompson } 1232352a5e7cSSebastian Grimberg if (eval_mode != CEED_EVAL_WEIGHT) { 1233352a5e7cSSebastian Grimberg // q_comp = 1 if CEED_EVAL_NONE, CEED_EVAL_WEIGHT caught by QF Assembly 1234352a5e7cSSebastian Grimberg CeedCall(CeedRealloc(num_eval_modes_out[index] + q_comp, &eval_modes_out[index])); 1235352a5e7cSSebastian Grimberg CeedCall(CeedRealloc(num_eval_modes_out[index] + q_comp, &eval_mode_offsets_out[index])); 1236352a5e7cSSebastian Grimberg for (CeedInt d = 0; d < q_comp; d++) { 1237437c7c90SJeremy L Thompson eval_modes_out[index][num_eval_modes_out[index] + d] = eval_mode; 1238437c7c90SJeremy L Thompson eval_mode_offsets_out[index][num_eval_modes_out[index] + d] = offset; 1239352a5e7cSSebastian Grimberg offset += num_comp; 1240ed9e99e6SJeremy L Thompson } 1241352a5e7cSSebastian Grimberg num_eval_modes_out[index] += q_comp; 1242ed9e99e6SJeremy L Thompson } 1243ed9e99e6SJeremy L Thompson } 1244ed9e99e6SJeremy L Thompson } 1245437c7c90SJeremy L Thompson (*data)->num_output_components = offset; 1246437c7c90SJeremy L Thompson (*data)->num_eval_modes_out = num_eval_modes_out; 1247437c7c90SJeremy L Thompson (*data)->eval_modes_out = eval_modes_out; 1248437c7c90SJeremy L Thompson (*data)->eval_mode_offsets_out = eval_mode_offsets_out; 1249437c7c90SJeremy L Thompson (*data)->num_active_bases = num_active_bases; 1250ed9e99e6SJeremy L Thompson 1251ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1252ed9e99e6SJeremy L Thompson } 1253ed9e99e6SJeremy L Thompson 1254ed9e99e6SJeremy L Thompson /** 1255ba746a46SJeremy L Thompson @brief Get CeedOperator CeedEvalModes for assembly. 1256ba746a46SJeremy L Thompson 1257ba746a46SJeremy L Thompson Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object. 1258ed9e99e6SJeremy L Thompson 1259ed9e99e6SJeremy L Thompson @param[in] data CeedOperatorAssemblyData 1260ba746a46SJeremy L Thompson @param[out] num_active_bases Total number of active bases 1261c5d0f995SJed Brown @param[out] num_eval_modes_in Pointer to hold array of numbers of input CeedEvalModes, or NULL. 1262ba746a46SJeremy L Thompson `eval_modes_in[0]` holds an array of eval modes for the first active basis. 1263c5d0f995SJed Brown @param[out] eval_modes_in Pointer to hold arrays of input CeedEvalModes, or NULL. 1264ba746a46SJeremy L Thompson @param[out] eval_mode_offsets_in Pointer to hold arrays of input offsets at each quadrature point. 1265c5d0f995SJed Brown @param[out] num_eval_modes_out Pointer to hold array of numbers of output CeedEvalModes, or NULL 1266c5d0f995SJed Brown @param[out] eval_modes_out Pointer to hold arrays of output CeedEvalModes, or NULL. 1267437c7c90SJeremy L Thompson @param[out] eval_mode_offsets_out Pointer to hold arrays of output offsets at each quadrature point 1268ba746a46SJeremy L Thompson @param[out] num_output_components The number of columns in the assembled CeedQFunction matrix for each quadrature point, 1269ba746a46SJeremy L Thompson including contributions of all active bases 1270ed9e99e6SJeremy L Thompson 1271ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1272ed9e99e6SJeremy L Thompson 1273c5d0f995SJed Brown 1274ed9e99e6SJeremy L Thompson @ref Backend 1275ed9e99e6SJeremy L Thompson **/ 1276437c7c90SJeremy L Thompson int CeedOperatorAssemblyDataGetEvalModes(CeedOperatorAssemblyData data, CeedInt *num_active_bases, CeedInt **num_eval_modes_in, 1277437c7c90SJeremy L Thompson const CeedEvalMode ***eval_modes_in, CeedSize ***eval_mode_offsets_in, CeedInt **num_eval_modes_out, 1278437c7c90SJeremy L Thompson const CeedEvalMode ***eval_modes_out, CeedSize ***eval_mode_offsets_out, CeedSize *num_output_components) { 1279437c7c90SJeremy L Thompson if (num_active_bases) *num_active_bases = data->num_active_bases; 1280437c7c90SJeremy L Thompson if (num_eval_modes_in) *num_eval_modes_in = data->num_eval_modes_in; 1281437c7c90SJeremy L Thompson if (eval_modes_in) *eval_modes_in = (const CeedEvalMode **)data->eval_modes_in; 1282437c7c90SJeremy L Thompson if (eval_mode_offsets_in) *eval_mode_offsets_in = data->eval_mode_offsets_in; 1283437c7c90SJeremy L Thompson if (num_eval_modes_out) *num_eval_modes_out = data->num_eval_modes_out; 1284437c7c90SJeremy L Thompson if (eval_modes_out) *eval_modes_out = (const CeedEvalMode **)data->eval_modes_out; 1285437c7c90SJeremy L Thompson if (eval_mode_offsets_out) *eval_mode_offsets_out = data->eval_mode_offsets_out; 1286437c7c90SJeremy L Thompson if (num_output_components) *num_output_components = data->num_output_components; 1287ed9e99e6SJeremy L Thompson 1288ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1289ed9e99e6SJeremy L Thompson } 1290ed9e99e6SJeremy L Thompson 1291ed9e99e6SJeremy L Thompson /** 1292ba746a46SJeremy L Thompson @brief Get CeedOperator CeedBasis data for assembly. 1293ba746a46SJeremy L Thompson 1294ba746a46SJeremy L Thompson Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object. 1295ed9e99e6SJeremy L Thompson 1296ed9e99e6SJeremy L Thompson @param[in] data CeedOperatorAssemblyData 1297437c7c90SJeremy L Thompson @param[out] num_active_bases Number of active bases, or NULL 1298437c7c90SJeremy L Thompson @param[out] active_bases Pointer to hold active CeedBasis, or NULL 1299437c7c90SJeremy L Thompson @param[out] assembled_bases_in Pointer to hold assembled active input B, or NULL 1300437c7c90SJeremy L Thompson @param[out] assembled_bases_out Pointer to hold assembled active output B, or NULL 1301ed9e99e6SJeremy L Thompson 1302ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1303ed9e99e6SJeremy L Thompson 1304ed9e99e6SJeremy L Thompson @ref Backend 1305ed9e99e6SJeremy L Thompson **/ 1306437c7c90SJeremy L Thompson int CeedOperatorAssemblyDataGetBases(CeedOperatorAssemblyData data, CeedInt *num_active_bases, CeedBasis **active_bases, 1307437c7c90SJeremy L Thompson const CeedScalar ***assembled_bases_in, const CeedScalar ***assembled_bases_out) { 1308ed9e99e6SJeremy L Thompson // Assemble B_in, B_out if needed 1309437c7c90SJeremy L Thompson if (assembled_bases_in && !data->assembled_bases_in[0]) { 1310437c7c90SJeremy L Thompson CeedInt num_qpts; 1311437c7c90SJeremy L Thompson 1312437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(data->active_bases[0], &num_qpts)); 1313437c7c90SJeremy L Thompson for (CeedInt b = 0; b < data->num_active_bases; b++) { 1314352a5e7cSSebastian Grimberg CeedInt num_nodes; 1315437c7c90SJeremy L Thompson CeedScalar *B_in = NULL, *identity = NULL; 1316ed9e99e6SJeremy L Thompson bool has_eval_none = false; 1317ed9e99e6SJeremy L Thompson 1318352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumNodes(data->active_bases[b], &num_nodes)); 1319352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_qpts * num_nodes * data->num_eval_modes_in[b], &B_in)); 1320ed9e99e6SJeremy L Thompson 1321437c7c90SJeremy L Thompson for (CeedInt i = 0; i < data->num_eval_modes_in[b]; i++) { 1322437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (data->eval_modes_in[b][i] == CEED_EVAL_NONE); 1323ed9e99e6SJeremy L Thompson } 1324ed9e99e6SJeremy L Thompson if (has_eval_none) { 1325352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_qpts * num_nodes, &identity)); 1326352a5e7cSSebastian Grimberg for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) { 1327352a5e7cSSebastian Grimberg identity[i * num_nodes + i] = 1.0; 1328ed9e99e6SJeremy L Thompson } 1329ed9e99e6SJeremy L Thompson } 1330ed9e99e6SJeremy L Thompson 1331ed9e99e6SJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 1332352a5e7cSSebastian Grimberg for (CeedInt n = 0; n < num_nodes; n++) { 1333352a5e7cSSebastian Grimberg CeedInt d_in = 0, q_comp_in; 1334352a5e7cSSebastian Grimberg CeedEvalMode eval_mode_in_prev = CEED_EVAL_NONE; 1335437c7c90SJeremy L Thompson for (CeedInt e_in = 0; e_in < data->num_eval_modes_in[b]; e_in++) { 1336437c7c90SJeremy L Thompson const CeedInt qq = data->num_eval_modes_in[b] * q; 1337437c7c90SJeremy L Thompson const CeedScalar *B = NULL; 1338352a5e7cSSebastian Grimberg CeedOperatorGetBasisPointer(data->active_bases[b], data->eval_modes_in[b][e_in], identity, &B); 1339352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(data->active_bases[b], data->eval_modes_in[b][e_in], &q_comp_in)); 1340352a5e7cSSebastian Grimberg if (q_comp_in > 1) { 1341352a5e7cSSebastian Grimberg if (e_in == 0 || data->eval_modes_in[b][e_in] != eval_mode_in_prev) d_in = 0; 1342352a5e7cSSebastian Grimberg else B = &B[(++d_in) * num_qpts * num_nodes]; 1343352a5e7cSSebastian Grimberg } 1344352a5e7cSSebastian Grimberg eval_mode_in_prev = data->eval_modes_in[b][e_in]; 1345352a5e7cSSebastian Grimberg B_in[(qq + e_in) * num_nodes + n] = B[q * num_nodes + n]; 1346ed9e99e6SJeremy L Thompson } 1347ed9e99e6SJeremy L Thompson } 1348ed9e99e6SJeremy L Thompson } 1349437c7c90SJeremy L Thompson if (identity) CeedCall(CeedFree(identity)); 1350437c7c90SJeremy L Thompson data->assembled_bases_in[b] = B_in; 1351437c7c90SJeremy L Thompson } 1352ed9e99e6SJeremy L Thompson } 1353ed9e99e6SJeremy L Thompson 1354437c7c90SJeremy L Thompson if (assembled_bases_out && !data->assembled_bases_out[0]) { 1355437c7c90SJeremy L Thompson CeedInt num_qpts; 1356437c7c90SJeremy L Thompson 1357437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(data->active_bases[0], &num_qpts)); 1358437c7c90SJeremy L Thompson for (CeedInt b = 0; b < data->num_active_bases; b++) { 1359352a5e7cSSebastian Grimberg CeedInt num_nodes; 1360ed9e99e6SJeremy L Thompson bool has_eval_none = false; 1361437c7c90SJeremy L Thompson CeedScalar *B_out = NULL, *identity = NULL; 1362ed9e99e6SJeremy L Thompson 1363352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumNodes(data->active_bases[b], &num_nodes)); 1364352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_qpts * num_nodes * data->num_eval_modes_out[b], &B_out)); 1365ed9e99e6SJeremy L Thompson 1366437c7c90SJeremy L Thompson for (CeedInt i = 0; i < data->num_eval_modes_out[b]; i++) { 1367437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (data->eval_modes_out[b][i] == CEED_EVAL_NONE); 1368ed9e99e6SJeremy L Thompson } 1369ed9e99e6SJeremy L Thompson if (has_eval_none) { 1370352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_qpts * num_nodes, &identity)); 1371352a5e7cSSebastian Grimberg for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) { 1372352a5e7cSSebastian Grimberg identity[i * num_nodes + i] = 1.0; 1373ed9e99e6SJeremy L Thompson } 1374ed9e99e6SJeremy L Thompson } 1375ed9e99e6SJeremy L Thompson 1376ed9e99e6SJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 1377352a5e7cSSebastian Grimberg for (CeedInt n = 0; n < num_nodes; n++) { 1378352a5e7cSSebastian Grimberg CeedInt d_out = 0, q_comp_out; 1379352a5e7cSSebastian Grimberg CeedEvalMode eval_mode_out_prev = CEED_EVAL_NONE; 1380437c7c90SJeremy L Thompson for (CeedInt e_out = 0; e_out < data->num_eval_modes_out[b]; e_out++) { 1381437c7c90SJeremy L Thompson const CeedInt qq = data->num_eval_modes_out[b] * q; 1382437c7c90SJeremy L Thompson const CeedScalar *B = NULL; 1383352a5e7cSSebastian Grimberg CeedOperatorGetBasisPointer(data->active_bases[b], data->eval_modes_out[b][e_out], identity, &B); 1384352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(data->active_bases[b], data->eval_modes_out[b][e_out], &q_comp_out)); 1385352a5e7cSSebastian Grimberg if (q_comp_out > 1) { 1386352a5e7cSSebastian Grimberg if (e_out == 0 || data->eval_modes_out[b][e_out] != eval_mode_out_prev) d_out = 0; 1387352a5e7cSSebastian Grimberg else B = &B[(++d_out) * num_qpts * num_nodes]; 1388352a5e7cSSebastian Grimberg } 1389352a5e7cSSebastian Grimberg eval_mode_out_prev = data->eval_modes_out[b][e_out]; 1390352a5e7cSSebastian Grimberg B_out[(qq + e_out) * num_nodes + n] = B[q * num_nodes + n]; 1391ed9e99e6SJeremy L Thompson } 1392ed9e99e6SJeremy L Thompson } 1393ed9e99e6SJeremy L Thompson } 1394437c7c90SJeremy L Thompson if (identity) CeedCall(CeedFree(identity)); 1395437c7c90SJeremy L Thompson data->assembled_bases_out[b] = B_out; 1396437c7c90SJeremy L Thompson } 1397ed9e99e6SJeremy L Thompson } 1398ed9e99e6SJeremy L Thompson 1399437c7c90SJeremy L Thompson // Pass out assembled data 1400437c7c90SJeremy L Thompson if (active_bases) *active_bases = data->active_bases; 1401437c7c90SJeremy L Thompson if (assembled_bases_in) *assembled_bases_in = (const CeedScalar **)data->assembled_bases_in; 1402437c7c90SJeremy L Thompson if (assembled_bases_out) *assembled_bases_out = (const CeedScalar **)data->assembled_bases_out; 1403437c7c90SJeremy L Thompson 1404437c7c90SJeremy L Thompson return CEED_ERROR_SUCCESS; 1405437c7c90SJeremy L Thompson } 1406437c7c90SJeremy L Thompson 1407437c7c90SJeremy L Thompson /** 1408ba746a46SJeremy L Thompson @brief Get CeedOperator CeedBasis data for assembly. 1409ba746a46SJeremy L Thompson 1410ba746a46SJeremy L Thompson Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object. 1411437c7c90SJeremy L Thompson 1412437c7c90SJeremy L Thompson @param[in] data CeedOperatorAssemblyData 1413437c7c90SJeremy L Thompson @param[out] num_active_elem_rstrs Number of active element restrictions, or NULL 1414437c7c90SJeremy L Thompson @param[out] active_elem_rstrs Pointer to hold active CeedElemRestrictions, or NULL 1415437c7c90SJeremy L Thompson 1416437c7c90SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1417437c7c90SJeremy L Thompson 1418437c7c90SJeremy L Thompson @ref Backend 1419437c7c90SJeremy L Thompson **/ 1420437c7c90SJeremy L Thompson int CeedOperatorAssemblyDataGetElemRestrictions(CeedOperatorAssemblyData data, CeedInt *num_active_elem_rstrs, 1421437c7c90SJeremy L Thompson CeedElemRestriction **active_elem_rstrs) { 1422437c7c90SJeremy L Thompson if (num_active_elem_rstrs) *num_active_elem_rstrs = data->num_active_bases; 1423437c7c90SJeremy L Thompson if (active_elem_rstrs) *active_elem_rstrs = data->active_elem_rstrs; 1424ed9e99e6SJeremy L Thompson 1425ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1426ed9e99e6SJeremy L Thompson } 1427ed9e99e6SJeremy L Thompson 1428ed9e99e6SJeremy L Thompson /** 1429ed9e99e6SJeremy L Thompson @brief Destroy CeedOperatorAssemblyData 1430ed9e99e6SJeremy L Thompson 1431ea61e9acSJeremy L Thompson @param[in,out] data CeedOperatorAssemblyData to destroy 1432ed9e99e6SJeremy L Thompson 1433ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1434ed9e99e6SJeremy L Thompson 1435ed9e99e6SJeremy L Thompson @ref Backend 1436ed9e99e6SJeremy L Thompson **/ 1437ed9e99e6SJeremy L Thompson int CeedOperatorAssemblyDataDestroy(CeedOperatorAssemblyData *data) { 1438ad6481ceSJeremy L Thompson if (!*data) { 1439ad6481ceSJeremy L Thompson *data = NULL; 1440ad6481ceSJeremy L Thompson return CEED_ERROR_SUCCESS; 1441ad6481ceSJeremy L Thompson } 14422b730f8bSJeremy L Thompson CeedCall(CeedDestroy(&(*data)->ceed)); 1443437c7c90SJeremy L Thompson for (CeedInt b = 0; b < (*data)->num_active_bases; b++) { 1444437c7c90SJeremy L Thompson CeedCall(CeedBasisDestroy(&(*data)->active_bases[b])); 1445437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&(*data)->active_elem_rstrs[b])); 1446437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_in[b])); 1447437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_out[b])); 1448437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_in[b])); 1449437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_out[b])); 1450437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_in[b])); 1451437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_out[b])); 1452437c7c90SJeremy L Thompson } 1453437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->active_bases)); 1454437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->active_elem_rstrs)); 1455437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->num_eval_modes_in)); 1456437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->num_eval_modes_out)); 1457437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_in)); 1458437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_out)); 1459437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_in)); 1460437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_out)); 1461437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_in)); 1462437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_out)); 1463ed9e99e6SJeremy L Thompson 14642b730f8bSJeremy L Thompson CeedCall(CeedFree(data)); 1465ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1466ed9e99e6SJeremy L Thompson } 1467ed9e99e6SJeremy L Thompson 1468480fae85SJeremy L Thompson /// @} 1469480fae85SJeremy L Thompson 1470480fae85SJeremy L Thompson /// ---------------------------------------------------------------------------- 1471eaf62fffSJeremy L Thompson /// CeedOperator Public API 1472eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 1473eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorUser 1474eaf62fffSJeremy L Thompson /// @{ 1475eaf62fffSJeremy L Thompson 1476eaf62fffSJeremy L Thompson /** 1477eaf62fffSJeremy L Thompson @brief Assemble a linear CeedQFunction associated with a CeedOperator 1478eaf62fffSJeremy L Thompson 1479ea61e9acSJeremy L Thompson This returns a CeedVector containing a matrix at each quadrature point providing the action of the CeedQFunction associated with the CeedOperator. 1480859c15bbSJames Wright The vector `assembled` is of shape `[num_elements, num_input_fields, num_output_fields, num_quad_points]` and contains column-major matrices 1481859c15bbSJames Wright representing the action of the CeedQFunction for a corresponding quadrature point on an element. 1482859c15bbSJames Wright 1483859c15bbSJames Wright Inputs and outputs are in the order provided by the 1484ea61e9acSJeremy L Thompson user when adding CeedOperator fields. For example, a CeedQFunction with inputs 'u' and 'gradu' and outputs 'gradv' and 'v', provided in that order, 1485ea61e9acSJeremy L Thompson would result in an assembled QFunction that consists of (1 + dim) x (dim + 1) matrices at each quadrature point acting on the input [u, du_0, du_1] 1486ea61e9acSJeremy L Thompson and producing the output [dv_0, dv_1, v]. 1487eaf62fffSJeremy L Thompson 1488ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1489f04ea552SJeremy L Thompson 1490ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1491ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points 1492ea61e9acSJeremy L Thompson @param[out] rstr CeedElemRestriction for CeedVector containing assembled CeedQFunction 1493ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1494eaf62fffSJeremy L Thompson 1495eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1496eaf62fffSJeremy L Thompson 1497eaf62fffSJeremy L Thompson @ref User 1498eaf62fffSJeremy L Thompson **/ 14992b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunction(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 15002b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1501eaf62fffSJeremy L Thompson 1502eaf62fffSJeremy L Thompson if (op->LinearAssembleQFunction) { 1503d04bbc78SJeremy L Thompson // Backend version 15042b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleQFunction(op, assembled, rstr, request)); 1505eaf62fffSJeremy L Thompson } else { 1506d04bbc78SJeremy L Thompson // Operator fallback 1507d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1508d04bbc78SJeremy L Thompson 15092b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1510*6574a04fSJeremy L Thompson if (op_fallback) CeedCall(CeedOperatorLinearAssembleQFunction(op_fallback, assembled, rstr, request)); 1511*6574a04fSJeremy L Thompson else return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunction"); 151270a7ffb3SJeremy L Thompson } 1513eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1514eaf62fffSJeremy L Thompson } 151570a7ffb3SJeremy L Thompson 151670a7ffb3SJeremy L Thompson /** 1517ea61e9acSJeremy L Thompson @brief Assemble CeedQFunction and store result internally. 1518ea61e9acSJeremy L Thompson Return copied references of stored data to the caller. 1519ea61e9acSJeremy L Thompson Caller is responsible for ownership and destruction of the copied references. 1520ea61e9acSJeremy L Thompson See also @ref CeedOperatorLinearAssembleQFunction 152170a7ffb3SJeremy L Thompson 1522ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1523ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points 1524ea61e9acSJeremy L Thompson @param[out] rstr CeedElemRestriction for CeedVector containing assembledCeedQFunction 1525ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 152670a7ffb3SJeremy L Thompson 152770a7ffb3SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 152870a7ffb3SJeremy L Thompson 152970a7ffb3SJeremy L Thompson @ref User 153070a7ffb3SJeremy L Thompson **/ 15312b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunctionBuildOrUpdate(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 15322b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 153370a7ffb3SJeremy L Thompson 153470a7ffb3SJeremy L Thompson if (op->LinearAssembleQFunctionUpdate) { 1535d04bbc78SJeremy L Thompson // Backend version 1536480fae85SJeremy L Thompson bool qf_assembled_is_setup; 15372efa2d85SJeremy L Thompson CeedVector assembled_vec = NULL; 15382efa2d85SJeremy L Thompson CeedElemRestriction assembled_rstr = NULL; 1539480fae85SJeremy L Thompson 15402b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataIsSetup(op->qf_assembled, &qf_assembled_is_setup)); 1541480fae85SJeremy L Thompson if (qf_assembled_is_setup) { 1542d04bbc78SJeremy L Thompson bool update_needed; 1543d04bbc78SJeremy L Thompson 15442b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataGetObjects(op->qf_assembled, &assembled_vec, &assembled_rstr)); 15452b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataIsUpdateNeeded(op->qf_assembled, &update_needed)); 15468b919e6bSJeremy L Thompson if (update_needed) { 15472b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleQFunctionUpdate(op, assembled_vec, assembled_rstr, request)); 15488b919e6bSJeremy L Thompson } 154970a7ffb3SJeremy L Thompson } else { 15502b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleQFunction(op, &assembled_vec, &assembled_rstr, request)); 15512b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataSetObjects(op->qf_assembled, assembled_vec, assembled_rstr)); 155270a7ffb3SJeremy L Thompson } 15532b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataSetUpdateNeeded(op->qf_assembled, false)); 15542efa2d85SJeremy L Thompson 1555d04bbc78SJeremy L Thompson // Copy reference from internally held copy 155670a7ffb3SJeremy L Thompson *assembled = NULL; 155770a7ffb3SJeremy L Thompson *rstr = NULL; 15582b730f8bSJeremy L Thompson CeedCall(CeedVectorReferenceCopy(assembled_vec, assembled)); 15592b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled_vec)); 15602b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(assembled_rstr, rstr)); 15612b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&assembled_rstr)); 156270a7ffb3SJeremy L Thompson } else { 1563d04bbc78SJeremy L Thompson // Operator fallback 1564d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1565d04bbc78SJeremy L Thompson 15662b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1567*6574a04fSJeremy L Thompson if (op_fallback) CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op_fallback, assembled, rstr, request)); 1568*6574a04fSJeremy L Thompson else return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunctionUpdate"); 156970a7ffb3SJeremy L Thompson } 157070a7ffb3SJeremy L Thompson 157170a7ffb3SJeremy L Thompson return CEED_ERROR_SUCCESS; 1572eaf62fffSJeremy L Thompson } 1573eaf62fffSJeremy L Thompson 1574eaf62fffSJeremy L Thompson /** 1575eaf62fffSJeremy L Thompson @brief Assemble the diagonal of a square linear CeedOperator 1576eaf62fffSJeremy L Thompson 1577eaf62fffSJeremy L Thompson This overwrites a CeedVector with the diagonal of a linear CeedOperator. 1578eaf62fffSJeremy L Thompson 1579ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1580eaf62fffSJeremy L Thompson 1581ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1582f04ea552SJeremy L Thompson 1583ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1584eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator diagonal 1585ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1586eaf62fffSJeremy L Thompson 1587eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1588eaf62fffSJeremy L Thompson 1589eaf62fffSJeremy L Thompson @ref User 1590eaf62fffSJeremy L Thompson **/ 15912b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1592f3d47e36SJeremy L Thompson bool is_composite; 15932b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1594f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1595eaf62fffSJeremy L Thompson 1596c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 15972b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 1598*6574a04fSJeremy L Thompson CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1599c9366a6bSJeremy L Thompson 1600f3d47e36SJeremy L Thompson // Early exit for empty operator 1601f3d47e36SJeremy L Thompson if (!is_composite) { 1602f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1603f3d47e36SJeremy L Thompson 1604f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1605f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1606f3d47e36SJeremy L Thompson } 1607f3d47e36SJeremy L Thompson 1608eaf62fffSJeremy L Thompson if (op->LinearAssembleDiagonal) { 1609d04bbc78SJeremy L Thompson // Backend version 16102b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleDiagonal(op, assembled, request)); 1611eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1612eaf62fffSJeremy L Thompson } else if (op->LinearAssembleAddDiagonal) { 1613d04bbc78SJeremy L Thompson // Backend version with zeroing first 16142b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 16152b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request)); 1616eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1617eaf62fffSJeremy L Thompson } else { 1618d04bbc78SJeremy L Thompson // Operator fallback 1619d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1620d04bbc78SJeremy L Thompson 16212b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1622d04bbc78SJeremy L Thompson if (op_fallback) { 16232b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleDiagonal(op_fallback, assembled, request)); 1624eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1625eaf62fffSJeremy L Thompson } 1626eaf62fffSJeremy L Thompson } 1627eaf62fffSJeremy L Thompson // Default interface implementation 16282b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 16292b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddDiagonal(op, assembled, request)); 1630d04bbc78SJeremy L Thompson 1631eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1632eaf62fffSJeremy L Thompson } 1633eaf62fffSJeremy L Thompson 1634eaf62fffSJeremy L Thompson /** 1635eaf62fffSJeremy L Thompson @brief Assemble the diagonal of a square linear CeedOperator 1636eaf62fffSJeremy L Thompson 1637eaf62fffSJeremy L Thompson This sums into a CeedVector the diagonal of a linear CeedOperator. 1638eaf62fffSJeremy L Thompson 1639ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1640eaf62fffSJeremy L Thompson 1641ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1642f04ea552SJeremy L Thompson 1643ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1644eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator diagonal 1645ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1646eaf62fffSJeremy L Thompson 1647eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1648eaf62fffSJeremy L Thompson 1649eaf62fffSJeremy L Thompson @ref User 1650eaf62fffSJeremy L Thompson **/ 16512b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1652f3d47e36SJeremy L Thompson bool is_composite; 16532b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1654f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1655eaf62fffSJeremy L Thompson 1656c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 16572b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 1658*6574a04fSJeremy L Thompson CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1659c9366a6bSJeremy L Thompson 1660f3d47e36SJeremy L Thompson // Early exit for empty operator 1661f3d47e36SJeremy L Thompson if (!is_composite) { 1662f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1663f3d47e36SJeremy L Thompson 1664f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1665f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1666f3d47e36SJeremy L Thompson } 1667f3d47e36SJeremy L Thompson 1668eaf62fffSJeremy L Thompson if (op->LinearAssembleAddDiagonal) { 1669d04bbc78SJeremy L Thompson // Backend version 16702b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request)); 1671eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1672eaf62fffSJeremy L Thompson } else { 1673d04bbc78SJeremy L Thompson // Operator fallback 1674d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1675d04bbc78SJeremy L Thompson 16762b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1677d04bbc78SJeremy L Thompson if (op_fallback) { 16782b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddDiagonal(op_fallback, assembled, request)); 1679eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1680eaf62fffSJeremy L Thompson } 1681eaf62fffSJeremy L Thompson } 1682eaf62fffSJeremy L Thompson // Default interface implementation 1683eaf62fffSJeremy L Thompson if (is_composite) { 16842b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, false, assembled)); 1685eaf62fffSJeremy L Thompson } else { 16862b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, false, assembled)); 1687eaf62fffSJeremy L Thompson } 1688d04bbc78SJeremy L Thompson 1689d04bbc78SJeremy L Thompson return CEED_ERROR_SUCCESS; 1690eaf62fffSJeremy L Thompson } 1691eaf62fffSJeremy L Thompson 1692eaf62fffSJeremy L Thompson /** 1693eaf62fffSJeremy L Thompson @brief Assemble the point block diagonal of a square linear CeedOperator 1694eaf62fffSJeremy L Thompson 1695ea61e9acSJeremy L Thompson This overwrites a CeedVector with the point block diagonal of a linear CeedOperator. 1696eaf62fffSJeremy L Thompson 1697ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1698eaf62fffSJeremy L Thompson 1699ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1700f04ea552SJeremy L Thompson 1701ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1702ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp 1703ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out, 1704ea61e9acSJeremy L Thompson component in]. 1705ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1706eaf62fffSJeremy L Thompson 1707eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1708eaf62fffSJeremy L Thompson 1709eaf62fffSJeremy L Thompson @ref User 1710eaf62fffSJeremy L Thompson **/ 17112b730f8bSJeremy L Thompson int CeedOperatorLinearAssemblePointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1712f3d47e36SJeremy L Thompson bool is_composite; 17132b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1714f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1715eaf62fffSJeremy L Thompson 1716c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 17172b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 1718*6574a04fSJeremy L Thompson CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1719c9366a6bSJeremy L Thompson 1720f3d47e36SJeremy L Thompson // Early exit for empty operator 1721f3d47e36SJeremy L Thompson if (!is_composite) { 1722f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1723f3d47e36SJeremy L Thompson 1724f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1725f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1726f3d47e36SJeremy L Thompson } 1727f3d47e36SJeremy L Thompson 1728eaf62fffSJeremy L Thompson if (op->LinearAssemblePointBlockDiagonal) { 1729d04bbc78SJeremy L Thompson // Backend version 17302b730f8bSJeremy L Thompson CeedCall(op->LinearAssemblePointBlockDiagonal(op, assembled, request)); 1731eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1732eaf62fffSJeremy L Thompson } else if (op->LinearAssembleAddPointBlockDiagonal) { 1733d04bbc78SJeremy L Thompson // Backend version with zeroing first 17342b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 17352b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request)); 1736eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1737eaf62fffSJeremy L Thompson } else { 1738d04bbc78SJeremy L Thompson // Operator fallback 1739d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1740d04bbc78SJeremy L Thompson 17412b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1742d04bbc78SJeremy L Thompson if (op_fallback) { 17432b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssemblePointBlockDiagonal(op_fallback, assembled, request)); 1744eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1745eaf62fffSJeremy L Thompson } 1746eaf62fffSJeremy L Thompson } 1747eaf62fffSJeremy L Thompson // Default interface implementation 17482b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 17492b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request)); 1750d04bbc78SJeremy L Thompson 1751eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1752eaf62fffSJeremy L Thompson } 1753eaf62fffSJeremy L Thompson 1754eaf62fffSJeremy L Thompson /** 1755eaf62fffSJeremy L Thompson @brief Assemble the point block diagonal of a square linear CeedOperator 1756eaf62fffSJeremy L Thompson 1757ea61e9acSJeremy L Thompson This sums into a CeedVector with the point block diagonal of a linear CeedOperator. 1758eaf62fffSJeremy L Thompson 1759ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1760eaf62fffSJeremy L Thompson 1761ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1762f04ea552SJeremy L Thompson 1763ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1764ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp 1765ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out, 1766ea61e9acSJeremy L Thompson component in]. 1767ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1768eaf62fffSJeremy L Thompson 1769eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1770eaf62fffSJeremy L Thompson 1771eaf62fffSJeremy L Thompson @ref User 1772eaf62fffSJeremy L Thompson **/ 17732b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddPointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1774f3d47e36SJeremy L Thompson bool is_composite; 17752b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1776f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1777eaf62fffSJeremy L Thompson 1778c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 17792b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 1780*6574a04fSJeremy L Thompson CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1781c9366a6bSJeremy L Thompson 1782f3d47e36SJeremy L Thompson // Early exit for empty operator 1783f3d47e36SJeremy L Thompson if (!is_composite) { 1784f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1785f3d47e36SJeremy L Thompson 1786f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1787f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1788f3d47e36SJeremy L Thompson } 1789f3d47e36SJeremy L Thompson 1790eaf62fffSJeremy L Thompson if (op->LinearAssembleAddPointBlockDiagonal) { 1791d04bbc78SJeremy L Thompson // Backend version 17922b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleAddPointBlockDiagonal(op, assembled, request)); 1793eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1794eaf62fffSJeremy L Thompson } else { 1795d04bbc78SJeremy L Thompson // Operator fallback 1796d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1797d04bbc78SJeremy L Thompson 17982b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1799d04bbc78SJeremy L Thompson if (op_fallback) { 18002b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op_fallback, assembled, request)); 1801eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1802eaf62fffSJeremy L Thompson } 1803eaf62fffSJeremy L Thompson } 1804ea61e9acSJeremy L Thompson // Default interface implementation 1805eaf62fffSJeremy L Thompson if (is_composite) { 18062b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, true, assembled)); 1807eaf62fffSJeremy L Thompson } else { 18082b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, true, assembled)); 1809eaf62fffSJeremy L Thompson } 1810d04bbc78SJeremy L Thompson 1811d04bbc78SJeremy L Thompson return CEED_ERROR_SUCCESS; 1812eaf62fffSJeremy L Thompson } 1813eaf62fffSJeremy L Thompson 1814eaf62fffSJeremy L Thompson /** 1815eaf62fffSJeremy L Thompson @brief Fully assemble the nonzero pattern of a linear operator. 1816eaf62fffSJeremy L Thompson 1817ea61e9acSJeremy L Thompson Expected to be used in conjunction with CeedOperatorLinearAssemble(). 1818eaf62fffSJeremy L Thompson 1819ea61e9acSJeremy L Thompson The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the 1820ea61e9acSJeremy L Thompson matrix in entry (i, j). Note that the (i, j) pairs are not unique and may repeat. This function returns the number of entries and their (i, j) 1821ea61e9acSJeremy L Thompson locations, while CeedOperatorLinearAssemble() provides the values in the same ordering. 1822eaf62fffSJeremy L Thompson 1823eaf62fffSJeremy L Thompson This will generally be slow unless your operator is low-order. 1824eaf62fffSJeremy L Thompson 1825ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1826f04ea552SJeremy L Thompson 1827eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 1828eaf62fffSJeremy L Thompson @param[out] num_entries Number of entries in coordinate nonzero pattern 1829eaf62fffSJeremy L Thompson @param[out] rows Row number for each entry 1830eaf62fffSJeremy L Thompson @param[out] cols Column number for each entry 1831eaf62fffSJeremy L Thompson 1832eaf62fffSJeremy L Thompson @ref User 1833eaf62fffSJeremy L Thompson **/ 18342b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleSymbolic(CeedOperator op, CeedSize *num_entries, CeedInt **rows, CeedInt **cols) { 1835eaf62fffSJeremy L Thompson CeedInt num_suboperators, single_entries; 1836eaf62fffSJeremy L Thompson CeedOperator *sub_operators; 1837eaf62fffSJeremy L Thompson bool is_composite; 18382b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1839f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1840eaf62fffSJeremy L Thompson 1841eaf62fffSJeremy L Thompson if (op->LinearAssembleSymbolic) { 1842d04bbc78SJeremy L Thompson // Backend version 18432b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleSymbolic(op, num_entries, rows, cols)); 1844eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1845eaf62fffSJeremy L Thompson } else { 1846d04bbc78SJeremy L Thompson // Operator fallback 1847d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1848d04bbc78SJeremy L Thompson 18492b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1850d04bbc78SJeremy L Thompson if (op_fallback) { 18512b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleSymbolic(op_fallback, num_entries, rows, cols)); 1852eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1853eaf62fffSJeremy L Thompson } 1854eaf62fffSJeremy L Thompson } 1855eaf62fffSJeremy L Thompson 1856eaf62fffSJeremy L Thompson // Default interface implementation 1857eaf62fffSJeremy L Thompson 1858eaf62fffSJeremy L Thompson // count entries and allocate rows, cols arrays 1859eaf62fffSJeremy L Thompson *num_entries = 0; 1860eaf62fffSJeremy L Thompson if (is_composite) { 1861c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1862c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 186392ae7e47SJeremy L Thompson for (CeedInt k = 0; k < num_suboperators; ++k) { 18642b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries)); 1865eaf62fffSJeremy L Thompson *num_entries += single_entries; 1866eaf62fffSJeremy L Thompson } 1867eaf62fffSJeremy L Thompson } else { 18682b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(op, &single_entries)); 1869eaf62fffSJeremy L Thompson *num_entries += single_entries; 1870eaf62fffSJeremy L Thompson } 18712b730f8bSJeremy L Thompson CeedCall(CeedCalloc(*num_entries, rows)); 18722b730f8bSJeremy L Thompson CeedCall(CeedCalloc(*num_entries, cols)); 1873eaf62fffSJeremy L Thompson 1874eaf62fffSJeremy L Thompson // assemble nonzero locations 1875eaf62fffSJeremy L Thompson CeedInt offset = 0; 1876eaf62fffSJeremy L Thompson if (is_composite) { 1877c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1878c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 187992ae7e47SJeremy L Thompson for (CeedInt k = 0; k < num_suboperators; ++k) { 18802b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleSymbolic(sub_operators[k], offset, *rows, *cols)); 18812b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries)); 1882eaf62fffSJeremy L Thompson offset += single_entries; 1883eaf62fffSJeremy L Thompson } 1884eaf62fffSJeremy L Thompson } else { 18852b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleSymbolic(op, offset, *rows, *cols)); 1886eaf62fffSJeremy L Thompson } 1887eaf62fffSJeremy L Thompson 1888eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1889eaf62fffSJeremy L Thompson } 1890eaf62fffSJeremy L Thompson 1891eaf62fffSJeremy L Thompson /** 1892eaf62fffSJeremy L Thompson @brief Fully assemble the nonzero entries of a linear operator. 1893eaf62fffSJeremy L Thompson 1894ea61e9acSJeremy L Thompson Expected to be used in conjunction with CeedOperatorLinearAssembleSymbolic(). 1895eaf62fffSJeremy L Thompson 1896ea61e9acSJeremy L Thompson The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the 1897ea61e9acSJeremy L Thompson matrix in entry (i, j). Note that the (i, j) pairs are not unique and may repeat. This function returns the values of the nonzero entries to be added, 1898ea61e9acSJeremy L Thompson their (i, j) locations are provided by CeedOperatorLinearAssembleSymbolic() 1899eaf62fffSJeremy L Thompson 1900eaf62fffSJeremy L Thompson This will generally be slow unless your operator is low-order. 1901eaf62fffSJeremy L Thompson 1902ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1903f04ea552SJeremy L Thompson 1904eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 1905eaf62fffSJeremy L Thompson @param[out] values Values to assemble into matrix 1906eaf62fffSJeremy L Thompson 1907eaf62fffSJeremy L Thompson @ref User 1908eaf62fffSJeremy L Thompson **/ 1909eaf62fffSJeremy L Thompson int CeedOperatorLinearAssemble(CeedOperator op, CeedVector values) { 1910eaf62fffSJeremy L Thompson CeedInt num_suboperators, single_entries = 0; 1911eaf62fffSJeremy L Thompson CeedOperator *sub_operators; 1912f3d47e36SJeremy L Thompson bool is_composite; 19132b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1914f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1915f3d47e36SJeremy L Thompson 1916f3d47e36SJeremy L Thompson // Early exit for empty operator 1917f3d47e36SJeremy L Thompson if (!is_composite) { 1918f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1919f3d47e36SJeremy L Thompson 1920f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1921f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1922f3d47e36SJeremy L Thompson } 1923eaf62fffSJeremy L Thompson 1924eaf62fffSJeremy L Thompson if (op->LinearAssemble) { 1925d04bbc78SJeremy L Thompson // Backend version 19262b730f8bSJeremy L Thompson CeedCall(op->LinearAssemble(op, values)); 1927eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1928eaf62fffSJeremy L Thompson } else { 1929d04bbc78SJeremy L Thompson // Operator fallback 1930d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1931d04bbc78SJeremy L Thompson 19322b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1933d04bbc78SJeremy L Thompson if (op_fallback) { 19342b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssemble(op_fallback, values)); 1935eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1936eaf62fffSJeremy L Thompson } 1937eaf62fffSJeremy L Thompson } 1938eaf62fffSJeremy L Thompson 1939eaf62fffSJeremy L Thompson // Default interface implementation 1940eaf62fffSJeremy L Thompson CeedInt offset = 0; 194128ec399dSJeremy L Thompson CeedCall(CeedVectorSetValue(values, 0.0)); 1942eaf62fffSJeremy L Thompson if (is_composite) { 1943c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1944c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 1945cefa2673SJeremy L Thompson for (CeedInt k = 0; k < num_suboperators; k++) { 19462b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemble(sub_operators[k], offset, values)); 19472b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries)); 1948eaf62fffSJeremy L Thompson offset += single_entries; 1949eaf62fffSJeremy L Thompson } 1950eaf62fffSJeremy L Thompson } else { 19512b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemble(op, offset, values)); 1952eaf62fffSJeremy L Thompson } 1953eaf62fffSJeremy L Thompson 1954eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1955eaf62fffSJeremy L Thompson } 1956eaf62fffSJeremy L Thompson 1957eaf62fffSJeremy L Thompson /** 195875f0d5a4SJeremy L Thompson @brief Get the multiplicity of nodes across suboperators in a composite CeedOperator 195975f0d5a4SJeremy L Thompson 196075f0d5a4SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 196175f0d5a4SJeremy L Thompson 196275f0d5a4SJeremy L Thompson @param[in] op Composite CeedOperator 196375f0d5a4SJeremy L Thompson @param[in] num_skip_indices Number of suboperators to skip 196475f0d5a4SJeremy L Thompson @param[in] skip_indices Array of indices of suboperators to skip 196575f0d5a4SJeremy L Thompson @param[out] mult Vector to store multiplicity (of size l_size) 196675f0d5a4SJeremy L Thompson 196775f0d5a4SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 196875f0d5a4SJeremy L Thompson 196975f0d5a4SJeremy L Thompson @ref User 197075f0d5a4SJeremy L Thompson **/ 197175f0d5a4SJeremy L Thompson int CeedCompositeOperatorGetMultiplicity(CeedOperator op, CeedInt num_skip_indices, CeedInt *skip_indices, CeedVector mult) { 197275f0d5a4SJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 197375f0d5a4SJeremy L Thompson 197475f0d5a4SJeremy L Thompson Ceed ceed; 1975b275c451SJeremy L Thompson CeedInt num_suboperators; 197675f0d5a4SJeremy L Thompson CeedSize l_vec_len; 197775f0d5a4SJeremy L Thompson CeedScalar *mult_array; 197875f0d5a4SJeremy L Thompson CeedVector ones_l_vec; 1979437c7c90SJeremy L Thompson CeedElemRestriction elem_rstr; 1980b275c451SJeremy L Thompson CeedOperator *sub_operators; 198175f0d5a4SJeremy L Thompson 198275f0d5a4SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 198375f0d5a4SJeremy L Thompson 198475f0d5a4SJeremy L Thompson // Zero mult vector 198575f0d5a4SJeremy L Thompson CeedCall(CeedVectorSetValue(mult, 0.0)); 198675f0d5a4SJeremy L Thompson 198775f0d5a4SJeremy L Thompson // Get suboperators 1988b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1989b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 1990b275c451SJeremy L Thompson if (num_suboperators == 0) return CEED_ERROR_SUCCESS; 199175f0d5a4SJeremy L Thompson 199275f0d5a4SJeremy L Thompson // Work vector 199375f0d5a4SJeremy L Thompson CeedCall(CeedVectorGetLength(mult, &l_vec_len)); 199475f0d5a4SJeremy L Thompson CeedCall(CeedVectorCreate(ceed, l_vec_len, &ones_l_vec)); 199575f0d5a4SJeremy L Thompson CeedCall(CeedVectorSetValue(ones_l_vec, 1.0)); 199675f0d5a4SJeremy L Thompson CeedCall(CeedVectorGetArray(mult, CEED_MEM_HOST, &mult_array)); 199775f0d5a4SJeremy L Thompson 199875f0d5a4SJeremy L Thompson // Compute multiplicity across suboperators 1999b275c451SJeremy L Thompson for (CeedInt i = 0; i < num_suboperators; i++) { 200075f0d5a4SJeremy L Thompson const CeedScalar *sub_mult_array; 200175f0d5a4SJeremy L Thompson CeedVector sub_mult_l_vec, ones_e_vec; 200275f0d5a4SJeremy L Thompson 200375f0d5a4SJeremy L Thompson // -- Check for suboperator to skip 200475f0d5a4SJeremy L Thompson for (CeedInt j = 0; j < num_skip_indices; j++) { 200575f0d5a4SJeremy L Thompson if (skip_indices[j] == i) continue; 200675f0d5a4SJeremy L Thompson } 200775f0d5a4SJeremy L Thompson 200875f0d5a4SJeremy L Thompson // -- Sub operator multiplicity 2009437c7c90SJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(sub_operators[i], &elem_rstr)); 2010437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionCreateVector(elem_rstr, &sub_mult_l_vec, &ones_e_vec)); 201175f0d5a4SJeremy L Thompson CeedCall(CeedVectorSetValue(sub_mult_l_vec, 0.0)); 2012437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionApply(elem_rstr, CEED_NOTRANSPOSE, ones_l_vec, ones_e_vec, CEED_REQUEST_IMMEDIATE)); 2013437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionApply(elem_rstr, CEED_TRANSPOSE, ones_e_vec, sub_mult_l_vec, CEED_REQUEST_IMMEDIATE)); 201475f0d5a4SJeremy L Thompson CeedCall(CeedVectorGetArrayRead(sub_mult_l_vec, CEED_MEM_HOST, &sub_mult_array)); 201575f0d5a4SJeremy L Thompson // ---- Flag every node present in the current suboperator 201675f0d5a4SJeremy L Thompson for (CeedInt j = 0; j < l_vec_len; j++) { 201775f0d5a4SJeremy L Thompson if (sub_mult_array[j] > 0.0) mult_array[j] += 1.0; 201875f0d5a4SJeremy L Thompson } 201975f0d5a4SJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(sub_mult_l_vec, &sub_mult_array)); 202075f0d5a4SJeremy L Thompson CeedCall(CeedVectorDestroy(&sub_mult_l_vec)); 202175f0d5a4SJeremy L Thompson CeedCall(CeedVectorDestroy(&ones_e_vec)); 202275f0d5a4SJeremy L Thompson } 202375f0d5a4SJeremy L Thompson CeedCall(CeedVectorRestoreArray(mult, &mult_array)); 2024811d0ccfSJeremy L Thompson CeedCall(CeedVectorDestroy(&ones_l_vec)); 202575f0d5a4SJeremy L Thompson 202675f0d5a4SJeremy L Thompson return CEED_ERROR_SUCCESS; 202775f0d5a4SJeremy L Thompson } 202875f0d5a4SJeremy L Thompson 202975f0d5a4SJeremy L Thompson /** 2030ea61e9acSJeremy L Thompson @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator, creating the prolongation basis from the fine and coarse 2031ea61e9acSJeremy L Thompson grid interpolation 2032eaf62fffSJeremy L Thompson 203358e4b056SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable. 2034f04ea552SJeremy L Thompson 2035eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 203685bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 2037eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 2038eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 2039eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 204085bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 204185bb9dcfSJeremy L Thompson @param[out] op_restrict Fine to coarse operator, or NULL 2042eaf62fffSJeremy L Thompson 2043eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2044eaf62fffSJeremy L Thompson 2045eaf62fffSJeremy L Thompson @ref User 2046eaf62fffSJeremy L Thompson **/ 20472b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreate(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 20482b730f8bSJeremy L Thompson CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) { 20492b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fine)); 2050eaf62fffSJeremy L Thompson 205183d6adf3SZach Atkins // Build prolongation matrix, if required 205283d6adf3SZach Atkins CeedBasis basis_c_to_f = NULL; 205383d6adf3SZach Atkins if (op_prolong || op_restrict) { 205483d6adf3SZach Atkins CeedBasis basis_fine; 20552b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine)); 20562b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateProjection(basis_coarse, basis_fine, &basis_c_to_f)); 205783d6adf3SZach Atkins } 2058eaf62fffSJeremy L Thompson 2059f113e5dcSJeremy L Thompson // Core code 20602b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict)); 2061f113e5dcSJeremy L Thompson 2062eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2063eaf62fffSJeremy L Thompson } 2064eaf62fffSJeremy L Thompson 2065eaf62fffSJeremy L Thompson /** 2066ea61e9acSJeremy L Thompson @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a tensor basis for the active basis 2067eaf62fffSJeremy L Thompson 206858e4b056SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable. 2069f04ea552SJeremy L Thompson 2070eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 207185bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 2072eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 2073eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 207485bb9dcfSJeremy L Thompson @param[in] interp_c_to_f Matrix for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators 2075eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 207685bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 207785bb9dcfSJeremy L Thompson @param[out] op_restrict Fine to coarse operator, or NULL 2078eaf62fffSJeremy L Thompson 2079eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2080eaf62fffSJeremy L Thompson 2081eaf62fffSJeremy L Thompson @ref User 2082eaf62fffSJeremy L Thompson **/ 20832b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateTensorH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 20842b730f8bSJeremy L Thompson const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, 20852b730f8bSJeremy L Thompson CeedOperator *op_restrict) { 20862b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fine)); 2087eaf62fffSJeremy L Thompson Ceed ceed; 20882b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op_fine, &ceed)); 2089eaf62fffSJeremy L Thompson 2090eaf62fffSJeremy L Thompson // Check for compatible quadrature spaces 2091eaf62fffSJeremy L Thompson CeedBasis basis_fine; 20922b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine)); 2093eaf62fffSJeremy L Thompson CeedInt Q_f, Q_c; 20942b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f)); 20952b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c)); 2096*6574a04fSJeremy L Thompson CeedCheck(Q_f == Q_c, ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces"); 2097eaf62fffSJeremy L Thompson 209883d6adf3SZach Atkins // Create coarse to fine basis, if required 209983d6adf3SZach Atkins CeedBasis basis_c_to_f = NULL; 210083d6adf3SZach Atkins if (op_prolong || op_restrict) { 210183d6adf3SZach Atkins // Check if interpolation matrix is provided 2102*6574a04fSJeremy L Thompson CeedCheck(interp_c_to_f, ceed, CEED_ERROR_INCOMPATIBLE, 2103*6574a04fSJeremy L Thompson "Prolongation or restriction operator creation requires coarse-to-fine interpolation matrix"); 2104eaf62fffSJeremy L Thompson CeedInt dim, num_comp, num_nodes_c, P_1d_f, P_1d_c; 21052b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis_fine, &dim)); 21062b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp)); 21072b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes1D(basis_fine, &P_1d_f)); 21082b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c)); 21092b730f8bSJeremy L Thompson P_1d_c = dim == 1 ? num_nodes_c : dim == 2 ? sqrt(num_nodes_c) : cbrt(num_nodes_c); 2110eaf62fffSJeremy L Thompson CeedScalar *q_ref, *q_weight, *grad; 21112b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d_f, &q_ref)); 21122b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d_f, &q_weight)); 21132b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d_f * P_1d_c * dim, &grad)); 21142b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateTensorH1(ceed, dim, num_comp, P_1d_c, P_1d_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f)); 21152b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_ref)); 21162b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_weight)); 21172b730f8bSJeremy L Thompson CeedCall(CeedFree(&grad)); 211883d6adf3SZach Atkins } 2119eaf62fffSJeremy L Thompson 2120eaf62fffSJeremy L Thompson // Core code 21212b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict)); 2122eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2123eaf62fffSJeremy L Thompson } 2124eaf62fffSJeremy L Thompson 2125eaf62fffSJeremy L Thompson /** 2126ea61e9acSJeremy L Thompson @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a non-tensor basis for the active vector 2127eaf62fffSJeremy L Thompson 212858e4b056SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable. 2129f04ea552SJeremy L Thompson 2130eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 213185bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 2132eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 2133eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 213485bb9dcfSJeremy L Thompson @param[in] interp_c_to_f Matrix for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators 2135eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 213685bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 213785bb9dcfSJeremy L Thompson @param[out] op_restrict Fine to coarse operator, or NULL 2138eaf62fffSJeremy L Thompson 2139eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2140eaf62fffSJeremy L Thompson 2141eaf62fffSJeremy L Thompson @ref User 2142eaf62fffSJeremy L Thompson **/ 21432b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 21442b730f8bSJeremy L Thompson const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, 2145eaf62fffSJeremy L Thompson CeedOperator *op_restrict) { 21462b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fine)); 2147eaf62fffSJeremy L Thompson Ceed ceed; 21482b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op_fine, &ceed)); 2149eaf62fffSJeremy L Thompson 2150eaf62fffSJeremy L Thompson // Check for compatible quadrature spaces 2151eaf62fffSJeremy L Thompson CeedBasis basis_fine; 21522b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine)); 2153eaf62fffSJeremy L Thompson CeedInt Q_f, Q_c; 21542b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f)); 21552b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c)); 2156*6574a04fSJeremy L Thompson CeedCheck(Q_f == Q_c, ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces"); 2157eaf62fffSJeremy L Thompson 2158eaf62fffSJeremy L Thompson // Coarse to fine basis 215983d6adf3SZach Atkins CeedBasis basis_c_to_f = NULL; 216083d6adf3SZach Atkins if (op_prolong || op_restrict) { 216183d6adf3SZach Atkins // Check if interpolation matrix is provided 2162*6574a04fSJeremy L Thompson CeedCheck(interp_c_to_f, ceed, CEED_ERROR_INCOMPATIBLE, 2163*6574a04fSJeremy L Thompson "Prolongation or restriction operator creation requires coarse-to-fine interpolation matrix"); 2164eaf62fffSJeremy L Thompson CeedElemTopology topo; 21652b730f8bSJeremy L Thompson CeedCall(CeedBasisGetTopology(basis_fine, &topo)); 2166eaf62fffSJeremy L Thompson CeedInt dim, num_comp, num_nodes_c, num_nodes_f; 21672b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis_fine, &dim)); 21682b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp)); 21692b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes(basis_fine, &num_nodes_f)); 21702b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c)); 2171eaf62fffSJeremy L Thompson CeedScalar *q_ref, *q_weight, *grad; 21722b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_nodes_f * dim, &q_ref)); 21732b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_nodes_f, &q_weight)); 21742b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_nodes_f * num_nodes_c * dim, &grad)); 21752b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateH1(ceed, topo, num_comp, num_nodes_c, num_nodes_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f)); 21762b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_ref)); 21772b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_weight)); 21782b730f8bSJeremy L Thompson CeedCall(CeedFree(&grad)); 217983d6adf3SZach Atkins } 2180eaf62fffSJeremy L Thompson 2181eaf62fffSJeremy L Thompson // Core code 21822b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict)); 2183eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2184eaf62fffSJeremy L Thompson } 2185eaf62fffSJeremy L Thompson 2186eaf62fffSJeremy L Thompson /** 2187ea61e9acSJeremy L Thompson @brief Build a FDM based approximate inverse for each element for a CeedOperator 2188eaf62fffSJeremy L Thompson 2189ea61e9acSJeremy L Thompson This returns a CeedOperator and CeedVector to apply a Fast Diagonalization Method based approximate inverse. 2190859c15bbSJames Wright This function obtains the simultaneous diagonalization for the 1D mass and Laplacian operators, \f$M = V^T V, K = V^T S V\f$. 2191859c15bbSJames Wright The assembled QFunction is used to modify the eigenvalues from simultaneous diagonalization and obtain an approximate inverse of the form \f$V^T 2192859c15bbSJames Wright \hat S V\f$. The CeedOperator must be linear and non-composite. The associated CeedQFunction must therefore also be linear. 2193eaf62fffSJeremy L Thompson 2194ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 2195f04ea552SJeremy L Thompson 2196ea61e9acSJeremy L Thompson @param[in] op CeedOperator to create element inverses 2197ea61e9acSJeremy L Thompson @param[out] fdm_inv CeedOperator to apply the action of a FDM based inverse for each element 2198ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 2199eaf62fffSJeremy L Thompson 2200eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2201eaf62fffSJeremy L Thompson 2202480fae85SJeremy L Thompson @ref User 2203eaf62fffSJeremy L Thompson **/ 22042b730f8bSJeremy L Thompson int CeedOperatorCreateFDMElementInverse(CeedOperator op, CeedOperator *fdm_inv, CeedRequest *request) { 22052b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 2206eaf62fffSJeremy L Thompson 2207eaf62fffSJeremy L Thompson if (op->CreateFDMElementInverse) { 2208d04bbc78SJeremy L Thompson // Backend version 22092b730f8bSJeremy L Thompson CeedCall(op->CreateFDMElementInverse(op, fdm_inv, request)); 2210eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2211eaf62fffSJeremy L Thompson } else { 2212d04bbc78SJeremy L Thompson // Operator fallback 2213d04bbc78SJeremy L Thompson CeedOperator op_fallback; 2214d04bbc78SJeremy L Thompson 22152b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 2216d04bbc78SJeremy L Thompson if (op_fallback) { 22172b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreateFDMElementInverse(op_fallback, fdm_inv, request)); 2218eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2219eaf62fffSJeremy L Thompson } 2220eaf62fffSJeremy L Thompson } 2221eaf62fffSJeremy L Thompson 2222d04bbc78SJeremy L Thompson // Default interface implementation 2223eaf62fffSJeremy L Thompson Ceed ceed, ceed_parent; 22242b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 22252b730f8bSJeremy L Thompson CeedCall(CeedGetOperatorFallbackParentCeed(ceed, &ceed_parent)); 2226eaf62fffSJeremy L Thompson ceed_parent = ceed_parent ? ceed_parent : ceed; 2227eaf62fffSJeremy L Thompson CeedQFunction qf; 22282b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 2229eaf62fffSJeremy L Thompson 2230eaf62fffSJeremy L Thompson // Determine active input basis 2231eaf62fffSJeremy L Thompson bool interp = false, grad = false; 2232eaf62fffSJeremy L Thompson CeedBasis basis = NULL; 2233eaf62fffSJeremy L Thompson CeedElemRestriction rstr = NULL; 2234eaf62fffSJeremy L Thompson CeedOperatorField *op_fields; 2235eaf62fffSJeremy L Thompson CeedQFunctionField *qf_fields; 2236eaf62fffSJeremy L Thompson CeedInt num_input_fields; 22372b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, &num_input_fields, &op_fields, NULL, NULL)); 22382b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL)); 2239eaf62fffSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 2240eaf62fffSJeremy L Thompson CeedVector vec; 22412b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec)); 2242eaf62fffSJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 2243eaf62fffSJeremy L Thompson CeedEvalMode eval_mode; 22442b730f8bSJeremy L Thompson CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 2245eaf62fffSJeremy L Thompson interp = interp || eval_mode == CEED_EVAL_INTERP; 2246eaf62fffSJeremy L Thompson grad = grad || eval_mode == CEED_EVAL_GRAD; 22472b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 22482b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr)); 2249eaf62fffSJeremy L Thompson } 2250eaf62fffSJeremy L Thompson } 2251*6574a04fSJeremy L Thompson CeedCheck(basis, ceed, CEED_ERROR_BACKEND, "No active field set"); 2252e79b91d9SJeremy L Thompson CeedSize l_size = 1; 2253352a5e7cSSebastian Grimberg CeedInt P_1d, Q_1d, num_nodes, num_qpts, dim, num_comp = 1, num_elem = 1; 22542b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes1D(basis, &P_1d)); 2255352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumNodes(basis, &num_nodes)); 22562b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints1D(basis, &Q_1d)); 22572b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis, &num_qpts)); 22582b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis, &dim)); 22592b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis, &num_comp)); 22602b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem)); 22612b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size)); 2262eaf62fffSJeremy L Thompson 2263eaf62fffSJeremy L Thompson // Build and diagonalize 1D Mass and Laplacian 2264*6574a04fSJeremy L Thompson bool is_tensor_basis; 2265*6574a04fSJeremy L Thompson CeedCall(CeedBasisIsTensor(basis, &is_tensor_basis)); 2266*6574a04fSJeremy L Thompson CeedCheck(is_tensor_basis, ceed, CEED_ERROR_BACKEND, "FDMElementInverse only supported for tensor bases"); 2267eaf62fffSJeremy L Thompson CeedScalar *mass, *laplace, *x, *fdm_interp, *lambda; 22682b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &mass)); 22692b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &laplace)); 22702b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &x)); 22712b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &fdm_interp)); 22722b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d, &lambda)); 2273eaf62fffSJeremy L Thompson // -- Build matrices 2274eaf62fffSJeremy L Thompson const CeedScalar *interp_1d, *grad_1d, *q_weight_1d; 22752b730f8bSJeremy L Thompson CeedCall(CeedBasisGetInterp1D(basis, &interp_1d)); 22762b730f8bSJeremy L Thompson CeedCall(CeedBasisGetGrad1D(basis, &grad_1d)); 22772b730f8bSJeremy L Thompson CeedCall(CeedBasisGetQWeights(basis, &q_weight_1d)); 22782b730f8bSJeremy L Thompson CeedCall(CeedBuildMassLaplace(interp_1d, grad_1d, q_weight_1d, P_1d, Q_1d, dim, mass, laplace)); 2279eaf62fffSJeremy L Thompson 2280eaf62fffSJeremy L Thompson // -- Diagonalize 22812b730f8bSJeremy L Thompson CeedCall(CeedSimultaneousDiagonalization(ceed, laplace, mass, x, lambda, P_1d)); 22822b730f8bSJeremy L Thompson CeedCall(CeedFree(&mass)); 22832b730f8bSJeremy L Thompson CeedCall(CeedFree(&laplace)); 22842b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) { 22852b730f8bSJeremy L Thompson for (CeedInt j = 0; j < P_1d; j++) fdm_interp[i + j * P_1d] = x[j + i * P_1d]; 22862b730f8bSJeremy L Thompson } 22872b730f8bSJeremy L Thompson CeedCall(CeedFree(&x)); 2288eaf62fffSJeremy L Thompson 2289eaf62fffSJeremy L Thompson // Assemble QFunction 2290eaf62fffSJeremy L Thompson CeedVector assembled; 2291eaf62fffSJeremy L Thompson CeedElemRestriction rstr_qf; 22922b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled, &rstr_qf, request)); 2293eaf62fffSJeremy L Thompson CeedInt layout[3]; 22942b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(rstr_qf, &layout)); 22952b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_qf)); 2296eaf62fffSJeremy L Thompson CeedScalar max_norm = 0; 22972b730f8bSJeremy L Thompson CeedCall(CeedVectorNorm(assembled, CEED_NORM_MAX, &max_norm)); 2298eaf62fffSJeremy L Thompson 2299eaf62fffSJeremy L Thompson // Calculate element averages 2300eaf62fffSJeremy L Thompson CeedInt num_modes = (interp ? 1 : 0) + (grad ? dim : 0); 2301eaf62fffSJeremy L Thompson CeedScalar *elem_avg; 2302eaf62fffSJeremy L Thompson const CeedScalar *assembled_array, *q_weight_array; 2303eaf62fffSJeremy L Thompson CeedVector q_weight; 23042b730f8bSJeremy L Thompson CeedCall(CeedVectorCreate(ceed_parent, num_qpts, &q_weight)); 23052b730f8bSJeremy L Thompson CeedCall(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, q_weight)); 23062b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(assembled, CEED_MEM_HOST, &assembled_array)); 23072b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(q_weight, CEED_MEM_HOST, &q_weight_array)); 23082b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_elem, &elem_avg)); 2309eaf62fffSJeremy L Thompson const CeedScalar qf_value_bound = max_norm * 100 * CEED_EPSILON; 2310eaf62fffSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 2311eaf62fffSJeremy L Thompson CeedInt count = 0; 23122b730f8bSJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 23132b730f8bSJeremy L Thompson for (CeedInt i = 0; i < num_comp * num_comp * num_modes * num_modes; i++) { 23142b730f8bSJeremy L Thompson if (fabs(assembled_array[q * layout[0] + i * layout[1] + e * layout[2]]) > qf_value_bound) { 23152b730f8bSJeremy L Thompson elem_avg[e] += assembled_array[q * layout[0] + i * layout[1] + e * layout[2]] / q_weight_array[q]; 2316eaf62fffSJeremy L Thompson count++; 2317eaf62fffSJeremy L Thompson } 23182b730f8bSJeremy L Thompson } 23192b730f8bSJeremy L Thompson } 2320eaf62fffSJeremy L Thompson if (count) { 2321eaf62fffSJeremy L Thompson elem_avg[e] /= count; 2322eaf62fffSJeremy L Thompson } else { 2323eaf62fffSJeremy L Thompson elem_avg[e] = 1.0; 2324eaf62fffSJeremy L Thompson } 2325eaf62fffSJeremy L Thompson } 23262b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(assembled, &assembled_array)); 23272b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled)); 23282b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(q_weight, &q_weight_array)); 23292b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&q_weight)); 2330eaf62fffSJeremy L Thompson 2331eaf62fffSJeremy L Thompson // Build FDM diagonal 2332eaf62fffSJeremy L Thompson CeedVector q_data; 2333eaf62fffSJeremy L Thompson CeedScalar *q_data_array, *fdm_diagonal; 2334352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_comp * num_nodes, &fdm_diagonal)); 2335352a5e7cSSebastian Grimberg const CeedScalar fdm_diagonal_bound = num_nodes * CEED_EPSILON; 23362b730f8bSJeremy L Thompson for (CeedInt c = 0; c < num_comp; c++) { 2337352a5e7cSSebastian Grimberg for (CeedInt n = 0; n < num_nodes; n++) { 2338352a5e7cSSebastian Grimberg if (interp) fdm_diagonal[c * num_nodes + n] = 1.0; 23392b730f8bSJeremy L Thompson if (grad) { 2340eaf62fffSJeremy L Thompson for (CeedInt d = 0; d < dim; d++) { 2341eaf62fffSJeremy L Thompson CeedInt i = (n / CeedIntPow(P_1d, d)) % P_1d; 2342352a5e7cSSebastian Grimberg fdm_diagonal[c * num_nodes + n] += lambda[i]; 2343eaf62fffSJeremy L Thompson } 2344eaf62fffSJeremy L Thompson } 2345352a5e7cSSebastian Grimberg if (fabs(fdm_diagonal[c * num_nodes + n]) < fdm_diagonal_bound) fdm_diagonal[c * num_nodes + n] = fdm_diagonal_bound; 23462b730f8bSJeremy L Thompson } 23472b730f8bSJeremy L Thompson } 2348352a5e7cSSebastian Grimberg CeedCall(CeedVectorCreate(ceed_parent, num_elem * num_comp * num_nodes, &q_data)); 23492b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(q_data, 0.0)); 23502b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayWrite(q_data, CEED_MEM_HOST, &q_data_array)); 23512b730f8bSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 23522b730f8bSJeremy L Thompson for (CeedInt c = 0; c < num_comp; c++) { 2353352a5e7cSSebastian Grimberg for (CeedInt n = 0; n < num_nodes; n++) q_data_array[(e * num_comp + c) * num_nodes + n] = 1. / (elem_avg[e] * fdm_diagonal[c * num_nodes + n]); 23542b730f8bSJeremy L Thompson } 23552b730f8bSJeremy L Thompson } 23562b730f8bSJeremy L Thompson CeedCall(CeedFree(&elem_avg)); 23572b730f8bSJeremy L Thompson CeedCall(CeedFree(&fdm_diagonal)); 23582b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(q_data, &q_data_array)); 2359eaf62fffSJeremy L Thompson 2360eaf62fffSJeremy L Thompson // Setup FDM operator 2361eaf62fffSJeremy L Thompson // -- Basis 2362eaf62fffSJeremy L Thompson CeedBasis fdm_basis; 2363eaf62fffSJeremy L Thompson CeedScalar *grad_dummy, *q_ref_dummy, *q_weight_dummy; 23642b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &grad_dummy)); 23652b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d, &q_ref_dummy)); 23662b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d, &q_weight_dummy)); 23672b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateTensorH1(ceed_parent, dim, num_comp, P_1d, P_1d, fdm_interp, grad_dummy, q_ref_dummy, q_weight_dummy, &fdm_basis)); 23682b730f8bSJeremy L Thompson CeedCall(CeedFree(&fdm_interp)); 23692b730f8bSJeremy L Thompson CeedCall(CeedFree(&grad_dummy)); 23702b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_ref_dummy)); 23712b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_weight_dummy)); 23722b730f8bSJeremy L Thompson CeedCall(CeedFree(&lambda)); 2373eaf62fffSJeremy L Thompson 2374eaf62fffSJeremy L Thompson // -- Restriction 2375eaf62fffSJeremy L Thompson CeedElemRestriction rstr_qd_i; 2376352a5e7cSSebastian Grimberg CeedInt strides[3] = {1, num_nodes, num_nodes * num_comp}; 2377352a5e7cSSebastian Grimberg CeedCall(CeedElemRestrictionCreateStrided(ceed_parent, num_elem, num_nodes, num_comp, num_elem * num_comp * num_nodes, strides, &rstr_qd_i)); 2378eaf62fffSJeremy L Thompson // -- QFunction 2379eaf62fffSJeremy L Thompson CeedQFunction qf_fdm; 23802b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateInteriorByName(ceed_parent, "Scale", &qf_fdm)); 23812b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_fdm, "input", num_comp, CEED_EVAL_INTERP)); 23822b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_fdm, "scale", num_comp, CEED_EVAL_NONE)); 23832b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(qf_fdm, "output", num_comp, CEED_EVAL_INTERP)); 23842b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_fdm, num_comp)); 2385eaf62fffSJeremy L Thompson // -- QFunction context 2386eaf62fffSJeremy L Thompson CeedInt *num_comp_data; 23872b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &num_comp_data)); 2388eaf62fffSJeremy L Thompson num_comp_data[0] = num_comp; 2389eaf62fffSJeremy L Thompson CeedQFunctionContext ctx_fdm; 23902b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextCreate(ceed, &ctx_fdm)); 23912b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextSetData(ctx_fdm, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_data), num_comp_data)); 23922b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(qf_fdm, ctx_fdm)); 23932b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextDestroy(&ctx_fdm)); 2394eaf62fffSJeremy L Thompson // -- Operator 23952b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed_parent, qf_fdm, NULL, NULL, fdm_inv)); 23962b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*fdm_inv, "input", rstr, fdm_basis, CEED_VECTOR_ACTIVE)); 23972b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*fdm_inv, "scale", rstr_qd_i, CEED_BASIS_COLLOCATED, q_data)); 23982b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*fdm_inv, "output", rstr, fdm_basis, CEED_VECTOR_ACTIVE)); 2399eaf62fffSJeremy L Thompson 2400eaf62fffSJeremy L Thompson // Cleanup 24012b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&q_data)); 24022b730f8bSJeremy L Thompson CeedCall(CeedBasisDestroy(&fdm_basis)); 24032b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_qd_i)); 24042b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&qf_fdm)); 2405eaf62fffSJeremy L Thompson 2406eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2407eaf62fffSJeremy L Thompson } 2408eaf62fffSJeremy L Thompson 2409eaf62fffSJeremy L Thompson /// @} 2410