13d8e8822SJeremy L Thompson // Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors. 23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details. 3eaf62fffSJeremy L Thompson // 43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause 5eaf62fffSJeremy L Thompson // 63d8e8822SJeremy L Thompson // This file is part of CEED: http://github.com/ceed 7eaf62fffSJeremy L Thompson 82b730f8bSJeremy L Thompson #include <ceed-impl.h> 949aac155SJeremy L Thompson #include <ceed.h> 102b730f8bSJeremy L Thompson #include <ceed/backend.h> 11c85e8640SSebastian Grimberg #include <assert.h> 122b730f8bSJeremy L Thompson #include <math.h> 13eaf62fffSJeremy L Thompson #include <stdbool.h> 14eaf62fffSJeremy L Thompson #include <stdio.h> 15eaf62fffSJeremy L Thompson #include <string.h> 16eaf62fffSJeremy L Thompson 17eaf62fffSJeremy L Thompson /// @file 18eaf62fffSJeremy L Thompson /// Implementation of CeedOperator preconditioning interfaces 19eaf62fffSJeremy L Thompson 20eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 21eaf62fffSJeremy L Thompson /// CeedOperator Library Internal Preconditioning Functions 22eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 23eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorDeveloper 24eaf62fffSJeremy L Thompson /// @{ 25eaf62fffSJeremy L Thompson 26eaf62fffSJeremy L Thompson /** 27ea61e9acSJeremy L Thompson @brief Duplicate a CeedQFunction with a reference Ceed to fallback for advanced CeedOperator functionality 289e77b9c8SJeremy L Thompson 2901ea9c81SJed Brown @param[in] fallback_ceed Ceed on which to create fallback CeedQFunction 309e77b9c8SJeremy L Thompson @param[in] qf CeedQFunction to create fallback for 3101ea9c81SJed Brown @param[out] qf_fallback fallback CeedQFunction 329e77b9c8SJeremy L Thompson 339e77b9c8SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 349e77b9c8SJeremy L Thompson 359e77b9c8SJeremy L Thompson @ref Developer 369e77b9c8SJeremy L Thompson **/ 372b730f8bSJeremy L Thompson static int CeedQFunctionCreateFallback(Ceed fallback_ceed, CeedQFunction qf, CeedQFunction *qf_fallback) { 389e77b9c8SJeremy L Thompson // Check if NULL qf passed in 399e77b9c8SJeremy L Thompson if (!qf) return CEED_ERROR_SUCCESS; 409e77b9c8SJeremy L Thompson 41d04bbc78SJeremy L Thompson CeedDebug256(qf->ceed, 1, "---------- CeedOperator Fallback ----------\n"); 4213f886e9SJeremy L Thompson CeedDebug(qf->ceed, "Creating fallback CeedQFunction\n"); 43d04bbc78SJeremy L Thompson 441862681bSJeremy Luke Thompson char *source_path_with_name = NULL; 459e77b9c8SJeremy L Thompson if (qf->source_path) { 462b730f8bSJeremy L Thompson size_t path_len = strlen(qf->source_path), name_len = strlen(qf->kernel_name); 472b730f8bSJeremy L Thompson CeedCall(CeedCalloc(path_len + name_len + 2, &source_path_with_name)); 489e77b9c8SJeremy L Thompson memcpy(source_path_with_name, qf->source_path, path_len); 499e77b9c8SJeremy L Thompson memcpy(&source_path_with_name[path_len], ":", 1); 509e77b9c8SJeremy L Thompson memcpy(&source_path_with_name[path_len + 1], qf->kernel_name, name_len); 519e77b9c8SJeremy L Thompson } else { 522b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &source_path_with_name)); 539e77b9c8SJeremy L Thompson } 549e77b9c8SJeremy L Thompson 552b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateInterior(fallback_ceed, qf->vec_length, qf->function, source_path_with_name, qf_fallback)); 569e77b9c8SJeremy L Thompson { 579e77b9c8SJeremy L Thompson CeedQFunctionContext ctx; 589e77b9c8SJeremy L Thompson 592b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetContext(qf, &ctx)); 602b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(*qf_fallback, ctx)); 619e77b9c8SJeremy L Thompson } 629e77b9c8SJeremy L Thompson for (CeedInt i = 0; i < qf->num_input_fields; i++) { 632b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(*qf_fallback, qf->input_fields[i]->field_name, qf->input_fields[i]->size, qf->input_fields[i]->eval_mode)); 649e77b9c8SJeremy L Thompson } 659e77b9c8SJeremy L Thompson for (CeedInt i = 0; i < qf->num_output_fields; i++) { 662b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(*qf_fallback, qf->output_fields[i]->field_name, qf->output_fields[i]->size, qf->output_fields[i]->eval_mode)); 679e77b9c8SJeremy L Thompson } 682b730f8bSJeremy L Thompson CeedCall(CeedFree(&source_path_with_name)); 699e77b9c8SJeremy L Thompson 709e77b9c8SJeremy L Thompson return CEED_ERROR_SUCCESS; 719e77b9c8SJeremy L Thompson } 729e77b9c8SJeremy L Thompson 739e77b9c8SJeremy L Thompson /** 74ea61e9acSJeremy L Thompson @brief Duplicate a CeedOperator with a reference Ceed to fallback for advanced CeedOperator functionality 75eaf62fffSJeremy L Thompson 76ea61e9acSJeremy L Thompson @param[in,out] op CeedOperator to create fallback for 77eaf62fffSJeremy L Thompson 78eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 79eaf62fffSJeremy L Thompson 80eaf62fffSJeremy L Thompson @ref Developer 81eaf62fffSJeremy L Thompson **/ 82d04bbc78SJeremy L Thompson static int CeedOperatorCreateFallback(CeedOperator op) { 83b275c451SJeremy L Thompson bool is_composite; 849e77b9c8SJeremy L Thompson Ceed ceed_fallback; 85eaf62fffSJeremy L Thompson 86805fe78eSJeremy L Thompson // Check not already created 87805fe78eSJeremy L Thompson if (op->op_fallback) return CEED_ERROR_SUCCESS; 88805fe78eSJeremy L Thompson 89eaf62fffSJeremy L Thompson // Fallback Ceed 902b730f8bSJeremy L Thompson CeedCall(CeedGetOperatorFallbackCeed(op->ceed, &ceed_fallback)); 91d04bbc78SJeremy L Thompson if (!ceed_fallback) return CEED_ERROR_SUCCESS; 92d04bbc78SJeremy L Thompson 93d04bbc78SJeremy L Thompson CeedDebug256(op->ceed, 1, "---------- CeedOperator Fallback ----------\n"); 9413f886e9SJeremy L Thompson CeedDebug(op->ceed, "Creating fallback CeedOperator\n"); 95eaf62fffSJeremy L Thompson 96eaf62fffSJeremy L Thompson // Clone Op 97805fe78eSJeremy L Thompson CeedOperator op_fallback; 98b275c451SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 99b275c451SJeremy L Thompson if (is_composite) { 100b275c451SJeremy L Thompson CeedInt num_suboperators; 101b275c451SJeremy L Thompson CeedOperator *sub_operators; 102b275c451SJeremy L Thompson 1032b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorCreate(ceed_fallback, &op_fallback)); 104b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 105b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 106b275c451SJeremy L Thompson for (CeedInt i = 0; i < num_suboperators; i++) { 107d04bbc78SJeremy L Thompson CeedOperator op_sub_fallback; 108d04bbc78SJeremy L Thompson 109b275c451SJeremy L Thompson CeedCall(CeedOperatorGetFallback(sub_operators[i], &op_sub_fallback)); 1102b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorAddSub(op_fallback, op_sub_fallback)); 111805fe78eSJeremy L Thompson } 112805fe78eSJeremy L Thompson } else { 1139e77b9c8SJeremy L Thompson CeedQFunction qf_fallback = NULL, dqf_fallback = NULL, dqfT_fallback = NULL; 1142b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->qf, &qf_fallback)); 1152b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqf, &dqf_fallback)); 1162b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqfT, &dqfT_fallback)); 1172b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed_fallback, qf_fallback, dqf_fallback, dqfT_fallback, &op_fallback)); 118805fe78eSJeremy L Thompson for (CeedInt i = 0; i < op->qf->num_input_fields; i++) { 119437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(op_fallback, op->input_fields[i]->field_name, op->input_fields[i]->elem_rstr, op->input_fields[i]->basis, 1202b730f8bSJeremy L Thompson op->input_fields[i]->vec)); 121805fe78eSJeremy L Thompson } 122805fe78eSJeremy L Thompson for (CeedInt i = 0; i < op->qf->num_output_fields; i++) { 123437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(op_fallback, op->output_fields[i]->field_name, op->output_fields[i]->elem_rstr, op->output_fields[i]->basis, 1242b730f8bSJeremy L Thompson op->output_fields[i]->vec)); 125805fe78eSJeremy L Thompson } 1262b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op->qf_assembled, &op_fallback->qf_assembled)); 127febe2972SJeremy L Thompson if (op_fallback->num_qpts == 0) CeedCall(CeedOperatorSetNumQuadraturePoints(op_fallback, op->num_qpts)); 1289e77b9c8SJeremy L Thompson // Cleanup 1292b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&qf_fallback)); 1302b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&dqf_fallback)); 1312b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&dqfT_fallback)); 132805fe78eSJeremy L Thompson } 1332b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetName(op_fallback, op->name)); 1342b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fallback)); 135*b05f7e9fSJeremy L Thompson // Note: No ref-counting here so we don't get caught in a reference loop. 136*b05f7e9fSJeremy L Thompson // The op holds the only reference to op_fallback and is responsible for deleting itself and op_fallback. 137805fe78eSJeremy L Thompson op->op_fallback = op_fallback; 138*b05f7e9fSJeremy L Thompson op_fallback->op_fallback_parent = op; 139eaf62fffSJeremy L Thompson 140eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 141eaf62fffSJeremy L Thompson } 142eaf62fffSJeremy L Thompson 143eaf62fffSJeremy L Thompson /** 144ea61e9acSJeremy L Thompson @brief Retrieve fallback CeedOperator with a reference Ceed for advanced CeedOperator functionality 145d04bbc78SJeremy L Thompson 146d04bbc78SJeremy L Thompson @param[in] op CeedOperator to retrieve fallback for 147d04bbc78SJeremy L Thompson @param[out] op_fallback Fallback CeedOperator 148d04bbc78SJeremy L Thompson 149d04bbc78SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 150d04bbc78SJeremy L Thompson 151d04bbc78SJeremy L Thompson @ref Developer 152d04bbc78SJeremy L Thompson **/ 153d04bbc78SJeremy L Thompson int CeedOperatorGetFallback(CeedOperator op, CeedOperator *op_fallback) { 154d04bbc78SJeremy L Thompson // Create if needed 155d04bbc78SJeremy L Thompson if (!op->op_fallback) { 1562b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreateFallback(op)); 157d04bbc78SJeremy L Thompson } 158d04bbc78SJeremy L Thompson if (op->op_fallback) { 159d04bbc78SJeremy L Thompson bool is_debug; 160d04bbc78SJeremy L Thompson 1612b730f8bSJeremy L Thompson CeedCall(CeedIsDebug(op->ceed, &is_debug)); 162d04bbc78SJeremy L Thompson if (is_debug) { 163b275c451SJeremy L Thompson Ceed ceed, ceed_fallback; 164d04bbc78SJeremy L Thompson const char *resource, *resource_fallback; 165d04bbc78SJeremy L Thompson 166b275c451SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 167b275c451SJeremy L Thompson CeedCall(CeedGetOperatorFallbackCeed(ceed, &ceed_fallback)); 168b275c451SJeremy L Thompson CeedCall(CeedGetResource(ceed, &resource)); 1692b730f8bSJeremy L Thompson CeedCall(CeedGetResource(ceed_fallback, &resource_fallback)); 170d04bbc78SJeremy L Thompson 17123d4529eSJeremy L Thompson CeedDebug256(ceed, CEED_DEBUG_COLOR_SUCCESS, "---------- CeedOperator Fallback ----------\n"); 172b275c451SJeremy L Thompson CeedDebug(ceed, "Falling back from %s operator at address %ld to %s operator at address %ld\n", resource, op, resource_fallback, 1732b730f8bSJeremy L Thompson op->op_fallback); 174d04bbc78SJeremy L Thompson } 175d04bbc78SJeremy L Thompson } 176d04bbc78SJeremy L Thompson *op_fallback = op->op_fallback; 177d04bbc78SJeremy L Thompson 178d04bbc78SJeremy L Thompson return CEED_ERROR_SUCCESS; 179d04bbc78SJeremy L Thompson } 180d04bbc78SJeremy L Thompson 181d04bbc78SJeremy L Thompson /** 182eaf62fffSJeremy L Thompson @brief Select correct basis matrix pointer based on CeedEvalMode 183eaf62fffSJeremy L Thompson 184352a5e7cSSebastian Grimberg @param[in] basis CeedBasis from which to get the basis matrix 185eaf62fffSJeremy L Thompson @param[in] eval_mode Current basis evaluation mode 186eaf62fffSJeremy L Thompson @param[in] identity Pointer to identity matrix 187eaf62fffSJeremy L Thompson @param[out] basis_ptr Basis pointer to set 188eaf62fffSJeremy L Thompson 189eaf62fffSJeremy L Thompson @ref Developer 190eaf62fffSJeremy L Thompson **/ 191352a5e7cSSebastian Grimberg static inline int CeedOperatorGetBasisPointer(CeedBasis basis, CeedEvalMode eval_mode, const CeedScalar *identity, const CeedScalar **basis_ptr) { 192eaf62fffSJeremy L Thompson switch (eval_mode) { 193eaf62fffSJeremy L Thompson case CEED_EVAL_NONE: 194eaf62fffSJeremy L Thompson *basis_ptr = identity; 195eaf62fffSJeremy L Thompson break; 196eaf62fffSJeremy L Thompson case CEED_EVAL_INTERP: 197352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetInterp(basis, basis_ptr)); 198eaf62fffSJeremy L Thompson break; 199eaf62fffSJeremy L Thompson case CEED_EVAL_GRAD: 200352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetGrad(basis, basis_ptr)); 201352a5e7cSSebastian Grimberg break; 202352a5e7cSSebastian Grimberg case CEED_EVAL_DIV: 203352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetDiv(basis, basis_ptr)); 204352a5e7cSSebastian Grimberg break; 205352a5e7cSSebastian Grimberg case CEED_EVAL_CURL: 206352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetCurl(basis, basis_ptr)); 207eaf62fffSJeremy L Thompson break; 208eaf62fffSJeremy L Thompson case CEED_EVAL_WEIGHT: 209eaf62fffSJeremy L Thompson break; // Caught by QF Assembly 210eaf62fffSJeremy L Thompson } 211ed9e99e6SJeremy L Thompson assert(*basis_ptr != NULL); 212352a5e7cSSebastian Grimberg 213352a5e7cSSebastian Grimberg return CEED_ERROR_SUCCESS; 214eaf62fffSJeremy L Thompson } 215eaf62fffSJeremy L Thompson 216eaf62fffSJeremy L Thompson /** 217eaf62fffSJeremy L Thompson @brief Create point block restriction for active operator field 218eaf62fffSJeremy L Thompson 219eaf62fffSJeremy L Thompson @param[in] rstr Original CeedElemRestriction for active field 220ea61e9acSJeremy L Thompson @param[out] pointblock_rstr Address of the variable where the newly created CeedElemRestriction will be stored 221eaf62fffSJeremy L Thompson 222eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 223eaf62fffSJeremy L Thompson 224eaf62fffSJeremy L Thompson @ref Developer 225eaf62fffSJeremy L Thompson **/ 2262b730f8bSJeremy L Thompson static int CeedOperatorCreateActivePointBlockRestriction(CeedElemRestriction rstr, CeedElemRestriction *pointblock_rstr) { 227eaf62fffSJeremy L Thompson Ceed ceed; 2282b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetCeed(rstr, &ceed)); 229eaf62fffSJeremy L Thompson const CeedInt *offsets; 2302b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetOffsets(rstr, CEED_MEM_HOST, &offsets)); 231eaf62fffSJeremy L Thompson 232eaf62fffSJeremy L Thompson // Expand offsets 2337b63f5c6SJed Brown CeedInt num_elem, num_comp, elem_size, comp_stride, *pointblock_offsets; 2347b63f5c6SJed Brown CeedSize l_size; 2352b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem)); 2362b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp)); 2372b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size)); 2382b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetCompStride(rstr, &comp_stride)); 2392b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size)); 240eaf62fffSJeremy L Thompson CeedInt shift = num_comp; 2412b730f8bSJeremy L Thompson if (comp_stride != 1) shift *= num_comp; 2422b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_elem * elem_size, &pointblock_offsets)); 243eaf62fffSJeremy L Thompson for (CeedInt i = 0; i < num_elem * elem_size; i++) { 244eaf62fffSJeremy L Thompson pointblock_offsets[i] = offsets[i] * shift; 245eaf62fffSJeremy L Thompson } 246eaf62fffSJeremy L Thompson 247eaf62fffSJeremy L Thompson // Create new restriction 2482b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionCreate(ceed, num_elem, elem_size, num_comp * num_comp, 1, l_size * num_comp, CEED_MEM_HOST, CEED_OWN_POINTER, 2492b730f8bSJeremy L Thompson pointblock_offsets, pointblock_rstr)); 250eaf62fffSJeremy L Thompson 251eaf62fffSJeremy L Thompson // Cleanup 2522b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionRestoreOffsets(rstr, &offsets)); 253eaf62fffSJeremy L Thompson 254eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 255eaf62fffSJeremy L Thompson } 256eaf62fffSJeremy L Thompson 257eaf62fffSJeremy L Thompson /** 258eaf62fffSJeremy L Thompson @brief Core logic for assembling operator diagonal or point block diagonal 259eaf62fffSJeremy L Thompson 260eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble point block diagonal 261ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE 262eaf62fffSJeremy L Thompson @param[in] is_pointblock Boolean flag to assemble diagonal or point block diagonal 263eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled diagonal 264eaf62fffSJeremy L Thompson 265eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 266eaf62fffSJeremy L Thompson 267eaf62fffSJeremy L Thompson @ref Developer 268eaf62fffSJeremy L Thompson **/ 2692b730f8bSJeremy L Thompson static inline int CeedSingleOperatorAssembleAddDiagonal_Core(CeedOperator op, CeedRequest *request, const bool is_pointblock, CeedVector assembled) { 270eaf62fffSJeremy L Thompson Ceed ceed; 2712b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 272eaf62fffSJeremy L Thompson 273eaf62fffSJeremy L Thompson // Assemble QFunction 274eaf62fffSJeremy L Thompson CeedQFunction qf; 275437c7c90SJeremy L Thompson const CeedScalar *assembled_qf_array; 276c5f45aeaSJeremy L Thompson CeedVector assembled_qf = NULL; 277c5f45aeaSJeremy L Thompson CeedElemRestriction assembled_elem_rstr = NULL; 278437c7c90SJeremy L Thompson CeedInt num_input_fields, num_output_fields; 279eaf62fffSJeremy L Thompson CeedInt layout[3]; 280437c7c90SJeremy L Thompson 281437c7c90SJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 282437c7c90SJeremy L Thompson CeedCall(CeedQFunctionGetNumArgs(qf, &num_input_fields, &num_output_fields)); 283437c7c90SJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &assembled_elem_rstr, request)); 284437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(assembled_elem_rstr, &layout)); 285437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&assembled_elem_rstr)); 286437c7c90SJeremy L Thompson CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array)); 287eaf62fffSJeremy L Thompson 288ed9e99e6SJeremy L Thompson // Get assembly data 289ed9e99e6SJeremy L Thompson CeedOperatorAssemblyData data; 290437c7c90SJeremy L Thompson const CeedEvalMode **eval_modes_in, **eval_modes_out; 291437c7c90SJeremy L Thompson CeedInt *num_eval_modes_in, *num_eval_modes_out, num_active_bases; 292437c7c90SJeremy L Thompson CeedSize **eval_mode_offsets_in, **eval_mode_offsets_out, num_output_components; 293437c7c90SJeremy L Thompson CeedBasis *active_bases; 294437c7c90SJeremy L Thompson CeedElemRestriction *active_elem_rstrs; 295437c7c90SJeremy L Thompson CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data)); 296437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_active_bases, &num_eval_modes_in, &eval_modes_in, &eval_mode_offsets_in, 297437c7c90SJeremy L Thompson &num_eval_modes_out, &eval_modes_out, &eval_mode_offsets_out, &num_output_components)); 298437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, &active_bases, NULL, NULL)); 299437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetElemRestrictions(data, NULL, &active_elem_rstrs)); 300437c7c90SJeremy L Thompson 301437c7c90SJeremy L Thompson // Loop over all active bases 302437c7c90SJeremy L Thompson for (CeedInt b = 0; b < num_active_bases; b++) { 303eaf62fffSJeremy L Thompson // Assemble point block diagonal restriction, if needed 304437c7c90SJeremy L Thompson CeedElemRestriction diag_elem_rstr = active_elem_rstrs[b]; 305437c7c90SJeremy L Thompson 306eaf62fffSJeremy L Thompson if (is_pointblock) { 307437c7c90SJeremy L Thompson CeedElemRestriction point_block_elem_rstr; 308437c7c90SJeremy L Thompson 309437c7c90SJeremy L Thompson CeedCall(CeedOperatorCreateActivePointBlockRestriction(diag_elem_rstr, &point_block_elem_rstr)); 310437c7c90SJeremy L Thompson diag_elem_rstr = point_block_elem_rstr; 311eaf62fffSJeremy L Thompson } 312eaf62fffSJeremy L Thompson 313eaf62fffSJeremy L Thompson // Create diagonal vector 314eaf62fffSJeremy L Thompson CeedVector elem_diag; 315437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionCreateVector(diag_elem_rstr, NULL, &elem_diag)); 316eaf62fffSJeremy L Thompson 317eaf62fffSJeremy L Thompson // Assemble element operator diagonals 3189c774eddSJeremy L Thompson CeedScalar *elem_diag_array; 319437c7c90SJeremy L Thompson CeedInt num_elem, num_nodes, num_qpts, num_components; 320437c7c90SJeremy L Thompson 3212b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(elem_diag, 0.0)); 3222b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArray(elem_diag, CEED_MEM_HOST, &elem_diag_array)); 323437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(diag_elem_rstr, &num_elem)); 324437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumNodes(active_bases[b], &num_nodes)); 325437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumComponents(active_bases[b], &num_components)); 326437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(active_bases[b], &num_qpts)); 327ed9e99e6SJeremy L Thompson 328352a5e7cSSebastian Grimberg // Construct identity matrix for basis if required 329ed9e99e6SJeremy L Thompson bool has_eval_none = false; 330352a5e7cSSebastian Grimberg CeedScalar *identity = NULL; 331437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_eval_modes_in[b]; i++) { 332437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (eval_modes_in[b][i] == CEED_EVAL_NONE); 333ed9e99e6SJeremy L Thompson } 334437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_eval_modes_out[b]; i++) { 335437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (eval_modes_out[b][i] == CEED_EVAL_NONE); 336ed9e99e6SJeremy L Thompson } 337ed9e99e6SJeremy L Thompson if (has_eval_none) { 3382b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_qpts * num_nodes, &identity)); 3392b730f8bSJeremy L Thompson for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) identity[i * num_nodes + i] = 1.0; 340eaf62fffSJeremy L Thompson } 341352a5e7cSSebastian Grimberg 342eaf62fffSJeremy L Thompson // Compute the diagonal of B^T D B 343eaf62fffSJeremy L Thompson // Each element 344b94338b9SJed Brown for (CeedSize e = 0; e < num_elem; e++) { 345eaf62fffSJeremy L Thompson // Each basis eval mode pair 346352a5e7cSSebastian Grimberg CeedInt d_out = 0, q_comp_out; 347352a5e7cSSebastian Grimberg CeedEvalMode eval_mode_out_prev = CEED_EVAL_NONE; 348437c7c90SJeremy L Thompson for (CeedInt e_out = 0; e_out < num_eval_modes_out[b]; e_out++) { 349437c7c90SJeremy L Thompson const CeedScalar *B_t = NULL; 350352a5e7cSSebastian Grimberg CeedOperatorGetBasisPointer(active_bases[b], eval_modes_out[b][e_out], identity, &B_t); 351352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(active_bases[b], eval_modes_out[b][e_out], &q_comp_out)); 352352a5e7cSSebastian Grimberg if (q_comp_out > 1) { 353352a5e7cSSebastian Grimberg if (e_out == 0 || eval_modes_out[b][e_out] != eval_mode_out_prev) d_out = 0; 354352a5e7cSSebastian Grimberg else B_t = &B_t[(++d_out) * num_qpts * num_nodes]; 355352a5e7cSSebastian Grimberg } 356352a5e7cSSebastian Grimberg eval_mode_out_prev = eval_modes_out[b][e_out]; 357352a5e7cSSebastian Grimberg 358352a5e7cSSebastian Grimberg CeedInt d_in = 0, q_comp_in; 359352a5e7cSSebastian Grimberg CeedEvalMode eval_mode_in_prev = CEED_EVAL_NONE; 360437c7c90SJeremy L Thompson for (CeedInt e_in = 0; e_in < num_eval_modes_in[b]; e_in++) { 361437c7c90SJeremy L Thompson const CeedScalar *B = NULL; 362352a5e7cSSebastian Grimberg CeedOperatorGetBasisPointer(active_bases[b], eval_modes_in[b][e_in], identity, &B); 363352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(active_bases[b], eval_modes_in[b][e_in], &q_comp_in)); 364352a5e7cSSebastian Grimberg if (q_comp_in > 1) { 365352a5e7cSSebastian Grimberg if (e_in == 0 || eval_modes_in[b][e_in] != eval_mode_in_prev) d_in = 0; 366352a5e7cSSebastian Grimberg else B = &B[(++d_in) * num_qpts * num_nodes]; 367352a5e7cSSebastian Grimberg } 368352a5e7cSSebastian Grimberg eval_mode_in_prev = eval_modes_in[b][e_in]; 369352a5e7cSSebastian Grimberg 370eaf62fffSJeremy L Thompson // Each component 371437c7c90SJeremy L Thompson for (CeedInt c_out = 0; c_out < num_components; c_out++) { 372437c7c90SJeremy L Thompson // Each qpt/node pair 3732b730f8bSJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 374eaf62fffSJeremy L Thompson if (is_pointblock) { 375eaf62fffSJeremy L Thompson // Point Block Diagonal 376437c7c90SJeremy L Thompson for (CeedInt c_in = 0; c_in < num_components; c_in++) { 377b94338b9SJed Brown const CeedSize c_offset = (eval_mode_offsets_in[b][e_in] + c_in) * num_output_components + eval_mode_offsets_out[b][e_out] + c_out; 378437c7c90SJeremy L Thompson const CeedScalar qf_value = assembled_qf_array[q * layout[0] + c_offset * layout[1] + e * layout[2]]; 3792b730f8bSJeremy L Thompson for (CeedInt n = 0; n < num_nodes; n++) { 380437c7c90SJeremy L Thompson elem_diag_array[((e * num_components + c_out) * num_components + c_in) * num_nodes + n] += 381437c7c90SJeremy L Thompson B_t[q * num_nodes + n] * qf_value * B[q * num_nodes + n]; 382eaf62fffSJeremy L Thompson } 3832b730f8bSJeremy L Thompson } 384eaf62fffSJeremy L Thompson } else { 385eaf62fffSJeremy L Thompson // Diagonal Only 386437c7c90SJeremy L Thompson const CeedInt c_offset = (eval_mode_offsets_in[b][e_in] + c_out) * num_output_components + eval_mode_offsets_out[b][e_out] + c_out; 387437c7c90SJeremy L Thompson const CeedScalar qf_value = assembled_qf_array[q * layout[0] + c_offset * layout[1] + e * layout[2]]; 3882b730f8bSJeremy L Thompson for (CeedInt n = 0; n < num_nodes; n++) { 389437c7c90SJeremy L Thompson elem_diag_array[(e * num_components + c_out) * num_nodes + n] += B_t[q * num_nodes + n] * qf_value * B[q * num_nodes + n]; 390eaf62fffSJeremy L Thompson } 391eaf62fffSJeremy L Thompson } 392eaf62fffSJeremy L Thompson } 393eaf62fffSJeremy L Thompson } 3942b730f8bSJeremy L Thompson } 3952b730f8bSJeremy L Thompson } 3962b730f8bSJeremy L Thompson } 3972b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(elem_diag, &elem_diag_array)); 398eaf62fffSJeremy L Thompson 399eaf62fffSJeremy L Thompson // Assemble local operator diagonal 400f30b1135SSebastian Grimberg CeedCall(CeedElemRestrictionApplyUnsigned(diag_elem_rstr, CEED_TRANSPOSE, elem_diag, assembled, request)); 401eaf62fffSJeremy L Thompson 402eaf62fffSJeremy L Thompson // Cleanup 403437c7c90SJeremy L Thompson if (is_pointblock) CeedCall(CeedElemRestrictionDestroy(&diag_elem_rstr)); 4042b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&elem_diag)); 4052b730f8bSJeremy L Thompson CeedCall(CeedFree(&identity)); 406437c7c90SJeremy L Thompson } 407437c7c90SJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array)); 408437c7c90SJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled_qf)); 409eaf62fffSJeremy L Thompson 410eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 411eaf62fffSJeremy L Thompson } 412eaf62fffSJeremy L Thompson 413eaf62fffSJeremy L Thompson /** 414eaf62fffSJeremy L Thompson @brief Core logic for assembling composite operator diagonal 415eaf62fffSJeremy L Thompson 416eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble point block diagonal 417ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE 418eaf62fffSJeremy L Thompson @param[in] is_pointblock Boolean flag to assemble diagonal or point block diagonal 419eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled diagonal 420eaf62fffSJeremy L Thompson 421eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 422eaf62fffSJeremy L Thompson 423eaf62fffSJeremy L Thompson @ref Developer 424eaf62fffSJeremy L Thompson **/ 4252b730f8bSJeremy L Thompson static inline int CeedCompositeOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedRequest *request, const bool is_pointblock, 426eaf62fffSJeremy L Thompson CeedVector assembled) { 427eaf62fffSJeremy L Thompson CeedInt num_sub; 428eaf62fffSJeremy L Thompson CeedOperator *suboperators; 429c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_sub)); 430c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &suboperators)); 431eaf62fffSJeremy L Thompson for (CeedInt i = 0; i < num_sub; i++) { 4326aa95790SJeremy L Thompson if (is_pointblock) { 4332b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(suboperators[i], assembled, request)); 4346aa95790SJeremy L Thompson } else { 4352b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddDiagonal(suboperators[i], assembled, request)); 4366aa95790SJeremy L Thompson } 437eaf62fffSJeremy L Thompson } 438eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 439eaf62fffSJeremy L Thompson } 440eaf62fffSJeremy L Thompson 441eaf62fffSJeremy L Thompson /** 442eaf62fffSJeremy L Thompson @brief Build nonzero pattern for non-composite operator 443eaf62fffSJeremy L Thompson 444eaf62fffSJeremy L Thompson Users should generally use CeedOperatorLinearAssembleSymbolic() 445eaf62fffSJeremy L Thompson 4463bdd4e5aSSebastian Grimberg Note: For operators using oriented element restrictions, entries in rows or cols may be negative indicating the assembled value at this nonzero 4473bdd4e5aSSebastian Grimberg should be negated 448f30b1135SSebastian Grimberg 449eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble nonzero pattern 450eaf62fffSJeremy L Thompson @param[in] offset Offset for number of entries 451eaf62fffSJeremy L Thompson @param[out] rows Row number for each entry 452eaf62fffSJeremy L Thompson @param[out] cols Column number for each entry 453eaf62fffSJeremy L Thompson 454eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 455eaf62fffSJeremy L Thompson 456eaf62fffSJeremy L Thompson @ref Developer 457eaf62fffSJeremy L Thompson **/ 4582b730f8bSJeremy L Thompson static int CeedSingleOperatorAssembleSymbolic(CeedOperator op, CeedInt offset, CeedInt *rows, CeedInt *cols) { 459f3d47e36SJeremy L Thompson Ceed ceed; 460f3d47e36SJeremy L Thompson bool is_composite; 461f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 462f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 463f3d47e36SJeremy L Thompson 4646574a04fSJeremy L Thompson CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 465eaf62fffSJeremy L Thompson 466c9366a6bSJeremy L Thompson CeedSize num_nodes; 4672b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &num_nodes, NULL)); 468eaf62fffSJeremy L Thompson CeedElemRestriction rstr_in; 4692b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(op, &rstr_in)); 470e79b91d9SJeremy L Thompson CeedInt num_elem, elem_size, num_comp; 4712b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr_in, &num_elem)); 4722b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr_in, &elem_size)); 4732b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(rstr_in, &num_comp)); 474eaf62fffSJeremy L Thompson CeedInt layout_er[3]; 4752b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(rstr_in, &layout_er)); 476eaf62fffSJeremy L Thompson 477eaf62fffSJeremy L Thompson CeedInt local_num_entries = elem_size * num_comp * elem_size * num_comp * num_elem; 478eaf62fffSJeremy L Thompson 479eaf62fffSJeremy L Thompson // Determine elem_dof relation 480eaf62fffSJeremy L Thompson CeedVector index_vec; 4812b730f8bSJeremy L Thompson CeedCall(CeedVectorCreate(ceed, num_nodes, &index_vec)); 482eaf62fffSJeremy L Thompson CeedScalar *array; 4832b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayWrite(index_vec, CEED_MEM_HOST, &array)); 484ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_nodes; i++) array[i] = i; 4852b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(index_vec, &array)); 486eaf62fffSJeremy L Thompson CeedVector elem_dof; 4872b730f8bSJeremy L Thompson CeedCall(CeedVectorCreate(ceed, num_elem * elem_size * num_comp, &elem_dof)); 4882b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(elem_dof, 0.0)); 4892b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionApply(rstr_in, CEED_NOTRANSPOSE, index_vec, elem_dof, CEED_REQUEST_IMMEDIATE)); 490eaf62fffSJeremy L Thompson const CeedScalar *elem_dof_a; 4912b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(elem_dof, CEED_MEM_HOST, &elem_dof_a)); 4922b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&index_vec)); 493eaf62fffSJeremy L Thompson 494eaf62fffSJeremy L Thompson // Determine i, j locations for element matrices 495b94338b9SJed Brown CeedSize count = 0; 496ed9e99e6SJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 497ed9e99e6SJeremy L Thompson for (CeedInt comp_in = 0; comp_in < num_comp; comp_in++) { 498ed9e99e6SJeremy L Thompson for (CeedInt comp_out = 0; comp_out < num_comp; comp_out++) { 499ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < elem_size; i++) { 500ed9e99e6SJeremy L Thompson for (CeedInt j = 0; j < elem_size; j++) { 5012b730f8bSJeremy L Thompson const CeedInt elem_dof_index_row = i * layout_er[0] + (comp_out)*layout_er[1] + e * layout_er[2]; 5022b730f8bSJeremy L Thompson const CeedInt elem_dof_index_col = j * layout_er[0] + comp_in * layout_er[1] + e * layout_er[2]; 503eaf62fffSJeremy L Thompson 504eaf62fffSJeremy L Thompson const CeedInt row = elem_dof_a[elem_dof_index_row]; 505eaf62fffSJeremy L Thompson const CeedInt col = elem_dof_a[elem_dof_index_col]; 506eaf62fffSJeremy L Thompson 507eaf62fffSJeremy L Thompson rows[offset + count] = row; 508eaf62fffSJeremy L Thompson cols[offset + count] = col; 509eaf62fffSJeremy L Thompson count++; 510eaf62fffSJeremy L Thompson } 511eaf62fffSJeremy L Thompson } 512eaf62fffSJeremy L Thompson } 513eaf62fffSJeremy L Thompson } 514eaf62fffSJeremy L Thompson } 5156574a04fSJeremy L Thompson CeedCheck(count == local_num_entries, ceed, CEED_ERROR_MAJOR, "Error computing assembled entries"); 5162b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(elem_dof, &elem_dof_a)); 5172b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&elem_dof)); 518eaf62fffSJeremy L Thompson 519eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 520eaf62fffSJeremy L Thompson } 521eaf62fffSJeremy L Thompson 522eaf62fffSJeremy L Thompson /** 523eaf62fffSJeremy L Thompson @brief Assemble nonzero entries for non-composite operator 524eaf62fffSJeremy L Thompson 525eaf62fffSJeremy L Thompson Users should generally use CeedOperatorLinearAssemble() 526eaf62fffSJeremy L Thompson 527eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 528ea61e9acSJeremy L Thompson @param[in] offset Offset for number of entries 529eaf62fffSJeremy L Thompson @param[out] values Values to assemble into matrix 530eaf62fffSJeremy L Thompson 531eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 532eaf62fffSJeremy L Thompson 533eaf62fffSJeremy L Thompson @ref Developer 534eaf62fffSJeremy L Thompson **/ 5352b730f8bSJeremy L Thompson static int CeedSingleOperatorAssemble(CeedOperator op, CeedInt offset, CeedVector values) { 536f3d47e36SJeremy L Thompson Ceed ceed; 537f3d47e36SJeremy L Thompson bool is_composite; 538f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 539f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 540f3d47e36SJeremy L Thompson 5416574a04fSJeremy L Thompson CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 542f3d47e36SJeremy L Thompson 543f3d47e36SJeremy L Thompson // Early exit for empty operator 544f3d47e36SJeremy L Thompson { 545f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 546f3d47e36SJeremy L Thompson 547f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 548f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 549f3d47e36SJeremy L Thompson } 550eaf62fffSJeremy L Thompson 551cefa2673SJeremy L Thompson if (op->LinearAssembleSingle) { 552cefa2673SJeremy L Thompson // Backend version 5532b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleSingle(op, offset, values)); 554cefa2673SJeremy L Thompson return CEED_ERROR_SUCCESS; 555cefa2673SJeremy L Thompson } else { 556cefa2673SJeremy L Thompson // Operator fallback 557cefa2673SJeremy L Thompson CeedOperator op_fallback; 558cefa2673SJeremy L Thompson 5592b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 560cefa2673SJeremy L Thompson if (op_fallback) { 5612b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemble(op_fallback, offset, values)); 562cefa2673SJeremy L Thompson return CEED_ERROR_SUCCESS; 563cefa2673SJeremy L Thompson } 564cefa2673SJeremy L Thompson } 565cefa2673SJeremy L Thompson 566eaf62fffSJeremy L Thompson // Assemble QFunction 567eaf62fffSJeremy L Thompson CeedQFunction qf; 5682b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 569c5f45aeaSJeremy L Thompson CeedVector assembled_qf = NULL; 570c5f45aeaSJeremy L Thompson CeedElemRestriction rstr_q = NULL; 5712b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &rstr_q, CEED_REQUEST_IMMEDIATE)); 5721f9221feSJeremy L Thompson CeedSize qf_length; 5732b730f8bSJeremy L Thompson CeedCall(CeedVectorGetLength(assembled_qf, &qf_length)); 574eaf62fffSJeremy L Thompson 5757e7773b5SJeremy L Thompson CeedInt num_input_fields, num_output_fields; 576eaf62fffSJeremy L Thompson CeedOperatorField *input_fields; 577eaf62fffSJeremy L Thompson CeedOperatorField *output_fields; 5782b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, &num_input_fields, &input_fields, &num_output_fields, &output_fields)); 579eaf62fffSJeremy L Thompson 580ed9e99e6SJeremy L Thompson // Get assembly data 581ed9e99e6SJeremy L Thompson CeedOperatorAssemblyData data; 5822b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data)); 583437c7c90SJeremy L Thompson const CeedEvalMode **eval_modes_in, **eval_modes_out; 584437c7c90SJeremy L Thompson CeedInt *num_eval_modes_in, *num_eval_modes_out, num_active_bases; 585437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_active_bases, &num_eval_modes_in, &eval_modes_in, NULL, &num_eval_modes_out, 586437c7c90SJeremy L Thompson &eval_modes_out, NULL, NULL)); 587437c7c90SJeremy L Thompson CeedBasis *bases; 588437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, &bases, NULL, NULL)); 589437c7c90SJeremy L Thompson CeedBasis basis_in = bases[0]; 590eaf62fffSJeremy L Thompson 5916574a04fSJeremy L Thompson CeedCheck(num_active_bases == 1, ceed, CEED_ERROR_UNSUPPORTED, "Cannot assemble operator with multiple active bases"); 5926574a04fSJeremy L Thompson CeedCheck(num_eval_modes_in[0] > 0 && num_eval_modes_out[0] > 0, ceed, CEED_ERROR_UNSUPPORTED, "Cannot assemble operator with out inputs/outputs"); 593eaf62fffSJeremy L Thompson 594ed9e99e6SJeremy L Thompson CeedElemRestriction active_rstr; 595eaf62fffSJeremy L Thompson CeedInt num_elem, elem_size, num_qpts, num_comp; 5962b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(op, &active_rstr)); 5972b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(active_rstr, &num_elem)); 5982b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(active_rstr, &elem_size)); 5992b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(active_rstr, &num_comp)); 6002b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_in, &num_qpts)); 601eaf62fffSJeremy L Thompson 602eaf62fffSJeremy L Thompson CeedInt local_num_entries = elem_size * num_comp * elem_size * num_comp * num_elem; 603eaf62fffSJeremy L Thompson 604eaf62fffSJeremy L Thompson // loop over elements and put in data structure 605eaf62fffSJeremy L Thompson const CeedScalar *assembled_qf_array; 6062b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array)); 607eaf62fffSJeremy L Thompson 608eaf62fffSJeremy L Thompson CeedInt layout_qf[3]; 6092b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(rstr_q, &layout_qf)); 6102b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_q)); 611eaf62fffSJeremy L Thompson 612eaf62fffSJeremy L Thompson // we store B_mat_in, B_mat_out, BTD, elem_mat in row-major order 613437c7c90SJeremy L Thompson const CeedScalar **B_mats_in, **B_mats_out; 614437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, NULL, &B_mats_in, &B_mats_out)); 615437c7c90SJeremy L Thompson const CeedScalar *B_mat_in = B_mats_in[0], *B_mat_out = B_mats_out[0]; 616437c7c90SJeremy L Thompson CeedScalar BTD_mat[elem_size * num_qpts * num_eval_modes_in[0]]; 617eaf62fffSJeremy L Thompson CeedScalar elem_mat[elem_size * elem_size]; 618b94338b9SJed Brown CeedSize count = 0; 619eaf62fffSJeremy L Thompson CeedScalar *vals; 62028ec399dSJeremy L Thompson CeedCall(CeedVectorGetArray(values, CEED_MEM_HOST, &vals)); 621b94338b9SJed Brown for (CeedSize e = 0; e < num_elem; e++) { 622ed9e99e6SJeremy L Thompson for (CeedInt comp_in = 0; comp_in < num_comp; comp_in++) { 623ed9e99e6SJeremy L Thompson for (CeedInt comp_out = 0; comp_out < num_comp; comp_out++) { 624ed9e99e6SJeremy L Thompson // Compute B^T*D 625b94338b9SJed Brown for (CeedSize n = 0; n < elem_size; n++) { 626b94338b9SJed Brown for (CeedSize q = 0; q < num_qpts; q++) { 627437c7c90SJeremy L Thompson for (CeedInt e_in = 0; e_in < num_eval_modes_in[0]; e_in++) { 628b94338b9SJed Brown const CeedSize btd_index = n * (num_qpts * num_eval_modes_in[0]) + (num_eval_modes_in[0] * q + e_in); 629067fd99fSJeremy L Thompson CeedScalar sum = 0.0; 630437c7c90SJeremy L Thompson for (CeedInt e_out = 0; e_out < num_eval_modes_out[0]; e_out++) { 631b94338b9SJed Brown const CeedSize b_out_index = (num_eval_modes_out[0] * q + e_out) * elem_size + n; 632b94338b9SJed Brown const CeedSize eval_mode_index = ((e_in * num_comp + comp_in) * num_eval_modes_out[0] + e_out) * num_comp + comp_out; 633b94338b9SJed Brown const CeedSize qf_index = q * layout_qf[0] + eval_mode_index * layout_qf[1] + e * layout_qf[2]; 634067fd99fSJeremy L Thompson sum += B_mat_out[b_out_index] * assembled_qf_array[qf_index]; 635eaf62fffSJeremy L Thompson } 636067fd99fSJeremy L Thompson BTD_mat[btd_index] = sum; 637ed9e99e6SJeremy L Thompson } 638ed9e99e6SJeremy L Thompson } 639eaf62fffSJeremy L Thompson } 640eaf62fffSJeremy L Thompson // form element matrix itself (for each block component) 641437c7c90SJeremy L Thompson CeedCall(CeedMatrixMatrixMultiply(ceed, BTD_mat, B_mat_in, elem_mat, elem_size, elem_size, num_qpts * num_eval_modes_in[0])); 642eaf62fffSJeremy L Thompson 643eaf62fffSJeremy L Thompson // put element matrix in coordinate data structure 644ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < elem_size; i++) { 645ed9e99e6SJeremy L Thompson for (CeedInt j = 0; j < elem_size; j++) { 646eaf62fffSJeremy L Thompson vals[offset + count] = elem_mat[i * elem_size + j]; 647eaf62fffSJeremy L Thompson count++; 648eaf62fffSJeremy L Thompson } 649eaf62fffSJeremy L Thompson } 650eaf62fffSJeremy L Thompson } 651eaf62fffSJeremy L Thompson } 652eaf62fffSJeremy L Thompson } 6536574a04fSJeremy L Thompson CeedCheck(count == local_num_entries, ceed, CEED_ERROR_MAJOR, "Error computing entries"); 6542b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(values, &vals)); 655eaf62fffSJeremy L Thompson 6562b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array)); 6572b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled_qf)); 658eaf62fffSJeremy L Thompson 659eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 660eaf62fffSJeremy L Thompson } 661eaf62fffSJeremy L Thompson 662eaf62fffSJeremy L Thompson /** 663eaf62fffSJeremy L Thompson @brief Count number of entries for assembled CeedOperator 664eaf62fffSJeremy L Thompson 665eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 666eaf62fffSJeremy L Thompson @param[out] num_entries Number of entries in assembled representation 667eaf62fffSJeremy L Thompson 668eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 669eaf62fffSJeremy L Thompson 670eaf62fffSJeremy L Thompson @ref Utility 671eaf62fffSJeremy L Thompson **/ 672b94338b9SJed Brown static int CeedSingleOperatorAssemblyCountEntries(CeedOperator op, CeedSize *num_entries) { 673b275c451SJeremy L Thompson bool is_composite; 674eaf62fffSJeremy L Thompson CeedElemRestriction rstr; 675eaf62fffSJeremy L Thompson CeedInt num_elem, elem_size, num_comp; 676eaf62fffSJeremy L Thompson 677b275c451SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 6786574a04fSJeremy L Thompson CeedCheck(!is_composite, op->ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 6792b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(op, &rstr)); 6802b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem)); 6812b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size)); 6822b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp)); 683b94338b9SJed Brown *num_entries = (CeedSize)elem_size * num_comp * elem_size * num_comp * num_elem; 684eaf62fffSJeremy L Thompson 685eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 686eaf62fffSJeremy L Thompson } 687eaf62fffSJeremy L Thompson 688eaf62fffSJeremy L Thompson /** 689ea61e9acSJeremy L Thompson @brief Common code for creating a multigrid coarse operator and level transfer operators for a CeedOperator 690eaf62fffSJeremy L Thompson 691eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 69285bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 693eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 694eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 69585bb9dcfSJeremy L Thompson @param[in] basis_c_to_f Basis for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators 696eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 69785bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 69885bb9dcfSJeremy L Thompson @param[out] op_restrict Fine to coarse operator, or NULL 699eaf62fffSJeremy L Thompson 700eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 701eaf62fffSJeremy L Thompson 702eaf62fffSJeremy L Thompson @ref Developer 703eaf62fffSJeremy L Thompson **/ 7042b730f8bSJeremy L Thompson static int CeedSingleOperatorMultigridLevel(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 7052b730f8bSJeremy L Thompson CeedBasis basis_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) { 706eaf62fffSJeremy L Thompson Ceed ceed; 70785bb9dcfSJeremy L Thompson CeedVector mult_vec = NULL; 708c17ec2beSJeremy L Thompson CeedElemRestriction rstr_p_mult_fine = NULL; 7092b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op_fine, &ceed)); 710eaf62fffSJeremy L Thompson 711eaf62fffSJeremy L Thompson // Check for composite operator 712eaf62fffSJeremy L Thompson bool is_composite; 7132b730f8bSJeremy L Thompson CeedCall(CeedOperatorIsComposite(op_fine, &is_composite)); 7146574a04fSJeremy L Thompson CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Automatic multigrid setup for composite operators not supported"); 715eaf62fffSJeremy L Thompson 716eaf62fffSJeremy L Thompson // Coarse Grid 7172b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed, op_fine->qf, op_fine->dqf, op_fine->dqfT, op_coarse)); 718eaf62fffSJeremy L Thompson CeedElemRestriction rstr_fine = NULL; 719eaf62fffSJeremy L Thompson // -- Clone input fields 72092ae7e47SJeremy L Thompson for (CeedInt i = 0; i < op_fine->qf->num_input_fields; i++) { 721eaf62fffSJeremy L Thompson if (op_fine->input_fields[i]->vec == CEED_VECTOR_ACTIVE) { 722437c7c90SJeremy L Thompson rstr_fine = op_fine->input_fields[i]->elem_rstr; 7232b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE)); 724eaf62fffSJeremy L Thompson } else { 725437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, op_fine->input_fields[i]->elem_rstr, 7262b730f8bSJeremy L Thompson op_fine->input_fields[i]->basis, op_fine->input_fields[i]->vec)); 727eaf62fffSJeremy L Thompson } 728eaf62fffSJeremy L Thompson } 729eaf62fffSJeremy L Thompson // -- Clone output fields 73092ae7e47SJeremy L Thompson for (CeedInt i = 0; i < op_fine->qf->num_output_fields; i++) { 731eaf62fffSJeremy L Thompson if (op_fine->output_fields[i]->vec == CEED_VECTOR_ACTIVE) { 7322b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE)); 733eaf62fffSJeremy L Thompson } else { 734437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, op_fine->output_fields[i]->elem_rstr, 7352b730f8bSJeremy L Thompson op_fine->output_fields[i]->basis, op_fine->output_fields[i]->vec)); 736eaf62fffSJeremy L Thompson } 737eaf62fffSJeremy L Thompson } 738af99e877SJeremy L Thompson // -- Clone QFunctionAssemblyData 7392b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op_fine->qf_assembled, &(*op_coarse)->qf_assembled)); 740eaf62fffSJeremy L Thompson 741eaf62fffSJeremy L Thompson // Multiplicity vector 74285bb9dcfSJeremy L Thompson if (op_restrict || op_prolong) { 74385bb9dcfSJeremy L Thompson CeedVector mult_e_vec; 74485bb9dcfSJeremy L Thompson 745c17ec2beSJeremy L Thompson CeedCall(CeedElemRestrictionCreateUnsignedCopy(rstr_fine, &rstr_p_mult_fine)); 7466574a04fSJeremy L Thompson CeedCheck(p_mult_fine, ceed, CEED_ERROR_INCOMPATIBLE, "Prolongation or restriction operator creation requires fine grid multiplicity vector"); 7472b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionCreateVector(rstr_fine, &mult_vec, &mult_e_vec)); 7482b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(mult_e_vec, 0.0)); 749c17ec2beSJeremy L Thompson CeedCall(CeedElemRestrictionApply(rstr_p_mult_fine, CEED_NOTRANSPOSE, p_mult_fine, mult_e_vec, CEED_REQUEST_IMMEDIATE)); 7502b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(mult_vec, 0.0)); 751c17ec2beSJeremy L Thompson CeedCall(CeedElemRestrictionApply(rstr_p_mult_fine, CEED_TRANSPOSE, mult_e_vec, mult_vec, CEED_REQUEST_IMMEDIATE)); 7522b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&mult_e_vec)); 7532b730f8bSJeremy L Thompson CeedCall(CeedVectorReciprocal(mult_vec)); 75485bb9dcfSJeremy L Thompson } 755eaf62fffSJeremy L Thompson 756addd79feSZach Atkins // Clone name 757addd79feSZach Atkins bool has_name = op_fine->name; 758addd79feSZach Atkins size_t name_len = op_fine->name ? strlen(op_fine->name) : 0; 759addd79feSZach Atkins CeedCall(CeedOperatorSetName(*op_coarse, op_fine->name)); 760addd79feSZach Atkins 76183d6adf3SZach Atkins // Check that coarse to fine basis is provided if prolong/restrict operators are requested 7626574a04fSJeremy L Thompson CeedCheck(basis_c_to_f || (!op_restrict && !op_prolong), ceed, CEED_ERROR_INCOMPATIBLE, 7636574a04fSJeremy L Thompson "Prolongation or restriction operator creation requires coarse-to-fine basis"); 76483d6adf3SZach Atkins 76585bb9dcfSJeremy L Thompson // Restriction/Prolongation Operators 766eaf62fffSJeremy L Thompson CeedInt num_comp; 7672b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_coarse, &num_comp)); 768addd79feSZach Atkins 769addd79feSZach Atkins // Restriction 770addd79feSZach Atkins if (op_restrict) { 771eaf62fffSJeremy L Thompson CeedInt *num_comp_r_data; 77285bb9dcfSJeremy L Thompson CeedQFunction qf_restrict; 77385bb9dcfSJeremy L Thompson CeedQFunctionContext ctx_r; 77485bb9dcfSJeremy L Thompson 77585bb9dcfSJeremy L Thompson CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_restrict)); 7762b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &num_comp_r_data)); 777eaf62fffSJeremy L Thompson num_comp_r_data[0] = num_comp; 7782b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextCreate(ceed, &ctx_r)); 7792b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextSetData(ctx_r, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_r_data), num_comp_r_data)); 7802b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(qf_restrict, ctx_r)); 7812b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextDestroy(&ctx_r)); 7822b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_restrict, "input", num_comp, CEED_EVAL_NONE)); 7832b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_restrict, "scale", num_comp, CEED_EVAL_NONE)); 7842b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(qf_restrict, "output", num_comp, CEED_EVAL_INTERP)); 7852b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_restrict, num_comp)); 786eaf62fffSJeremy L Thompson 7872b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed, qf_restrict, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_restrict)); 7882b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_restrict, "input", rstr_fine, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE)); 789c17ec2beSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_restrict, "scale", rstr_p_mult_fine, CEED_BASIS_COLLOCATED, mult_vec)); 7902b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_restrict, "output", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE)); 791eaf62fffSJeremy L Thompson 792addd79feSZach Atkins // Set name 793addd79feSZach Atkins char *restriction_name; 794addd79feSZach Atkins CeedCall(CeedCalloc(17 + name_len, &restriction_name)); 795addd79feSZach Atkins sprintf(restriction_name, "restriction%s%s", has_name ? " for " : "", has_name ? op_fine->name : ""); 796addd79feSZach Atkins CeedCall(CeedOperatorSetName(*op_restrict, restriction_name)); 797addd79feSZach Atkins CeedCall(CeedFree(&restriction_name)); 798addd79feSZach Atkins 799addd79feSZach Atkins // Check 800addd79feSZach Atkins CeedCall(CeedOperatorCheckReady(*op_restrict)); 801addd79feSZach Atkins 802addd79feSZach Atkins // Cleanup 803addd79feSZach Atkins CeedCall(CeedQFunctionDestroy(&qf_restrict)); 804addd79feSZach Atkins } 805addd79feSZach Atkins 806eaf62fffSJeremy L Thompson // Prolongation 807addd79feSZach Atkins if (op_prolong) { 808eaf62fffSJeremy L Thompson CeedInt *num_comp_p_data; 80985bb9dcfSJeremy L Thompson CeedQFunction qf_prolong; 81085bb9dcfSJeremy L Thompson CeedQFunctionContext ctx_p; 81185bb9dcfSJeremy L Thompson 81285bb9dcfSJeremy L Thompson CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_prolong)); 8132b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &num_comp_p_data)); 814eaf62fffSJeremy L Thompson num_comp_p_data[0] = num_comp; 8152b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextCreate(ceed, &ctx_p)); 8162b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextSetData(ctx_p, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_p_data), num_comp_p_data)); 8172b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(qf_prolong, ctx_p)); 8182b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextDestroy(&ctx_p)); 8192b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_prolong, "input", num_comp, CEED_EVAL_INTERP)); 8202b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_prolong, "scale", num_comp, CEED_EVAL_NONE)); 8212b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(qf_prolong, "output", num_comp, CEED_EVAL_NONE)); 8222b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_prolong, num_comp)); 823eaf62fffSJeremy L Thompson 8242b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed, qf_prolong, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_prolong)); 8252b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_prolong, "input", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE)); 826c17ec2beSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_prolong, "scale", rstr_p_mult_fine, CEED_BASIS_COLLOCATED, mult_vec)); 8272b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_prolong, "output", rstr_fine, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE)); 828eaf62fffSJeremy L Thompson 829addd79feSZach Atkins // Set name 830ea6b5821SJeremy L Thompson char *prolongation_name; 8312b730f8bSJeremy L Thompson CeedCall(CeedCalloc(18 + name_len, &prolongation_name)); 8322b730f8bSJeremy L Thompson sprintf(prolongation_name, "prolongation%s%s", has_name ? " for " : "", has_name ? op_fine->name : ""); 8332b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetName(*op_prolong, prolongation_name)); 8342b730f8bSJeremy L Thompson CeedCall(CeedFree(&prolongation_name)); 835addd79feSZach Atkins 836addd79feSZach Atkins // Check 837addd79feSZach Atkins CeedCall(CeedOperatorCheckReady(*op_prolong)); 838addd79feSZach Atkins 839addd79feSZach Atkins // Cleanup 840addd79feSZach Atkins CeedCall(CeedQFunctionDestroy(&qf_prolong)); 841ea6b5821SJeremy L Thompson } 842ea6b5821SJeremy L Thompson 84358e4b056SJeremy L Thompson // Check 84458e4b056SJeremy L Thompson CeedCall(CeedOperatorCheckReady(*op_coarse)); 84558e4b056SJeremy L Thompson 846eaf62fffSJeremy L Thompson // Cleanup 8472b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&mult_vec)); 848c17ec2beSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_p_mult_fine)); 8492b730f8bSJeremy L Thompson CeedCall(CeedBasisDestroy(&basis_c_to_f)); 850805fe78eSJeremy L Thompson 851eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 852eaf62fffSJeremy L Thompson } 853eaf62fffSJeremy L Thompson 854eaf62fffSJeremy L Thompson /** 855eaf62fffSJeremy L Thompson @brief Build 1D mass matrix and Laplacian with perturbation 856eaf62fffSJeremy L Thompson 857eaf62fffSJeremy L Thompson @param[in] interp_1d Interpolation matrix in one dimension 858eaf62fffSJeremy L Thompson @param[in] grad_1d Gradient matrix in one dimension 859eaf62fffSJeremy L Thompson @param[in] q_weight_1d Quadrature weights in one dimension 860eaf62fffSJeremy L Thompson @param[in] P_1d Number of basis nodes in one dimension 861eaf62fffSJeremy L Thompson @param[in] Q_1d Number of quadrature points in one dimension 862eaf62fffSJeremy L Thompson @param[in] dim Dimension of basis 863eaf62fffSJeremy L Thompson @param[out] mass Assembled mass matrix in one dimension 864eaf62fffSJeremy L Thompson @param[out] laplace Assembled perturbed Laplacian in one dimension 865eaf62fffSJeremy L Thompson 866eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 867eaf62fffSJeremy L Thompson 868eaf62fffSJeremy L Thompson @ref Developer 869eaf62fffSJeremy L Thompson **/ 8702c2ea1dbSJeremy L Thompson CeedPragmaOptimizeOff 8712c2ea1dbSJeremy L Thompson static int CeedBuildMassLaplace(const CeedScalar *interp_1d, const CeedScalar *grad_1d, const CeedScalar *q_weight_1d, CeedInt P_1d, CeedInt Q_1d, 8722c2ea1dbSJeremy L Thompson CeedInt dim, CeedScalar *mass, CeedScalar *laplace) { 8732b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) { 874eaf62fffSJeremy L Thompson for (CeedInt j = 0; j < P_1d; j++) { 875eaf62fffSJeremy L Thompson CeedScalar sum = 0.0; 8762b730f8bSJeremy L Thompson for (CeedInt k = 0; k < Q_1d; k++) sum += interp_1d[k * P_1d + i] * q_weight_1d[k] * interp_1d[k * P_1d + j]; 877eaf62fffSJeremy L Thompson mass[i + j * P_1d] = sum; 878eaf62fffSJeremy L Thompson } 8792b730f8bSJeremy L Thompson } 880eaf62fffSJeremy L Thompson // -- Laplacian 8812b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) { 882eaf62fffSJeremy L Thompson for (CeedInt j = 0; j < P_1d; j++) { 883eaf62fffSJeremy L Thompson CeedScalar sum = 0.0; 8842b730f8bSJeremy L Thompson for (CeedInt k = 0; k < Q_1d; k++) sum += grad_1d[k * P_1d + i] * q_weight_1d[k] * grad_1d[k * P_1d + j]; 885eaf62fffSJeremy L Thompson laplace[i + j * P_1d] = sum; 886eaf62fffSJeremy L Thompson } 8872b730f8bSJeremy L Thompson } 888eaf62fffSJeremy L Thompson CeedScalar perturbation = dim > 2 ? 1e-6 : 1e-4; 8892b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) laplace[i + P_1d * i] += perturbation; 890eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 891eaf62fffSJeremy L Thompson } 8922c2ea1dbSJeremy L Thompson CeedPragmaOptimizeOn 893eaf62fffSJeremy L Thompson 894eaf62fffSJeremy L Thompson /// @} 895eaf62fffSJeremy L Thompson 896eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 897480fae85SJeremy L Thompson /// CeedOperator Backend API 898480fae85SJeremy L Thompson /// ---------------------------------------------------------------------------- 899480fae85SJeremy L Thompson /// @addtogroup CeedOperatorBackend 900480fae85SJeremy L Thompson /// @{ 901480fae85SJeremy L Thompson 902480fae85SJeremy L Thompson /** 903480fae85SJeremy L Thompson @brief Create object holding CeedQFunction assembly data for CeedOperator 904480fae85SJeremy L Thompson 905480fae85SJeremy L Thompson @param[in] ceed A Ceed object where the CeedQFunctionAssemblyData will be created 906ea61e9acSJeremy L Thompson @param[out] data Address of the variable where the newly created CeedQFunctionAssemblyData will be stored 907480fae85SJeremy L Thompson 908480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 909480fae85SJeremy L Thompson 910480fae85SJeremy L Thompson @ref Backend 911480fae85SJeremy L Thompson **/ 912ea61e9acSJeremy L Thompson int CeedQFunctionAssemblyDataCreate(Ceed ceed, CeedQFunctionAssemblyData *data) { 9132b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, data)); 914480fae85SJeremy L Thompson (*data)->ref_count = 1; 915480fae85SJeremy L Thompson (*data)->ceed = ceed; 9162b730f8bSJeremy L Thompson CeedCall(CeedReference(ceed)); 917480fae85SJeremy L Thompson 918480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 919480fae85SJeremy L Thompson } 920480fae85SJeremy L Thompson 921480fae85SJeremy L Thompson /** 922480fae85SJeremy L Thompson @brief Increment the reference counter for a CeedQFunctionAssemblyData 923480fae85SJeremy L Thompson 924ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to increment the reference counter 925480fae85SJeremy L Thompson 926480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 927480fae85SJeremy L Thompson 928480fae85SJeremy L Thompson @ref Backend 929480fae85SJeremy L Thompson **/ 930480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataReference(CeedQFunctionAssemblyData data) { 931480fae85SJeremy L Thompson data->ref_count++; 932480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 933480fae85SJeremy L Thompson } 934480fae85SJeremy L Thompson 935480fae85SJeremy L Thompson /** 936beecbf24SJeremy L Thompson @brief Set re-use of CeedQFunctionAssemblyData 9378b919e6bSJeremy L Thompson 938ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to mark for reuse 939ea61e9acSJeremy L Thompson @param[in] reuse_data Boolean flag indicating data re-use 9408b919e6bSJeremy L Thompson 9418b919e6bSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 9428b919e6bSJeremy L Thompson 9438b919e6bSJeremy L Thompson @ref Backend 9448b919e6bSJeremy L Thompson **/ 9452b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetReuse(CeedQFunctionAssemblyData data, bool reuse_data) { 946beecbf24SJeremy L Thompson data->reuse_data = reuse_data; 947beecbf24SJeremy L Thompson data->needs_data_update = true; 948beecbf24SJeremy L Thompson return CEED_ERROR_SUCCESS; 949beecbf24SJeremy L Thompson } 950beecbf24SJeremy L Thompson 951beecbf24SJeremy L Thompson /** 952beecbf24SJeremy L Thompson @brief Mark QFunctionAssemblyData as stale 953beecbf24SJeremy L Thompson 954ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to mark as stale 955ea61e9acSJeremy L Thompson @param[in] needs_data_update Boolean flag indicating if update is needed or completed 956beecbf24SJeremy L Thompson 957beecbf24SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 958beecbf24SJeremy L Thompson 959beecbf24SJeremy L Thompson @ref Backend 960beecbf24SJeremy L Thompson **/ 9612b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetUpdateNeeded(CeedQFunctionAssemblyData data, bool needs_data_update) { 962beecbf24SJeremy L Thompson data->needs_data_update = needs_data_update; 9638b919e6bSJeremy L Thompson return CEED_ERROR_SUCCESS; 9648b919e6bSJeremy L Thompson } 9658b919e6bSJeremy L Thompson 9668b919e6bSJeremy L Thompson /** 9678b919e6bSJeremy L Thompson @brief Determine if QFunctionAssemblyData needs update 9688b919e6bSJeremy L Thompson 9698b919e6bSJeremy L Thompson @param[in] data CeedQFunctionAssemblyData to mark as stale 9708b919e6bSJeremy L Thompson @param[out] is_update_needed Boolean flag indicating if re-assembly is required 9718b919e6bSJeremy L Thompson 9728b919e6bSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 9738b919e6bSJeremy L Thompson 9748b919e6bSJeremy L Thompson @ref Backend 9758b919e6bSJeremy L Thompson **/ 9762b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsUpdateNeeded(CeedQFunctionAssemblyData data, bool *is_update_needed) { 977beecbf24SJeremy L Thompson *is_update_needed = !data->reuse_data || data->needs_data_update; 9788b919e6bSJeremy L Thompson return CEED_ERROR_SUCCESS; 9798b919e6bSJeremy L Thompson } 9808b919e6bSJeremy L Thompson 9818b919e6bSJeremy L Thompson /** 982ea61e9acSJeremy L Thompson @brief Copy the pointer to a CeedQFunctionAssemblyData. 9834385fb7fSSebastian Grimberg 984ea61e9acSJeremy L Thompson Both pointers should be destroyed with `CeedCeedQFunctionAssemblyDataDestroy()`. 985512bb800SJeremy L Thompson 986512bb800SJeremy L Thompson Note: If the value of `data_copy` passed to this function is non-NULL, then it is assumed that `*data_copy` is a pointer to a 987512bb800SJeremy L Thompson CeedQFunctionAssemblyData. This CeedQFunctionAssemblyData will be destroyed if `data_copy` is the only reference to this 988512bb800SJeremy L Thompson CeedQFunctionAssemblyData. 989480fae85SJeremy L Thompson 990ea61e9acSJeremy L Thompson @param[in] data CeedQFunctionAssemblyData to copy reference to 991ea61e9acSJeremy L Thompson @param[in,out] data_copy Variable to store copied reference 992480fae85SJeremy L Thompson 993480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 994480fae85SJeremy L Thompson 995480fae85SJeremy L Thompson @ref Backend 996480fae85SJeremy L Thompson **/ 9972b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataReferenceCopy(CeedQFunctionAssemblyData data, CeedQFunctionAssemblyData *data_copy) { 9982b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataReference(data)); 9992b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataDestroy(data_copy)); 1000480fae85SJeremy L Thompson *data_copy = data; 1001480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1002480fae85SJeremy L Thompson } 1003480fae85SJeremy L Thompson 1004480fae85SJeremy L Thompson /** 1005480fae85SJeremy L Thompson @brief Get setup status for internal objects for CeedQFunctionAssemblyData 1006480fae85SJeremy L Thompson 1007ea61e9acSJeremy L Thompson @param[in] data CeedQFunctionAssemblyData to retrieve status 1008480fae85SJeremy L Thompson @param[out] is_setup Boolean flag for setup status 1009480fae85SJeremy L Thompson 1010480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1011480fae85SJeremy L Thompson 1012480fae85SJeremy L Thompson @ref Backend 1013480fae85SJeremy L Thompson **/ 10142b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsSetup(CeedQFunctionAssemblyData data, bool *is_setup) { 1015480fae85SJeremy L Thompson *is_setup = data->is_setup; 1016480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1017480fae85SJeremy L Thompson } 1018480fae85SJeremy L Thompson 1019480fae85SJeremy L Thompson /** 1020480fae85SJeremy L Thompson @brief Set internal objects for CeedQFunctionAssemblyData 1021480fae85SJeremy L Thompson 1022ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to set objects 1023480fae85SJeremy L Thompson @param[in] vec CeedVector to store assembled CeedQFunction at quadrature points 1024480fae85SJeremy L Thompson @param[in] rstr CeedElemRestriction for CeedVector containing assembled CeedQFunction 1025480fae85SJeremy L Thompson 1026480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1027480fae85SJeremy L Thompson 1028480fae85SJeremy L Thompson @ref Backend 1029480fae85SJeremy L Thompson **/ 10302b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetObjects(CeedQFunctionAssemblyData data, CeedVector vec, CeedElemRestriction rstr) { 10312b730f8bSJeremy L Thompson CeedCall(CeedVectorReferenceCopy(vec, &data->vec)); 10322b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(rstr, &data->rstr)); 1033480fae85SJeremy L Thompson 1034480fae85SJeremy L Thompson data->is_setup = true; 1035480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1036480fae85SJeremy L Thompson } 1037480fae85SJeremy L Thompson 10382b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataGetObjects(CeedQFunctionAssemblyData data, CeedVector *vec, CeedElemRestriction *rstr) { 10396574a04fSJeremy L Thompson CeedCheck(data->is_setup, data->ceed, CEED_ERROR_INCOMPLETE, "Internal objects not set; must call CeedQFunctionAssemblyDataSetObjects first."); 1040480fae85SJeremy L Thompson 10412b730f8bSJeremy L Thompson CeedCall(CeedVectorReferenceCopy(data->vec, vec)); 10422b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(data->rstr, rstr)); 1043480fae85SJeremy L Thompson 1044480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1045480fae85SJeremy L Thompson } 1046480fae85SJeremy L Thompson 1047480fae85SJeremy L Thompson /** 1048480fae85SJeremy L Thompson @brief Destroy CeedQFunctionAssemblyData 1049480fae85SJeremy L Thompson 1050ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to destroy 1051480fae85SJeremy L Thompson 1052480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1053480fae85SJeremy L Thompson 1054480fae85SJeremy L Thompson @ref Backend 1055480fae85SJeremy L Thompson **/ 1056480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataDestroy(CeedQFunctionAssemblyData *data) { 1057ad6481ceSJeremy L Thompson if (!*data || --(*data)->ref_count > 0) { 1058ad6481ceSJeremy L Thompson *data = NULL; 1059ad6481ceSJeremy L Thompson return CEED_ERROR_SUCCESS; 1060ad6481ceSJeremy L Thompson } 10612b730f8bSJeremy L Thompson CeedCall(CeedDestroy(&(*data)->ceed)); 10622b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&(*data)->vec)); 10632b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&(*data)->rstr)); 1064480fae85SJeremy L Thompson 10652b730f8bSJeremy L Thompson CeedCall(CeedFree(data)); 1066480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1067480fae85SJeremy L Thompson } 1068480fae85SJeremy L Thompson 1069ed9e99e6SJeremy L Thompson /** 1070ed9e99e6SJeremy L Thompson @brief Get CeedOperatorAssemblyData 1071ed9e99e6SJeremy L Thompson 1072ed9e99e6SJeremy L Thompson @param[in] op CeedOperator to assemble 1073ed9e99e6SJeremy L Thompson @param[out] data CeedQFunctionAssemblyData 1074ed9e99e6SJeremy L Thompson 1075ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1076ed9e99e6SJeremy L Thompson 1077ed9e99e6SJeremy L Thompson @ref Backend 1078ed9e99e6SJeremy L Thompson **/ 10792b730f8bSJeremy L Thompson int CeedOperatorGetOperatorAssemblyData(CeedOperator op, CeedOperatorAssemblyData *data) { 1080ed9e99e6SJeremy L Thompson if (!op->op_assembled) { 1081ed9e99e6SJeremy L Thompson CeedOperatorAssemblyData data; 1082ed9e99e6SJeremy L Thompson 10832b730f8bSJeremy L Thompson CeedCall(CeedOperatorAssemblyDataCreate(op->ceed, op, &data)); 1084ed9e99e6SJeremy L Thompson op->op_assembled = data; 1085ed9e99e6SJeremy L Thompson } 1086ed9e99e6SJeremy L Thompson *data = op->op_assembled; 1087ed9e99e6SJeremy L Thompson 1088ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1089ed9e99e6SJeremy L Thompson } 1090ed9e99e6SJeremy L Thompson 1091ed9e99e6SJeremy L Thompson /** 1092ba746a46SJeremy L Thompson @brief Create object holding CeedOperator assembly data. 1093ba746a46SJeremy L Thompson 1094ba746a46SJeremy L Thompson The CeedOperatorAssemblyData holds an array with references to every active CeedBasis used in the CeedOperator. 1095ba746a46SJeremy L Thompson An array with references to the corresponding active CeedElemRestrictions is also stored. 1096ba746a46SJeremy L Thompson For each active CeedBasis, the CeedOperatorAssemblyData holds an array of all input and output CeedEvalModes for this CeedBasis. 1097ba746a46SJeremy L Thompson The CeedOperatorAssemblyData holds an array of offsets for indexing into the assembled CeedQFunction arrays to the row representing each 1098ba746a46SJeremy L Thompson CeedEvalMode. 1099ba746a46SJeremy L Thompson The number of input columns across all active bases for the assembled CeedQFunction is also stored. 1100ba746a46SJeremy L Thompson Lastly, the CeedOperatorAssembly data holds assembled matrices representing the full action of the CeedBasis for all CeedEvalModes. 1101ed9e99e6SJeremy L Thompson 1102ea61e9acSJeremy L Thompson @param[in] ceed Ceed object where the CeedOperatorAssemblyData will be created 1103ed9e99e6SJeremy L Thompson @param[in] op CeedOperator to be assembled 1104ea61e9acSJeremy L Thompson @param[out] data Address of the variable where the newly created CeedOperatorAssemblyData will be stored 1105ed9e99e6SJeremy L Thompson 1106ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1107ed9e99e6SJeremy L Thompson 1108ed9e99e6SJeremy L Thompson @ref Backend 1109ed9e99e6SJeremy L Thompson **/ 11102b730f8bSJeremy L Thompson int CeedOperatorAssemblyDataCreate(Ceed ceed, CeedOperator op, CeedOperatorAssemblyData *data) { 1111437c7c90SJeremy L Thompson CeedInt num_active_bases = 0; 1112437c7c90SJeremy L Thompson 1113437c7c90SJeremy L Thompson // Allocate 11142b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, data)); 1115ed9e99e6SJeremy L Thompson (*data)->ceed = ceed; 11162b730f8bSJeremy L Thompson CeedCall(CeedReference(ceed)); 1117ed9e99e6SJeremy L Thompson 1118ed9e99e6SJeremy L Thompson // Build OperatorAssembly data 1119ed9e99e6SJeremy L Thompson CeedQFunction qf; 1120ed9e99e6SJeremy L Thompson CeedQFunctionField *qf_fields; 1121ed9e99e6SJeremy L Thompson CeedOperatorField *op_fields; 1122ed9e99e6SJeremy L Thompson CeedInt num_input_fields; 11232b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 11242b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetFields(qf, &num_input_fields, &qf_fields, NULL, NULL)); 11252b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL)); 1126ed9e99e6SJeremy L Thompson 1127ed9e99e6SJeremy L Thompson // Determine active input basis 1128437c7c90SJeremy L Thompson CeedInt *num_eval_modes_in = NULL, *num_eval_modes_out = NULL, offset = 0; 1129437c7c90SJeremy L Thompson CeedEvalMode **eval_modes_in = NULL, **eval_modes_out = NULL; 1130437c7c90SJeremy L Thompson CeedSize **eval_mode_offsets_in = NULL, **eval_mode_offsets_out = NULL; 1131ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 1132ed9e99e6SJeremy L Thompson CeedVector vec; 11332b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec)); 1134ed9e99e6SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 1135437c7c90SJeremy L Thompson CeedBasis basis_in = NULL; 1136437c7c90SJeremy L Thompson CeedEvalMode eval_mode; 1137352a5e7cSSebastian Grimberg CeedInt index = -1, dim, num_comp, q_comp; 11382b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_in)); 11392b730f8bSJeremy L Thompson CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 1140352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetDimension(basis_in, &dim)); 1141352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumComponents(basis_in, &num_comp)); 1142352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(basis_in, eval_mode, &q_comp)); 1143437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_active_bases; i++) { 1144437c7c90SJeremy L Thompson if ((*data)->active_bases[i] == basis_in) index = i; 1145437c7c90SJeremy L Thompson } 1146437c7c90SJeremy L Thompson if (index == -1) { 1147437c7c90SJeremy L Thompson CeedElemRestriction elem_rstr_in; 1148437c7c90SJeremy L Thompson index = num_active_bases; 1149437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_bases)); 1150437c7c90SJeremy L Thompson (*data)->active_bases[num_active_bases] = NULL; 1151437c7c90SJeremy L Thompson CeedCall(CeedBasisReferenceCopy(basis_in, &(*data)->active_bases[num_active_bases])); 1152437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_elem_rstrs)); 1153437c7c90SJeremy L Thompson (*data)->active_elem_rstrs[num_active_bases] = NULL; 1154437c7c90SJeremy L Thompson CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr_in)); 1155437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(elem_rstr_in, &(*data)->active_elem_rstrs[num_active_bases])); 1156437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_in)); 1157437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_out)); 1158437c7c90SJeremy L Thompson num_eval_modes_in[index] = 0; 1159437c7c90SJeremy L Thompson num_eval_modes_out[index] = 0; 1160437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_in)); 1161437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_out)); 1162437c7c90SJeremy L Thompson eval_modes_in[index] = NULL; 1163437c7c90SJeremy L Thompson eval_modes_out[index] = NULL; 1164437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_in)); 1165437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_out)); 1166437c7c90SJeremy L Thompson eval_mode_offsets_in[index] = NULL; 1167437c7c90SJeremy L Thompson eval_mode_offsets_out[index] = NULL; 1168437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_in)); 1169437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_out)); 1170437c7c90SJeremy L Thompson (*data)->assembled_bases_in[index] = NULL; 1171437c7c90SJeremy L Thompson (*data)->assembled_bases_out[index] = NULL; 1172437c7c90SJeremy L Thompson num_active_bases++; 1173437c7c90SJeremy L Thompson } 1174352a5e7cSSebastian Grimberg if (eval_mode != CEED_EVAL_WEIGHT) { 1175352a5e7cSSebastian Grimberg // q_comp = 1 if CEED_EVAL_NONE, CEED_EVAL_WEIGHT caught by QF Assembly 1176352a5e7cSSebastian Grimberg CeedCall(CeedRealloc(num_eval_modes_in[index] + q_comp, &eval_modes_in[index])); 1177352a5e7cSSebastian Grimberg CeedCall(CeedRealloc(num_eval_modes_in[index] + q_comp, &eval_mode_offsets_in[index])); 1178352a5e7cSSebastian Grimberg for (CeedInt d = 0; d < q_comp; d++) { 1179437c7c90SJeremy L Thompson eval_modes_in[index][num_eval_modes_in[index] + d] = eval_mode; 1180437c7c90SJeremy L Thompson eval_mode_offsets_in[index][num_eval_modes_in[index] + d] = offset; 1181352a5e7cSSebastian Grimberg offset += num_comp; 1182ed9e99e6SJeremy L Thompson } 1183352a5e7cSSebastian Grimberg num_eval_modes_in[index] += q_comp; 1184ed9e99e6SJeremy L Thompson } 1185ed9e99e6SJeremy L Thompson } 1186ed9e99e6SJeremy L Thompson } 1187437c7c90SJeremy L Thompson (*data)->num_eval_modes_in = num_eval_modes_in; 1188437c7c90SJeremy L Thompson (*data)->eval_modes_in = eval_modes_in; 1189437c7c90SJeremy L Thompson (*data)->eval_mode_offsets_in = eval_mode_offsets_in; 1190ed9e99e6SJeremy L Thompson 1191ed9e99e6SJeremy L Thompson // Determine active output basis 1192ed9e99e6SJeremy L Thompson CeedInt num_output_fields; 11932b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetFields(qf, NULL, NULL, &num_output_fields, &qf_fields)); 11942b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields)); 1195437c7c90SJeremy L Thompson offset = 0; 1196ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_output_fields; i++) { 1197ed9e99e6SJeremy L Thompson CeedVector vec; 11982b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec)); 1199ed9e99e6SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 1200437c7c90SJeremy L Thompson CeedBasis basis_out = NULL; 1201ed9e99e6SJeremy L Thompson CeedEvalMode eval_mode; 1202352a5e7cSSebastian Grimberg CeedInt index = -1, dim, num_comp, q_comp; 1203437c7c90SJeremy L Thompson CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_out)); 12042b730f8bSJeremy L Thompson CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 1205352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetDimension(basis_out, &dim)); 1206352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumComponents(basis_out, &num_comp)); 1207352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(basis_out, eval_mode, &q_comp)); 1208437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_active_bases; i++) { 1209437c7c90SJeremy L Thompson if ((*data)->active_bases[i] == basis_out) index = i; 1210437c7c90SJeremy L Thompson } 1211437c7c90SJeremy L Thompson if (index == -1) { 1212437c7c90SJeremy L Thompson CeedElemRestriction elem_rstr_out; 1213437c7c90SJeremy L Thompson 1214437c7c90SJeremy L Thompson index = num_active_bases; 1215437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_bases)); 1216437c7c90SJeremy L Thompson (*data)->active_bases[num_active_bases] = NULL; 1217437c7c90SJeremy L Thompson CeedCall(CeedBasisReferenceCopy(basis_out, &(*data)->active_bases[num_active_bases])); 1218437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_elem_rstrs)); 1219437c7c90SJeremy L Thompson (*data)->active_elem_rstrs[num_active_bases] = NULL; 1220437c7c90SJeremy L Thompson CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr_out)); 1221437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(elem_rstr_out, &(*data)->active_elem_rstrs[num_active_bases])); 1222437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_in)); 1223437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_out)); 1224437c7c90SJeremy L Thompson num_eval_modes_in[index] = 0; 1225437c7c90SJeremy L Thompson num_eval_modes_out[index] = 0; 1226437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_in)); 1227437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_out)); 1228437c7c90SJeremy L Thompson eval_modes_in[index] = NULL; 1229437c7c90SJeremy L Thompson eval_modes_out[index] = NULL; 1230437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_in)); 1231437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_out)); 1232437c7c90SJeremy L Thompson eval_mode_offsets_in[index] = NULL; 1233437c7c90SJeremy L Thompson eval_mode_offsets_out[index] = NULL; 1234437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_in)); 1235437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_out)); 1236437c7c90SJeremy L Thompson (*data)->assembled_bases_in[index] = NULL; 1237437c7c90SJeremy L Thompson (*data)->assembled_bases_out[index] = NULL; 1238437c7c90SJeremy L Thompson num_active_bases++; 1239437c7c90SJeremy L Thompson } 1240352a5e7cSSebastian Grimberg if (eval_mode != CEED_EVAL_WEIGHT) { 1241352a5e7cSSebastian Grimberg // q_comp = 1 if CEED_EVAL_NONE, CEED_EVAL_WEIGHT caught by QF Assembly 1242352a5e7cSSebastian Grimberg CeedCall(CeedRealloc(num_eval_modes_out[index] + q_comp, &eval_modes_out[index])); 1243352a5e7cSSebastian Grimberg CeedCall(CeedRealloc(num_eval_modes_out[index] + q_comp, &eval_mode_offsets_out[index])); 1244352a5e7cSSebastian Grimberg for (CeedInt d = 0; d < q_comp; d++) { 1245437c7c90SJeremy L Thompson eval_modes_out[index][num_eval_modes_out[index] + d] = eval_mode; 1246437c7c90SJeremy L Thompson eval_mode_offsets_out[index][num_eval_modes_out[index] + d] = offset; 1247352a5e7cSSebastian Grimberg offset += num_comp; 1248ed9e99e6SJeremy L Thompson } 1249352a5e7cSSebastian Grimberg num_eval_modes_out[index] += q_comp; 1250ed9e99e6SJeremy L Thompson } 1251ed9e99e6SJeremy L Thompson } 1252ed9e99e6SJeremy L Thompson } 1253437c7c90SJeremy L Thompson (*data)->num_output_components = offset; 1254437c7c90SJeremy L Thompson (*data)->num_eval_modes_out = num_eval_modes_out; 1255437c7c90SJeremy L Thompson (*data)->eval_modes_out = eval_modes_out; 1256437c7c90SJeremy L Thompson (*data)->eval_mode_offsets_out = eval_mode_offsets_out; 1257437c7c90SJeremy L Thompson (*data)->num_active_bases = num_active_bases; 1258ed9e99e6SJeremy L Thompson 1259ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1260ed9e99e6SJeremy L Thompson } 1261ed9e99e6SJeremy L Thompson 1262ed9e99e6SJeremy L Thompson /** 1263ba746a46SJeremy L Thompson @brief Get CeedOperator CeedEvalModes for assembly. 1264ba746a46SJeremy L Thompson 1265ba746a46SJeremy L Thompson Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object. 1266ed9e99e6SJeremy L Thompson 1267ed9e99e6SJeremy L Thompson @param[in] data CeedOperatorAssemblyData 1268ba746a46SJeremy L Thompson @param[out] num_active_bases Total number of active bases 1269c5d0f995SJed Brown @param[out] num_eval_modes_in Pointer to hold array of numbers of input CeedEvalModes, or NULL. 1270ba746a46SJeremy L Thompson `eval_modes_in[0]` holds an array of eval modes for the first active basis. 1271c5d0f995SJed Brown @param[out] eval_modes_in Pointer to hold arrays of input CeedEvalModes, or NULL. 1272ba746a46SJeremy L Thompson @param[out] eval_mode_offsets_in Pointer to hold arrays of input offsets at each quadrature point. 1273c5d0f995SJed Brown @param[out] num_eval_modes_out Pointer to hold array of numbers of output CeedEvalModes, or NULL 1274c5d0f995SJed Brown @param[out] eval_modes_out Pointer to hold arrays of output CeedEvalModes, or NULL. 1275437c7c90SJeremy L Thompson @param[out] eval_mode_offsets_out Pointer to hold arrays of output offsets at each quadrature point 1276ba746a46SJeremy L Thompson @param[out] num_output_components The number of columns in the assembled CeedQFunction matrix for each quadrature point, 1277ba746a46SJeremy L Thompson including contributions of all active bases 1278ed9e99e6SJeremy L Thompson 1279ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1280ed9e99e6SJeremy L Thompson 1281c5d0f995SJed Brown 1282ed9e99e6SJeremy L Thompson @ref Backend 1283ed9e99e6SJeremy L Thompson **/ 1284437c7c90SJeremy L Thompson int CeedOperatorAssemblyDataGetEvalModes(CeedOperatorAssemblyData data, CeedInt *num_active_bases, CeedInt **num_eval_modes_in, 1285437c7c90SJeremy L Thompson const CeedEvalMode ***eval_modes_in, CeedSize ***eval_mode_offsets_in, CeedInt **num_eval_modes_out, 1286437c7c90SJeremy L Thompson const CeedEvalMode ***eval_modes_out, CeedSize ***eval_mode_offsets_out, CeedSize *num_output_components) { 1287437c7c90SJeremy L Thompson if (num_active_bases) *num_active_bases = data->num_active_bases; 1288437c7c90SJeremy L Thompson if (num_eval_modes_in) *num_eval_modes_in = data->num_eval_modes_in; 1289437c7c90SJeremy L Thompson if (eval_modes_in) *eval_modes_in = (const CeedEvalMode **)data->eval_modes_in; 1290437c7c90SJeremy L Thompson if (eval_mode_offsets_in) *eval_mode_offsets_in = data->eval_mode_offsets_in; 1291437c7c90SJeremy L Thompson if (num_eval_modes_out) *num_eval_modes_out = data->num_eval_modes_out; 1292437c7c90SJeremy L Thompson if (eval_modes_out) *eval_modes_out = (const CeedEvalMode **)data->eval_modes_out; 1293437c7c90SJeremy L Thompson if (eval_mode_offsets_out) *eval_mode_offsets_out = data->eval_mode_offsets_out; 1294437c7c90SJeremy L Thompson if (num_output_components) *num_output_components = data->num_output_components; 1295ed9e99e6SJeremy L Thompson 1296ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1297ed9e99e6SJeremy L Thompson } 1298ed9e99e6SJeremy L Thompson 1299ed9e99e6SJeremy L Thompson /** 1300ba746a46SJeremy L Thompson @brief Get CeedOperator CeedBasis data for assembly. 1301ba746a46SJeremy L Thompson 1302ba746a46SJeremy L Thompson Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object. 1303ed9e99e6SJeremy L Thompson 1304ed9e99e6SJeremy L Thompson @param[in] data CeedOperatorAssemblyData 1305437c7c90SJeremy L Thompson @param[out] num_active_bases Number of active bases, or NULL 1306437c7c90SJeremy L Thompson @param[out] active_bases Pointer to hold active CeedBasis, or NULL 1307437c7c90SJeremy L Thompson @param[out] assembled_bases_in Pointer to hold assembled active input B, or NULL 1308437c7c90SJeremy L Thompson @param[out] assembled_bases_out Pointer to hold assembled active output B, or NULL 1309ed9e99e6SJeremy L Thompson 1310ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1311ed9e99e6SJeremy L Thompson 1312ed9e99e6SJeremy L Thompson @ref Backend 1313ed9e99e6SJeremy L Thompson **/ 1314437c7c90SJeremy L Thompson int CeedOperatorAssemblyDataGetBases(CeedOperatorAssemblyData data, CeedInt *num_active_bases, CeedBasis **active_bases, 1315437c7c90SJeremy L Thompson const CeedScalar ***assembled_bases_in, const CeedScalar ***assembled_bases_out) { 1316ed9e99e6SJeremy L Thompson // Assemble B_in, B_out if needed 1317437c7c90SJeremy L Thompson if (assembled_bases_in && !data->assembled_bases_in[0]) { 1318437c7c90SJeremy L Thompson CeedInt num_qpts; 1319437c7c90SJeremy L Thompson 1320437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(data->active_bases[0], &num_qpts)); 1321437c7c90SJeremy L Thompson for (CeedInt b = 0; b < data->num_active_bases; b++) { 1322352a5e7cSSebastian Grimberg CeedInt num_nodes; 1323437c7c90SJeremy L Thompson CeedScalar *B_in = NULL, *identity = NULL; 1324ed9e99e6SJeremy L Thompson bool has_eval_none = false; 1325ed9e99e6SJeremy L Thompson 1326352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumNodes(data->active_bases[b], &num_nodes)); 1327352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_qpts * num_nodes * data->num_eval_modes_in[b], &B_in)); 1328ed9e99e6SJeremy L Thompson 1329437c7c90SJeremy L Thompson for (CeedInt i = 0; i < data->num_eval_modes_in[b]; i++) { 1330437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (data->eval_modes_in[b][i] == CEED_EVAL_NONE); 1331ed9e99e6SJeremy L Thompson } 1332ed9e99e6SJeremy L Thompson if (has_eval_none) { 1333352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_qpts * num_nodes, &identity)); 1334352a5e7cSSebastian Grimberg for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) { 1335352a5e7cSSebastian Grimberg identity[i * num_nodes + i] = 1.0; 1336ed9e99e6SJeremy L Thompson } 1337ed9e99e6SJeremy L Thompson } 1338ed9e99e6SJeremy L Thompson 1339ed9e99e6SJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 1340352a5e7cSSebastian Grimberg for (CeedInt n = 0; n < num_nodes; n++) { 1341352a5e7cSSebastian Grimberg CeedInt d_in = 0, q_comp_in; 1342352a5e7cSSebastian Grimberg CeedEvalMode eval_mode_in_prev = CEED_EVAL_NONE; 1343437c7c90SJeremy L Thompson for (CeedInt e_in = 0; e_in < data->num_eval_modes_in[b]; e_in++) { 1344437c7c90SJeremy L Thompson const CeedInt qq = data->num_eval_modes_in[b] * q; 1345437c7c90SJeremy L Thompson const CeedScalar *B = NULL; 1346352a5e7cSSebastian Grimberg CeedOperatorGetBasisPointer(data->active_bases[b], data->eval_modes_in[b][e_in], identity, &B); 1347352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(data->active_bases[b], data->eval_modes_in[b][e_in], &q_comp_in)); 1348352a5e7cSSebastian Grimberg if (q_comp_in > 1) { 1349352a5e7cSSebastian Grimberg if (e_in == 0 || data->eval_modes_in[b][e_in] != eval_mode_in_prev) d_in = 0; 1350352a5e7cSSebastian Grimberg else B = &B[(++d_in) * num_qpts * num_nodes]; 1351352a5e7cSSebastian Grimberg } 1352352a5e7cSSebastian Grimberg eval_mode_in_prev = data->eval_modes_in[b][e_in]; 1353352a5e7cSSebastian Grimberg B_in[(qq + e_in) * num_nodes + n] = B[q * num_nodes + n]; 1354ed9e99e6SJeremy L Thompson } 1355ed9e99e6SJeremy L Thompson } 1356ed9e99e6SJeremy L Thompson } 1357437c7c90SJeremy L Thompson if (identity) CeedCall(CeedFree(identity)); 1358437c7c90SJeremy L Thompson data->assembled_bases_in[b] = B_in; 1359437c7c90SJeremy L Thompson } 1360ed9e99e6SJeremy L Thompson } 1361ed9e99e6SJeremy L Thompson 1362437c7c90SJeremy L Thompson if (assembled_bases_out && !data->assembled_bases_out[0]) { 1363437c7c90SJeremy L Thompson CeedInt num_qpts; 1364437c7c90SJeremy L Thompson 1365437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(data->active_bases[0], &num_qpts)); 1366437c7c90SJeremy L Thompson for (CeedInt b = 0; b < data->num_active_bases; b++) { 1367352a5e7cSSebastian Grimberg CeedInt num_nodes; 1368ed9e99e6SJeremy L Thompson bool has_eval_none = false; 1369437c7c90SJeremy L Thompson CeedScalar *B_out = NULL, *identity = NULL; 1370ed9e99e6SJeremy L Thompson 1371352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumNodes(data->active_bases[b], &num_nodes)); 1372352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_qpts * num_nodes * data->num_eval_modes_out[b], &B_out)); 1373ed9e99e6SJeremy L Thompson 1374437c7c90SJeremy L Thompson for (CeedInt i = 0; i < data->num_eval_modes_out[b]; i++) { 1375437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (data->eval_modes_out[b][i] == CEED_EVAL_NONE); 1376ed9e99e6SJeremy L Thompson } 1377ed9e99e6SJeremy L Thompson if (has_eval_none) { 1378352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_qpts * num_nodes, &identity)); 1379352a5e7cSSebastian Grimberg for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) { 1380352a5e7cSSebastian Grimberg identity[i * num_nodes + i] = 1.0; 1381ed9e99e6SJeremy L Thompson } 1382ed9e99e6SJeremy L Thompson } 1383ed9e99e6SJeremy L Thompson 1384ed9e99e6SJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 1385352a5e7cSSebastian Grimberg for (CeedInt n = 0; n < num_nodes; n++) { 1386352a5e7cSSebastian Grimberg CeedInt d_out = 0, q_comp_out; 1387352a5e7cSSebastian Grimberg CeedEvalMode eval_mode_out_prev = CEED_EVAL_NONE; 1388437c7c90SJeremy L Thompson for (CeedInt e_out = 0; e_out < data->num_eval_modes_out[b]; e_out++) { 1389437c7c90SJeremy L Thompson const CeedInt qq = data->num_eval_modes_out[b] * q; 1390437c7c90SJeremy L Thompson const CeedScalar *B = NULL; 1391352a5e7cSSebastian Grimberg CeedOperatorGetBasisPointer(data->active_bases[b], data->eval_modes_out[b][e_out], identity, &B); 1392352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(data->active_bases[b], data->eval_modes_out[b][e_out], &q_comp_out)); 1393352a5e7cSSebastian Grimberg if (q_comp_out > 1) { 1394352a5e7cSSebastian Grimberg if (e_out == 0 || data->eval_modes_out[b][e_out] != eval_mode_out_prev) d_out = 0; 1395352a5e7cSSebastian Grimberg else B = &B[(++d_out) * num_qpts * num_nodes]; 1396352a5e7cSSebastian Grimberg } 1397352a5e7cSSebastian Grimberg eval_mode_out_prev = data->eval_modes_out[b][e_out]; 1398352a5e7cSSebastian Grimberg B_out[(qq + e_out) * num_nodes + n] = B[q * num_nodes + n]; 1399ed9e99e6SJeremy L Thompson } 1400ed9e99e6SJeremy L Thompson } 1401ed9e99e6SJeremy L Thompson } 1402437c7c90SJeremy L Thompson if (identity) CeedCall(CeedFree(identity)); 1403437c7c90SJeremy L Thompson data->assembled_bases_out[b] = B_out; 1404437c7c90SJeremy L Thompson } 1405ed9e99e6SJeremy L Thompson } 1406ed9e99e6SJeremy L Thompson 1407437c7c90SJeremy L Thompson // Pass out assembled data 1408437c7c90SJeremy L Thompson if (active_bases) *active_bases = data->active_bases; 1409437c7c90SJeremy L Thompson if (assembled_bases_in) *assembled_bases_in = (const CeedScalar **)data->assembled_bases_in; 1410437c7c90SJeremy L Thompson if (assembled_bases_out) *assembled_bases_out = (const CeedScalar **)data->assembled_bases_out; 1411437c7c90SJeremy L Thompson 1412437c7c90SJeremy L Thompson return CEED_ERROR_SUCCESS; 1413437c7c90SJeremy L Thompson } 1414437c7c90SJeremy L Thompson 1415437c7c90SJeremy L Thompson /** 1416ba746a46SJeremy L Thompson @brief Get CeedOperator CeedBasis data for assembly. 1417ba746a46SJeremy L Thompson 1418ba746a46SJeremy L Thompson Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object. 1419437c7c90SJeremy L Thompson 1420437c7c90SJeremy L Thompson @param[in] data CeedOperatorAssemblyData 1421437c7c90SJeremy L Thompson @param[out] num_active_elem_rstrs Number of active element restrictions, or NULL 1422437c7c90SJeremy L Thompson @param[out] active_elem_rstrs Pointer to hold active CeedElemRestrictions, or NULL 1423437c7c90SJeremy L Thompson 1424437c7c90SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1425437c7c90SJeremy L Thompson 1426437c7c90SJeremy L Thompson @ref Backend 1427437c7c90SJeremy L Thompson **/ 1428437c7c90SJeremy L Thompson int CeedOperatorAssemblyDataGetElemRestrictions(CeedOperatorAssemblyData data, CeedInt *num_active_elem_rstrs, 1429437c7c90SJeremy L Thompson CeedElemRestriction **active_elem_rstrs) { 1430437c7c90SJeremy L Thompson if (num_active_elem_rstrs) *num_active_elem_rstrs = data->num_active_bases; 1431437c7c90SJeremy L Thompson if (active_elem_rstrs) *active_elem_rstrs = data->active_elem_rstrs; 1432ed9e99e6SJeremy L Thompson 1433ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1434ed9e99e6SJeremy L Thompson } 1435ed9e99e6SJeremy L Thompson 1436ed9e99e6SJeremy L Thompson /** 1437ed9e99e6SJeremy L Thompson @brief Destroy CeedOperatorAssemblyData 1438ed9e99e6SJeremy L Thompson 1439ea61e9acSJeremy L Thompson @param[in,out] data CeedOperatorAssemblyData to destroy 1440ed9e99e6SJeremy L Thompson 1441ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1442ed9e99e6SJeremy L Thompson 1443ed9e99e6SJeremy L Thompson @ref Backend 1444ed9e99e6SJeremy L Thompson **/ 1445ed9e99e6SJeremy L Thompson int CeedOperatorAssemblyDataDestroy(CeedOperatorAssemblyData *data) { 1446ad6481ceSJeremy L Thompson if (!*data) { 1447ad6481ceSJeremy L Thompson *data = NULL; 1448ad6481ceSJeremy L Thompson return CEED_ERROR_SUCCESS; 1449ad6481ceSJeremy L Thompson } 14502b730f8bSJeremy L Thompson CeedCall(CeedDestroy(&(*data)->ceed)); 1451437c7c90SJeremy L Thompson for (CeedInt b = 0; b < (*data)->num_active_bases; b++) { 1452437c7c90SJeremy L Thompson CeedCall(CeedBasisDestroy(&(*data)->active_bases[b])); 1453437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&(*data)->active_elem_rstrs[b])); 1454437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_in[b])); 1455437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_out[b])); 1456437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_in[b])); 1457437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_out[b])); 1458437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_in[b])); 1459437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_out[b])); 1460437c7c90SJeremy L Thompson } 1461437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->active_bases)); 1462437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->active_elem_rstrs)); 1463437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->num_eval_modes_in)); 1464437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->num_eval_modes_out)); 1465437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_in)); 1466437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_out)); 1467437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_in)); 1468437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_out)); 1469437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_in)); 1470437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_out)); 1471ed9e99e6SJeremy L Thompson 14722b730f8bSJeremy L Thompson CeedCall(CeedFree(data)); 1473ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1474ed9e99e6SJeremy L Thompson } 1475ed9e99e6SJeremy L Thompson 1476480fae85SJeremy L Thompson /// @} 1477480fae85SJeremy L Thompson 1478480fae85SJeremy L Thompson /// ---------------------------------------------------------------------------- 1479eaf62fffSJeremy L Thompson /// CeedOperator Public API 1480eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 1481eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorUser 1482eaf62fffSJeremy L Thompson /// @{ 1483eaf62fffSJeremy L Thompson 1484eaf62fffSJeremy L Thompson /** 1485eaf62fffSJeremy L Thompson @brief Assemble a linear CeedQFunction associated with a CeedOperator 1486eaf62fffSJeremy L Thompson 1487ea61e9acSJeremy L Thompson This returns a CeedVector containing a matrix at each quadrature point providing the action of the CeedQFunction associated with the CeedOperator. 1488859c15bbSJames Wright The vector `assembled` is of shape `[num_elements, num_input_fields, num_output_fields, num_quad_points]` and contains column-major matrices 1489859c15bbSJames Wright representing the action of the CeedQFunction for a corresponding quadrature point on an element. 1490859c15bbSJames Wright 14919fd66db6SSebastian Grimberg Inputs and outputs are in the order provided by the user when adding CeedOperator fields. 14929fd66db6SSebastian Grimberg For example, a CeedQFunction with inputs 'u' and 'gradu' and outputs 'gradv' and 'v', provided in that order, would result in an assembled QFunction 14939fd66db6SSebastian Grimberg that consists of (1 + dim) x (dim + 1) matrices at each quadrature point acting on the input [u, du_0, du_1] and producing the output [dv_0, dv_1, v]. 1494eaf62fffSJeremy L Thompson 1495ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1496f04ea552SJeremy L Thompson 1497ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1498ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points 1499ea61e9acSJeremy L Thompson @param[out] rstr CeedElemRestriction for CeedVector containing assembled CeedQFunction 1500ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1501eaf62fffSJeremy L Thompson 1502eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1503eaf62fffSJeremy L Thompson 1504eaf62fffSJeremy L Thompson @ref User 1505eaf62fffSJeremy L Thompson **/ 15062b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunction(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 15072b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1508eaf62fffSJeremy L Thompson 1509eaf62fffSJeremy L Thompson if (op->LinearAssembleQFunction) { 1510d04bbc78SJeremy L Thompson // Backend version 15112b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleQFunction(op, assembled, rstr, request)); 1512eaf62fffSJeremy L Thompson } else { 1513d04bbc78SJeremy L Thompson // Operator fallback 1514d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1515d04bbc78SJeremy L Thompson 15162b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 15176574a04fSJeremy L Thompson if (op_fallback) CeedCall(CeedOperatorLinearAssembleQFunction(op_fallback, assembled, rstr, request)); 15186574a04fSJeremy L Thompson else return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunction"); 151970a7ffb3SJeremy L Thompson } 1520eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1521eaf62fffSJeremy L Thompson } 152270a7ffb3SJeremy L Thompson 152370a7ffb3SJeremy L Thompson /** 1524ea61e9acSJeremy L Thompson @brief Assemble CeedQFunction and store result internally. 15254385fb7fSSebastian Grimberg 1526ea61e9acSJeremy L Thompson Return copied references of stored data to the caller. 1527ea61e9acSJeremy L Thompson Caller is responsible for ownership and destruction of the copied references. 1528ea61e9acSJeremy L Thompson See also @ref CeedOperatorLinearAssembleQFunction 152970a7ffb3SJeremy L Thompson 1530c5f45aeaSJeremy L Thompson Note: If the value of `assembled` or `rstr` passed to this function are non-NULL, then it is assumed that they hold valid pointers. 1531c5f45aeaSJeremy L Thompson These objects will be destroyed if `*assembled` or `*rstr` is the only reference to the object. 1532c5f45aeaSJeremy L Thompson 1533ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1534ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points 1535ea61e9acSJeremy L Thompson @param[out] rstr CeedElemRestriction for CeedVector containing assembledCeedQFunction 1536ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 153770a7ffb3SJeremy L Thompson 153870a7ffb3SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 153970a7ffb3SJeremy L Thompson 154070a7ffb3SJeremy L Thompson @ref User 154170a7ffb3SJeremy L Thompson **/ 15422b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunctionBuildOrUpdate(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 1543*b05f7e9fSJeremy L Thompson int (*LinearAssembleQFunctionUpdate)(CeedOperator, CeedVector, CeedElemRestriction, CeedRequest *) = NULL; 1544*b05f7e9fSJeremy L Thompson CeedOperator op_assemble = NULL; 1545*b05f7e9fSJeremy L Thompson 15462b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 154770a7ffb3SJeremy L Thompson 1548*b05f7e9fSJeremy L Thompson // Determine if fallback parent or operator has implementation 1549*b05f7e9fSJeremy L Thompson if (op->op_fallback_parent && op->op_fallback_parent->LinearAssembleQFunctionUpdate) { 1550*b05f7e9fSJeremy L Thompson // -- Backend version for op fallback parent is faster, if it exists 1551*b05f7e9fSJeremy L Thompson LinearAssembleQFunctionUpdate = op->op_fallback_parent->LinearAssembleQFunctionUpdate; 1552*b05f7e9fSJeremy L Thompson op_assemble = op->op_fallback_parent; 1553*b05f7e9fSJeremy L Thompson } else if (op->LinearAssembleQFunctionUpdate) { 1554*b05f7e9fSJeremy L Thompson // -- Backend version for op 1555*b05f7e9fSJeremy L Thompson LinearAssembleQFunctionUpdate = op->LinearAssembleQFunctionUpdate; 1556*b05f7e9fSJeremy L Thompson op_assemble = op; 1557*b05f7e9fSJeremy L Thompson } 1558*b05f7e9fSJeremy L Thompson 1559*b05f7e9fSJeremy L Thompson // Assemble QFunction 1560*b05f7e9fSJeremy L Thompson if (LinearAssembleQFunctionUpdate) { 1561*b05f7e9fSJeremy L Thompson // Backend or fallback parent version 1562480fae85SJeremy L Thompson bool qf_assembled_is_setup; 15632efa2d85SJeremy L Thompson CeedVector assembled_vec = NULL; 15642efa2d85SJeremy L Thompson CeedElemRestriction assembled_rstr = NULL; 1565480fae85SJeremy L Thompson 15662b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataIsSetup(op->qf_assembled, &qf_assembled_is_setup)); 1567480fae85SJeremy L Thompson if (qf_assembled_is_setup) { 1568d04bbc78SJeremy L Thompson bool update_needed; 1569d04bbc78SJeremy L Thompson 15702b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataGetObjects(op->qf_assembled, &assembled_vec, &assembled_rstr)); 15712b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataIsUpdateNeeded(op->qf_assembled, &update_needed)); 1572*b05f7e9fSJeremy L Thompson if (update_needed) CeedCall(LinearAssembleQFunctionUpdate(op_assemble, assembled_vec, assembled_rstr, request)); 157370a7ffb3SJeremy L Thompson } else { 1574*b05f7e9fSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunction(op_assemble, &assembled_vec, &assembled_rstr, request)); 15752b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataSetObjects(op->qf_assembled, assembled_vec, assembled_rstr)); 157670a7ffb3SJeremy L Thompson } 15772b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataSetUpdateNeeded(op->qf_assembled, false)); 15782efa2d85SJeremy L Thompson 1579d04bbc78SJeremy L Thompson // Copy reference from internally held copy 15802b730f8bSJeremy L Thompson CeedCall(CeedVectorReferenceCopy(assembled_vec, assembled)); 15812b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(assembled_rstr, rstr)); 1582c5f45aeaSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled_vec)); 15832b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&assembled_rstr)); 158470a7ffb3SJeremy L Thompson } else { 1585d04bbc78SJeremy L Thompson // Operator fallback 1586d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1587d04bbc78SJeremy L Thompson 15882b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 15896574a04fSJeremy L Thompson if (op_fallback) CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op_fallback, assembled, rstr, request)); 15906574a04fSJeremy L Thompson else return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunctionUpdate"); 159170a7ffb3SJeremy L Thompson } 159270a7ffb3SJeremy L Thompson 159370a7ffb3SJeremy L Thompson return CEED_ERROR_SUCCESS; 1594eaf62fffSJeremy L Thompson } 1595eaf62fffSJeremy L Thompson 1596eaf62fffSJeremy L Thompson /** 1597eaf62fffSJeremy L Thompson @brief Assemble the diagonal of a square linear CeedOperator 1598eaf62fffSJeremy L Thompson 1599eaf62fffSJeremy L Thompson This overwrites a CeedVector with the diagonal of a linear CeedOperator. 1600eaf62fffSJeremy L Thompson 1601ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1602eaf62fffSJeremy L Thompson 1603ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1604f04ea552SJeremy L Thompson 1605ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1606eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator diagonal 1607ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1608eaf62fffSJeremy L Thompson 1609eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1610eaf62fffSJeremy L Thompson 1611eaf62fffSJeremy L Thompson @ref User 1612eaf62fffSJeremy L Thompson **/ 16132b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1614f3d47e36SJeremy L Thompson bool is_composite; 16152b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1616f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1617eaf62fffSJeremy L Thompson 1618c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 16192b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 16206574a04fSJeremy L Thompson CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1621c9366a6bSJeremy L Thompson 1622f3d47e36SJeremy L Thompson // Early exit for empty operator 1623f3d47e36SJeremy L Thompson if (!is_composite) { 1624f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1625f3d47e36SJeremy L Thompson 1626f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1627f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1628f3d47e36SJeremy L Thompson } 1629f3d47e36SJeremy L Thompson 1630eaf62fffSJeremy L Thompson if (op->LinearAssembleDiagonal) { 1631d04bbc78SJeremy L Thompson // Backend version 16322b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleDiagonal(op, assembled, request)); 1633eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1634eaf62fffSJeremy L Thompson } else if (op->LinearAssembleAddDiagonal) { 1635d04bbc78SJeremy L Thompson // Backend version with zeroing first 16362b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 16372b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request)); 1638eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1639eaf62fffSJeremy L Thompson } else { 1640d04bbc78SJeremy L Thompson // Operator fallback 1641d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1642d04bbc78SJeremy L Thompson 16432b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1644d04bbc78SJeremy L Thompson if (op_fallback) { 16452b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleDiagonal(op_fallback, assembled, request)); 1646eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1647eaf62fffSJeremy L Thompson } 1648eaf62fffSJeremy L Thompson } 1649eaf62fffSJeremy L Thompson // Default interface implementation 16502b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 16512b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddDiagonal(op, assembled, request)); 1652d04bbc78SJeremy L Thompson 1653eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1654eaf62fffSJeremy L Thompson } 1655eaf62fffSJeremy L Thompson 1656eaf62fffSJeremy L Thompson /** 1657eaf62fffSJeremy L Thompson @brief Assemble the diagonal of a square linear CeedOperator 1658eaf62fffSJeremy L Thompson 1659eaf62fffSJeremy L Thompson This sums into a CeedVector the diagonal of a linear CeedOperator. 1660eaf62fffSJeremy L Thompson 1661ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1662eaf62fffSJeremy L Thompson 1663ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1664f04ea552SJeremy L Thompson 1665ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1666eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator diagonal 1667ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1668eaf62fffSJeremy L Thompson 1669eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1670eaf62fffSJeremy L Thompson 1671eaf62fffSJeremy L Thompson @ref User 1672eaf62fffSJeremy L Thompson **/ 16732b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1674f3d47e36SJeremy L Thompson bool is_composite; 16752b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1676f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1677eaf62fffSJeremy L Thompson 1678c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 16792b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 16806574a04fSJeremy L Thompson CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1681c9366a6bSJeremy L Thompson 1682f3d47e36SJeremy L Thompson // Early exit for empty operator 1683f3d47e36SJeremy L Thompson if (!is_composite) { 1684f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1685f3d47e36SJeremy L Thompson 1686f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1687f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1688f3d47e36SJeremy L Thompson } 1689f3d47e36SJeremy L Thompson 1690eaf62fffSJeremy L Thompson if (op->LinearAssembleAddDiagonal) { 1691d04bbc78SJeremy L Thompson // Backend version 16922b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request)); 1693eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1694eaf62fffSJeremy L Thompson } else { 1695d04bbc78SJeremy L Thompson // Operator fallback 1696d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1697d04bbc78SJeremy L Thompson 16982b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1699d04bbc78SJeremy L Thompson if (op_fallback) { 17002b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddDiagonal(op_fallback, assembled, request)); 1701eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1702eaf62fffSJeremy L Thompson } 1703eaf62fffSJeremy L Thompson } 1704eaf62fffSJeremy L Thompson // Default interface implementation 1705eaf62fffSJeremy L Thompson if (is_composite) { 17062b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, false, assembled)); 1707eaf62fffSJeremy L Thompson } else { 17082b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, false, assembled)); 1709eaf62fffSJeremy L Thompson } 1710d04bbc78SJeremy L Thompson 1711d04bbc78SJeremy L Thompson return CEED_ERROR_SUCCESS; 1712eaf62fffSJeremy L Thompson } 1713eaf62fffSJeremy L Thompson 1714eaf62fffSJeremy L Thompson /** 1715eaf62fffSJeremy L Thompson @brief Assemble the point block diagonal of a square linear CeedOperator 1716eaf62fffSJeremy L Thompson 1717ea61e9acSJeremy L Thompson This overwrites a CeedVector with the point block diagonal of a linear CeedOperator. 1718eaf62fffSJeremy L Thompson 1719ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1720eaf62fffSJeremy L Thompson 1721ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1722f04ea552SJeremy L Thompson 1723ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1724ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp 1725ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out, 1726ea61e9acSJeremy L Thompson component in]. 1727ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1728eaf62fffSJeremy L Thompson 1729eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1730eaf62fffSJeremy L Thompson 1731eaf62fffSJeremy L Thompson @ref User 1732eaf62fffSJeremy L Thompson **/ 17332b730f8bSJeremy L Thompson int CeedOperatorLinearAssemblePointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1734f3d47e36SJeremy L Thompson bool is_composite; 17352b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1736f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1737eaf62fffSJeremy L Thompson 1738c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 17392b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 17406574a04fSJeremy L Thompson CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1741c9366a6bSJeremy L Thompson 1742f3d47e36SJeremy L Thompson // Early exit for empty operator 1743f3d47e36SJeremy L Thompson if (!is_composite) { 1744f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1745f3d47e36SJeremy L Thompson 1746f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1747f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1748f3d47e36SJeremy L Thompson } 1749f3d47e36SJeremy L Thompson 1750eaf62fffSJeremy L Thompson if (op->LinearAssemblePointBlockDiagonal) { 1751d04bbc78SJeremy L Thompson // Backend version 17522b730f8bSJeremy L Thompson CeedCall(op->LinearAssemblePointBlockDiagonal(op, assembled, request)); 1753eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1754eaf62fffSJeremy L Thompson } else if (op->LinearAssembleAddPointBlockDiagonal) { 1755d04bbc78SJeremy L Thompson // Backend version with zeroing first 17562b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 17572b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request)); 1758eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1759eaf62fffSJeremy L Thompson } else { 1760d04bbc78SJeremy L Thompson // Operator fallback 1761d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1762d04bbc78SJeremy L Thompson 17632b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1764d04bbc78SJeremy L Thompson if (op_fallback) { 17652b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssemblePointBlockDiagonal(op_fallback, assembled, request)); 1766eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1767eaf62fffSJeremy L Thompson } 1768eaf62fffSJeremy L Thompson } 1769eaf62fffSJeremy L Thompson // Default interface implementation 17702b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 17712b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request)); 1772d04bbc78SJeremy L Thompson 1773eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1774eaf62fffSJeremy L Thompson } 1775eaf62fffSJeremy L Thompson 1776eaf62fffSJeremy L Thompson /** 1777eaf62fffSJeremy L Thompson @brief Assemble the point block diagonal of a square linear CeedOperator 1778eaf62fffSJeremy L Thompson 1779ea61e9acSJeremy L Thompson This sums into a CeedVector with the point block diagonal of a linear CeedOperator. 1780eaf62fffSJeremy L Thompson 1781ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1782eaf62fffSJeremy L Thompson 1783ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1784f04ea552SJeremy L Thompson 1785ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1786ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp 1787ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out, 1788ea61e9acSJeremy L Thompson component in]. 1789ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1790eaf62fffSJeremy L Thompson 1791eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1792eaf62fffSJeremy L Thompson 1793eaf62fffSJeremy L Thompson @ref User 1794eaf62fffSJeremy L Thompson **/ 17952b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddPointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1796f3d47e36SJeremy L Thompson bool is_composite; 17972b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1798f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1799eaf62fffSJeremy L Thompson 1800c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 18012b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 18026574a04fSJeremy L Thompson CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1803c9366a6bSJeremy L Thompson 1804f3d47e36SJeremy L Thompson // Early exit for empty operator 1805f3d47e36SJeremy L Thompson if (!is_composite) { 1806f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1807f3d47e36SJeremy L Thompson 1808f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1809f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1810f3d47e36SJeremy L Thompson } 1811f3d47e36SJeremy L Thompson 1812eaf62fffSJeremy L Thompson if (op->LinearAssembleAddPointBlockDiagonal) { 1813d04bbc78SJeremy L Thompson // Backend version 18142b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleAddPointBlockDiagonal(op, assembled, request)); 1815eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1816eaf62fffSJeremy L Thompson } else { 1817d04bbc78SJeremy L Thompson // Operator fallback 1818d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1819d04bbc78SJeremy L Thompson 18202b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1821d04bbc78SJeremy L Thompson if (op_fallback) { 18222b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op_fallback, assembled, request)); 1823eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1824eaf62fffSJeremy L Thompson } 1825eaf62fffSJeremy L Thompson } 1826ea61e9acSJeremy L Thompson // Default interface implementation 1827eaf62fffSJeremy L Thompson if (is_composite) { 18282b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, true, assembled)); 1829eaf62fffSJeremy L Thompson } else { 18302b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, true, assembled)); 1831eaf62fffSJeremy L Thompson } 1832d04bbc78SJeremy L Thompson 1833d04bbc78SJeremy L Thompson return CEED_ERROR_SUCCESS; 1834eaf62fffSJeremy L Thompson } 1835eaf62fffSJeremy L Thompson 1836eaf62fffSJeremy L Thompson /** 1837eaf62fffSJeremy L Thompson @brief Fully assemble the nonzero pattern of a linear operator. 1838eaf62fffSJeremy L Thompson 1839ea61e9acSJeremy L Thompson Expected to be used in conjunction with CeedOperatorLinearAssemble(). 1840eaf62fffSJeremy L Thompson 1841ea61e9acSJeremy L Thompson The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the 18429fd66db6SSebastian Grimberg matrix in entry (i, j). 18439fd66db6SSebastian Grimberg Note that the (i, j) pairs are not unique and may repeat. 18449fd66db6SSebastian Grimberg This function returns the number of entries and their (i, j) locations, while CeedOperatorLinearAssemble() provides the values in the same ordering. 1845eaf62fffSJeremy L Thompson 1846eaf62fffSJeremy L Thompson This will generally be slow unless your operator is low-order. 1847eaf62fffSJeremy L Thompson 1848ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1849f04ea552SJeremy L Thompson 1850eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 1851eaf62fffSJeremy L Thompson @param[out] num_entries Number of entries in coordinate nonzero pattern 1852eaf62fffSJeremy L Thompson @param[out] rows Row number for each entry 1853eaf62fffSJeremy L Thompson @param[out] cols Column number for each entry 1854eaf62fffSJeremy L Thompson 1855eaf62fffSJeremy L Thompson @ref User 1856eaf62fffSJeremy L Thompson **/ 18572b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleSymbolic(CeedOperator op, CeedSize *num_entries, CeedInt **rows, CeedInt **cols) { 1858b94338b9SJed Brown CeedInt num_suboperators; 1859b94338b9SJed Brown CeedSize single_entries; 1860eaf62fffSJeremy L Thompson CeedOperator *sub_operators; 1861eaf62fffSJeremy L Thompson bool is_composite; 18622b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1863f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1864eaf62fffSJeremy L Thompson 1865eaf62fffSJeremy L Thompson if (op->LinearAssembleSymbolic) { 1866d04bbc78SJeremy L Thompson // Backend version 18672b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleSymbolic(op, num_entries, rows, cols)); 1868eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1869eaf62fffSJeremy L Thompson } else { 1870d04bbc78SJeremy L Thompson // Operator fallback 1871d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1872d04bbc78SJeremy L Thompson 18732b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1874d04bbc78SJeremy L Thompson if (op_fallback) { 18752b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleSymbolic(op_fallback, num_entries, rows, cols)); 1876eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1877eaf62fffSJeremy L Thompson } 1878eaf62fffSJeremy L Thompson } 1879eaf62fffSJeremy L Thompson 1880eaf62fffSJeremy L Thompson // Default interface implementation 1881eaf62fffSJeremy L Thompson 1882eaf62fffSJeremy L Thompson // count entries and allocate rows, cols arrays 1883eaf62fffSJeremy L Thompson *num_entries = 0; 1884eaf62fffSJeremy L Thompson if (is_composite) { 1885c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1886c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 188792ae7e47SJeremy L Thompson for (CeedInt k = 0; k < num_suboperators; ++k) { 18882b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries)); 1889eaf62fffSJeremy L Thompson *num_entries += single_entries; 1890eaf62fffSJeremy L Thompson } 1891eaf62fffSJeremy L Thompson } else { 18922b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(op, &single_entries)); 1893eaf62fffSJeremy L Thompson *num_entries += single_entries; 1894eaf62fffSJeremy L Thompson } 18952b730f8bSJeremy L Thompson CeedCall(CeedCalloc(*num_entries, rows)); 18962b730f8bSJeremy L Thompson CeedCall(CeedCalloc(*num_entries, cols)); 1897eaf62fffSJeremy L Thompson 1898eaf62fffSJeremy L Thompson // assemble nonzero locations 1899eaf62fffSJeremy L Thompson CeedInt offset = 0; 1900eaf62fffSJeremy L Thompson if (is_composite) { 1901c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1902c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 190392ae7e47SJeremy L Thompson for (CeedInt k = 0; k < num_suboperators; ++k) { 19042b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleSymbolic(sub_operators[k], offset, *rows, *cols)); 19052b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries)); 1906eaf62fffSJeremy L Thompson offset += single_entries; 1907eaf62fffSJeremy L Thompson } 1908eaf62fffSJeremy L Thompson } else { 19092b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleSymbolic(op, offset, *rows, *cols)); 1910eaf62fffSJeremy L Thompson } 1911eaf62fffSJeremy L Thompson 1912eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1913eaf62fffSJeremy L Thompson } 1914eaf62fffSJeremy L Thompson 1915eaf62fffSJeremy L Thompson /** 1916eaf62fffSJeremy L Thompson @brief Fully assemble the nonzero entries of a linear operator. 1917eaf62fffSJeremy L Thompson 1918ea61e9acSJeremy L Thompson Expected to be used in conjunction with CeedOperatorLinearAssembleSymbolic(). 1919eaf62fffSJeremy L Thompson 1920ea61e9acSJeremy L Thompson The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the 19219fd66db6SSebastian Grimberg matrix in entry (i, j). 19229fd66db6SSebastian Grimberg Note that the (i, j) pairs are not unique and may repeat. 19239fd66db6SSebastian Grimberg This function returns the values of the nonzero entries to be added, their (i, j) locations are provided by CeedOperatorLinearAssembleSymbolic() 1924eaf62fffSJeremy L Thompson 1925eaf62fffSJeremy L Thompson This will generally be slow unless your operator is low-order. 1926eaf62fffSJeremy L Thompson 1927ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1928f04ea552SJeremy L Thompson 1929eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 1930eaf62fffSJeremy L Thompson @param[out] values Values to assemble into matrix 1931eaf62fffSJeremy L Thompson 1932eaf62fffSJeremy L Thompson @ref User 1933eaf62fffSJeremy L Thompson **/ 1934eaf62fffSJeremy L Thompson int CeedOperatorLinearAssemble(CeedOperator op, CeedVector values) { 1935b94338b9SJed Brown CeedInt num_suboperators; 1936b94338b9SJed Brown CeedSize single_entries = 0; 1937eaf62fffSJeremy L Thompson CeedOperator *sub_operators; 1938f3d47e36SJeremy L Thompson bool is_composite; 19392b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1940f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1941f3d47e36SJeremy L Thompson 1942f3d47e36SJeremy L Thompson // Early exit for empty operator 1943f3d47e36SJeremy L Thompson if (!is_composite) { 1944f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1945f3d47e36SJeremy L Thompson 1946f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1947f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1948f3d47e36SJeremy L Thompson } 1949eaf62fffSJeremy L Thompson 1950eaf62fffSJeremy L Thompson if (op->LinearAssemble) { 1951d04bbc78SJeremy L Thompson // Backend version 19522b730f8bSJeremy L Thompson CeedCall(op->LinearAssemble(op, values)); 1953eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1954eaf62fffSJeremy L Thompson } else { 1955d04bbc78SJeremy L Thompson // Operator fallback 1956d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1957d04bbc78SJeremy L Thompson 19582b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1959d04bbc78SJeremy L Thompson if (op_fallback) { 19602b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssemble(op_fallback, values)); 1961eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1962eaf62fffSJeremy L Thompson } 1963eaf62fffSJeremy L Thompson } 1964eaf62fffSJeremy L Thompson 1965eaf62fffSJeremy L Thompson // Default interface implementation 1966eaf62fffSJeremy L Thompson CeedInt offset = 0; 196728ec399dSJeremy L Thompson CeedCall(CeedVectorSetValue(values, 0.0)); 1968eaf62fffSJeremy L Thompson if (is_composite) { 1969c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1970c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 1971cefa2673SJeremy L Thompson for (CeedInt k = 0; k < num_suboperators; k++) { 19722b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemble(sub_operators[k], offset, values)); 19732b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries)); 1974eaf62fffSJeremy L Thompson offset += single_entries; 1975eaf62fffSJeremy L Thompson } 1976eaf62fffSJeremy L Thompson } else { 19772b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemble(op, offset, values)); 1978eaf62fffSJeremy L Thompson } 1979eaf62fffSJeremy L Thompson 1980eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1981eaf62fffSJeremy L Thompson } 1982eaf62fffSJeremy L Thompson 1983eaf62fffSJeremy L Thompson /** 198475f0d5a4SJeremy L Thompson @brief Get the multiplicity of nodes across suboperators in a composite CeedOperator 198575f0d5a4SJeremy L Thompson 198675f0d5a4SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 198775f0d5a4SJeremy L Thompson 198875f0d5a4SJeremy L Thompson @param[in] op Composite CeedOperator 198975f0d5a4SJeremy L Thompson @param[in] num_skip_indices Number of suboperators to skip 199075f0d5a4SJeremy L Thompson @param[in] skip_indices Array of indices of suboperators to skip 199175f0d5a4SJeremy L Thompson @param[out] mult Vector to store multiplicity (of size l_size) 199275f0d5a4SJeremy L Thompson 199375f0d5a4SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 199475f0d5a4SJeremy L Thompson 199575f0d5a4SJeremy L Thompson @ref User 199675f0d5a4SJeremy L Thompson **/ 199775f0d5a4SJeremy L Thompson int CeedCompositeOperatorGetMultiplicity(CeedOperator op, CeedInt num_skip_indices, CeedInt *skip_indices, CeedVector mult) { 199875f0d5a4SJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 199975f0d5a4SJeremy L Thompson 200075f0d5a4SJeremy L Thompson Ceed ceed; 2001b275c451SJeremy L Thompson CeedInt num_suboperators; 200275f0d5a4SJeremy L Thompson CeedSize l_vec_len; 200375f0d5a4SJeremy L Thompson CeedScalar *mult_array; 200475f0d5a4SJeremy L Thompson CeedVector ones_l_vec; 2005437c7c90SJeremy L Thompson CeedElemRestriction elem_rstr; 2006b275c451SJeremy L Thompson CeedOperator *sub_operators; 200775f0d5a4SJeremy L Thompson 200875f0d5a4SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 200975f0d5a4SJeremy L Thompson 201075f0d5a4SJeremy L Thompson // Zero mult vector 201175f0d5a4SJeremy L Thompson CeedCall(CeedVectorSetValue(mult, 0.0)); 201275f0d5a4SJeremy L Thompson 201375f0d5a4SJeremy L Thompson // Get suboperators 2014b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 2015b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 2016b275c451SJeremy L Thompson if (num_suboperators == 0) return CEED_ERROR_SUCCESS; 201775f0d5a4SJeremy L Thompson 201875f0d5a4SJeremy L Thompson // Work vector 201975f0d5a4SJeremy L Thompson CeedCall(CeedVectorGetLength(mult, &l_vec_len)); 202075f0d5a4SJeremy L Thompson CeedCall(CeedVectorCreate(ceed, l_vec_len, &ones_l_vec)); 202175f0d5a4SJeremy L Thompson CeedCall(CeedVectorSetValue(ones_l_vec, 1.0)); 202275f0d5a4SJeremy L Thompson CeedCall(CeedVectorGetArray(mult, CEED_MEM_HOST, &mult_array)); 202375f0d5a4SJeremy L Thompson 202475f0d5a4SJeremy L Thompson // Compute multiplicity across suboperators 2025b275c451SJeremy L Thompson for (CeedInt i = 0; i < num_suboperators; i++) { 202675f0d5a4SJeremy L Thompson const CeedScalar *sub_mult_array; 202775f0d5a4SJeremy L Thompson CeedVector sub_mult_l_vec, ones_e_vec; 202875f0d5a4SJeremy L Thompson 202975f0d5a4SJeremy L Thompson // -- Check for suboperator to skip 203075f0d5a4SJeremy L Thompson for (CeedInt j = 0; j < num_skip_indices; j++) { 203175f0d5a4SJeremy L Thompson if (skip_indices[j] == i) continue; 203275f0d5a4SJeremy L Thompson } 203375f0d5a4SJeremy L Thompson 203475f0d5a4SJeremy L Thompson // -- Sub operator multiplicity 2035437c7c90SJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(sub_operators[i], &elem_rstr)); 2036437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionCreateVector(elem_rstr, &sub_mult_l_vec, &ones_e_vec)); 203775f0d5a4SJeremy L Thompson CeedCall(CeedVectorSetValue(sub_mult_l_vec, 0.0)); 2038437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionApply(elem_rstr, CEED_NOTRANSPOSE, ones_l_vec, ones_e_vec, CEED_REQUEST_IMMEDIATE)); 2039437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionApply(elem_rstr, CEED_TRANSPOSE, ones_e_vec, sub_mult_l_vec, CEED_REQUEST_IMMEDIATE)); 204075f0d5a4SJeremy L Thompson CeedCall(CeedVectorGetArrayRead(sub_mult_l_vec, CEED_MEM_HOST, &sub_mult_array)); 204175f0d5a4SJeremy L Thompson // ---- Flag every node present in the current suboperator 204275f0d5a4SJeremy L Thompson for (CeedInt j = 0; j < l_vec_len; j++) { 204375f0d5a4SJeremy L Thompson if (sub_mult_array[j] > 0.0) mult_array[j] += 1.0; 204475f0d5a4SJeremy L Thompson } 204575f0d5a4SJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(sub_mult_l_vec, &sub_mult_array)); 204675f0d5a4SJeremy L Thompson CeedCall(CeedVectorDestroy(&sub_mult_l_vec)); 204775f0d5a4SJeremy L Thompson CeedCall(CeedVectorDestroy(&ones_e_vec)); 204875f0d5a4SJeremy L Thompson } 204975f0d5a4SJeremy L Thompson CeedCall(CeedVectorRestoreArray(mult, &mult_array)); 2050811d0ccfSJeremy L Thompson CeedCall(CeedVectorDestroy(&ones_l_vec)); 205175f0d5a4SJeremy L Thompson 205275f0d5a4SJeremy L Thompson return CEED_ERROR_SUCCESS; 205375f0d5a4SJeremy L Thompson } 205475f0d5a4SJeremy L Thompson 205575f0d5a4SJeremy L Thompson /** 2056ea61e9acSJeremy L Thompson @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator, creating the prolongation basis from the fine and coarse 2057ea61e9acSJeremy L Thompson grid interpolation 2058eaf62fffSJeremy L Thompson 205958e4b056SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable. 2060f04ea552SJeremy L Thompson 2061eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 206285bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 2063eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 2064eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 2065eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 206685bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 206785bb9dcfSJeremy L Thompson @param[out] op_restrict Fine to coarse operator, or NULL 2068eaf62fffSJeremy L Thompson 2069eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2070eaf62fffSJeremy L Thompson 2071eaf62fffSJeremy L Thompson @ref User 2072eaf62fffSJeremy L Thompson **/ 20732b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreate(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 20742b730f8bSJeremy L Thompson CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) { 20752b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fine)); 2076eaf62fffSJeremy L Thompson 207783d6adf3SZach Atkins // Build prolongation matrix, if required 207883d6adf3SZach Atkins CeedBasis basis_c_to_f = NULL; 207983d6adf3SZach Atkins if (op_prolong || op_restrict) { 208083d6adf3SZach Atkins CeedBasis basis_fine; 20812b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine)); 20822b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateProjection(basis_coarse, basis_fine, &basis_c_to_f)); 208383d6adf3SZach Atkins } 2084eaf62fffSJeremy L Thompson 2085f113e5dcSJeremy L Thompson // Core code 20862b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict)); 2087f113e5dcSJeremy L Thompson 2088eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2089eaf62fffSJeremy L Thompson } 2090eaf62fffSJeremy L Thompson 2091eaf62fffSJeremy L Thompson /** 2092ea61e9acSJeremy L Thompson @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a tensor basis for the active basis 2093eaf62fffSJeremy L Thompson 209458e4b056SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable. 2095f04ea552SJeremy L Thompson 2096eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 209785bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 2098eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 2099eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 210085bb9dcfSJeremy L Thompson @param[in] interp_c_to_f Matrix for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators 2101eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 210285bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 210385bb9dcfSJeremy L Thompson @param[out] op_restrict Fine to coarse operator, or NULL 2104eaf62fffSJeremy L Thompson 2105eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2106eaf62fffSJeremy L Thompson 2107eaf62fffSJeremy L Thompson @ref User 2108eaf62fffSJeremy L Thompson **/ 21092b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateTensorH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 21102b730f8bSJeremy L Thompson const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, 21112b730f8bSJeremy L Thompson CeedOperator *op_restrict) { 21122b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fine)); 2113eaf62fffSJeremy L Thompson Ceed ceed; 21142b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op_fine, &ceed)); 2115eaf62fffSJeremy L Thompson 2116eaf62fffSJeremy L Thompson // Check for compatible quadrature spaces 2117eaf62fffSJeremy L Thompson CeedBasis basis_fine; 21182b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine)); 2119eaf62fffSJeremy L Thompson CeedInt Q_f, Q_c; 21202b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f)); 21212b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c)); 21226574a04fSJeremy L Thompson CeedCheck(Q_f == Q_c, ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces"); 2123eaf62fffSJeremy L Thompson 212483d6adf3SZach Atkins // Create coarse to fine basis, if required 212583d6adf3SZach Atkins CeedBasis basis_c_to_f = NULL; 212683d6adf3SZach Atkins if (op_prolong || op_restrict) { 212783d6adf3SZach Atkins // Check if interpolation matrix is provided 21286574a04fSJeremy L Thompson CeedCheck(interp_c_to_f, ceed, CEED_ERROR_INCOMPATIBLE, 21296574a04fSJeremy L Thompson "Prolongation or restriction operator creation requires coarse-to-fine interpolation matrix"); 2130eaf62fffSJeremy L Thompson CeedInt dim, num_comp, num_nodes_c, P_1d_f, P_1d_c; 21312b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis_fine, &dim)); 21322b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp)); 21332b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes1D(basis_fine, &P_1d_f)); 21342b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c)); 21352b730f8bSJeremy L Thompson P_1d_c = dim == 1 ? num_nodes_c : dim == 2 ? sqrt(num_nodes_c) : cbrt(num_nodes_c); 2136eaf62fffSJeremy L Thompson CeedScalar *q_ref, *q_weight, *grad; 21372b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d_f, &q_ref)); 21382b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d_f, &q_weight)); 21392b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d_f * P_1d_c * dim, &grad)); 21402b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateTensorH1(ceed, dim, num_comp, P_1d_c, P_1d_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f)); 21412b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_ref)); 21422b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_weight)); 21432b730f8bSJeremy L Thompson CeedCall(CeedFree(&grad)); 214483d6adf3SZach Atkins } 2145eaf62fffSJeremy L Thompson 2146eaf62fffSJeremy L Thompson // Core code 21472b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict)); 2148eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2149eaf62fffSJeremy L Thompson } 2150eaf62fffSJeremy L Thompson 2151eaf62fffSJeremy L Thompson /** 2152ea61e9acSJeremy L Thompson @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a non-tensor basis for the active vector 2153eaf62fffSJeremy L Thompson 215458e4b056SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable. 2155f04ea552SJeremy L Thompson 2156eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 215785bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 2158eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 2159eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 216085bb9dcfSJeremy L Thompson @param[in] interp_c_to_f Matrix for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators 2161eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 216285bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 216385bb9dcfSJeremy L Thompson @param[out] op_restrict Fine to coarse operator, or NULL 2164eaf62fffSJeremy L Thompson 2165eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2166eaf62fffSJeremy L Thompson 2167eaf62fffSJeremy L Thompson @ref User 2168eaf62fffSJeremy L Thompson **/ 21692b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 21702b730f8bSJeremy L Thompson const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, 2171eaf62fffSJeremy L Thompson CeedOperator *op_restrict) { 21722b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fine)); 2173eaf62fffSJeremy L Thompson Ceed ceed; 21742b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op_fine, &ceed)); 2175eaf62fffSJeremy L Thompson 2176eaf62fffSJeremy L Thompson // Check for compatible quadrature spaces 2177eaf62fffSJeremy L Thompson CeedBasis basis_fine; 21782b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine)); 2179eaf62fffSJeremy L Thompson CeedInt Q_f, Q_c; 21802b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f)); 21812b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c)); 21826574a04fSJeremy L Thompson CeedCheck(Q_f == Q_c, ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces"); 2183eaf62fffSJeremy L Thompson 2184eaf62fffSJeremy L Thompson // Coarse to fine basis 218583d6adf3SZach Atkins CeedBasis basis_c_to_f = NULL; 218683d6adf3SZach Atkins if (op_prolong || op_restrict) { 218783d6adf3SZach Atkins // Check if interpolation matrix is provided 21886574a04fSJeremy L Thompson CeedCheck(interp_c_to_f, ceed, CEED_ERROR_INCOMPATIBLE, 21896574a04fSJeremy L Thompson "Prolongation or restriction operator creation requires coarse-to-fine interpolation matrix"); 2190eaf62fffSJeremy L Thompson CeedElemTopology topo; 21912b730f8bSJeremy L Thompson CeedCall(CeedBasisGetTopology(basis_fine, &topo)); 2192eaf62fffSJeremy L Thompson CeedInt dim, num_comp, num_nodes_c, num_nodes_f; 21932b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis_fine, &dim)); 21942b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp)); 21952b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes(basis_fine, &num_nodes_f)); 21962b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c)); 2197eaf62fffSJeremy L Thompson CeedScalar *q_ref, *q_weight, *grad; 21982b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_nodes_f * dim, &q_ref)); 21992b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_nodes_f, &q_weight)); 22002b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_nodes_f * num_nodes_c * dim, &grad)); 22012b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateH1(ceed, topo, num_comp, num_nodes_c, num_nodes_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f)); 22022b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_ref)); 22032b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_weight)); 22042b730f8bSJeremy L Thompson CeedCall(CeedFree(&grad)); 220583d6adf3SZach Atkins } 2206eaf62fffSJeremy L Thompson 2207eaf62fffSJeremy L Thompson // Core code 22082b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict)); 2209eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2210eaf62fffSJeremy L Thompson } 2211eaf62fffSJeremy L Thompson 2212eaf62fffSJeremy L Thompson /** 2213ea61e9acSJeremy L Thompson @brief Build a FDM based approximate inverse for each element for a CeedOperator 2214eaf62fffSJeremy L Thompson 2215ea61e9acSJeremy L Thompson This returns a CeedOperator and CeedVector to apply a Fast Diagonalization Method based approximate inverse. 2216859c15bbSJames Wright This function obtains the simultaneous diagonalization for the 1D mass and Laplacian operators, \f$M = V^T V, K = V^T S V\f$. 2217859c15bbSJames Wright The assembled QFunction is used to modify the eigenvalues from simultaneous diagonalization and obtain an approximate inverse of the form \f$V^T 22189fd66db6SSebastian Grimberg \hat S V\f$. 22199fd66db6SSebastian Grimberg The CeedOperator must be linear and non-composite. 22209fd66db6SSebastian Grimberg The associated CeedQFunction must therefore also be linear. 2221eaf62fffSJeremy L Thompson 2222ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 2223f04ea552SJeremy L Thompson 2224ea61e9acSJeremy L Thompson @param[in] op CeedOperator to create element inverses 2225ea61e9acSJeremy L Thompson @param[out] fdm_inv CeedOperator to apply the action of a FDM based inverse for each element 2226ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 2227eaf62fffSJeremy L Thompson 2228eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2229eaf62fffSJeremy L Thompson 2230480fae85SJeremy L Thompson @ref User 2231eaf62fffSJeremy L Thompson **/ 22322b730f8bSJeremy L Thompson int CeedOperatorCreateFDMElementInverse(CeedOperator op, CeedOperator *fdm_inv, CeedRequest *request) { 22332b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 2234eaf62fffSJeremy L Thompson 2235eaf62fffSJeremy L Thompson if (op->CreateFDMElementInverse) { 2236d04bbc78SJeremy L Thompson // Backend version 22372b730f8bSJeremy L Thompson CeedCall(op->CreateFDMElementInverse(op, fdm_inv, request)); 2238eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2239eaf62fffSJeremy L Thompson } else { 2240d04bbc78SJeremy L Thompson // Operator fallback 2241d04bbc78SJeremy L Thompson CeedOperator op_fallback; 2242d04bbc78SJeremy L Thompson 22432b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 2244d04bbc78SJeremy L Thompson if (op_fallback) { 22452b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreateFDMElementInverse(op_fallback, fdm_inv, request)); 2246eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2247eaf62fffSJeremy L Thompson } 2248eaf62fffSJeremy L Thompson } 2249eaf62fffSJeremy L Thompson 2250d04bbc78SJeremy L Thompson // Default interface implementation 2251eaf62fffSJeremy L Thompson Ceed ceed, ceed_parent; 22522b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 22532b730f8bSJeremy L Thompson CeedCall(CeedGetOperatorFallbackParentCeed(ceed, &ceed_parent)); 2254eaf62fffSJeremy L Thompson ceed_parent = ceed_parent ? ceed_parent : ceed; 2255eaf62fffSJeremy L Thompson CeedQFunction qf; 22562b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 2257eaf62fffSJeremy L Thompson 2258eaf62fffSJeremy L Thompson // Determine active input basis 2259eaf62fffSJeremy L Thompson bool interp = false, grad = false; 2260eaf62fffSJeremy L Thompson CeedBasis basis = NULL; 2261eaf62fffSJeremy L Thompson CeedElemRestriction rstr = NULL; 2262eaf62fffSJeremy L Thompson CeedOperatorField *op_fields; 2263eaf62fffSJeremy L Thompson CeedQFunctionField *qf_fields; 2264eaf62fffSJeremy L Thompson CeedInt num_input_fields; 22652b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, &num_input_fields, &op_fields, NULL, NULL)); 22662b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL)); 2267eaf62fffSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 2268eaf62fffSJeremy L Thompson CeedVector vec; 22692b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec)); 2270eaf62fffSJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 2271eaf62fffSJeremy L Thompson CeedEvalMode eval_mode; 22722b730f8bSJeremy L Thompson CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 2273eaf62fffSJeremy L Thompson interp = interp || eval_mode == CEED_EVAL_INTERP; 2274eaf62fffSJeremy L Thompson grad = grad || eval_mode == CEED_EVAL_GRAD; 22752b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 22762b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr)); 2277eaf62fffSJeremy L Thompson } 2278eaf62fffSJeremy L Thompson } 22796574a04fSJeremy L Thompson CeedCheck(basis, ceed, CEED_ERROR_BACKEND, "No active field set"); 2280e79b91d9SJeremy L Thompson CeedSize l_size = 1; 2281352a5e7cSSebastian Grimberg CeedInt P_1d, Q_1d, num_nodes, num_qpts, dim, num_comp = 1, num_elem = 1; 22822b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes1D(basis, &P_1d)); 2283352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumNodes(basis, &num_nodes)); 22842b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints1D(basis, &Q_1d)); 22852b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis, &num_qpts)); 22862b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis, &dim)); 22872b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis, &num_comp)); 22882b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem)); 22892b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size)); 2290eaf62fffSJeremy L Thompson 2291eaf62fffSJeremy L Thompson // Build and diagonalize 1D Mass and Laplacian 22926574a04fSJeremy L Thompson bool is_tensor_basis; 22936574a04fSJeremy L Thompson CeedCall(CeedBasisIsTensor(basis, &is_tensor_basis)); 22946574a04fSJeremy L Thompson CeedCheck(is_tensor_basis, ceed, CEED_ERROR_BACKEND, "FDMElementInverse only supported for tensor bases"); 2295eaf62fffSJeremy L Thompson CeedScalar *mass, *laplace, *x, *fdm_interp, *lambda; 22962b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &mass)); 22972b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &laplace)); 22982b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &x)); 22992b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &fdm_interp)); 23002b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d, &lambda)); 2301eaf62fffSJeremy L Thompson // -- Build matrices 2302eaf62fffSJeremy L Thompson const CeedScalar *interp_1d, *grad_1d, *q_weight_1d; 23032b730f8bSJeremy L Thompson CeedCall(CeedBasisGetInterp1D(basis, &interp_1d)); 23042b730f8bSJeremy L Thompson CeedCall(CeedBasisGetGrad1D(basis, &grad_1d)); 23052b730f8bSJeremy L Thompson CeedCall(CeedBasisGetQWeights(basis, &q_weight_1d)); 23062b730f8bSJeremy L Thompson CeedCall(CeedBuildMassLaplace(interp_1d, grad_1d, q_weight_1d, P_1d, Q_1d, dim, mass, laplace)); 2307eaf62fffSJeremy L Thompson 2308eaf62fffSJeremy L Thompson // -- Diagonalize 23092b730f8bSJeremy L Thompson CeedCall(CeedSimultaneousDiagonalization(ceed, laplace, mass, x, lambda, P_1d)); 23102b730f8bSJeremy L Thompson CeedCall(CeedFree(&mass)); 23112b730f8bSJeremy L Thompson CeedCall(CeedFree(&laplace)); 23122b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) { 23132b730f8bSJeremy L Thompson for (CeedInt j = 0; j < P_1d; j++) fdm_interp[i + j * P_1d] = x[j + i * P_1d]; 23142b730f8bSJeremy L Thompson } 23152b730f8bSJeremy L Thompson CeedCall(CeedFree(&x)); 2316eaf62fffSJeremy L Thompson 2317eaf62fffSJeremy L Thompson // Assemble QFunction 2318c5f45aeaSJeremy L Thompson CeedVector assembled = NULL; 2319c5f45aeaSJeremy L Thompson CeedElemRestriction rstr_qf = NULL; 23202b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled, &rstr_qf, request)); 2321eaf62fffSJeremy L Thompson CeedInt layout[3]; 23222b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(rstr_qf, &layout)); 23232b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_qf)); 2324eaf62fffSJeremy L Thompson CeedScalar max_norm = 0; 23252b730f8bSJeremy L Thompson CeedCall(CeedVectorNorm(assembled, CEED_NORM_MAX, &max_norm)); 2326eaf62fffSJeremy L Thompson 2327eaf62fffSJeremy L Thompson // Calculate element averages 2328eaf62fffSJeremy L Thompson CeedInt num_modes = (interp ? 1 : 0) + (grad ? dim : 0); 2329eaf62fffSJeremy L Thompson CeedScalar *elem_avg; 2330eaf62fffSJeremy L Thompson const CeedScalar *assembled_array, *q_weight_array; 2331eaf62fffSJeremy L Thompson CeedVector q_weight; 23322b730f8bSJeremy L Thompson CeedCall(CeedVectorCreate(ceed_parent, num_qpts, &q_weight)); 23332b730f8bSJeremy L Thompson CeedCall(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, q_weight)); 23342b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(assembled, CEED_MEM_HOST, &assembled_array)); 23352b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(q_weight, CEED_MEM_HOST, &q_weight_array)); 23362b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_elem, &elem_avg)); 2337eaf62fffSJeremy L Thompson const CeedScalar qf_value_bound = max_norm * 100 * CEED_EPSILON; 2338eaf62fffSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 2339eaf62fffSJeremy L Thompson CeedInt count = 0; 23402b730f8bSJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 23412b730f8bSJeremy L Thompson for (CeedInt i = 0; i < num_comp * num_comp * num_modes * num_modes; i++) { 23422b730f8bSJeremy L Thompson if (fabs(assembled_array[q * layout[0] + i * layout[1] + e * layout[2]]) > qf_value_bound) { 23432b730f8bSJeremy L Thompson elem_avg[e] += assembled_array[q * layout[0] + i * layout[1] + e * layout[2]] / q_weight_array[q]; 2344eaf62fffSJeremy L Thompson count++; 2345eaf62fffSJeremy L Thompson } 23462b730f8bSJeremy L Thompson } 23472b730f8bSJeremy L Thompson } 2348eaf62fffSJeremy L Thompson if (count) { 2349eaf62fffSJeremy L Thompson elem_avg[e] /= count; 2350eaf62fffSJeremy L Thompson } else { 2351eaf62fffSJeremy L Thompson elem_avg[e] = 1.0; 2352eaf62fffSJeremy L Thompson } 2353eaf62fffSJeremy L Thompson } 23542b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(assembled, &assembled_array)); 23552b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled)); 23562b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(q_weight, &q_weight_array)); 23572b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&q_weight)); 2358eaf62fffSJeremy L Thompson 2359eaf62fffSJeremy L Thompson // Build FDM diagonal 2360eaf62fffSJeremy L Thompson CeedVector q_data; 2361eaf62fffSJeremy L Thompson CeedScalar *q_data_array, *fdm_diagonal; 2362352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_comp * num_nodes, &fdm_diagonal)); 2363352a5e7cSSebastian Grimberg const CeedScalar fdm_diagonal_bound = num_nodes * CEED_EPSILON; 23642b730f8bSJeremy L Thompson for (CeedInt c = 0; c < num_comp; c++) { 2365352a5e7cSSebastian Grimberg for (CeedInt n = 0; n < num_nodes; n++) { 2366352a5e7cSSebastian Grimberg if (interp) fdm_diagonal[c * num_nodes + n] = 1.0; 23672b730f8bSJeremy L Thompson if (grad) { 2368eaf62fffSJeremy L Thompson for (CeedInt d = 0; d < dim; d++) { 2369eaf62fffSJeremy L Thompson CeedInt i = (n / CeedIntPow(P_1d, d)) % P_1d; 2370352a5e7cSSebastian Grimberg fdm_diagonal[c * num_nodes + n] += lambda[i]; 2371eaf62fffSJeremy L Thompson } 2372eaf62fffSJeremy L Thompson } 2373352a5e7cSSebastian Grimberg if (fabs(fdm_diagonal[c * num_nodes + n]) < fdm_diagonal_bound) fdm_diagonal[c * num_nodes + n] = fdm_diagonal_bound; 23742b730f8bSJeremy L Thompson } 23752b730f8bSJeremy L Thompson } 2376352a5e7cSSebastian Grimberg CeedCall(CeedVectorCreate(ceed_parent, num_elem * num_comp * num_nodes, &q_data)); 23772b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(q_data, 0.0)); 23782b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayWrite(q_data, CEED_MEM_HOST, &q_data_array)); 23792b730f8bSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 23802b730f8bSJeremy L Thompson for (CeedInt c = 0; c < num_comp; c++) { 2381352a5e7cSSebastian Grimberg for (CeedInt n = 0; n < num_nodes; n++) q_data_array[(e * num_comp + c) * num_nodes + n] = 1. / (elem_avg[e] * fdm_diagonal[c * num_nodes + n]); 23822b730f8bSJeremy L Thompson } 23832b730f8bSJeremy L Thompson } 23842b730f8bSJeremy L Thompson CeedCall(CeedFree(&elem_avg)); 23852b730f8bSJeremy L Thompson CeedCall(CeedFree(&fdm_diagonal)); 23862b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(q_data, &q_data_array)); 2387eaf62fffSJeremy L Thompson 2388eaf62fffSJeremy L Thompson // Setup FDM operator 2389eaf62fffSJeremy L Thompson // -- Basis 2390eaf62fffSJeremy L Thompson CeedBasis fdm_basis; 2391eaf62fffSJeremy L Thompson CeedScalar *grad_dummy, *q_ref_dummy, *q_weight_dummy; 23922b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &grad_dummy)); 23932b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d, &q_ref_dummy)); 23942b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d, &q_weight_dummy)); 23952b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateTensorH1(ceed_parent, dim, num_comp, P_1d, P_1d, fdm_interp, grad_dummy, q_ref_dummy, q_weight_dummy, &fdm_basis)); 23962b730f8bSJeremy L Thompson CeedCall(CeedFree(&fdm_interp)); 23972b730f8bSJeremy L Thompson CeedCall(CeedFree(&grad_dummy)); 23982b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_ref_dummy)); 23992b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_weight_dummy)); 24002b730f8bSJeremy L Thompson CeedCall(CeedFree(&lambda)); 2401eaf62fffSJeremy L Thompson 2402eaf62fffSJeremy L Thompson // -- Restriction 2403eaf62fffSJeremy L Thompson CeedElemRestriction rstr_qd_i; 2404352a5e7cSSebastian Grimberg CeedInt strides[3] = {1, num_nodes, num_nodes * num_comp}; 2405352a5e7cSSebastian Grimberg CeedCall(CeedElemRestrictionCreateStrided(ceed_parent, num_elem, num_nodes, num_comp, num_elem * num_comp * num_nodes, strides, &rstr_qd_i)); 2406eaf62fffSJeremy L Thompson // -- QFunction 2407eaf62fffSJeremy L Thompson CeedQFunction qf_fdm; 24082b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateInteriorByName(ceed_parent, "Scale", &qf_fdm)); 24092b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_fdm, "input", num_comp, CEED_EVAL_INTERP)); 24102b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_fdm, "scale", num_comp, CEED_EVAL_NONE)); 24112b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(qf_fdm, "output", num_comp, CEED_EVAL_INTERP)); 24122b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_fdm, num_comp)); 2413eaf62fffSJeremy L Thompson // -- QFunction context 2414eaf62fffSJeremy L Thompson CeedInt *num_comp_data; 24152b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &num_comp_data)); 2416eaf62fffSJeremy L Thompson num_comp_data[0] = num_comp; 2417eaf62fffSJeremy L Thompson CeedQFunctionContext ctx_fdm; 24182b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextCreate(ceed, &ctx_fdm)); 24192b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextSetData(ctx_fdm, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_data), num_comp_data)); 24202b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(qf_fdm, ctx_fdm)); 24212b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextDestroy(&ctx_fdm)); 2422eaf62fffSJeremy L Thompson // -- Operator 24232b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed_parent, qf_fdm, NULL, NULL, fdm_inv)); 24242b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*fdm_inv, "input", rstr, fdm_basis, CEED_VECTOR_ACTIVE)); 24252b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*fdm_inv, "scale", rstr_qd_i, CEED_BASIS_COLLOCATED, q_data)); 24262b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*fdm_inv, "output", rstr, fdm_basis, CEED_VECTOR_ACTIVE)); 2427eaf62fffSJeremy L Thompson 2428eaf62fffSJeremy L Thompson // Cleanup 24292b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&q_data)); 24302b730f8bSJeremy L Thompson CeedCall(CeedBasisDestroy(&fdm_basis)); 24312b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_qd_i)); 24322b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&qf_fdm)); 2433eaf62fffSJeremy L Thompson 2434eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2435eaf62fffSJeremy L Thompson } 2436eaf62fffSJeremy L Thompson 2437eaf62fffSJeremy L Thompson /// @} 2438