13d8e8822SJeremy L Thompson // Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors. 23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details. 3eaf62fffSJeremy L Thompson // 43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause 5eaf62fffSJeremy L Thompson // 63d8e8822SJeremy L Thompson // This file is part of CEED: http://github.com/ceed 7eaf62fffSJeremy L Thompson 82b730f8bSJeremy L Thompson #include <ceed-impl.h> 949aac155SJeremy L Thompson #include <ceed.h> 102b730f8bSJeremy L Thompson #include <ceed/backend.h> 11c85e8640SSebastian Grimberg #include <assert.h> 122b730f8bSJeremy L Thompson #include <math.h> 13eaf62fffSJeremy L Thompson #include <stdbool.h> 14eaf62fffSJeremy L Thompson #include <stdio.h> 15eaf62fffSJeremy L Thompson #include <string.h> 16eaf62fffSJeremy L Thompson 17eaf62fffSJeremy L Thompson /// @file 18eaf62fffSJeremy L Thompson /// Implementation of CeedOperator preconditioning interfaces 19eaf62fffSJeremy L Thompson 20eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 21eaf62fffSJeremy L Thompson /// CeedOperator Library Internal Preconditioning Functions 22eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 23eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorDeveloper 24eaf62fffSJeremy L Thompson /// @{ 25eaf62fffSJeremy L Thompson 26eaf62fffSJeremy L Thompson /** 27ea61e9acSJeremy L Thompson @brief Duplicate a CeedQFunction with a reference Ceed to fallback for advanced CeedOperator functionality 289e77b9c8SJeremy L Thompson 2901ea9c81SJed Brown @param[in] fallback_ceed Ceed on which to create fallback CeedQFunction 309e77b9c8SJeremy L Thompson @param[in] qf CeedQFunction to create fallback for 3101ea9c81SJed Brown @param[out] qf_fallback fallback CeedQFunction 329e77b9c8SJeremy L Thompson 339e77b9c8SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 349e77b9c8SJeremy L Thompson 359e77b9c8SJeremy L Thompson @ref Developer 369e77b9c8SJeremy L Thompson **/ 372b730f8bSJeremy L Thompson static int CeedQFunctionCreateFallback(Ceed fallback_ceed, CeedQFunction qf, CeedQFunction *qf_fallback) { 389e77b9c8SJeremy L Thompson // Check if NULL qf passed in 399e77b9c8SJeremy L Thompson if (!qf) return CEED_ERROR_SUCCESS; 409e77b9c8SJeremy L Thompson 41d04bbc78SJeremy L Thompson CeedDebug256(qf->ceed, 1, "---------- CeedOperator Fallback ----------\n"); 4213f886e9SJeremy L Thompson CeedDebug(qf->ceed, "Creating fallback CeedQFunction\n"); 43d04bbc78SJeremy L Thompson 441862681bSJeremy Luke Thompson char *source_path_with_name = NULL; 459e77b9c8SJeremy L Thompson if (qf->source_path) { 462b730f8bSJeremy L Thompson size_t path_len = strlen(qf->source_path), name_len = strlen(qf->kernel_name); 472b730f8bSJeremy L Thompson CeedCall(CeedCalloc(path_len + name_len + 2, &source_path_with_name)); 489e77b9c8SJeremy L Thompson memcpy(source_path_with_name, qf->source_path, path_len); 499e77b9c8SJeremy L Thompson memcpy(&source_path_with_name[path_len], ":", 1); 509e77b9c8SJeremy L Thompson memcpy(&source_path_with_name[path_len + 1], qf->kernel_name, name_len); 519e77b9c8SJeremy L Thompson } else { 522b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &source_path_with_name)); 539e77b9c8SJeremy L Thompson } 549e77b9c8SJeremy L Thompson 552b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateInterior(fallback_ceed, qf->vec_length, qf->function, source_path_with_name, qf_fallback)); 569e77b9c8SJeremy L Thompson { 579e77b9c8SJeremy L Thompson CeedQFunctionContext ctx; 589e77b9c8SJeremy L Thompson 592b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetContext(qf, &ctx)); 602b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(*qf_fallback, ctx)); 619e77b9c8SJeremy L Thompson } 629e77b9c8SJeremy L Thompson for (CeedInt i = 0; i < qf->num_input_fields; i++) { 632b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(*qf_fallback, qf->input_fields[i]->field_name, qf->input_fields[i]->size, qf->input_fields[i]->eval_mode)); 649e77b9c8SJeremy L Thompson } 659e77b9c8SJeremy L Thompson for (CeedInt i = 0; i < qf->num_output_fields; i++) { 662b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(*qf_fallback, qf->output_fields[i]->field_name, qf->output_fields[i]->size, qf->output_fields[i]->eval_mode)); 679e77b9c8SJeremy L Thompson } 682b730f8bSJeremy L Thompson CeedCall(CeedFree(&source_path_with_name)); 699e77b9c8SJeremy L Thompson 709e77b9c8SJeremy L Thompson return CEED_ERROR_SUCCESS; 719e77b9c8SJeremy L Thompson } 729e77b9c8SJeremy L Thompson 739e77b9c8SJeremy L Thompson /** 74ea61e9acSJeremy L Thompson @brief Duplicate a CeedOperator with a reference Ceed to fallback for advanced CeedOperator functionality 75eaf62fffSJeremy L Thompson 76ea61e9acSJeremy L Thompson @param[in,out] op CeedOperator to create fallback for 77eaf62fffSJeremy L Thompson 78eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 79eaf62fffSJeremy L Thompson 80eaf62fffSJeremy L Thompson @ref Developer 81eaf62fffSJeremy L Thompson **/ 82d04bbc78SJeremy L Thompson static int CeedOperatorCreateFallback(CeedOperator op) { 83b275c451SJeremy L Thompson bool is_composite; 849e77b9c8SJeremy L Thompson Ceed ceed_fallback; 85eaf62fffSJeremy L Thompson 86805fe78eSJeremy L Thompson // Check not already created 87805fe78eSJeremy L Thompson if (op->op_fallback) return CEED_ERROR_SUCCESS; 88805fe78eSJeremy L Thompson 89eaf62fffSJeremy L Thompson // Fallback Ceed 902b730f8bSJeremy L Thompson CeedCall(CeedGetOperatorFallbackCeed(op->ceed, &ceed_fallback)); 91d04bbc78SJeremy L Thompson if (!ceed_fallback) return CEED_ERROR_SUCCESS; 92d04bbc78SJeremy L Thompson 93d04bbc78SJeremy L Thompson CeedDebug256(op->ceed, 1, "---------- CeedOperator Fallback ----------\n"); 9413f886e9SJeremy L Thompson CeedDebug(op->ceed, "Creating fallback CeedOperator\n"); 95eaf62fffSJeremy L Thompson 96eaf62fffSJeremy L Thompson // Clone Op 97805fe78eSJeremy L Thompson CeedOperator op_fallback; 98b275c451SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 99b275c451SJeremy L Thompson if (is_composite) { 100b275c451SJeremy L Thompson CeedInt num_suboperators; 101b275c451SJeremy L Thompson CeedOperator *sub_operators; 102b275c451SJeremy L Thompson 1032b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorCreate(ceed_fallback, &op_fallback)); 104b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 105b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 106b275c451SJeremy L Thompson for (CeedInt i = 0; i < num_suboperators; i++) { 107d04bbc78SJeremy L Thompson CeedOperator op_sub_fallback; 108d04bbc78SJeremy L Thompson 109b275c451SJeremy L Thompson CeedCall(CeedOperatorGetFallback(sub_operators[i], &op_sub_fallback)); 1102b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorAddSub(op_fallback, op_sub_fallback)); 111805fe78eSJeremy L Thompson } 112805fe78eSJeremy L Thompson } else { 1139e77b9c8SJeremy L Thompson CeedQFunction qf_fallback = NULL, dqf_fallback = NULL, dqfT_fallback = NULL; 1142b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->qf, &qf_fallback)); 1152b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqf, &dqf_fallback)); 1162b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqfT, &dqfT_fallback)); 1172b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed_fallback, qf_fallback, dqf_fallback, dqfT_fallback, &op_fallback)); 118805fe78eSJeremy L Thompson for (CeedInt i = 0; i < op->qf->num_input_fields; i++) { 119437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(op_fallback, op->input_fields[i]->field_name, op->input_fields[i]->elem_rstr, op->input_fields[i]->basis, 1202b730f8bSJeremy L Thompson op->input_fields[i]->vec)); 121805fe78eSJeremy L Thompson } 122805fe78eSJeremy L Thompson for (CeedInt i = 0; i < op->qf->num_output_fields; i++) { 123437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(op_fallback, op->output_fields[i]->field_name, op->output_fields[i]->elem_rstr, op->output_fields[i]->basis, 1242b730f8bSJeremy L Thompson op->output_fields[i]->vec)); 125805fe78eSJeremy L Thompson } 1262b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op->qf_assembled, &op_fallback->qf_assembled)); 127*febe2972SJeremy L Thompson if (op_fallback->num_qpts == 0) CeedCall(CeedOperatorSetNumQuadraturePoints(op_fallback, op->num_qpts)); 1289e77b9c8SJeremy L Thompson // Cleanup 1292b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&qf_fallback)); 1302b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&dqf_fallback)); 1312b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&dqfT_fallback)); 132805fe78eSJeremy L Thompson } 1332b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetName(op_fallback, op->name)); 1342b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fallback)); 135805fe78eSJeremy L Thompson op->op_fallback = op_fallback; 136eaf62fffSJeremy L Thompson 137eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 138eaf62fffSJeremy L Thompson } 139eaf62fffSJeremy L Thompson 140eaf62fffSJeremy L Thompson /** 141ea61e9acSJeremy L Thompson @brief Retrieve fallback CeedOperator with a reference Ceed for advanced CeedOperator functionality 142d04bbc78SJeremy L Thompson 143d04bbc78SJeremy L Thompson @param[in] op CeedOperator to retrieve fallback for 144d04bbc78SJeremy L Thompson @param[out] op_fallback Fallback CeedOperator 145d04bbc78SJeremy L Thompson 146d04bbc78SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 147d04bbc78SJeremy L Thompson 148d04bbc78SJeremy L Thompson @ref Developer 149d04bbc78SJeremy L Thompson **/ 150d04bbc78SJeremy L Thompson int CeedOperatorGetFallback(CeedOperator op, CeedOperator *op_fallback) { 151d04bbc78SJeremy L Thompson // Create if needed 152d04bbc78SJeremy L Thompson if (!op->op_fallback) { 1532b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreateFallback(op)); 154d04bbc78SJeremy L Thompson } 155d04bbc78SJeremy L Thompson if (op->op_fallback) { 156d04bbc78SJeremy L Thompson bool is_debug; 157d04bbc78SJeremy L Thompson 1582b730f8bSJeremy L Thompson CeedCall(CeedIsDebug(op->ceed, &is_debug)); 159d04bbc78SJeremy L Thompson if (is_debug) { 160b275c451SJeremy L Thompson Ceed ceed, ceed_fallback; 161d04bbc78SJeremy L Thompson const char *resource, *resource_fallback; 162d04bbc78SJeremy L Thompson 163b275c451SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 164b275c451SJeremy L Thompson CeedCall(CeedGetOperatorFallbackCeed(ceed, &ceed_fallback)); 165b275c451SJeremy L Thompson CeedCall(CeedGetResource(ceed, &resource)); 1662b730f8bSJeremy L Thompson CeedCall(CeedGetResource(ceed_fallback, &resource_fallback)); 167d04bbc78SJeremy L Thompson 16823d4529eSJeremy L Thompson CeedDebug256(ceed, CEED_DEBUG_COLOR_SUCCESS, "---------- CeedOperator Fallback ----------\n"); 169b275c451SJeremy L Thompson CeedDebug(ceed, "Falling back from %s operator at address %ld to %s operator at address %ld\n", resource, op, resource_fallback, 1702b730f8bSJeremy L Thompson op->op_fallback); 171d04bbc78SJeremy L Thompson } 172d04bbc78SJeremy L Thompson } 173d04bbc78SJeremy L Thompson *op_fallback = op->op_fallback; 174d04bbc78SJeremy L Thompson 175d04bbc78SJeremy L Thompson return CEED_ERROR_SUCCESS; 176d04bbc78SJeremy L Thompson } 177d04bbc78SJeremy L Thompson 178d04bbc78SJeremy L Thompson /** 179eaf62fffSJeremy L Thompson @brief Select correct basis matrix pointer based on CeedEvalMode 180eaf62fffSJeremy L Thompson 181352a5e7cSSebastian Grimberg @param[in] basis CeedBasis from which to get the basis matrix 182eaf62fffSJeremy L Thompson @param[in] eval_mode Current basis evaluation mode 183eaf62fffSJeremy L Thompson @param[in] identity Pointer to identity matrix 184eaf62fffSJeremy L Thompson @param[out] basis_ptr Basis pointer to set 185eaf62fffSJeremy L Thompson 186eaf62fffSJeremy L Thompson @ref Developer 187eaf62fffSJeremy L Thompson **/ 188352a5e7cSSebastian Grimberg static inline int CeedOperatorGetBasisPointer(CeedBasis basis, CeedEvalMode eval_mode, const CeedScalar *identity, const CeedScalar **basis_ptr) { 189eaf62fffSJeremy L Thompson switch (eval_mode) { 190eaf62fffSJeremy L Thompson case CEED_EVAL_NONE: 191eaf62fffSJeremy L Thompson *basis_ptr = identity; 192eaf62fffSJeremy L Thompson break; 193eaf62fffSJeremy L Thompson case CEED_EVAL_INTERP: 194352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetInterp(basis, basis_ptr)); 195eaf62fffSJeremy L Thompson break; 196eaf62fffSJeremy L Thompson case CEED_EVAL_GRAD: 197352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetGrad(basis, basis_ptr)); 198352a5e7cSSebastian Grimberg break; 199352a5e7cSSebastian Grimberg case CEED_EVAL_DIV: 200352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetDiv(basis, basis_ptr)); 201352a5e7cSSebastian Grimberg break; 202352a5e7cSSebastian Grimberg case CEED_EVAL_CURL: 203352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetCurl(basis, basis_ptr)); 204eaf62fffSJeremy L Thompson break; 205eaf62fffSJeremy L Thompson case CEED_EVAL_WEIGHT: 206eaf62fffSJeremy L Thompson break; // Caught by QF Assembly 207eaf62fffSJeremy L Thompson } 208ed9e99e6SJeremy L Thompson assert(*basis_ptr != NULL); 209352a5e7cSSebastian Grimberg 210352a5e7cSSebastian Grimberg return CEED_ERROR_SUCCESS; 211eaf62fffSJeremy L Thompson } 212eaf62fffSJeremy L Thompson 213eaf62fffSJeremy L Thompson /** 214eaf62fffSJeremy L Thompson @brief Create point block restriction for active operator field 215eaf62fffSJeremy L Thompson 216eaf62fffSJeremy L Thompson @param[in] rstr Original CeedElemRestriction for active field 217ea61e9acSJeremy L Thompson @param[out] pointblock_rstr Address of the variable where the newly created CeedElemRestriction will be stored 218eaf62fffSJeremy L Thompson 219eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 220eaf62fffSJeremy L Thompson 221eaf62fffSJeremy L Thompson @ref Developer 222eaf62fffSJeremy L Thompson **/ 2232b730f8bSJeremy L Thompson static int CeedOperatorCreateActivePointBlockRestriction(CeedElemRestriction rstr, CeedElemRestriction *pointblock_rstr) { 224eaf62fffSJeremy L Thompson Ceed ceed; 2252b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetCeed(rstr, &ceed)); 226eaf62fffSJeremy L Thompson const CeedInt *offsets; 2272b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetOffsets(rstr, CEED_MEM_HOST, &offsets)); 228eaf62fffSJeremy L Thompson 229eaf62fffSJeremy L Thompson // Expand offsets 2307b63f5c6SJed Brown CeedInt num_elem, num_comp, elem_size, comp_stride, *pointblock_offsets; 2317b63f5c6SJed Brown CeedSize l_size; 2322b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem)); 2332b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp)); 2342b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size)); 2352b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetCompStride(rstr, &comp_stride)); 2362b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size)); 237eaf62fffSJeremy L Thompson CeedInt shift = num_comp; 2382b730f8bSJeremy L Thompson if (comp_stride != 1) shift *= num_comp; 2392b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_elem * elem_size, &pointblock_offsets)); 240eaf62fffSJeremy L Thompson for (CeedInt i = 0; i < num_elem * elem_size; i++) { 241eaf62fffSJeremy L Thompson pointblock_offsets[i] = offsets[i] * shift; 242eaf62fffSJeremy L Thompson } 243eaf62fffSJeremy L Thompson 244eaf62fffSJeremy L Thompson // Create new restriction 2452b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionCreate(ceed, num_elem, elem_size, num_comp * num_comp, 1, l_size * num_comp, CEED_MEM_HOST, CEED_OWN_POINTER, 2462b730f8bSJeremy L Thompson pointblock_offsets, pointblock_rstr)); 247eaf62fffSJeremy L Thompson 248eaf62fffSJeremy L Thompson // Cleanup 2492b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionRestoreOffsets(rstr, &offsets)); 250eaf62fffSJeremy L Thompson 251eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 252eaf62fffSJeremy L Thompson } 253eaf62fffSJeremy L Thompson 254eaf62fffSJeremy L Thompson /** 255eaf62fffSJeremy L Thompson @brief Core logic for assembling operator diagonal or point block diagonal 256eaf62fffSJeremy L Thompson 257eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble point block diagonal 258ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE 259eaf62fffSJeremy L Thompson @param[in] is_pointblock Boolean flag to assemble diagonal or point block diagonal 260eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled diagonal 261eaf62fffSJeremy L Thompson 262eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 263eaf62fffSJeremy L Thompson 264eaf62fffSJeremy L Thompson @ref Developer 265eaf62fffSJeremy L Thompson **/ 2662b730f8bSJeremy L Thompson static inline int CeedSingleOperatorAssembleAddDiagonal_Core(CeedOperator op, CeedRequest *request, const bool is_pointblock, CeedVector assembled) { 267eaf62fffSJeremy L Thompson Ceed ceed; 2682b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 269eaf62fffSJeremy L Thompson 270eaf62fffSJeremy L Thompson // Assemble QFunction 271eaf62fffSJeremy L Thompson CeedQFunction qf; 272437c7c90SJeremy L Thompson const CeedScalar *assembled_qf_array; 273c5f45aeaSJeremy L Thompson CeedVector assembled_qf = NULL; 274c5f45aeaSJeremy L Thompson CeedElemRestriction assembled_elem_rstr = NULL; 275437c7c90SJeremy L Thompson CeedInt num_input_fields, num_output_fields; 276eaf62fffSJeremy L Thompson CeedInt layout[3]; 277437c7c90SJeremy L Thompson 278437c7c90SJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 279437c7c90SJeremy L Thompson CeedCall(CeedQFunctionGetNumArgs(qf, &num_input_fields, &num_output_fields)); 280437c7c90SJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &assembled_elem_rstr, request)); 281437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(assembled_elem_rstr, &layout)); 282437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&assembled_elem_rstr)); 283437c7c90SJeremy L Thompson CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array)); 284eaf62fffSJeremy L Thompson 285ed9e99e6SJeremy L Thompson // Get assembly data 286ed9e99e6SJeremy L Thompson CeedOperatorAssemblyData data; 287437c7c90SJeremy L Thompson const CeedEvalMode **eval_modes_in, **eval_modes_out; 288437c7c90SJeremy L Thompson CeedInt *num_eval_modes_in, *num_eval_modes_out, num_active_bases; 289437c7c90SJeremy L Thompson CeedSize **eval_mode_offsets_in, **eval_mode_offsets_out, num_output_components; 290437c7c90SJeremy L Thompson CeedBasis *active_bases; 291437c7c90SJeremy L Thompson CeedElemRestriction *active_elem_rstrs; 292437c7c90SJeremy L Thompson CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data)); 293437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_active_bases, &num_eval_modes_in, &eval_modes_in, &eval_mode_offsets_in, 294437c7c90SJeremy L Thompson &num_eval_modes_out, &eval_modes_out, &eval_mode_offsets_out, &num_output_components)); 295437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, &active_bases, NULL, NULL)); 296437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetElemRestrictions(data, NULL, &active_elem_rstrs)); 297437c7c90SJeremy L Thompson 298437c7c90SJeremy L Thompson // Loop over all active bases 299437c7c90SJeremy L Thompson for (CeedInt b = 0; b < num_active_bases; b++) { 300eaf62fffSJeremy L Thompson // Assemble point block diagonal restriction, if needed 301437c7c90SJeremy L Thompson CeedElemRestriction diag_elem_rstr = active_elem_rstrs[b]; 302437c7c90SJeremy L Thompson 303eaf62fffSJeremy L Thompson if (is_pointblock) { 304437c7c90SJeremy L Thompson CeedElemRestriction point_block_elem_rstr; 305437c7c90SJeremy L Thompson 306437c7c90SJeremy L Thompson CeedCall(CeedOperatorCreateActivePointBlockRestriction(diag_elem_rstr, &point_block_elem_rstr)); 307437c7c90SJeremy L Thompson diag_elem_rstr = point_block_elem_rstr; 308eaf62fffSJeremy L Thompson } 309eaf62fffSJeremy L Thompson 310eaf62fffSJeremy L Thompson // Create diagonal vector 311eaf62fffSJeremy L Thompson CeedVector elem_diag; 312437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionCreateVector(diag_elem_rstr, NULL, &elem_diag)); 313eaf62fffSJeremy L Thompson 314eaf62fffSJeremy L Thompson // Assemble element operator diagonals 3159c774eddSJeremy L Thompson CeedScalar *elem_diag_array; 316437c7c90SJeremy L Thompson CeedInt num_elem, num_nodes, num_qpts, num_components; 317437c7c90SJeremy L Thompson 3182b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(elem_diag, 0.0)); 3192b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArray(elem_diag, CEED_MEM_HOST, &elem_diag_array)); 320437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(diag_elem_rstr, &num_elem)); 321437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumNodes(active_bases[b], &num_nodes)); 322437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumComponents(active_bases[b], &num_components)); 323437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(active_bases[b], &num_qpts)); 324ed9e99e6SJeremy L Thompson 325352a5e7cSSebastian Grimberg // Construct identity matrix for basis if required 326ed9e99e6SJeremy L Thompson bool has_eval_none = false; 327352a5e7cSSebastian Grimberg CeedScalar *identity = NULL; 328437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_eval_modes_in[b]; i++) { 329437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (eval_modes_in[b][i] == CEED_EVAL_NONE); 330ed9e99e6SJeremy L Thompson } 331437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_eval_modes_out[b]; i++) { 332437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (eval_modes_out[b][i] == CEED_EVAL_NONE); 333ed9e99e6SJeremy L Thompson } 334ed9e99e6SJeremy L Thompson if (has_eval_none) { 3352b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_qpts * num_nodes, &identity)); 3362b730f8bSJeremy L Thompson for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) identity[i * num_nodes + i] = 1.0; 337eaf62fffSJeremy L Thompson } 338352a5e7cSSebastian Grimberg 339eaf62fffSJeremy L Thompson // Compute the diagonal of B^T D B 340eaf62fffSJeremy L Thompson // Each element 341b94338b9SJed Brown for (CeedSize e = 0; e < num_elem; e++) { 342eaf62fffSJeremy L Thompson // Each basis eval mode pair 343352a5e7cSSebastian Grimberg CeedInt d_out = 0, q_comp_out; 344352a5e7cSSebastian Grimberg CeedEvalMode eval_mode_out_prev = CEED_EVAL_NONE; 345437c7c90SJeremy L Thompson for (CeedInt e_out = 0; e_out < num_eval_modes_out[b]; e_out++) { 346437c7c90SJeremy L Thompson const CeedScalar *B_t = NULL; 347352a5e7cSSebastian Grimberg CeedOperatorGetBasisPointer(active_bases[b], eval_modes_out[b][e_out], identity, &B_t); 348352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(active_bases[b], eval_modes_out[b][e_out], &q_comp_out)); 349352a5e7cSSebastian Grimberg if (q_comp_out > 1) { 350352a5e7cSSebastian Grimberg if (e_out == 0 || eval_modes_out[b][e_out] != eval_mode_out_prev) d_out = 0; 351352a5e7cSSebastian Grimberg else B_t = &B_t[(++d_out) * num_qpts * num_nodes]; 352352a5e7cSSebastian Grimberg } 353352a5e7cSSebastian Grimberg eval_mode_out_prev = eval_modes_out[b][e_out]; 354352a5e7cSSebastian Grimberg 355352a5e7cSSebastian Grimberg CeedInt d_in = 0, q_comp_in; 356352a5e7cSSebastian Grimberg CeedEvalMode eval_mode_in_prev = CEED_EVAL_NONE; 357437c7c90SJeremy L Thompson for (CeedInt e_in = 0; e_in < num_eval_modes_in[b]; e_in++) { 358437c7c90SJeremy L Thompson const CeedScalar *B = NULL; 359352a5e7cSSebastian Grimberg CeedOperatorGetBasisPointer(active_bases[b], eval_modes_in[b][e_in], identity, &B); 360352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(active_bases[b], eval_modes_in[b][e_in], &q_comp_in)); 361352a5e7cSSebastian Grimberg if (q_comp_in > 1) { 362352a5e7cSSebastian Grimberg if (e_in == 0 || eval_modes_in[b][e_in] != eval_mode_in_prev) d_in = 0; 363352a5e7cSSebastian Grimberg else B = &B[(++d_in) * num_qpts * num_nodes]; 364352a5e7cSSebastian Grimberg } 365352a5e7cSSebastian Grimberg eval_mode_in_prev = eval_modes_in[b][e_in]; 366352a5e7cSSebastian Grimberg 367eaf62fffSJeremy L Thompson // Each component 368437c7c90SJeremy L Thompson for (CeedInt c_out = 0; c_out < num_components; c_out++) { 369437c7c90SJeremy L Thompson // Each qpt/node pair 3702b730f8bSJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 371eaf62fffSJeremy L Thompson if (is_pointblock) { 372eaf62fffSJeremy L Thompson // Point Block Diagonal 373437c7c90SJeremy L Thompson for (CeedInt c_in = 0; c_in < num_components; c_in++) { 374b94338b9SJed Brown const CeedSize c_offset = (eval_mode_offsets_in[b][e_in] + c_in) * num_output_components + eval_mode_offsets_out[b][e_out] + c_out; 375437c7c90SJeremy L Thompson const CeedScalar qf_value = assembled_qf_array[q * layout[0] + c_offset * layout[1] + e * layout[2]]; 3762b730f8bSJeremy L Thompson for (CeedInt n = 0; n < num_nodes; n++) { 377437c7c90SJeremy L Thompson elem_diag_array[((e * num_components + c_out) * num_components + c_in) * num_nodes + n] += 378437c7c90SJeremy L Thompson B_t[q * num_nodes + n] * qf_value * B[q * num_nodes + n]; 379eaf62fffSJeremy L Thompson } 3802b730f8bSJeremy L Thompson } 381eaf62fffSJeremy L Thompson } else { 382eaf62fffSJeremy L Thompson // Diagonal Only 383437c7c90SJeremy L Thompson const CeedInt c_offset = (eval_mode_offsets_in[b][e_in] + c_out) * num_output_components + eval_mode_offsets_out[b][e_out] + c_out; 384437c7c90SJeremy L Thompson const CeedScalar qf_value = assembled_qf_array[q * layout[0] + c_offset * layout[1] + e * layout[2]]; 3852b730f8bSJeremy L Thompson for (CeedInt n = 0; n < num_nodes; n++) { 386437c7c90SJeremy L Thompson elem_diag_array[(e * num_components + c_out) * num_nodes + n] += B_t[q * num_nodes + n] * qf_value * B[q * num_nodes + n]; 387eaf62fffSJeremy L Thompson } 388eaf62fffSJeremy L Thompson } 389eaf62fffSJeremy L Thompson } 390eaf62fffSJeremy L Thompson } 3912b730f8bSJeremy L Thompson } 3922b730f8bSJeremy L Thompson } 3932b730f8bSJeremy L Thompson } 3942b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(elem_diag, &elem_diag_array)); 395eaf62fffSJeremy L Thompson 396eaf62fffSJeremy L Thompson // Assemble local operator diagonal 397f30b1135SSebastian Grimberg CeedCall(CeedElemRestrictionApplyUnsigned(diag_elem_rstr, CEED_TRANSPOSE, elem_diag, assembled, request)); 398eaf62fffSJeremy L Thompson 399eaf62fffSJeremy L Thompson // Cleanup 400437c7c90SJeremy L Thompson if (is_pointblock) CeedCall(CeedElemRestrictionDestroy(&diag_elem_rstr)); 4012b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&elem_diag)); 4022b730f8bSJeremy L Thompson CeedCall(CeedFree(&identity)); 403437c7c90SJeremy L Thompson } 404437c7c90SJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array)); 405437c7c90SJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled_qf)); 406eaf62fffSJeremy L Thompson 407eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 408eaf62fffSJeremy L Thompson } 409eaf62fffSJeremy L Thompson 410eaf62fffSJeremy L Thompson /** 411eaf62fffSJeremy L Thompson @brief Core logic for assembling composite operator diagonal 412eaf62fffSJeremy L Thompson 413eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble point block diagonal 414ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE 415eaf62fffSJeremy L Thompson @param[in] is_pointblock Boolean flag to assemble diagonal or point block diagonal 416eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled diagonal 417eaf62fffSJeremy L Thompson 418eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 419eaf62fffSJeremy L Thompson 420eaf62fffSJeremy L Thompson @ref Developer 421eaf62fffSJeremy L Thompson **/ 4222b730f8bSJeremy L Thompson static inline int CeedCompositeOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedRequest *request, const bool is_pointblock, 423eaf62fffSJeremy L Thompson CeedVector assembled) { 424eaf62fffSJeremy L Thompson CeedInt num_sub; 425eaf62fffSJeremy L Thompson CeedOperator *suboperators; 426c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_sub)); 427c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &suboperators)); 428eaf62fffSJeremy L Thompson for (CeedInt i = 0; i < num_sub; i++) { 4296aa95790SJeremy L Thompson if (is_pointblock) { 4302b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(suboperators[i], assembled, request)); 4316aa95790SJeremy L Thompson } else { 4322b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddDiagonal(suboperators[i], assembled, request)); 4336aa95790SJeremy L Thompson } 434eaf62fffSJeremy L Thompson } 435eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 436eaf62fffSJeremy L Thompson } 437eaf62fffSJeremy L Thompson 438eaf62fffSJeremy L Thompson /** 439eaf62fffSJeremy L Thompson @brief Build nonzero pattern for non-composite operator 440eaf62fffSJeremy L Thompson 441eaf62fffSJeremy L Thompson Users should generally use CeedOperatorLinearAssembleSymbolic() 442eaf62fffSJeremy L Thompson 4433bdd4e5aSSebastian Grimberg Note: For operators using oriented element restrictions, entries in rows or cols may be negative indicating the assembled value at this nonzero 4443bdd4e5aSSebastian Grimberg should be negated 445f30b1135SSebastian Grimberg 446eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble nonzero pattern 447eaf62fffSJeremy L Thompson @param[in] offset Offset for number of entries 448eaf62fffSJeremy L Thompson @param[out] rows Row number for each entry 449eaf62fffSJeremy L Thompson @param[out] cols Column number for each entry 450eaf62fffSJeremy L Thompson 451eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 452eaf62fffSJeremy L Thompson 453eaf62fffSJeremy L Thompson @ref Developer 454eaf62fffSJeremy L Thompson **/ 4552b730f8bSJeremy L Thompson static int CeedSingleOperatorAssembleSymbolic(CeedOperator op, CeedInt offset, CeedInt *rows, CeedInt *cols) { 456f3d47e36SJeremy L Thompson Ceed ceed; 457f3d47e36SJeremy L Thompson bool is_composite; 458f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 459f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 460f3d47e36SJeremy L Thompson 4616574a04fSJeremy L Thompson CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 462eaf62fffSJeremy L Thompson 463c9366a6bSJeremy L Thompson CeedSize num_nodes; 4642b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &num_nodes, NULL)); 465eaf62fffSJeremy L Thompson CeedElemRestriction rstr_in; 4662b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(op, &rstr_in)); 467e79b91d9SJeremy L Thompson CeedInt num_elem, elem_size, num_comp; 4682b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr_in, &num_elem)); 4692b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr_in, &elem_size)); 4702b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(rstr_in, &num_comp)); 471eaf62fffSJeremy L Thompson CeedInt layout_er[3]; 4722b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(rstr_in, &layout_er)); 473eaf62fffSJeremy L Thompson 474eaf62fffSJeremy L Thompson CeedInt local_num_entries = elem_size * num_comp * elem_size * num_comp * num_elem; 475eaf62fffSJeremy L Thompson 476eaf62fffSJeremy L Thompson // Determine elem_dof relation 477eaf62fffSJeremy L Thompson CeedVector index_vec; 4782b730f8bSJeremy L Thompson CeedCall(CeedVectorCreate(ceed, num_nodes, &index_vec)); 479eaf62fffSJeremy L Thompson CeedScalar *array; 4802b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayWrite(index_vec, CEED_MEM_HOST, &array)); 481ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_nodes; i++) array[i] = i; 4822b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(index_vec, &array)); 483eaf62fffSJeremy L Thompson CeedVector elem_dof; 4842b730f8bSJeremy L Thompson CeedCall(CeedVectorCreate(ceed, num_elem * elem_size * num_comp, &elem_dof)); 4852b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(elem_dof, 0.0)); 4862b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionApply(rstr_in, CEED_NOTRANSPOSE, index_vec, elem_dof, CEED_REQUEST_IMMEDIATE)); 487eaf62fffSJeremy L Thompson const CeedScalar *elem_dof_a; 4882b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(elem_dof, CEED_MEM_HOST, &elem_dof_a)); 4892b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&index_vec)); 490eaf62fffSJeremy L Thompson 491eaf62fffSJeremy L Thompson // Determine i, j locations for element matrices 492b94338b9SJed Brown CeedSize count = 0; 493ed9e99e6SJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 494ed9e99e6SJeremy L Thompson for (CeedInt comp_in = 0; comp_in < num_comp; comp_in++) { 495ed9e99e6SJeremy L Thompson for (CeedInt comp_out = 0; comp_out < num_comp; comp_out++) { 496ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < elem_size; i++) { 497ed9e99e6SJeremy L Thompson for (CeedInt j = 0; j < elem_size; j++) { 4982b730f8bSJeremy L Thompson const CeedInt elem_dof_index_row = i * layout_er[0] + (comp_out)*layout_er[1] + e * layout_er[2]; 4992b730f8bSJeremy L Thompson const CeedInt elem_dof_index_col = j * layout_er[0] + comp_in * layout_er[1] + e * layout_er[2]; 500eaf62fffSJeremy L Thompson 501eaf62fffSJeremy L Thompson const CeedInt row = elem_dof_a[elem_dof_index_row]; 502eaf62fffSJeremy L Thompson const CeedInt col = elem_dof_a[elem_dof_index_col]; 503eaf62fffSJeremy L Thompson 504eaf62fffSJeremy L Thompson rows[offset + count] = row; 505eaf62fffSJeremy L Thompson cols[offset + count] = col; 506eaf62fffSJeremy L Thompson count++; 507eaf62fffSJeremy L Thompson } 508eaf62fffSJeremy L Thompson } 509eaf62fffSJeremy L Thompson } 510eaf62fffSJeremy L Thompson } 511eaf62fffSJeremy L Thompson } 5126574a04fSJeremy L Thompson CeedCheck(count == local_num_entries, ceed, CEED_ERROR_MAJOR, "Error computing assembled entries"); 5132b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(elem_dof, &elem_dof_a)); 5142b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&elem_dof)); 515eaf62fffSJeremy L Thompson 516eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 517eaf62fffSJeremy L Thompson } 518eaf62fffSJeremy L Thompson 519eaf62fffSJeremy L Thompson /** 520eaf62fffSJeremy L Thompson @brief Assemble nonzero entries for non-composite operator 521eaf62fffSJeremy L Thompson 522eaf62fffSJeremy L Thompson Users should generally use CeedOperatorLinearAssemble() 523eaf62fffSJeremy L Thompson 524eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 525ea61e9acSJeremy L Thompson @param[in] offset Offset for number of entries 526eaf62fffSJeremy L Thompson @param[out] values Values to assemble into matrix 527eaf62fffSJeremy L Thompson 528eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 529eaf62fffSJeremy L Thompson 530eaf62fffSJeremy L Thompson @ref Developer 531eaf62fffSJeremy L Thompson **/ 5322b730f8bSJeremy L Thompson static int CeedSingleOperatorAssemble(CeedOperator op, CeedInt offset, CeedVector values) { 533f3d47e36SJeremy L Thompson Ceed ceed; 534f3d47e36SJeremy L Thompson bool is_composite; 535f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 536f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 537f3d47e36SJeremy L Thompson 5386574a04fSJeremy L Thompson CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 539f3d47e36SJeremy L Thompson 540f3d47e36SJeremy L Thompson // Early exit for empty operator 541f3d47e36SJeremy L Thompson { 542f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 543f3d47e36SJeremy L Thompson 544f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 545f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 546f3d47e36SJeremy L Thompson } 547eaf62fffSJeremy L Thompson 548cefa2673SJeremy L Thompson if (op->LinearAssembleSingle) { 549cefa2673SJeremy L Thompson // Backend version 5502b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleSingle(op, offset, values)); 551cefa2673SJeremy L Thompson return CEED_ERROR_SUCCESS; 552cefa2673SJeremy L Thompson } else { 553cefa2673SJeremy L Thompson // Operator fallback 554cefa2673SJeremy L Thompson CeedOperator op_fallback; 555cefa2673SJeremy L Thompson 5562b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 557cefa2673SJeremy L Thompson if (op_fallback) { 5582b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemble(op_fallback, offset, values)); 559cefa2673SJeremy L Thompson return CEED_ERROR_SUCCESS; 560cefa2673SJeremy L Thompson } 561cefa2673SJeremy L Thompson } 562cefa2673SJeremy L Thompson 563eaf62fffSJeremy L Thompson // Assemble QFunction 564eaf62fffSJeremy L Thompson CeedQFunction qf; 5652b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 566c5f45aeaSJeremy L Thompson CeedVector assembled_qf = NULL; 567c5f45aeaSJeremy L Thompson CeedElemRestriction rstr_q = NULL; 5682b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &rstr_q, CEED_REQUEST_IMMEDIATE)); 5691f9221feSJeremy L Thompson CeedSize qf_length; 5702b730f8bSJeremy L Thompson CeedCall(CeedVectorGetLength(assembled_qf, &qf_length)); 571eaf62fffSJeremy L Thompson 5727e7773b5SJeremy L Thompson CeedInt num_input_fields, num_output_fields; 573eaf62fffSJeremy L Thompson CeedOperatorField *input_fields; 574eaf62fffSJeremy L Thompson CeedOperatorField *output_fields; 5752b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, &num_input_fields, &input_fields, &num_output_fields, &output_fields)); 576eaf62fffSJeremy L Thompson 577ed9e99e6SJeremy L Thompson // Get assembly data 578ed9e99e6SJeremy L Thompson CeedOperatorAssemblyData data; 5792b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data)); 580437c7c90SJeremy L Thompson const CeedEvalMode **eval_modes_in, **eval_modes_out; 581437c7c90SJeremy L Thompson CeedInt *num_eval_modes_in, *num_eval_modes_out, num_active_bases; 582437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_active_bases, &num_eval_modes_in, &eval_modes_in, NULL, &num_eval_modes_out, 583437c7c90SJeremy L Thompson &eval_modes_out, NULL, NULL)); 584437c7c90SJeremy L Thompson CeedBasis *bases; 585437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, &bases, NULL, NULL)); 586437c7c90SJeremy L Thompson CeedBasis basis_in = bases[0]; 587eaf62fffSJeremy L Thompson 5886574a04fSJeremy L Thompson CeedCheck(num_active_bases == 1, ceed, CEED_ERROR_UNSUPPORTED, "Cannot assemble operator with multiple active bases"); 5896574a04fSJeremy L Thompson CeedCheck(num_eval_modes_in[0] > 0 && num_eval_modes_out[0] > 0, ceed, CEED_ERROR_UNSUPPORTED, "Cannot assemble operator with out inputs/outputs"); 590eaf62fffSJeremy L Thompson 591ed9e99e6SJeremy L Thompson CeedElemRestriction active_rstr; 592eaf62fffSJeremy L Thompson CeedInt num_elem, elem_size, num_qpts, num_comp; 5932b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(op, &active_rstr)); 5942b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(active_rstr, &num_elem)); 5952b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(active_rstr, &elem_size)); 5962b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(active_rstr, &num_comp)); 5972b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_in, &num_qpts)); 598eaf62fffSJeremy L Thompson 599eaf62fffSJeremy L Thompson CeedInt local_num_entries = elem_size * num_comp * elem_size * num_comp * num_elem; 600eaf62fffSJeremy L Thompson 601eaf62fffSJeremy L Thompson // loop over elements and put in data structure 602eaf62fffSJeremy L Thompson const CeedScalar *assembled_qf_array; 6032b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array)); 604eaf62fffSJeremy L Thompson 605eaf62fffSJeremy L Thompson CeedInt layout_qf[3]; 6062b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(rstr_q, &layout_qf)); 6072b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_q)); 608eaf62fffSJeremy L Thompson 609eaf62fffSJeremy L Thompson // we store B_mat_in, B_mat_out, BTD, elem_mat in row-major order 610437c7c90SJeremy L Thompson const CeedScalar **B_mats_in, **B_mats_out; 611437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, NULL, &B_mats_in, &B_mats_out)); 612437c7c90SJeremy L Thompson const CeedScalar *B_mat_in = B_mats_in[0], *B_mat_out = B_mats_out[0]; 613437c7c90SJeremy L Thompson CeedScalar BTD_mat[elem_size * num_qpts * num_eval_modes_in[0]]; 614eaf62fffSJeremy L Thompson CeedScalar elem_mat[elem_size * elem_size]; 615b94338b9SJed Brown CeedSize count = 0; 616eaf62fffSJeremy L Thompson CeedScalar *vals; 61728ec399dSJeremy L Thompson CeedCall(CeedVectorGetArray(values, CEED_MEM_HOST, &vals)); 618b94338b9SJed Brown for (CeedSize e = 0; e < num_elem; e++) { 619ed9e99e6SJeremy L Thompson for (CeedInt comp_in = 0; comp_in < num_comp; comp_in++) { 620ed9e99e6SJeremy L Thompson for (CeedInt comp_out = 0; comp_out < num_comp; comp_out++) { 621ed9e99e6SJeremy L Thompson // Compute B^T*D 622b94338b9SJed Brown for (CeedSize n = 0; n < elem_size; n++) { 623b94338b9SJed Brown for (CeedSize q = 0; q < num_qpts; q++) { 624437c7c90SJeremy L Thompson for (CeedInt e_in = 0; e_in < num_eval_modes_in[0]; e_in++) { 625b94338b9SJed Brown const CeedSize btd_index = n * (num_qpts * num_eval_modes_in[0]) + (num_eval_modes_in[0] * q + e_in); 626067fd99fSJeremy L Thompson CeedScalar sum = 0.0; 627437c7c90SJeremy L Thompson for (CeedInt e_out = 0; e_out < num_eval_modes_out[0]; e_out++) { 628b94338b9SJed Brown const CeedSize b_out_index = (num_eval_modes_out[0] * q + e_out) * elem_size + n; 629b94338b9SJed Brown const CeedSize eval_mode_index = ((e_in * num_comp + comp_in) * num_eval_modes_out[0] + e_out) * num_comp + comp_out; 630b94338b9SJed Brown const CeedSize qf_index = q * layout_qf[0] + eval_mode_index * layout_qf[1] + e * layout_qf[2]; 631067fd99fSJeremy L Thompson sum += B_mat_out[b_out_index] * assembled_qf_array[qf_index]; 632eaf62fffSJeremy L Thompson } 633067fd99fSJeremy L Thompson BTD_mat[btd_index] = sum; 634ed9e99e6SJeremy L Thompson } 635ed9e99e6SJeremy L Thompson } 636eaf62fffSJeremy L Thompson } 637eaf62fffSJeremy L Thompson // form element matrix itself (for each block component) 638437c7c90SJeremy L Thompson CeedCall(CeedMatrixMatrixMultiply(ceed, BTD_mat, B_mat_in, elem_mat, elem_size, elem_size, num_qpts * num_eval_modes_in[0])); 639eaf62fffSJeremy L Thompson 640eaf62fffSJeremy L Thompson // put element matrix in coordinate data structure 641ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < elem_size; i++) { 642ed9e99e6SJeremy L Thompson for (CeedInt j = 0; j < elem_size; j++) { 643eaf62fffSJeremy L Thompson vals[offset + count] = elem_mat[i * elem_size + j]; 644eaf62fffSJeremy L Thompson count++; 645eaf62fffSJeremy L Thompson } 646eaf62fffSJeremy L Thompson } 647eaf62fffSJeremy L Thompson } 648eaf62fffSJeremy L Thompson } 649eaf62fffSJeremy L Thompson } 6506574a04fSJeremy L Thompson CeedCheck(count == local_num_entries, ceed, CEED_ERROR_MAJOR, "Error computing entries"); 6512b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(values, &vals)); 652eaf62fffSJeremy L Thompson 6532b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array)); 6542b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled_qf)); 655eaf62fffSJeremy L Thompson 656eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 657eaf62fffSJeremy L Thompson } 658eaf62fffSJeremy L Thompson 659eaf62fffSJeremy L Thompson /** 660eaf62fffSJeremy L Thompson @brief Count number of entries for assembled CeedOperator 661eaf62fffSJeremy L Thompson 662eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 663eaf62fffSJeremy L Thompson @param[out] num_entries Number of entries in assembled representation 664eaf62fffSJeremy L Thompson 665eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 666eaf62fffSJeremy L Thompson 667eaf62fffSJeremy L Thompson @ref Utility 668eaf62fffSJeremy L Thompson **/ 669b94338b9SJed Brown static int CeedSingleOperatorAssemblyCountEntries(CeedOperator op, CeedSize *num_entries) { 670b275c451SJeremy L Thompson bool is_composite; 671eaf62fffSJeremy L Thompson CeedElemRestriction rstr; 672eaf62fffSJeremy L Thompson CeedInt num_elem, elem_size, num_comp; 673eaf62fffSJeremy L Thompson 674b275c451SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 6756574a04fSJeremy L Thompson CeedCheck(!is_composite, op->ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 6762b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(op, &rstr)); 6772b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem)); 6782b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size)); 6792b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp)); 680b94338b9SJed Brown *num_entries = (CeedSize)elem_size * num_comp * elem_size * num_comp * num_elem; 681eaf62fffSJeremy L Thompson 682eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 683eaf62fffSJeremy L Thompson } 684eaf62fffSJeremy L Thompson 685eaf62fffSJeremy L Thompson /** 686ea61e9acSJeremy L Thompson @brief Common code for creating a multigrid coarse operator and level transfer operators for a CeedOperator 687eaf62fffSJeremy L Thompson 688eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 68985bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 690eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 691eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 69285bb9dcfSJeremy L Thompson @param[in] basis_c_to_f Basis for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators 693eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 69485bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 69585bb9dcfSJeremy L Thompson @param[out] op_restrict Fine to coarse operator, or NULL 696eaf62fffSJeremy L Thompson 697eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 698eaf62fffSJeremy L Thompson 699eaf62fffSJeremy L Thompson @ref Developer 700eaf62fffSJeremy L Thompson **/ 7012b730f8bSJeremy L Thompson static int CeedSingleOperatorMultigridLevel(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 7022b730f8bSJeremy L Thompson CeedBasis basis_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) { 703eaf62fffSJeremy L Thompson Ceed ceed; 70485bb9dcfSJeremy L Thompson CeedVector mult_vec = NULL; 705c17ec2beSJeremy L Thompson CeedElemRestriction rstr_p_mult_fine = NULL; 7062b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op_fine, &ceed)); 707eaf62fffSJeremy L Thompson 708eaf62fffSJeremy L Thompson // Check for composite operator 709eaf62fffSJeremy L Thompson bool is_composite; 7102b730f8bSJeremy L Thompson CeedCall(CeedOperatorIsComposite(op_fine, &is_composite)); 7116574a04fSJeremy L Thompson CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Automatic multigrid setup for composite operators not supported"); 712eaf62fffSJeremy L Thompson 713eaf62fffSJeremy L Thompson // Coarse Grid 7142b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed, op_fine->qf, op_fine->dqf, op_fine->dqfT, op_coarse)); 715eaf62fffSJeremy L Thompson CeedElemRestriction rstr_fine = NULL; 716eaf62fffSJeremy L Thompson // -- Clone input fields 71792ae7e47SJeremy L Thompson for (CeedInt i = 0; i < op_fine->qf->num_input_fields; i++) { 718eaf62fffSJeremy L Thompson if (op_fine->input_fields[i]->vec == CEED_VECTOR_ACTIVE) { 719437c7c90SJeremy L Thompson rstr_fine = op_fine->input_fields[i]->elem_rstr; 7202b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE)); 721eaf62fffSJeremy L Thompson } else { 722437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, op_fine->input_fields[i]->elem_rstr, 7232b730f8bSJeremy L Thompson op_fine->input_fields[i]->basis, op_fine->input_fields[i]->vec)); 724eaf62fffSJeremy L Thompson } 725eaf62fffSJeremy L Thompson } 726eaf62fffSJeremy L Thompson // -- Clone output fields 72792ae7e47SJeremy L Thompson for (CeedInt i = 0; i < op_fine->qf->num_output_fields; i++) { 728eaf62fffSJeremy L Thompson if (op_fine->output_fields[i]->vec == CEED_VECTOR_ACTIVE) { 7292b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE)); 730eaf62fffSJeremy L Thompson } else { 731437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, op_fine->output_fields[i]->elem_rstr, 7322b730f8bSJeremy L Thompson op_fine->output_fields[i]->basis, op_fine->output_fields[i]->vec)); 733eaf62fffSJeremy L Thompson } 734eaf62fffSJeremy L Thompson } 735af99e877SJeremy L Thompson // -- Clone QFunctionAssemblyData 7362b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op_fine->qf_assembled, &(*op_coarse)->qf_assembled)); 737eaf62fffSJeremy L Thompson 738eaf62fffSJeremy L Thompson // Multiplicity vector 73985bb9dcfSJeremy L Thompson if (op_restrict || op_prolong) { 74085bb9dcfSJeremy L Thompson CeedVector mult_e_vec; 74185bb9dcfSJeremy L Thompson 742c17ec2beSJeremy L Thompson CeedCall(CeedElemRestrictionCreateUnsignedCopy(rstr_fine, &rstr_p_mult_fine)); 7436574a04fSJeremy L Thompson CeedCheck(p_mult_fine, ceed, CEED_ERROR_INCOMPATIBLE, "Prolongation or restriction operator creation requires fine grid multiplicity vector"); 7442b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionCreateVector(rstr_fine, &mult_vec, &mult_e_vec)); 7452b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(mult_e_vec, 0.0)); 746c17ec2beSJeremy L Thompson CeedCall(CeedElemRestrictionApply(rstr_p_mult_fine, CEED_NOTRANSPOSE, p_mult_fine, mult_e_vec, CEED_REQUEST_IMMEDIATE)); 7472b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(mult_vec, 0.0)); 748c17ec2beSJeremy L Thompson CeedCall(CeedElemRestrictionApply(rstr_p_mult_fine, CEED_TRANSPOSE, mult_e_vec, mult_vec, CEED_REQUEST_IMMEDIATE)); 7492b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&mult_e_vec)); 7502b730f8bSJeremy L Thompson CeedCall(CeedVectorReciprocal(mult_vec)); 75185bb9dcfSJeremy L Thompson } 752eaf62fffSJeremy L Thompson 753addd79feSZach Atkins // Clone name 754addd79feSZach Atkins bool has_name = op_fine->name; 755addd79feSZach Atkins size_t name_len = op_fine->name ? strlen(op_fine->name) : 0; 756addd79feSZach Atkins CeedCall(CeedOperatorSetName(*op_coarse, op_fine->name)); 757addd79feSZach Atkins 75883d6adf3SZach Atkins // Check that coarse to fine basis is provided if prolong/restrict operators are requested 7596574a04fSJeremy L Thompson CeedCheck(basis_c_to_f || (!op_restrict && !op_prolong), ceed, CEED_ERROR_INCOMPATIBLE, 7606574a04fSJeremy L Thompson "Prolongation or restriction operator creation requires coarse-to-fine basis"); 76183d6adf3SZach Atkins 76285bb9dcfSJeremy L Thompson // Restriction/Prolongation Operators 763eaf62fffSJeremy L Thompson CeedInt num_comp; 7642b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_coarse, &num_comp)); 765addd79feSZach Atkins 766addd79feSZach Atkins // Restriction 767addd79feSZach Atkins if (op_restrict) { 768eaf62fffSJeremy L Thompson CeedInt *num_comp_r_data; 76985bb9dcfSJeremy L Thompson CeedQFunction qf_restrict; 77085bb9dcfSJeremy L Thompson CeedQFunctionContext ctx_r; 77185bb9dcfSJeremy L Thompson 77285bb9dcfSJeremy L Thompson CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_restrict)); 7732b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &num_comp_r_data)); 774eaf62fffSJeremy L Thompson num_comp_r_data[0] = num_comp; 7752b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextCreate(ceed, &ctx_r)); 7762b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextSetData(ctx_r, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_r_data), num_comp_r_data)); 7772b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(qf_restrict, ctx_r)); 7782b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextDestroy(&ctx_r)); 7792b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_restrict, "input", num_comp, CEED_EVAL_NONE)); 7802b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_restrict, "scale", num_comp, CEED_EVAL_NONE)); 7812b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(qf_restrict, "output", num_comp, CEED_EVAL_INTERP)); 7822b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_restrict, num_comp)); 783eaf62fffSJeremy L Thompson 7842b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed, qf_restrict, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_restrict)); 7852b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_restrict, "input", rstr_fine, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE)); 786c17ec2beSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_restrict, "scale", rstr_p_mult_fine, CEED_BASIS_COLLOCATED, mult_vec)); 7872b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_restrict, "output", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE)); 788eaf62fffSJeremy L Thompson 789addd79feSZach Atkins // Set name 790addd79feSZach Atkins char *restriction_name; 791addd79feSZach Atkins CeedCall(CeedCalloc(17 + name_len, &restriction_name)); 792addd79feSZach Atkins sprintf(restriction_name, "restriction%s%s", has_name ? " for " : "", has_name ? op_fine->name : ""); 793addd79feSZach Atkins CeedCall(CeedOperatorSetName(*op_restrict, restriction_name)); 794addd79feSZach Atkins CeedCall(CeedFree(&restriction_name)); 795addd79feSZach Atkins 796addd79feSZach Atkins // Check 797addd79feSZach Atkins CeedCall(CeedOperatorCheckReady(*op_restrict)); 798addd79feSZach Atkins 799addd79feSZach Atkins // Cleanup 800addd79feSZach Atkins CeedCall(CeedQFunctionDestroy(&qf_restrict)); 801addd79feSZach Atkins } 802addd79feSZach Atkins 803eaf62fffSJeremy L Thompson // Prolongation 804addd79feSZach Atkins if (op_prolong) { 805eaf62fffSJeremy L Thompson CeedInt *num_comp_p_data; 80685bb9dcfSJeremy L Thompson CeedQFunction qf_prolong; 80785bb9dcfSJeremy L Thompson CeedQFunctionContext ctx_p; 80885bb9dcfSJeremy L Thompson 80985bb9dcfSJeremy L Thompson CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_prolong)); 8102b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &num_comp_p_data)); 811eaf62fffSJeremy L Thompson num_comp_p_data[0] = num_comp; 8122b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextCreate(ceed, &ctx_p)); 8132b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextSetData(ctx_p, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_p_data), num_comp_p_data)); 8142b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(qf_prolong, ctx_p)); 8152b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextDestroy(&ctx_p)); 8162b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_prolong, "input", num_comp, CEED_EVAL_INTERP)); 8172b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_prolong, "scale", num_comp, CEED_EVAL_NONE)); 8182b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(qf_prolong, "output", num_comp, CEED_EVAL_NONE)); 8192b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_prolong, num_comp)); 820eaf62fffSJeremy L Thompson 8212b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed, qf_prolong, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_prolong)); 8222b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_prolong, "input", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE)); 823c17ec2beSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_prolong, "scale", rstr_p_mult_fine, CEED_BASIS_COLLOCATED, mult_vec)); 8242b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_prolong, "output", rstr_fine, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE)); 825eaf62fffSJeremy L Thompson 826addd79feSZach Atkins // Set name 827ea6b5821SJeremy L Thompson char *prolongation_name; 8282b730f8bSJeremy L Thompson CeedCall(CeedCalloc(18 + name_len, &prolongation_name)); 8292b730f8bSJeremy L Thompson sprintf(prolongation_name, "prolongation%s%s", has_name ? " for " : "", has_name ? op_fine->name : ""); 8302b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetName(*op_prolong, prolongation_name)); 8312b730f8bSJeremy L Thompson CeedCall(CeedFree(&prolongation_name)); 832addd79feSZach Atkins 833addd79feSZach Atkins // Check 834addd79feSZach Atkins CeedCall(CeedOperatorCheckReady(*op_prolong)); 835addd79feSZach Atkins 836addd79feSZach Atkins // Cleanup 837addd79feSZach Atkins CeedCall(CeedQFunctionDestroy(&qf_prolong)); 838ea6b5821SJeremy L Thompson } 839ea6b5821SJeremy L Thompson 84058e4b056SJeremy L Thompson // Check 84158e4b056SJeremy L Thompson CeedCall(CeedOperatorCheckReady(*op_coarse)); 84258e4b056SJeremy L Thompson 843eaf62fffSJeremy L Thompson // Cleanup 8442b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&mult_vec)); 845c17ec2beSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_p_mult_fine)); 8462b730f8bSJeremy L Thompson CeedCall(CeedBasisDestroy(&basis_c_to_f)); 847805fe78eSJeremy L Thompson 848eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 849eaf62fffSJeremy L Thompson } 850eaf62fffSJeremy L Thompson 851eaf62fffSJeremy L Thompson /** 852eaf62fffSJeremy L Thompson @brief Build 1D mass matrix and Laplacian with perturbation 853eaf62fffSJeremy L Thompson 854eaf62fffSJeremy L Thompson @param[in] interp_1d Interpolation matrix in one dimension 855eaf62fffSJeremy L Thompson @param[in] grad_1d Gradient matrix in one dimension 856eaf62fffSJeremy L Thompson @param[in] q_weight_1d Quadrature weights in one dimension 857eaf62fffSJeremy L Thompson @param[in] P_1d Number of basis nodes in one dimension 858eaf62fffSJeremy L Thompson @param[in] Q_1d Number of quadrature points in one dimension 859eaf62fffSJeremy L Thompson @param[in] dim Dimension of basis 860eaf62fffSJeremy L Thompson @param[out] mass Assembled mass matrix in one dimension 861eaf62fffSJeremy L Thompson @param[out] laplace Assembled perturbed Laplacian in one dimension 862eaf62fffSJeremy L Thompson 863eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 864eaf62fffSJeremy L Thompson 865eaf62fffSJeremy L Thompson @ref Developer 866eaf62fffSJeremy L Thompson **/ 8672c2ea1dbSJeremy L Thompson CeedPragmaOptimizeOff 8682c2ea1dbSJeremy L Thompson static int CeedBuildMassLaplace(const CeedScalar *interp_1d, const CeedScalar *grad_1d, const CeedScalar *q_weight_1d, CeedInt P_1d, CeedInt Q_1d, 8692c2ea1dbSJeremy L Thompson CeedInt dim, CeedScalar *mass, CeedScalar *laplace) { 8702b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) { 871eaf62fffSJeremy L Thompson for (CeedInt j = 0; j < P_1d; j++) { 872eaf62fffSJeremy L Thompson CeedScalar sum = 0.0; 8732b730f8bSJeremy L Thompson for (CeedInt k = 0; k < Q_1d; k++) sum += interp_1d[k * P_1d + i] * q_weight_1d[k] * interp_1d[k * P_1d + j]; 874eaf62fffSJeremy L Thompson mass[i + j * P_1d] = sum; 875eaf62fffSJeremy L Thompson } 8762b730f8bSJeremy L Thompson } 877eaf62fffSJeremy L Thompson // -- Laplacian 8782b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) { 879eaf62fffSJeremy L Thompson for (CeedInt j = 0; j < P_1d; j++) { 880eaf62fffSJeremy L Thompson CeedScalar sum = 0.0; 8812b730f8bSJeremy L Thompson for (CeedInt k = 0; k < Q_1d; k++) sum += grad_1d[k * P_1d + i] * q_weight_1d[k] * grad_1d[k * P_1d + j]; 882eaf62fffSJeremy L Thompson laplace[i + j * P_1d] = sum; 883eaf62fffSJeremy L Thompson } 8842b730f8bSJeremy L Thompson } 885eaf62fffSJeremy L Thompson CeedScalar perturbation = dim > 2 ? 1e-6 : 1e-4; 8862b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) laplace[i + P_1d * i] += perturbation; 887eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 888eaf62fffSJeremy L Thompson } 8892c2ea1dbSJeremy L Thompson CeedPragmaOptimizeOn 890eaf62fffSJeremy L Thompson 891eaf62fffSJeremy L Thompson /// @} 892eaf62fffSJeremy L Thompson 893eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 894480fae85SJeremy L Thompson /// CeedOperator Backend API 895480fae85SJeremy L Thompson /// ---------------------------------------------------------------------------- 896480fae85SJeremy L Thompson /// @addtogroup CeedOperatorBackend 897480fae85SJeremy L Thompson /// @{ 898480fae85SJeremy L Thompson 899480fae85SJeremy L Thompson /** 900480fae85SJeremy L Thompson @brief Create object holding CeedQFunction assembly data for CeedOperator 901480fae85SJeremy L Thompson 902480fae85SJeremy L Thompson @param[in] ceed A Ceed object where the CeedQFunctionAssemblyData will be created 903ea61e9acSJeremy L Thompson @param[out] data Address of the variable where the newly created CeedQFunctionAssemblyData will be stored 904480fae85SJeremy L Thompson 905480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 906480fae85SJeremy L Thompson 907480fae85SJeremy L Thompson @ref Backend 908480fae85SJeremy L Thompson **/ 909ea61e9acSJeremy L Thompson int CeedQFunctionAssemblyDataCreate(Ceed ceed, CeedQFunctionAssemblyData *data) { 9102b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, data)); 911480fae85SJeremy L Thompson (*data)->ref_count = 1; 912480fae85SJeremy L Thompson (*data)->ceed = ceed; 9132b730f8bSJeremy L Thompson CeedCall(CeedReference(ceed)); 914480fae85SJeremy L Thompson 915480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 916480fae85SJeremy L Thompson } 917480fae85SJeremy L Thompson 918480fae85SJeremy L Thompson /** 919480fae85SJeremy L Thompson @brief Increment the reference counter for a CeedQFunctionAssemblyData 920480fae85SJeremy L Thompson 921ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to increment the reference counter 922480fae85SJeremy L Thompson 923480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 924480fae85SJeremy L Thompson 925480fae85SJeremy L Thompson @ref Backend 926480fae85SJeremy L Thompson **/ 927480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataReference(CeedQFunctionAssemblyData data) { 928480fae85SJeremy L Thompson data->ref_count++; 929480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 930480fae85SJeremy L Thompson } 931480fae85SJeremy L Thompson 932480fae85SJeremy L Thompson /** 933beecbf24SJeremy L Thompson @brief Set re-use of CeedQFunctionAssemblyData 9348b919e6bSJeremy L Thompson 935ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to mark for reuse 936ea61e9acSJeremy L Thompson @param[in] reuse_data Boolean flag indicating data re-use 9378b919e6bSJeremy L Thompson 9388b919e6bSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 9398b919e6bSJeremy L Thompson 9408b919e6bSJeremy L Thompson @ref Backend 9418b919e6bSJeremy L Thompson **/ 9422b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetReuse(CeedQFunctionAssemblyData data, bool reuse_data) { 943beecbf24SJeremy L Thompson data->reuse_data = reuse_data; 944beecbf24SJeremy L Thompson data->needs_data_update = true; 945beecbf24SJeremy L Thompson return CEED_ERROR_SUCCESS; 946beecbf24SJeremy L Thompson } 947beecbf24SJeremy L Thompson 948beecbf24SJeremy L Thompson /** 949beecbf24SJeremy L Thompson @brief Mark QFunctionAssemblyData as stale 950beecbf24SJeremy L Thompson 951ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to mark as stale 952ea61e9acSJeremy L Thompson @param[in] needs_data_update Boolean flag indicating if update is needed or completed 953beecbf24SJeremy L Thompson 954beecbf24SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 955beecbf24SJeremy L Thompson 956beecbf24SJeremy L Thompson @ref Backend 957beecbf24SJeremy L Thompson **/ 9582b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetUpdateNeeded(CeedQFunctionAssemblyData data, bool needs_data_update) { 959beecbf24SJeremy L Thompson data->needs_data_update = needs_data_update; 9608b919e6bSJeremy L Thompson return CEED_ERROR_SUCCESS; 9618b919e6bSJeremy L Thompson } 9628b919e6bSJeremy L Thompson 9638b919e6bSJeremy L Thompson /** 9648b919e6bSJeremy L Thompson @brief Determine if QFunctionAssemblyData needs update 9658b919e6bSJeremy L Thompson 9668b919e6bSJeremy L Thompson @param[in] data CeedQFunctionAssemblyData to mark as stale 9678b919e6bSJeremy L Thompson @param[out] is_update_needed Boolean flag indicating if re-assembly is required 9688b919e6bSJeremy L Thompson 9698b919e6bSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 9708b919e6bSJeremy L Thompson 9718b919e6bSJeremy L Thompson @ref Backend 9728b919e6bSJeremy L Thompson **/ 9732b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsUpdateNeeded(CeedQFunctionAssemblyData data, bool *is_update_needed) { 974beecbf24SJeremy L Thompson *is_update_needed = !data->reuse_data || data->needs_data_update; 9758b919e6bSJeremy L Thompson return CEED_ERROR_SUCCESS; 9768b919e6bSJeremy L Thompson } 9778b919e6bSJeremy L Thompson 9788b919e6bSJeremy L Thompson /** 979ea61e9acSJeremy L Thompson @brief Copy the pointer to a CeedQFunctionAssemblyData. 9804385fb7fSSebastian Grimberg 981ea61e9acSJeremy L Thompson Both pointers should be destroyed with `CeedCeedQFunctionAssemblyDataDestroy()`. 982512bb800SJeremy L Thompson 983512bb800SJeremy L Thompson Note: If the value of `data_copy` passed to this function is non-NULL, then it is assumed that `*data_copy` is a pointer to a 984512bb800SJeremy L Thompson CeedQFunctionAssemblyData. This CeedQFunctionAssemblyData will be destroyed if `data_copy` is the only reference to this 985512bb800SJeremy L Thompson CeedQFunctionAssemblyData. 986480fae85SJeremy L Thompson 987ea61e9acSJeremy L Thompson @param[in] data CeedQFunctionAssemblyData to copy reference to 988ea61e9acSJeremy L Thompson @param[in,out] data_copy Variable to store copied reference 989480fae85SJeremy L Thompson 990480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 991480fae85SJeremy L Thompson 992480fae85SJeremy L Thompson @ref Backend 993480fae85SJeremy L Thompson **/ 9942b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataReferenceCopy(CeedQFunctionAssemblyData data, CeedQFunctionAssemblyData *data_copy) { 9952b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataReference(data)); 9962b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataDestroy(data_copy)); 997480fae85SJeremy L Thompson *data_copy = data; 998480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 999480fae85SJeremy L Thompson } 1000480fae85SJeremy L Thompson 1001480fae85SJeremy L Thompson /** 1002480fae85SJeremy L Thompson @brief Get setup status for internal objects for CeedQFunctionAssemblyData 1003480fae85SJeremy L Thompson 1004ea61e9acSJeremy L Thompson @param[in] data CeedQFunctionAssemblyData to retrieve status 1005480fae85SJeremy L Thompson @param[out] is_setup Boolean flag for setup status 1006480fae85SJeremy L Thompson 1007480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1008480fae85SJeremy L Thompson 1009480fae85SJeremy L Thompson @ref Backend 1010480fae85SJeremy L Thompson **/ 10112b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsSetup(CeedQFunctionAssemblyData data, bool *is_setup) { 1012480fae85SJeremy L Thompson *is_setup = data->is_setup; 1013480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1014480fae85SJeremy L Thompson } 1015480fae85SJeremy L Thompson 1016480fae85SJeremy L Thompson /** 1017480fae85SJeremy L Thompson @brief Set internal objects for CeedQFunctionAssemblyData 1018480fae85SJeremy L Thompson 1019ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to set objects 1020480fae85SJeremy L Thompson @param[in] vec CeedVector to store assembled CeedQFunction at quadrature points 1021480fae85SJeremy L Thompson @param[in] rstr CeedElemRestriction for CeedVector containing assembled CeedQFunction 1022480fae85SJeremy L Thompson 1023480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1024480fae85SJeremy L Thompson 1025480fae85SJeremy L Thompson @ref Backend 1026480fae85SJeremy L Thompson **/ 10272b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetObjects(CeedQFunctionAssemblyData data, CeedVector vec, CeedElemRestriction rstr) { 10282b730f8bSJeremy L Thompson CeedCall(CeedVectorReferenceCopy(vec, &data->vec)); 10292b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(rstr, &data->rstr)); 1030480fae85SJeremy L Thompson 1031480fae85SJeremy L Thompson data->is_setup = true; 1032480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1033480fae85SJeremy L Thompson } 1034480fae85SJeremy L Thompson 10352b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataGetObjects(CeedQFunctionAssemblyData data, CeedVector *vec, CeedElemRestriction *rstr) { 10366574a04fSJeremy L Thompson CeedCheck(data->is_setup, data->ceed, CEED_ERROR_INCOMPLETE, "Internal objects not set; must call CeedQFunctionAssemblyDataSetObjects first."); 1037480fae85SJeremy L Thompson 10382b730f8bSJeremy L Thompson CeedCall(CeedVectorReferenceCopy(data->vec, vec)); 10392b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(data->rstr, rstr)); 1040480fae85SJeremy L Thompson 1041480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1042480fae85SJeremy L Thompson } 1043480fae85SJeremy L Thompson 1044480fae85SJeremy L Thompson /** 1045480fae85SJeremy L Thompson @brief Destroy CeedQFunctionAssemblyData 1046480fae85SJeremy L Thompson 1047ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to destroy 1048480fae85SJeremy L Thompson 1049480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1050480fae85SJeremy L Thompson 1051480fae85SJeremy L Thompson @ref Backend 1052480fae85SJeremy L Thompson **/ 1053480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataDestroy(CeedQFunctionAssemblyData *data) { 1054ad6481ceSJeremy L Thompson if (!*data || --(*data)->ref_count > 0) { 1055ad6481ceSJeremy L Thompson *data = NULL; 1056ad6481ceSJeremy L Thompson return CEED_ERROR_SUCCESS; 1057ad6481ceSJeremy L Thompson } 10582b730f8bSJeremy L Thompson CeedCall(CeedDestroy(&(*data)->ceed)); 10592b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&(*data)->vec)); 10602b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&(*data)->rstr)); 1061480fae85SJeremy L Thompson 10622b730f8bSJeremy L Thompson CeedCall(CeedFree(data)); 1063480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1064480fae85SJeremy L Thompson } 1065480fae85SJeremy L Thompson 1066ed9e99e6SJeremy L Thompson /** 1067ed9e99e6SJeremy L Thompson @brief Get CeedOperatorAssemblyData 1068ed9e99e6SJeremy L Thompson 1069ed9e99e6SJeremy L Thompson @param[in] op CeedOperator to assemble 1070ed9e99e6SJeremy L Thompson @param[out] data CeedQFunctionAssemblyData 1071ed9e99e6SJeremy L Thompson 1072ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1073ed9e99e6SJeremy L Thompson 1074ed9e99e6SJeremy L Thompson @ref Backend 1075ed9e99e6SJeremy L Thompson **/ 10762b730f8bSJeremy L Thompson int CeedOperatorGetOperatorAssemblyData(CeedOperator op, CeedOperatorAssemblyData *data) { 1077ed9e99e6SJeremy L Thompson if (!op->op_assembled) { 1078ed9e99e6SJeremy L Thompson CeedOperatorAssemblyData data; 1079ed9e99e6SJeremy L Thompson 10802b730f8bSJeremy L Thompson CeedCall(CeedOperatorAssemblyDataCreate(op->ceed, op, &data)); 1081ed9e99e6SJeremy L Thompson op->op_assembled = data; 1082ed9e99e6SJeremy L Thompson } 1083ed9e99e6SJeremy L Thompson *data = op->op_assembled; 1084ed9e99e6SJeremy L Thompson 1085ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1086ed9e99e6SJeremy L Thompson } 1087ed9e99e6SJeremy L Thompson 1088ed9e99e6SJeremy L Thompson /** 1089ba746a46SJeremy L Thompson @brief Create object holding CeedOperator assembly data. 1090ba746a46SJeremy L Thompson 1091ba746a46SJeremy L Thompson The CeedOperatorAssemblyData holds an array with references to every active CeedBasis used in the CeedOperator. 1092ba746a46SJeremy L Thompson An array with references to the corresponding active CeedElemRestrictions is also stored. 1093ba746a46SJeremy L Thompson For each active CeedBasis, the CeedOperatorAssemblyData holds an array of all input and output CeedEvalModes for this CeedBasis. 1094ba746a46SJeremy L Thompson The CeedOperatorAssemblyData holds an array of offsets for indexing into the assembled CeedQFunction arrays to the row representing each 1095ba746a46SJeremy L Thompson CeedEvalMode. 1096ba746a46SJeremy L Thompson The number of input columns across all active bases for the assembled CeedQFunction is also stored. 1097ba746a46SJeremy L Thompson Lastly, the CeedOperatorAssembly data holds assembled matrices representing the full action of the CeedBasis for all CeedEvalModes. 1098ed9e99e6SJeremy L Thompson 1099ea61e9acSJeremy L Thompson @param[in] ceed Ceed object where the CeedOperatorAssemblyData will be created 1100ed9e99e6SJeremy L Thompson @param[in] op CeedOperator to be assembled 1101ea61e9acSJeremy L Thompson @param[out] data Address of the variable where the newly created CeedOperatorAssemblyData will be stored 1102ed9e99e6SJeremy L Thompson 1103ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1104ed9e99e6SJeremy L Thompson 1105ed9e99e6SJeremy L Thompson @ref Backend 1106ed9e99e6SJeremy L Thompson **/ 11072b730f8bSJeremy L Thompson int CeedOperatorAssemblyDataCreate(Ceed ceed, CeedOperator op, CeedOperatorAssemblyData *data) { 1108437c7c90SJeremy L Thompson CeedInt num_active_bases = 0; 1109437c7c90SJeremy L Thompson 1110437c7c90SJeremy L Thompson // Allocate 11112b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, data)); 1112ed9e99e6SJeremy L Thompson (*data)->ceed = ceed; 11132b730f8bSJeremy L Thompson CeedCall(CeedReference(ceed)); 1114ed9e99e6SJeremy L Thompson 1115ed9e99e6SJeremy L Thompson // Build OperatorAssembly data 1116ed9e99e6SJeremy L Thompson CeedQFunction qf; 1117ed9e99e6SJeremy L Thompson CeedQFunctionField *qf_fields; 1118ed9e99e6SJeremy L Thompson CeedOperatorField *op_fields; 1119ed9e99e6SJeremy L Thompson CeedInt num_input_fields; 11202b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 11212b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetFields(qf, &num_input_fields, &qf_fields, NULL, NULL)); 11222b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL)); 1123ed9e99e6SJeremy L Thompson 1124ed9e99e6SJeremy L Thompson // Determine active input basis 1125437c7c90SJeremy L Thompson CeedInt *num_eval_modes_in = NULL, *num_eval_modes_out = NULL, offset = 0; 1126437c7c90SJeremy L Thompson CeedEvalMode **eval_modes_in = NULL, **eval_modes_out = NULL; 1127437c7c90SJeremy L Thompson CeedSize **eval_mode_offsets_in = NULL, **eval_mode_offsets_out = NULL; 1128ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 1129ed9e99e6SJeremy L Thompson CeedVector vec; 11302b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec)); 1131ed9e99e6SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 1132437c7c90SJeremy L Thompson CeedBasis basis_in = NULL; 1133437c7c90SJeremy L Thompson CeedEvalMode eval_mode; 1134352a5e7cSSebastian Grimberg CeedInt index = -1, dim, num_comp, q_comp; 11352b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_in)); 11362b730f8bSJeremy L Thompson CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 1137352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetDimension(basis_in, &dim)); 1138352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumComponents(basis_in, &num_comp)); 1139352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(basis_in, eval_mode, &q_comp)); 1140437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_active_bases; i++) { 1141437c7c90SJeremy L Thompson if ((*data)->active_bases[i] == basis_in) index = i; 1142437c7c90SJeremy L Thompson } 1143437c7c90SJeremy L Thompson if (index == -1) { 1144437c7c90SJeremy L Thompson CeedElemRestriction elem_rstr_in; 1145437c7c90SJeremy L Thompson index = num_active_bases; 1146437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_bases)); 1147437c7c90SJeremy L Thompson (*data)->active_bases[num_active_bases] = NULL; 1148437c7c90SJeremy L Thompson CeedCall(CeedBasisReferenceCopy(basis_in, &(*data)->active_bases[num_active_bases])); 1149437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_elem_rstrs)); 1150437c7c90SJeremy L Thompson (*data)->active_elem_rstrs[num_active_bases] = NULL; 1151437c7c90SJeremy L Thompson CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr_in)); 1152437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(elem_rstr_in, &(*data)->active_elem_rstrs[num_active_bases])); 1153437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_in)); 1154437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_out)); 1155437c7c90SJeremy L Thompson num_eval_modes_in[index] = 0; 1156437c7c90SJeremy L Thompson num_eval_modes_out[index] = 0; 1157437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_in)); 1158437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_out)); 1159437c7c90SJeremy L Thompson eval_modes_in[index] = NULL; 1160437c7c90SJeremy L Thompson eval_modes_out[index] = NULL; 1161437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_in)); 1162437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_out)); 1163437c7c90SJeremy L Thompson eval_mode_offsets_in[index] = NULL; 1164437c7c90SJeremy L Thompson eval_mode_offsets_out[index] = NULL; 1165437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_in)); 1166437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_out)); 1167437c7c90SJeremy L Thompson (*data)->assembled_bases_in[index] = NULL; 1168437c7c90SJeremy L Thompson (*data)->assembled_bases_out[index] = NULL; 1169437c7c90SJeremy L Thompson num_active_bases++; 1170437c7c90SJeremy L Thompson } 1171352a5e7cSSebastian Grimberg if (eval_mode != CEED_EVAL_WEIGHT) { 1172352a5e7cSSebastian Grimberg // q_comp = 1 if CEED_EVAL_NONE, CEED_EVAL_WEIGHT caught by QF Assembly 1173352a5e7cSSebastian Grimberg CeedCall(CeedRealloc(num_eval_modes_in[index] + q_comp, &eval_modes_in[index])); 1174352a5e7cSSebastian Grimberg CeedCall(CeedRealloc(num_eval_modes_in[index] + q_comp, &eval_mode_offsets_in[index])); 1175352a5e7cSSebastian Grimberg for (CeedInt d = 0; d < q_comp; d++) { 1176437c7c90SJeremy L Thompson eval_modes_in[index][num_eval_modes_in[index] + d] = eval_mode; 1177437c7c90SJeremy L Thompson eval_mode_offsets_in[index][num_eval_modes_in[index] + d] = offset; 1178352a5e7cSSebastian Grimberg offset += num_comp; 1179ed9e99e6SJeremy L Thompson } 1180352a5e7cSSebastian Grimberg num_eval_modes_in[index] += q_comp; 1181ed9e99e6SJeremy L Thompson } 1182ed9e99e6SJeremy L Thompson } 1183ed9e99e6SJeremy L Thompson } 1184437c7c90SJeremy L Thompson (*data)->num_eval_modes_in = num_eval_modes_in; 1185437c7c90SJeremy L Thompson (*data)->eval_modes_in = eval_modes_in; 1186437c7c90SJeremy L Thompson (*data)->eval_mode_offsets_in = eval_mode_offsets_in; 1187ed9e99e6SJeremy L Thompson 1188ed9e99e6SJeremy L Thompson // Determine active output basis 1189ed9e99e6SJeremy L Thompson CeedInt num_output_fields; 11902b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetFields(qf, NULL, NULL, &num_output_fields, &qf_fields)); 11912b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields)); 1192437c7c90SJeremy L Thompson offset = 0; 1193ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_output_fields; i++) { 1194ed9e99e6SJeremy L Thompson CeedVector vec; 11952b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec)); 1196ed9e99e6SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 1197437c7c90SJeremy L Thompson CeedBasis basis_out = NULL; 1198ed9e99e6SJeremy L Thompson CeedEvalMode eval_mode; 1199352a5e7cSSebastian Grimberg CeedInt index = -1, dim, num_comp, q_comp; 1200437c7c90SJeremy L Thompson CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_out)); 12012b730f8bSJeremy L Thompson CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 1202352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetDimension(basis_out, &dim)); 1203352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumComponents(basis_out, &num_comp)); 1204352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(basis_out, eval_mode, &q_comp)); 1205437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_active_bases; i++) { 1206437c7c90SJeremy L Thompson if ((*data)->active_bases[i] == basis_out) index = i; 1207437c7c90SJeremy L Thompson } 1208437c7c90SJeremy L Thompson if (index == -1) { 1209437c7c90SJeremy L Thompson CeedElemRestriction elem_rstr_out; 1210437c7c90SJeremy L Thompson 1211437c7c90SJeremy L Thompson index = num_active_bases; 1212437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_bases)); 1213437c7c90SJeremy L Thompson (*data)->active_bases[num_active_bases] = NULL; 1214437c7c90SJeremy L Thompson CeedCall(CeedBasisReferenceCopy(basis_out, &(*data)->active_bases[num_active_bases])); 1215437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_elem_rstrs)); 1216437c7c90SJeremy L Thompson (*data)->active_elem_rstrs[num_active_bases] = NULL; 1217437c7c90SJeremy L Thompson CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr_out)); 1218437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(elem_rstr_out, &(*data)->active_elem_rstrs[num_active_bases])); 1219437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_in)); 1220437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_out)); 1221437c7c90SJeremy L Thompson num_eval_modes_in[index] = 0; 1222437c7c90SJeremy L Thompson num_eval_modes_out[index] = 0; 1223437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_in)); 1224437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_out)); 1225437c7c90SJeremy L Thompson eval_modes_in[index] = NULL; 1226437c7c90SJeremy L Thompson eval_modes_out[index] = NULL; 1227437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_in)); 1228437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_out)); 1229437c7c90SJeremy L Thompson eval_mode_offsets_in[index] = NULL; 1230437c7c90SJeremy L Thompson eval_mode_offsets_out[index] = NULL; 1231437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_in)); 1232437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_out)); 1233437c7c90SJeremy L Thompson (*data)->assembled_bases_in[index] = NULL; 1234437c7c90SJeremy L Thompson (*data)->assembled_bases_out[index] = NULL; 1235437c7c90SJeremy L Thompson num_active_bases++; 1236437c7c90SJeremy L Thompson } 1237352a5e7cSSebastian Grimberg if (eval_mode != CEED_EVAL_WEIGHT) { 1238352a5e7cSSebastian Grimberg // q_comp = 1 if CEED_EVAL_NONE, CEED_EVAL_WEIGHT caught by QF Assembly 1239352a5e7cSSebastian Grimberg CeedCall(CeedRealloc(num_eval_modes_out[index] + q_comp, &eval_modes_out[index])); 1240352a5e7cSSebastian Grimberg CeedCall(CeedRealloc(num_eval_modes_out[index] + q_comp, &eval_mode_offsets_out[index])); 1241352a5e7cSSebastian Grimberg for (CeedInt d = 0; d < q_comp; d++) { 1242437c7c90SJeremy L Thompson eval_modes_out[index][num_eval_modes_out[index] + d] = eval_mode; 1243437c7c90SJeremy L Thompson eval_mode_offsets_out[index][num_eval_modes_out[index] + d] = offset; 1244352a5e7cSSebastian Grimberg offset += num_comp; 1245ed9e99e6SJeremy L Thompson } 1246352a5e7cSSebastian Grimberg num_eval_modes_out[index] += q_comp; 1247ed9e99e6SJeremy L Thompson } 1248ed9e99e6SJeremy L Thompson } 1249ed9e99e6SJeremy L Thompson } 1250437c7c90SJeremy L Thompson (*data)->num_output_components = offset; 1251437c7c90SJeremy L Thompson (*data)->num_eval_modes_out = num_eval_modes_out; 1252437c7c90SJeremy L Thompson (*data)->eval_modes_out = eval_modes_out; 1253437c7c90SJeremy L Thompson (*data)->eval_mode_offsets_out = eval_mode_offsets_out; 1254437c7c90SJeremy L Thompson (*data)->num_active_bases = num_active_bases; 1255ed9e99e6SJeremy L Thompson 1256ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1257ed9e99e6SJeremy L Thompson } 1258ed9e99e6SJeremy L Thompson 1259ed9e99e6SJeremy L Thompson /** 1260ba746a46SJeremy L Thompson @brief Get CeedOperator CeedEvalModes for assembly. 1261ba746a46SJeremy L Thompson 1262ba746a46SJeremy L Thompson Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object. 1263ed9e99e6SJeremy L Thompson 1264ed9e99e6SJeremy L Thompson @param[in] data CeedOperatorAssemblyData 1265ba746a46SJeremy L Thompson @param[out] num_active_bases Total number of active bases 1266c5d0f995SJed Brown @param[out] num_eval_modes_in Pointer to hold array of numbers of input CeedEvalModes, or NULL. 1267ba746a46SJeremy L Thompson `eval_modes_in[0]` holds an array of eval modes for the first active basis. 1268c5d0f995SJed Brown @param[out] eval_modes_in Pointer to hold arrays of input CeedEvalModes, or NULL. 1269ba746a46SJeremy L Thompson @param[out] eval_mode_offsets_in Pointer to hold arrays of input offsets at each quadrature point. 1270c5d0f995SJed Brown @param[out] num_eval_modes_out Pointer to hold array of numbers of output CeedEvalModes, or NULL 1271c5d0f995SJed Brown @param[out] eval_modes_out Pointer to hold arrays of output CeedEvalModes, or NULL. 1272437c7c90SJeremy L Thompson @param[out] eval_mode_offsets_out Pointer to hold arrays of output offsets at each quadrature point 1273ba746a46SJeremy L Thompson @param[out] num_output_components The number of columns in the assembled CeedQFunction matrix for each quadrature point, 1274ba746a46SJeremy L Thompson including contributions of all active bases 1275ed9e99e6SJeremy L Thompson 1276ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1277ed9e99e6SJeremy L Thompson 1278c5d0f995SJed Brown 1279ed9e99e6SJeremy L Thompson @ref Backend 1280ed9e99e6SJeremy L Thompson **/ 1281437c7c90SJeremy L Thompson int CeedOperatorAssemblyDataGetEvalModes(CeedOperatorAssemblyData data, CeedInt *num_active_bases, CeedInt **num_eval_modes_in, 1282437c7c90SJeremy L Thompson const CeedEvalMode ***eval_modes_in, CeedSize ***eval_mode_offsets_in, CeedInt **num_eval_modes_out, 1283437c7c90SJeremy L Thompson const CeedEvalMode ***eval_modes_out, CeedSize ***eval_mode_offsets_out, CeedSize *num_output_components) { 1284437c7c90SJeremy L Thompson if (num_active_bases) *num_active_bases = data->num_active_bases; 1285437c7c90SJeremy L Thompson if (num_eval_modes_in) *num_eval_modes_in = data->num_eval_modes_in; 1286437c7c90SJeremy L Thompson if (eval_modes_in) *eval_modes_in = (const CeedEvalMode **)data->eval_modes_in; 1287437c7c90SJeremy L Thompson if (eval_mode_offsets_in) *eval_mode_offsets_in = data->eval_mode_offsets_in; 1288437c7c90SJeremy L Thompson if (num_eval_modes_out) *num_eval_modes_out = data->num_eval_modes_out; 1289437c7c90SJeremy L Thompson if (eval_modes_out) *eval_modes_out = (const CeedEvalMode **)data->eval_modes_out; 1290437c7c90SJeremy L Thompson if (eval_mode_offsets_out) *eval_mode_offsets_out = data->eval_mode_offsets_out; 1291437c7c90SJeremy L Thompson if (num_output_components) *num_output_components = data->num_output_components; 1292ed9e99e6SJeremy L Thompson 1293ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1294ed9e99e6SJeremy L Thompson } 1295ed9e99e6SJeremy L Thompson 1296ed9e99e6SJeremy L Thompson /** 1297ba746a46SJeremy L Thompson @brief Get CeedOperator CeedBasis data for assembly. 1298ba746a46SJeremy L Thompson 1299ba746a46SJeremy L Thompson Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object. 1300ed9e99e6SJeremy L Thompson 1301ed9e99e6SJeremy L Thompson @param[in] data CeedOperatorAssemblyData 1302437c7c90SJeremy L Thompson @param[out] num_active_bases Number of active bases, or NULL 1303437c7c90SJeremy L Thompson @param[out] active_bases Pointer to hold active CeedBasis, or NULL 1304437c7c90SJeremy L Thompson @param[out] assembled_bases_in Pointer to hold assembled active input B, or NULL 1305437c7c90SJeremy L Thompson @param[out] assembled_bases_out Pointer to hold assembled active output B, or NULL 1306ed9e99e6SJeremy L Thompson 1307ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1308ed9e99e6SJeremy L Thompson 1309ed9e99e6SJeremy L Thompson @ref Backend 1310ed9e99e6SJeremy L Thompson **/ 1311437c7c90SJeremy L Thompson int CeedOperatorAssemblyDataGetBases(CeedOperatorAssemblyData data, CeedInt *num_active_bases, CeedBasis **active_bases, 1312437c7c90SJeremy L Thompson const CeedScalar ***assembled_bases_in, const CeedScalar ***assembled_bases_out) { 1313ed9e99e6SJeremy L Thompson // Assemble B_in, B_out if needed 1314437c7c90SJeremy L Thompson if (assembled_bases_in && !data->assembled_bases_in[0]) { 1315437c7c90SJeremy L Thompson CeedInt num_qpts; 1316437c7c90SJeremy L Thompson 1317437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(data->active_bases[0], &num_qpts)); 1318437c7c90SJeremy L Thompson for (CeedInt b = 0; b < data->num_active_bases; b++) { 1319352a5e7cSSebastian Grimberg CeedInt num_nodes; 1320437c7c90SJeremy L Thompson CeedScalar *B_in = NULL, *identity = NULL; 1321ed9e99e6SJeremy L Thompson bool has_eval_none = false; 1322ed9e99e6SJeremy L Thompson 1323352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumNodes(data->active_bases[b], &num_nodes)); 1324352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_qpts * num_nodes * data->num_eval_modes_in[b], &B_in)); 1325ed9e99e6SJeremy L Thompson 1326437c7c90SJeremy L Thompson for (CeedInt i = 0; i < data->num_eval_modes_in[b]; i++) { 1327437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (data->eval_modes_in[b][i] == CEED_EVAL_NONE); 1328ed9e99e6SJeremy L Thompson } 1329ed9e99e6SJeremy L Thompson if (has_eval_none) { 1330352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_qpts * num_nodes, &identity)); 1331352a5e7cSSebastian Grimberg for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) { 1332352a5e7cSSebastian Grimberg identity[i * num_nodes + i] = 1.0; 1333ed9e99e6SJeremy L Thompson } 1334ed9e99e6SJeremy L Thompson } 1335ed9e99e6SJeremy L Thompson 1336ed9e99e6SJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 1337352a5e7cSSebastian Grimberg for (CeedInt n = 0; n < num_nodes; n++) { 1338352a5e7cSSebastian Grimberg CeedInt d_in = 0, q_comp_in; 1339352a5e7cSSebastian Grimberg CeedEvalMode eval_mode_in_prev = CEED_EVAL_NONE; 1340437c7c90SJeremy L Thompson for (CeedInt e_in = 0; e_in < data->num_eval_modes_in[b]; e_in++) { 1341437c7c90SJeremy L Thompson const CeedInt qq = data->num_eval_modes_in[b] * q; 1342437c7c90SJeremy L Thompson const CeedScalar *B = NULL; 1343352a5e7cSSebastian Grimberg CeedOperatorGetBasisPointer(data->active_bases[b], data->eval_modes_in[b][e_in], identity, &B); 1344352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(data->active_bases[b], data->eval_modes_in[b][e_in], &q_comp_in)); 1345352a5e7cSSebastian Grimberg if (q_comp_in > 1) { 1346352a5e7cSSebastian Grimberg if (e_in == 0 || data->eval_modes_in[b][e_in] != eval_mode_in_prev) d_in = 0; 1347352a5e7cSSebastian Grimberg else B = &B[(++d_in) * num_qpts * num_nodes]; 1348352a5e7cSSebastian Grimberg } 1349352a5e7cSSebastian Grimberg eval_mode_in_prev = data->eval_modes_in[b][e_in]; 1350352a5e7cSSebastian Grimberg B_in[(qq + e_in) * num_nodes + n] = B[q * num_nodes + n]; 1351ed9e99e6SJeremy L Thompson } 1352ed9e99e6SJeremy L Thompson } 1353ed9e99e6SJeremy L Thompson } 1354437c7c90SJeremy L Thompson if (identity) CeedCall(CeedFree(identity)); 1355437c7c90SJeremy L Thompson data->assembled_bases_in[b] = B_in; 1356437c7c90SJeremy L Thompson } 1357ed9e99e6SJeremy L Thompson } 1358ed9e99e6SJeremy L Thompson 1359437c7c90SJeremy L Thompson if (assembled_bases_out && !data->assembled_bases_out[0]) { 1360437c7c90SJeremy L Thompson CeedInt num_qpts; 1361437c7c90SJeremy L Thompson 1362437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(data->active_bases[0], &num_qpts)); 1363437c7c90SJeremy L Thompson for (CeedInt b = 0; b < data->num_active_bases; b++) { 1364352a5e7cSSebastian Grimberg CeedInt num_nodes; 1365ed9e99e6SJeremy L Thompson bool has_eval_none = false; 1366437c7c90SJeremy L Thompson CeedScalar *B_out = NULL, *identity = NULL; 1367ed9e99e6SJeremy L Thompson 1368352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumNodes(data->active_bases[b], &num_nodes)); 1369352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_qpts * num_nodes * data->num_eval_modes_out[b], &B_out)); 1370ed9e99e6SJeremy L Thompson 1371437c7c90SJeremy L Thompson for (CeedInt i = 0; i < data->num_eval_modes_out[b]; i++) { 1372437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (data->eval_modes_out[b][i] == CEED_EVAL_NONE); 1373ed9e99e6SJeremy L Thompson } 1374ed9e99e6SJeremy L Thompson if (has_eval_none) { 1375352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_qpts * num_nodes, &identity)); 1376352a5e7cSSebastian Grimberg for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) { 1377352a5e7cSSebastian Grimberg identity[i * num_nodes + i] = 1.0; 1378ed9e99e6SJeremy L Thompson } 1379ed9e99e6SJeremy L Thompson } 1380ed9e99e6SJeremy L Thompson 1381ed9e99e6SJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 1382352a5e7cSSebastian Grimberg for (CeedInt n = 0; n < num_nodes; n++) { 1383352a5e7cSSebastian Grimberg CeedInt d_out = 0, q_comp_out; 1384352a5e7cSSebastian Grimberg CeedEvalMode eval_mode_out_prev = CEED_EVAL_NONE; 1385437c7c90SJeremy L Thompson for (CeedInt e_out = 0; e_out < data->num_eval_modes_out[b]; e_out++) { 1386437c7c90SJeremy L Thompson const CeedInt qq = data->num_eval_modes_out[b] * q; 1387437c7c90SJeremy L Thompson const CeedScalar *B = NULL; 1388352a5e7cSSebastian Grimberg CeedOperatorGetBasisPointer(data->active_bases[b], data->eval_modes_out[b][e_out], identity, &B); 1389352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(data->active_bases[b], data->eval_modes_out[b][e_out], &q_comp_out)); 1390352a5e7cSSebastian Grimberg if (q_comp_out > 1) { 1391352a5e7cSSebastian Grimberg if (e_out == 0 || data->eval_modes_out[b][e_out] != eval_mode_out_prev) d_out = 0; 1392352a5e7cSSebastian Grimberg else B = &B[(++d_out) * num_qpts * num_nodes]; 1393352a5e7cSSebastian Grimberg } 1394352a5e7cSSebastian Grimberg eval_mode_out_prev = data->eval_modes_out[b][e_out]; 1395352a5e7cSSebastian Grimberg B_out[(qq + e_out) * num_nodes + n] = B[q * num_nodes + n]; 1396ed9e99e6SJeremy L Thompson } 1397ed9e99e6SJeremy L Thompson } 1398ed9e99e6SJeremy L Thompson } 1399437c7c90SJeremy L Thompson if (identity) CeedCall(CeedFree(identity)); 1400437c7c90SJeremy L Thompson data->assembled_bases_out[b] = B_out; 1401437c7c90SJeremy L Thompson } 1402ed9e99e6SJeremy L Thompson } 1403ed9e99e6SJeremy L Thompson 1404437c7c90SJeremy L Thompson // Pass out assembled data 1405437c7c90SJeremy L Thompson if (active_bases) *active_bases = data->active_bases; 1406437c7c90SJeremy L Thompson if (assembled_bases_in) *assembled_bases_in = (const CeedScalar **)data->assembled_bases_in; 1407437c7c90SJeremy L Thompson if (assembled_bases_out) *assembled_bases_out = (const CeedScalar **)data->assembled_bases_out; 1408437c7c90SJeremy L Thompson 1409437c7c90SJeremy L Thompson return CEED_ERROR_SUCCESS; 1410437c7c90SJeremy L Thompson } 1411437c7c90SJeremy L Thompson 1412437c7c90SJeremy L Thompson /** 1413ba746a46SJeremy L Thompson @brief Get CeedOperator CeedBasis data for assembly. 1414ba746a46SJeremy L Thompson 1415ba746a46SJeremy L Thompson Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object. 1416437c7c90SJeremy L Thompson 1417437c7c90SJeremy L Thompson @param[in] data CeedOperatorAssemblyData 1418437c7c90SJeremy L Thompson @param[out] num_active_elem_rstrs Number of active element restrictions, or NULL 1419437c7c90SJeremy L Thompson @param[out] active_elem_rstrs Pointer to hold active CeedElemRestrictions, or NULL 1420437c7c90SJeremy L Thompson 1421437c7c90SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1422437c7c90SJeremy L Thompson 1423437c7c90SJeremy L Thompson @ref Backend 1424437c7c90SJeremy L Thompson **/ 1425437c7c90SJeremy L Thompson int CeedOperatorAssemblyDataGetElemRestrictions(CeedOperatorAssemblyData data, CeedInt *num_active_elem_rstrs, 1426437c7c90SJeremy L Thompson CeedElemRestriction **active_elem_rstrs) { 1427437c7c90SJeremy L Thompson if (num_active_elem_rstrs) *num_active_elem_rstrs = data->num_active_bases; 1428437c7c90SJeremy L Thompson if (active_elem_rstrs) *active_elem_rstrs = data->active_elem_rstrs; 1429ed9e99e6SJeremy L Thompson 1430ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1431ed9e99e6SJeremy L Thompson } 1432ed9e99e6SJeremy L Thompson 1433ed9e99e6SJeremy L Thompson /** 1434ed9e99e6SJeremy L Thompson @brief Destroy CeedOperatorAssemblyData 1435ed9e99e6SJeremy L Thompson 1436ea61e9acSJeremy L Thompson @param[in,out] data CeedOperatorAssemblyData to destroy 1437ed9e99e6SJeremy L Thompson 1438ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1439ed9e99e6SJeremy L Thompson 1440ed9e99e6SJeremy L Thompson @ref Backend 1441ed9e99e6SJeremy L Thompson **/ 1442ed9e99e6SJeremy L Thompson int CeedOperatorAssemblyDataDestroy(CeedOperatorAssemblyData *data) { 1443ad6481ceSJeremy L Thompson if (!*data) { 1444ad6481ceSJeremy L Thompson *data = NULL; 1445ad6481ceSJeremy L Thompson return CEED_ERROR_SUCCESS; 1446ad6481ceSJeremy L Thompson } 14472b730f8bSJeremy L Thompson CeedCall(CeedDestroy(&(*data)->ceed)); 1448437c7c90SJeremy L Thompson for (CeedInt b = 0; b < (*data)->num_active_bases; b++) { 1449437c7c90SJeremy L Thompson CeedCall(CeedBasisDestroy(&(*data)->active_bases[b])); 1450437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&(*data)->active_elem_rstrs[b])); 1451437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_in[b])); 1452437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_out[b])); 1453437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_in[b])); 1454437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_out[b])); 1455437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_in[b])); 1456437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_out[b])); 1457437c7c90SJeremy L Thompson } 1458437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->active_bases)); 1459437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->active_elem_rstrs)); 1460437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->num_eval_modes_in)); 1461437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->num_eval_modes_out)); 1462437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_in)); 1463437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_out)); 1464437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_in)); 1465437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_out)); 1466437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_in)); 1467437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_out)); 1468ed9e99e6SJeremy L Thompson 14692b730f8bSJeremy L Thompson CeedCall(CeedFree(data)); 1470ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1471ed9e99e6SJeremy L Thompson } 1472ed9e99e6SJeremy L Thompson 1473480fae85SJeremy L Thompson /// @} 1474480fae85SJeremy L Thompson 1475480fae85SJeremy L Thompson /// ---------------------------------------------------------------------------- 1476eaf62fffSJeremy L Thompson /// CeedOperator Public API 1477eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 1478eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorUser 1479eaf62fffSJeremy L Thompson /// @{ 1480eaf62fffSJeremy L Thompson 1481eaf62fffSJeremy L Thompson /** 1482eaf62fffSJeremy L Thompson @brief Assemble a linear CeedQFunction associated with a CeedOperator 1483eaf62fffSJeremy L Thompson 1484ea61e9acSJeremy L Thompson This returns a CeedVector containing a matrix at each quadrature point providing the action of the CeedQFunction associated with the CeedOperator. 1485859c15bbSJames Wright The vector `assembled` is of shape `[num_elements, num_input_fields, num_output_fields, num_quad_points]` and contains column-major matrices 1486859c15bbSJames Wright representing the action of the CeedQFunction for a corresponding quadrature point on an element. 1487859c15bbSJames Wright 14889fd66db6SSebastian Grimberg Inputs and outputs are in the order provided by the user when adding CeedOperator fields. 14899fd66db6SSebastian Grimberg For example, a CeedQFunction with inputs 'u' and 'gradu' and outputs 'gradv' and 'v', provided in that order, would result in an assembled QFunction 14909fd66db6SSebastian Grimberg that consists of (1 + dim) x (dim + 1) matrices at each quadrature point acting on the input [u, du_0, du_1] and producing the output [dv_0, dv_1, v]. 1491eaf62fffSJeremy L Thompson 1492ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1493f04ea552SJeremy L Thompson 1494ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1495ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points 1496ea61e9acSJeremy L Thompson @param[out] rstr CeedElemRestriction for CeedVector containing assembled CeedQFunction 1497ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1498eaf62fffSJeremy L Thompson 1499eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1500eaf62fffSJeremy L Thompson 1501eaf62fffSJeremy L Thompson @ref User 1502eaf62fffSJeremy L Thompson **/ 15032b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunction(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 15042b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1505eaf62fffSJeremy L Thompson 1506eaf62fffSJeremy L Thompson if (op->LinearAssembleQFunction) { 1507d04bbc78SJeremy L Thompson // Backend version 15082b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleQFunction(op, assembled, rstr, request)); 1509eaf62fffSJeremy L Thompson } else { 1510d04bbc78SJeremy L Thompson // Operator fallback 1511d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1512d04bbc78SJeremy L Thompson 15132b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 15146574a04fSJeremy L Thompson if (op_fallback) CeedCall(CeedOperatorLinearAssembleQFunction(op_fallback, assembled, rstr, request)); 15156574a04fSJeremy L Thompson else return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunction"); 151670a7ffb3SJeremy L Thompson } 1517eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1518eaf62fffSJeremy L Thompson } 151970a7ffb3SJeremy L Thompson 152070a7ffb3SJeremy L Thompson /** 1521ea61e9acSJeremy L Thompson @brief Assemble CeedQFunction and store result internally. 15224385fb7fSSebastian Grimberg 1523ea61e9acSJeremy L Thompson Return copied references of stored data to the caller. 1524ea61e9acSJeremy L Thompson Caller is responsible for ownership and destruction of the copied references. 1525ea61e9acSJeremy L Thompson See also @ref CeedOperatorLinearAssembleQFunction 152670a7ffb3SJeremy L Thompson 1527c5f45aeaSJeremy L Thompson Note: If the value of `assembled` or `rstr` passed to this function are non-NULL, then it is assumed that they hold valid pointers. 1528c5f45aeaSJeremy L Thompson These objects will be destroyed if `*assembled` or `*rstr` is the only reference to the object. 1529c5f45aeaSJeremy L Thompson 1530ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1531ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points 1532ea61e9acSJeremy L Thompson @param[out] rstr CeedElemRestriction for CeedVector containing assembledCeedQFunction 1533ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 153470a7ffb3SJeremy L Thompson 153570a7ffb3SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 153670a7ffb3SJeremy L Thompson 153770a7ffb3SJeremy L Thompson @ref User 153870a7ffb3SJeremy L Thompson **/ 15392b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunctionBuildOrUpdate(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 15402b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 154170a7ffb3SJeremy L Thompson 154270a7ffb3SJeremy L Thompson if (op->LinearAssembleQFunctionUpdate) { 1543d04bbc78SJeremy L Thompson // Backend version 1544480fae85SJeremy L Thompson bool qf_assembled_is_setup; 15452efa2d85SJeremy L Thompson CeedVector assembled_vec = NULL; 15462efa2d85SJeremy L Thompson CeedElemRestriction assembled_rstr = NULL; 1547480fae85SJeremy L Thompson 15482b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataIsSetup(op->qf_assembled, &qf_assembled_is_setup)); 1549480fae85SJeremy L Thompson if (qf_assembled_is_setup) { 1550d04bbc78SJeremy L Thompson bool update_needed; 1551d04bbc78SJeremy L Thompson 15522b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataGetObjects(op->qf_assembled, &assembled_vec, &assembled_rstr)); 15532b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataIsUpdateNeeded(op->qf_assembled, &update_needed)); 1554c5f45aeaSJeremy L Thompson if (update_needed) CeedCall(op->LinearAssembleQFunctionUpdate(op, assembled_vec, assembled_rstr, request)); 155570a7ffb3SJeremy L Thompson } else { 15562b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleQFunction(op, &assembled_vec, &assembled_rstr, request)); 15572b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataSetObjects(op->qf_assembled, assembled_vec, assembled_rstr)); 155870a7ffb3SJeremy L Thompson } 15592b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataSetUpdateNeeded(op->qf_assembled, false)); 15602efa2d85SJeremy L Thompson 1561d04bbc78SJeremy L Thompson // Copy reference from internally held copy 15622b730f8bSJeremy L Thompson CeedCall(CeedVectorReferenceCopy(assembled_vec, assembled)); 15632b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(assembled_rstr, rstr)); 1564c5f45aeaSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled_vec)); 15652b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&assembled_rstr)); 156670a7ffb3SJeremy L Thompson } else { 1567d04bbc78SJeremy L Thompson // Operator fallback 1568d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1569d04bbc78SJeremy L Thompson 15702b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 15716574a04fSJeremy L Thompson if (op_fallback) CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op_fallback, assembled, rstr, request)); 15726574a04fSJeremy L Thompson else return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunctionUpdate"); 157370a7ffb3SJeremy L Thompson } 157470a7ffb3SJeremy L Thompson 157570a7ffb3SJeremy L Thompson return CEED_ERROR_SUCCESS; 1576eaf62fffSJeremy L Thompson } 1577eaf62fffSJeremy L Thompson 1578eaf62fffSJeremy L Thompson /** 1579eaf62fffSJeremy L Thompson @brief Assemble the diagonal of a square linear CeedOperator 1580eaf62fffSJeremy L Thompson 1581eaf62fffSJeremy L Thompson This overwrites a CeedVector with the diagonal of a linear CeedOperator. 1582eaf62fffSJeremy L Thompson 1583ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1584eaf62fffSJeremy L Thompson 1585ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1586f04ea552SJeremy L Thompson 1587ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1588eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator diagonal 1589ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1590eaf62fffSJeremy L Thompson 1591eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1592eaf62fffSJeremy L Thompson 1593eaf62fffSJeremy L Thompson @ref User 1594eaf62fffSJeremy L Thompson **/ 15952b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1596f3d47e36SJeremy L Thompson bool is_composite; 15972b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1598f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1599eaf62fffSJeremy L Thompson 1600c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 16012b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 16026574a04fSJeremy L Thompson CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1603c9366a6bSJeremy L Thompson 1604f3d47e36SJeremy L Thompson // Early exit for empty operator 1605f3d47e36SJeremy L Thompson if (!is_composite) { 1606f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1607f3d47e36SJeremy L Thompson 1608f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1609f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1610f3d47e36SJeremy L Thompson } 1611f3d47e36SJeremy L Thompson 1612eaf62fffSJeremy L Thompson if (op->LinearAssembleDiagonal) { 1613d04bbc78SJeremy L Thompson // Backend version 16142b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleDiagonal(op, assembled, request)); 1615eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1616eaf62fffSJeremy L Thompson } else if (op->LinearAssembleAddDiagonal) { 1617d04bbc78SJeremy L Thompson // Backend version with zeroing first 16182b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 16192b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request)); 1620eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1621eaf62fffSJeremy L Thompson } else { 1622d04bbc78SJeremy L Thompson // Operator fallback 1623d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1624d04bbc78SJeremy L Thompson 16252b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1626d04bbc78SJeremy L Thompson if (op_fallback) { 16272b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleDiagonal(op_fallback, assembled, request)); 1628eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1629eaf62fffSJeremy L Thompson } 1630eaf62fffSJeremy L Thompson } 1631eaf62fffSJeremy L Thompson // Default interface implementation 16322b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 16332b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddDiagonal(op, assembled, request)); 1634d04bbc78SJeremy L Thompson 1635eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1636eaf62fffSJeremy L Thompson } 1637eaf62fffSJeremy L Thompson 1638eaf62fffSJeremy L Thompson /** 1639eaf62fffSJeremy L Thompson @brief Assemble the diagonal of a square linear CeedOperator 1640eaf62fffSJeremy L Thompson 1641eaf62fffSJeremy L Thompson This sums into a CeedVector the diagonal of a linear CeedOperator. 1642eaf62fffSJeremy L Thompson 1643ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1644eaf62fffSJeremy L Thompson 1645ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1646f04ea552SJeremy L Thompson 1647ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1648eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator diagonal 1649ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1650eaf62fffSJeremy L Thompson 1651eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1652eaf62fffSJeremy L Thompson 1653eaf62fffSJeremy L Thompson @ref User 1654eaf62fffSJeremy L Thompson **/ 16552b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1656f3d47e36SJeremy L Thompson bool is_composite; 16572b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1658f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1659eaf62fffSJeremy L Thompson 1660c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 16612b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 16626574a04fSJeremy L Thompson CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1663c9366a6bSJeremy L Thompson 1664f3d47e36SJeremy L Thompson // Early exit for empty operator 1665f3d47e36SJeremy L Thompson if (!is_composite) { 1666f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1667f3d47e36SJeremy L Thompson 1668f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1669f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1670f3d47e36SJeremy L Thompson } 1671f3d47e36SJeremy L Thompson 1672eaf62fffSJeremy L Thompson if (op->LinearAssembleAddDiagonal) { 1673d04bbc78SJeremy L Thompson // Backend version 16742b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request)); 1675eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1676eaf62fffSJeremy L Thompson } else { 1677d04bbc78SJeremy L Thompson // Operator fallback 1678d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1679d04bbc78SJeremy L Thompson 16802b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1681d04bbc78SJeremy L Thompson if (op_fallback) { 16822b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddDiagonal(op_fallback, assembled, request)); 1683eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1684eaf62fffSJeremy L Thompson } 1685eaf62fffSJeremy L Thompson } 1686eaf62fffSJeremy L Thompson // Default interface implementation 1687eaf62fffSJeremy L Thompson if (is_composite) { 16882b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, false, assembled)); 1689eaf62fffSJeremy L Thompson } else { 16902b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, false, assembled)); 1691eaf62fffSJeremy L Thompson } 1692d04bbc78SJeremy L Thompson 1693d04bbc78SJeremy L Thompson return CEED_ERROR_SUCCESS; 1694eaf62fffSJeremy L Thompson } 1695eaf62fffSJeremy L Thompson 1696eaf62fffSJeremy L Thompson /** 1697eaf62fffSJeremy L Thompson @brief Assemble the point block diagonal of a square linear CeedOperator 1698eaf62fffSJeremy L Thompson 1699ea61e9acSJeremy L Thompson This overwrites a CeedVector with the point block diagonal of a linear CeedOperator. 1700eaf62fffSJeremy L Thompson 1701ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1702eaf62fffSJeremy L Thompson 1703ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1704f04ea552SJeremy L Thompson 1705ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1706ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp 1707ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out, 1708ea61e9acSJeremy L Thompson component in]. 1709ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1710eaf62fffSJeremy L Thompson 1711eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1712eaf62fffSJeremy L Thompson 1713eaf62fffSJeremy L Thompson @ref User 1714eaf62fffSJeremy L Thompson **/ 17152b730f8bSJeremy L Thompson int CeedOperatorLinearAssemblePointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1716f3d47e36SJeremy L Thompson bool is_composite; 17172b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1718f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1719eaf62fffSJeremy L Thompson 1720c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 17212b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 17226574a04fSJeremy L Thompson CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1723c9366a6bSJeremy L Thompson 1724f3d47e36SJeremy L Thompson // Early exit for empty operator 1725f3d47e36SJeremy L Thompson if (!is_composite) { 1726f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1727f3d47e36SJeremy L Thompson 1728f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1729f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1730f3d47e36SJeremy L Thompson } 1731f3d47e36SJeremy L Thompson 1732eaf62fffSJeremy L Thompson if (op->LinearAssemblePointBlockDiagonal) { 1733d04bbc78SJeremy L Thompson // Backend version 17342b730f8bSJeremy L Thompson CeedCall(op->LinearAssemblePointBlockDiagonal(op, assembled, request)); 1735eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1736eaf62fffSJeremy L Thompson } else if (op->LinearAssembleAddPointBlockDiagonal) { 1737d04bbc78SJeremy L Thompson // Backend version with zeroing first 17382b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 17392b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request)); 1740eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1741eaf62fffSJeremy L Thompson } else { 1742d04bbc78SJeremy L Thompson // Operator fallback 1743d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1744d04bbc78SJeremy L Thompson 17452b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1746d04bbc78SJeremy L Thompson if (op_fallback) { 17472b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssemblePointBlockDiagonal(op_fallback, assembled, request)); 1748eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1749eaf62fffSJeremy L Thompson } 1750eaf62fffSJeremy L Thompson } 1751eaf62fffSJeremy L Thompson // Default interface implementation 17522b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 17532b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request)); 1754d04bbc78SJeremy L Thompson 1755eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1756eaf62fffSJeremy L Thompson } 1757eaf62fffSJeremy L Thompson 1758eaf62fffSJeremy L Thompson /** 1759eaf62fffSJeremy L Thompson @brief Assemble the point block diagonal of a square linear CeedOperator 1760eaf62fffSJeremy L Thompson 1761ea61e9acSJeremy L Thompson This sums into a CeedVector with the point block diagonal of a linear CeedOperator. 1762eaf62fffSJeremy L Thompson 1763ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1764eaf62fffSJeremy L Thompson 1765ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1766f04ea552SJeremy L Thompson 1767ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1768ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp 1769ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out, 1770ea61e9acSJeremy L Thompson component in]. 1771ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1772eaf62fffSJeremy L Thompson 1773eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1774eaf62fffSJeremy L Thompson 1775eaf62fffSJeremy L Thompson @ref User 1776eaf62fffSJeremy L Thompson **/ 17772b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddPointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1778f3d47e36SJeremy L Thompson bool is_composite; 17792b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1780f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1781eaf62fffSJeremy L Thompson 1782c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 17832b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 17846574a04fSJeremy L Thompson CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1785c9366a6bSJeremy L Thompson 1786f3d47e36SJeremy L Thompson // Early exit for empty operator 1787f3d47e36SJeremy L Thompson if (!is_composite) { 1788f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1789f3d47e36SJeremy L Thompson 1790f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1791f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1792f3d47e36SJeremy L Thompson } 1793f3d47e36SJeremy L Thompson 1794eaf62fffSJeremy L Thompson if (op->LinearAssembleAddPointBlockDiagonal) { 1795d04bbc78SJeremy L Thompson // Backend version 17962b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleAddPointBlockDiagonal(op, assembled, request)); 1797eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1798eaf62fffSJeremy L Thompson } else { 1799d04bbc78SJeremy L Thompson // Operator fallback 1800d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1801d04bbc78SJeremy L Thompson 18022b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1803d04bbc78SJeremy L Thompson if (op_fallback) { 18042b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op_fallback, assembled, request)); 1805eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1806eaf62fffSJeremy L Thompson } 1807eaf62fffSJeremy L Thompson } 1808ea61e9acSJeremy L Thompson // Default interface implementation 1809eaf62fffSJeremy L Thompson if (is_composite) { 18102b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, true, assembled)); 1811eaf62fffSJeremy L Thompson } else { 18122b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, true, assembled)); 1813eaf62fffSJeremy L Thompson } 1814d04bbc78SJeremy L Thompson 1815d04bbc78SJeremy L Thompson return CEED_ERROR_SUCCESS; 1816eaf62fffSJeremy L Thompson } 1817eaf62fffSJeremy L Thompson 1818eaf62fffSJeremy L Thompson /** 1819eaf62fffSJeremy L Thompson @brief Fully assemble the nonzero pattern of a linear operator. 1820eaf62fffSJeremy L Thompson 1821ea61e9acSJeremy L Thompson Expected to be used in conjunction with CeedOperatorLinearAssemble(). 1822eaf62fffSJeremy L Thompson 1823ea61e9acSJeremy L Thompson The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the 18249fd66db6SSebastian Grimberg matrix in entry (i, j). 18259fd66db6SSebastian Grimberg Note that the (i, j) pairs are not unique and may repeat. 18269fd66db6SSebastian Grimberg This function returns the number of entries and their (i, j) locations, while CeedOperatorLinearAssemble() provides the values in the same ordering. 1827eaf62fffSJeremy L Thompson 1828eaf62fffSJeremy L Thompson This will generally be slow unless your operator is low-order. 1829eaf62fffSJeremy L Thompson 1830ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1831f04ea552SJeremy L Thompson 1832eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 1833eaf62fffSJeremy L Thompson @param[out] num_entries Number of entries in coordinate nonzero pattern 1834eaf62fffSJeremy L Thompson @param[out] rows Row number for each entry 1835eaf62fffSJeremy L Thompson @param[out] cols Column number for each entry 1836eaf62fffSJeremy L Thompson 1837eaf62fffSJeremy L Thompson @ref User 1838eaf62fffSJeremy L Thompson **/ 18392b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleSymbolic(CeedOperator op, CeedSize *num_entries, CeedInt **rows, CeedInt **cols) { 1840b94338b9SJed Brown CeedInt num_suboperators; 1841b94338b9SJed Brown CeedSize single_entries; 1842eaf62fffSJeremy L Thompson CeedOperator *sub_operators; 1843eaf62fffSJeremy L Thompson bool is_composite; 18442b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1845f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1846eaf62fffSJeremy L Thompson 1847eaf62fffSJeremy L Thompson if (op->LinearAssembleSymbolic) { 1848d04bbc78SJeremy L Thompson // Backend version 18492b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleSymbolic(op, num_entries, rows, cols)); 1850eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1851eaf62fffSJeremy L Thompson } else { 1852d04bbc78SJeremy L Thompson // Operator fallback 1853d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1854d04bbc78SJeremy L Thompson 18552b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1856d04bbc78SJeremy L Thompson if (op_fallback) { 18572b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleSymbolic(op_fallback, num_entries, rows, cols)); 1858eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1859eaf62fffSJeremy L Thompson } 1860eaf62fffSJeremy L Thompson } 1861eaf62fffSJeremy L Thompson 1862eaf62fffSJeremy L Thompson // Default interface implementation 1863eaf62fffSJeremy L Thompson 1864eaf62fffSJeremy L Thompson // count entries and allocate rows, cols arrays 1865eaf62fffSJeremy L Thompson *num_entries = 0; 1866eaf62fffSJeremy L Thompson if (is_composite) { 1867c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1868c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 186992ae7e47SJeremy L Thompson for (CeedInt k = 0; k < num_suboperators; ++k) { 18702b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries)); 1871eaf62fffSJeremy L Thompson *num_entries += single_entries; 1872eaf62fffSJeremy L Thompson } 1873eaf62fffSJeremy L Thompson } else { 18742b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(op, &single_entries)); 1875eaf62fffSJeremy L Thompson *num_entries += single_entries; 1876eaf62fffSJeremy L Thompson } 18772b730f8bSJeremy L Thompson CeedCall(CeedCalloc(*num_entries, rows)); 18782b730f8bSJeremy L Thompson CeedCall(CeedCalloc(*num_entries, cols)); 1879eaf62fffSJeremy L Thompson 1880eaf62fffSJeremy L Thompson // assemble nonzero locations 1881eaf62fffSJeremy L Thompson CeedInt offset = 0; 1882eaf62fffSJeremy L Thompson if (is_composite) { 1883c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1884c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 188592ae7e47SJeremy L Thompson for (CeedInt k = 0; k < num_suboperators; ++k) { 18862b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleSymbolic(sub_operators[k], offset, *rows, *cols)); 18872b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries)); 1888eaf62fffSJeremy L Thompson offset += single_entries; 1889eaf62fffSJeremy L Thompson } 1890eaf62fffSJeremy L Thompson } else { 18912b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleSymbolic(op, offset, *rows, *cols)); 1892eaf62fffSJeremy L Thompson } 1893eaf62fffSJeremy L Thompson 1894eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1895eaf62fffSJeremy L Thompson } 1896eaf62fffSJeremy L Thompson 1897eaf62fffSJeremy L Thompson /** 1898eaf62fffSJeremy L Thompson @brief Fully assemble the nonzero entries of a linear operator. 1899eaf62fffSJeremy L Thompson 1900ea61e9acSJeremy L Thompson Expected to be used in conjunction with CeedOperatorLinearAssembleSymbolic(). 1901eaf62fffSJeremy L Thompson 1902ea61e9acSJeremy L Thompson The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the 19039fd66db6SSebastian Grimberg matrix in entry (i, j). 19049fd66db6SSebastian Grimberg Note that the (i, j) pairs are not unique and may repeat. 19059fd66db6SSebastian Grimberg This function returns the values of the nonzero entries to be added, their (i, j) locations are provided by CeedOperatorLinearAssembleSymbolic() 1906eaf62fffSJeremy L Thompson 1907eaf62fffSJeremy L Thompson This will generally be slow unless your operator is low-order. 1908eaf62fffSJeremy L Thompson 1909ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1910f04ea552SJeremy L Thompson 1911eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 1912eaf62fffSJeremy L Thompson @param[out] values Values to assemble into matrix 1913eaf62fffSJeremy L Thompson 1914eaf62fffSJeremy L Thompson @ref User 1915eaf62fffSJeremy L Thompson **/ 1916eaf62fffSJeremy L Thompson int CeedOperatorLinearAssemble(CeedOperator op, CeedVector values) { 1917b94338b9SJed Brown CeedInt num_suboperators; 1918b94338b9SJed Brown CeedSize single_entries = 0; 1919eaf62fffSJeremy L Thompson CeedOperator *sub_operators; 1920f3d47e36SJeremy L Thompson bool is_composite; 19212b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1922f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1923f3d47e36SJeremy L Thompson 1924f3d47e36SJeremy L Thompson // Early exit for empty operator 1925f3d47e36SJeremy L Thompson if (!is_composite) { 1926f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1927f3d47e36SJeremy L Thompson 1928f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1929f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1930f3d47e36SJeremy L Thompson } 1931eaf62fffSJeremy L Thompson 1932eaf62fffSJeremy L Thompson if (op->LinearAssemble) { 1933d04bbc78SJeremy L Thompson // Backend version 19342b730f8bSJeremy L Thompson CeedCall(op->LinearAssemble(op, values)); 1935eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1936eaf62fffSJeremy L Thompson } else { 1937d04bbc78SJeremy L Thompson // Operator fallback 1938d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1939d04bbc78SJeremy L Thompson 19402b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1941d04bbc78SJeremy L Thompson if (op_fallback) { 19422b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssemble(op_fallback, values)); 1943eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1944eaf62fffSJeremy L Thompson } 1945eaf62fffSJeremy L Thompson } 1946eaf62fffSJeremy L Thompson 1947eaf62fffSJeremy L Thompson // Default interface implementation 1948eaf62fffSJeremy L Thompson CeedInt offset = 0; 194928ec399dSJeremy L Thompson CeedCall(CeedVectorSetValue(values, 0.0)); 1950eaf62fffSJeremy L Thompson if (is_composite) { 1951c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1952c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 1953cefa2673SJeremy L Thompson for (CeedInt k = 0; k < num_suboperators; k++) { 19542b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemble(sub_operators[k], offset, values)); 19552b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries)); 1956eaf62fffSJeremy L Thompson offset += single_entries; 1957eaf62fffSJeremy L Thompson } 1958eaf62fffSJeremy L Thompson } else { 19592b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemble(op, offset, values)); 1960eaf62fffSJeremy L Thompson } 1961eaf62fffSJeremy L Thompson 1962eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1963eaf62fffSJeremy L Thompson } 1964eaf62fffSJeremy L Thompson 1965eaf62fffSJeremy L Thompson /** 196675f0d5a4SJeremy L Thompson @brief Get the multiplicity of nodes across suboperators in a composite CeedOperator 196775f0d5a4SJeremy L Thompson 196875f0d5a4SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 196975f0d5a4SJeremy L Thompson 197075f0d5a4SJeremy L Thompson @param[in] op Composite CeedOperator 197175f0d5a4SJeremy L Thompson @param[in] num_skip_indices Number of suboperators to skip 197275f0d5a4SJeremy L Thompson @param[in] skip_indices Array of indices of suboperators to skip 197375f0d5a4SJeremy L Thompson @param[out] mult Vector to store multiplicity (of size l_size) 197475f0d5a4SJeremy L Thompson 197575f0d5a4SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 197675f0d5a4SJeremy L Thompson 197775f0d5a4SJeremy L Thompson @ref User 197875f0d5a4SJeremy L Thompson **/ 197975f0d5a4SJeremy L Thompson int CeedCompositeOperatorGetMultiplicity(CeedOperator op, CeedInt num_skip_indices, CeedInt *skip_indices, CeedVector mult) { 198075f0d5a4SJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 198175f0d5a4SJeremy L Thompson 198275f0d5a4SJeremy L Thompson Ceed ceed; 1983b275c451SJeremy L Thompson CeedInt num_suboperators; 198475f0d5a4SJeremy L Thompson CeedSize l_vec_len; 198575f0d5a4SJeremy L Thompson CeedScalar *mult_array; 198675f0d5a4SJeremy L Thompson CeedVector ones_l_vec; 1987437c7c90SJeremy L Thompson CeedElemRestriction elem_rstr; 1988b275c451SJeremy L Thompson CeedOperator *sub_operators; 198975f0d5a4SJeremy L Thompson 199075f0d5a4SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 199175f0d5a4SJeremy L Thompson 199275f0d5a4SJeremy L Thompson // Zero mult vector 199375f0d5a4SJeremy L Thompson CeedCall(CeedVectorSetValue(mult, 0.0)); 199475f0d5a4SJeremy L Thompson 199575f0d5a4SJeremy L Thompson // Get suboperators 1996b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1997b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 1998b275c451SJeremy L Thompson if (num_suboperators == 0) return CEED_ERROR_SUCCESS; 199975f0d5a4SJeremy L Thompson 200075f0d5a4SJeremy L Thompson // Work vector 200175f0d5a4SJeremy L Thompson CeedCall(CeedVectorGetLength(mult, &l_vec_len)); 200275f0d5a4SJeremy L Thompson CeedCall(CeedVectorCreate(ceed, l_vec_len, &ones_l_vec)); 200375f0d5a4SJeremy L Thompson CeedCall(CeedVectorSetValue(ones_l_vec, 1.0)); 200475f0d5a4SJeremy L Thompson CeedCall(CeedVectorGetArray(mult, CEED_MEM_HOST, &mult_array)); 200575f0d5a4SJeremy L Thompson 200675f0d5a4SJeremy L Thompson // Compute multiplicity across suboperators 2007b275c451SJeremy L Thompson for (CeedInt i = 0; i < num_suboperators; i++) { 200875f0d5a4SJeremy L Thompson const CeedScalar *sub_mult_array; 200975f0d5a4SJeremy L Thompson CeedVector sub_mult_l_vec, ones_e_vec; 201075f0d5a4SJeremy L Thompson 201175f0d5a4SJeremy L Thompson // -- Check for suboperator to skip 201275f0d5a4SJeremy L Thompson for (CeedInt j = 0; j < num_skip_indices; j++) { 201375f0d5a4SJeremy L Thompson if (skip_indices[j] == i) continue; 201475f0d5a4SJeremy L Thompson } 201575f0d5a4SJeremy L Thompson 201675f0d5a4SJeremy L Thompson // -- Sub operator multiplicity 2017437c7c90SJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(sub_operators[i], &elem_rstr)); 2018437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionCreateVector(elem_rstr, &sub_mult_l_vec, &ones_e_vec)); 201975f0d5a4SJeremy L Thompson CeedCall(CeedVectorSetValue(sub_mult_l_vec, 0.0)); 2020437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionApply(elem_rstr, CEED_NOTRANSPOSE, ones_l_vec, ones_e_vec, CEED_REQUEST_IMMEDIATE)); 2021437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionApply(elem_rstr, CEED_TRANSPOSE, ones_e_vec, sub_mult_l_vec, CEED_REQUEST_IMMEDIATE)); 202275f0d5a4SJeremy L Thompson CeedCall(CeedVectorGetArrayRead(sub_mult_l_vec, CEED_MEM_HOST, &sub_mult_array)); 202375f0d5a4SJeremy L Thompson // ---- Flag every node present in the current suboperator 202475f0d5a4SJeremy L Thompson for (CeedInt j = 0; j < l_vec_len; j++) { 202575f0d5a4SJeremy L Thompson if (sub_mult_array[j] > 0.0) mult_array[j] += 1.0; 202675f0d5a4SJeremy L Thompson } 202775f0d5a4SJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(sub_mult_l_vec, &sub_mult_array)); 202875f0d5a4SJeremy L Thompson CeedCall(CeedVectorDestroy(&sub_mult_l_vec)); 202975f0d5a4SJeremy L Thompson CeedCall(CeedVectorDestroy(&ones_e_vec)); 203075f0d5a4SJeremy L Thompson } 203175f0d5a4SJeremy L Thompson CeedCall(CeedVectorRestoreArray(mult, &mult_array)); 2032811d0ccfSJeremy L Thompson CeedCall(CeedVectorDestroy(&ones_l_vec)); 203375f0d5a4SJeremy L Thompson 203475f0d5a4SJeremy L Thompson return CEED_ERROR_SUCCESS; 203575f0d5a4SJeremy L Thompson } 203675f0d5a4SJeremy L Thompson 203775f0d5a4SJeremy L Thompson /** 2038ea61e9acSJeremy L Thompson @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator, creating the prolongation basis from the fine and coarse 2039ea61e9acSJeremy L Thompson grid interpolation 2040eaf62fffSJeremy L Thompson 204158e4b056SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable. 2042f04ea552SJeremy L Thompson 2043eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 204485bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 2045eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 2046eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 2047eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 204885bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 204985bb9dcfSJeremy L Thompson @param[out] op_restrict Fine to coarse operator, or NULL 2050eaf62fffSJeremy L Thompson 2051eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2052eaf62fffSJeremy L Thompson 2053eaf62fffSJeremy L Thompson @ref User 2054eaf62fffSJeremy L Thompson **/ 20552b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreate(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 20562b730f8bSJeremy L Thompson CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) { 20572b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fine)); 2058eaf62fffSJeremy L Thompson 205983d6adf3SZach Atkins // Build prolongation matrix, if required 206083d6adf3SZach Atkins CeedBasis basis_c_to_f = NULL; 206183d6adf3SZach Atkins if (op_prolong || op_restrict) { 206283d6adf3SZach Atkins CeedBasis basis_fine; 20632b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine)); 20642b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateProjection(basis_coarse, basis_fine, &basis_c_to_f)); 206583d6adf3SZach Atkins } 2066eaf62fffSJeremy L Thompson 2067f113e5dcSJeremy L Thompson // Core code 20682b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict)); 2069f113e5dcSJeremy L Thompson 2070eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2071eaf62fffSJeremy L Thompson } 2072eaf62fffSJeremy L Thompson 2073eaf62fffSJeremy L Thompson /** 2074ea61e9acSJeremy L Thompson @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a tensor basis for the active basis 2075eaf62fffSJeremy L Thompson 207658e4b056SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable. 2077f04ea552SJeremy L Thompson 2078eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 207985bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 2080eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 2081eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 208285bb9dcfSJeremy L Thompson @param[in] interp_c_to_f Matrix for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators 2083eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 208485bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 208585bb9dcfSJeremy L Thompson @param[out] op_restrict Fine to coarse operator, or NULL 2086eaf62fffSJeremy L Thompson 2087eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2088eaf62fffSJeremy L Thompson 2089eaf62fffSJeremy L Thompson @ref User 2090eaf62fffSJeremy L Thompson **/ 20912b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateTensorH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 20922b730f8bSJeremy L Thompson const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, 20932b730f8bSJeremy L Thompson CeedOperator *op_restrict) { 20942b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fine)); 2095eaf62fffSJeremy L Thompson Ceed ceed; 20962b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op_fine, &ceed)); 2097eaf62fffSJeremy L Thompson 2098eaf62fffSJeremy L Thompson // Check for compatible quadrature spaces 2099eaf62fffSJeremy L Thompson CeedBasis basis_fine; 21002b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine)); 2101eaf62fffSJeremy L Thompson CeedInt Q_f, Q_c; 21022b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f)); 21032b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c)); 21046574a04fSJeremy L Thompson CeedCheck(Q_f == Q_c, ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces"); 2105eaf62fffSJeremy L Thompson 210683d6adf3SZach Atkins // Create coarse to fine basis, if required 210783d6adf3SZach Atkins CeedBasis basis_c_to_f = NULL; 210883d6adf3SZach Atkins if (op_prolong || op_restrict) { 210983d6adf3SZach Atkins // Check if interpolation matrix is provided 21106574a04fSJeremy L Thompson CeedCheck(interp_c_to_f, ceed, CEED_ERROR_INCOMPATIBLE, 21116574a04fSJeremy L Thompson "Prolongation or restriction operator creation requires coarse-to-fine interpolation matrix"); 2112eaf62fffSJeremy L Thompson CeedInt dim, num_comp, num_nodes_c, P_1d_f, P_1d_c; 21132b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis_fine, &dim)); 21142b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp)); 21152b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes1D(basis_fine, &P_1d_f)); 21162b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c)); 21172b730f8bSJeremy L Thompson P_1d_c = dim == 1 ? num_nodes_c : dim == 2 ? sqrt(num_nodes_c) : cbrt(num_nodes_c); 2118eaf62fffSJeremy L Thompson CeedScalar *q_ref, *q_weight, *grad; 21192b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d_f, &q_ref)); 21202b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d_f, &q_weight)); 21212b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d_f * P_1d_c * dim, &grad)); 21222b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateTensorH1(ceed, dim, num_comp, P_1d_c, P_1d_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f)); 21232b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_ref)); 21242b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_weight)); 21252b730f8bSJeremy L Thompson CeedCall(CeedFree(&grad)); 212683d6adf3SZach Atkins } 2127eaf62fffSJeremy L Thompson 2128eaf62fffSJeremy L Thompson // Core code 21292b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict)); 2130eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2131eaf62fffSJeremy L Thompson } 2132eaf62fffSJeremy L Thompson 2133eaf62fffSJeremy L Thompson /** 2134ea61e9acSJeremy L Thompson @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a non-tensor basis for the active vector 2135eaf62fffSJeremy L Thompson 213658e4b056SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable. 2137f04ea552SJeremy L Thompson 2138eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 213985bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 2140eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 2141eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 214285bb9dcfSJeremy L Thompson @param[in] interp_c_to_f Matrix for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators 2143eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 214485bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 214585bb9dcfSJeremy L Thompson @param[out] op_restrict Fine to coarse operator, or NULL 2146eaf62fffSJeremy L Thompson 2147eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2148eaf62fffSJeremy L Thompson 2149eaf62fffSJeremy L Thompson @ref User 2150eaf62fffSJeremy L Thompson **/ 21512b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 21522b730f8bSJeremy L Thompson const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, 2153eaf62fffSJeremy L Thompson CeedOperator *op_restrict) { 21542b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fine)); 2155eaf62fffSJeremy L Thompson Ceed ceed; 21562b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op_fine, &ceed)); 2157eaf62fffSJeremy L Thompson 2158eaf62fffSJeremy L Thompson // Check for compatible quadrature spaces 2159eaf62fffSJeremy L Thompson CeedBasis basis_fine; 21602b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine)); 2161eaf62fffSJeremy L Thompson CeedInt Q_f, Q_c; 21622b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f)); 21632b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c)); 21646574a04fSJeremy L Thompson CeedCheck(Q_f == Q_c, ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces"); 2165eaf62fffSJeremy L Thompson 2166eaf62fffSJeremy L Thompson // Coarse to fine basis 216783d6adf3SZach Atkins CeedBasis basis_c_to_f = NULL; 216883d6adf3SZach Atkins if (op_prolong || op_restrict) { 216983d6adf3SZach Atkins // Check if interpolation matrix is provided 21706574a04fSJeremy L Thompson CeedCheck(interp_c_to_f, ceed, CEED_ERROR_INCOMPATIBLE, 21716574a04fSJeremy L Thompson "Prolongation or restriction operator creation requires coarse-to-fine interpolation matrix"); 2172eaf62fffSJeremy L Thompson CeedElemTopology topo; 21732b730f8bSJeremy L Thompson CeedCall(CeedBasisGetTopology(basis_fine, &topo)); 2174eaf62fffSJeremy L Thompson CeedInt dim, num_comp, num_nodes_c, num_nodes_f; 21752b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis_fine, &dim)); 21762b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp)); 21772b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes(basis_fine, &num_nodes_f)); 21782b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c)); 2179eaf62fffSJeremy L Thompson CeedScalar *q_ref, *q_weight, *grad; 21802b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_nodes_f * dim, &q_ref)); 21812b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_nodes_f, &q_weight)); 21822b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_nodes_f * num_nodes_c * dim, &grad)); 21832b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateH1(ceed, topo, num_comp, num_nodes_c, num_nodes_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f)); 21842b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_ref)); 21852b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_weight)); 21862b730f8bSJeremy L Thompson CeedCall(CeedFree(&grad)); 218783d6adf3SZach Atkins } 2188eaf62fffSJeremy L Thompson 2189eaf62fffSJeremy L Thompson // Core code 21902b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict)); 2191eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2192eaf62fffSJeremy L Thompson } 2193eaf62fffSJeremy L Thompson 2194eaf62fffSJeremy L Thompson /** 2195ea61e9acSJeremy L Thompson @brief Build a FDM based approximate inverse for each element for a CeedOperator 2196eaf62fffSJeremy L Thompson 2197ea61e9acSJeremy L Thompson This returns a CeedOperator and CeedVector to apply a Fast Diagonalization Method based approximate inverse. 2198859c15bbSJames Wright This function obtains the simultaneous diagonalization for the 1D mass and Laplacian operators, \f$M = V^T V, K = V^T S V\f$. 2199859c15bbSJames Wright The assembled QFunction is used to modify the eigenvalues from simultaneous diagonalization and obtain an approximate inverse of the form \f$V^T 22009fd66db6SSebastian Grimberg \hat S V\f$. 22019fd66db6SSebastian Grimberg The CeedOperator must be linear and non-composite. 22029fd66db6SSebastian Grimberg The associated CeedQFunction must therefore also be linear. 2203eaf62fffSJeremy L Thompson 2204ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 2205f04ea552SJeremy L Thompson 2206ea61e9acSJeremy L Thompson @param[in] op CeedOperator to create element inverses 2207ea61e9acSJeremy L Thompson @param[out] fdm_inv CeedOperator to apply the action of a FDM based inverse for each element 2208ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 2209eaf62fffSJeremy L Thompson 2210eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2211eaf62fffSJeremy L Thompson 2212480fae85SJeremy L Thompson @ref User 2213eaf62fffSJeremy L Thompson **/ 22142b730f8bSJeremy L Thompson int CeedOperatorCreateFDMElementInverse(CeedOperator op, CeedOperator *fdm_inv, CeedRequest *request) { 22152b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 2216eaf62fffSJeremy L Thompson 2217eaf62fffSJeremy L Thompson if (op->CreateFDMElementInverse) { 2218d04bbc78SJeremy L Thompson // Backend version 22192b730f8bSJeremy L Thompson CeedCall(op->CreateFDMElementInverse(op, fdm_inv, request)); 2220eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2221eaf62fffSJeremy L Thompson } else { 2222d04bbc78SJeremy L Thompson // Operator fallback 2223d04bbc78SJeremy L Thompson CeedOperator op_fallback; 2224d04bbc78SJeremy L Thompson 22252b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 2226d04bbc78SJeremy L Thompson if (op_fallback) { 22272b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreateFDMElementInverse(op_fallback, fdm_inv, request)); 2228eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2229eaf62fffSJeremy L Thompson } 2230eaf62fffSJeremy L Thompson } 2231eaf62fffSJeremy L Thompson 2232d04bbc78SJeremy L Thompson // Default interface implementation 2233eaf62fffSJeremy L Thompson Ceed ceed, ceed_parent; 22342b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 22352b730f8bSJeremy L Thompson CeedCall(CeedGetOperatorFallbackParentCeed(ceed, &ceed_parent)); 2236eaf62fffSJeremy L Thompson ceed_parent = ceed_parent ? ceed_parent : ceed; 2237eaf62fffSJeremy L Thompson CeedQFunction qf; 22382b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 2239eaf62fffSJeremy L Thompson 2240eaf62fffSJeremy L Thompson // Determine active input basis 2241eaf62fffSJeremy L Thompson bool interp = false, grad = false; 2242eaf62fffSJeremy L Thompson CeedBasis basis = NULL; 2243eaf62fffSJeremy L Thompson CeedElemRestriction rstr = NULL; 2244eaf62fffSJeremy L Thompson CeedOperatorField *op_fields; 2245eaf62fffSJeremy L Thompson CeedQFunctionField *qf_fields; 2246eaf62fffSJeremy L Thompson CeedInt num_input_fields; 22472b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, &num_input_fields, &op_fields, NULL, NULL)); 22482b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL)); 2249eaf62fffSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 2250eaf62fffSJeremy L Thompson CeedVector vec; 22512b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec)); 2252eaf62fffSJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 2253eaf62fffSJeremy L Thompson CeedEvalMode eval_mode; 22542b730f8bSJeremy L Thompson CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 2255eaf62fffSJeremy L Thompson interp = interp || eval_mode == CEED_EVAL_INTERP; 2256eaf62fffSJeremy L Thompson grad = grad || eval_mode == CEED_EVAL_GRAD; 22572b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 22582b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr)); 2259eaf62fffSJeremy L Thompson } 2260eaf62fffSJeremy L Thompson } 22616574a04fSJeremy L Thompson CeedCheck(basis, ceed, CEED_ERROR_BACKEND, "No active field set"); 2262e79b91d9SJeremy L Thompson CeedSize l_size = 1; 2263352a5e7cSSebastian Grimberg CeedInt P_1d, Q_1d, num_nodes, num_qpts, dim, num_comp = 1, num_elem = 1; 22642b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes1D(basis, &P_1d)); 2265352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumNodes(basis, &num_nodes)); 22662b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints1D(basis, &Q_1d)); 22672b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis, &num_qpts)); 22682b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis, &dim)); 22692b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis, &num_comp)); 22702b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem)); 22712b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size)); 2272eaf62fffSJeremy L Thompson 2273eaf62fffSJeremy L Thompson // Build and diagonalize 1D Mass and Laplacian 22746574a04fSJeremy L Thompson bool is_tensor_basis; 22756574a04fSJeremy L Thompson CeedCall(CeedBasisIsTensor(basis, &is_tensor_basis)); 22766574a04fSJeremy L Thompson CeedCheck(is_tensor_basis, ceed, CEED_ERROR_BACKEND, "FDMElementInverse only supported for tensor bases"); 2277eaf62fffSJeremy L Thompson CeedScalar *mass, *laplace, *x, *fdm_interp, *lambda; 22782b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &mass)); 22792b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &laplace)); 22802b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &x)); 22812b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &fdm_interp)); 22822b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d, &lambda)); 2283eaf62fffSJeremy L Thompson // -- Build matrices 2284eaf62fffSJeremy L Thompson const CeedScalar *interp_1d, *grad_1d, *q_weight_1d; 22852b730f8bSJeremy L Thompson CeedCall(CeedBasisGetInterp1D(basis, &interp_1d)); 22862b730f8bSJeremy L Thompson CeedCall(CeedBasisGetGrad1D(basis, &grad_1d)); 22872b730f8bSJeremy L Thompson CeedCall(CeedBasisGetQWeights(basis, &q_weight_1d)); 22882b730f8bSJeremy L Thompson CeedCall(CeedBuildMassLaplace(interp_1d, grad_1d, q_weight_1d, P_1d, Q_1d, dim, mass, laplace)); 2289eaf62fffSJeremy L Thompson 2290eaf62fffSJeremy L Thompson // -- Diagonalize 22912b730f8bSJeremy L Thompson CeedCall(CeedSimultaneousDiagonalization(ceed, laplace, mass, x, lambda, P_1d)); 22922b730f8bSJeremy L Thompson CeedCall(CeedFree(&mass)); 22932b730f8bSJeremy L Thompson CeedCall(CeedFree(&laplace)); 22942b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) { 22952b730f8bSJeremy L Thompson for (CeedInt j = 0; j < P_1d; j++) fdm_interp[i + j * P_1d] = x[j + i * P_1d]; 22962b730f8bSJeremy L Thompson } 22972b730f8bSJeremy L Thompson CeedCall(CeedFree(&x)); 2298eaf62fffSJeremy L Thompson 2299eaf62fffSJeremy L Thompson // Assemble QFunction 2300c5f45aeaSJeremy L Thompson CeedVector assembled = NULL; 2301c5f45aeaSJeremy L Thompson CeedElemRestriction rstr_qf = NULL; 23022b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled, &rstr_qf, request)); 2303eaf62fffSJeremy L Thompson CeedInt layout[3]; 23042b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(rstr_qf, &layout)); 23052b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_qf)); 2306eaf62fffSJeremy L Thompson CeedScalar max_norm = 0; 23072b730f8bSJeremy L Thompson CeedCall(CeedVectorNorm(assembled, CEED_NORM_MAX, &max_norm)); 2308eaf62fffSJeremy L Thompson 2309eaf62fffSJeremy L Thompson // Calculate element averages 2310eaf62fffSJeremy L Thompson CeedInt num_modes = (interp ? 1 : 0) + (grad ? dim : 0); 2311eaf62fffSJeremy L Thompson CeedScalar *elem_avg; 2312eaf62fffSJeremy L Thompson const CeedScalar *assembled_array, *q_weight_array; 2313eaf62fffSJeremy L Thompson CeedVector q_weight; 23142b730f8bSJeremy L Thompson CeedCall(CeedVectorCreate(ceed_parent, num_qpts, &q_weight)); 23152b730f8bSJeremy L Thompson CeedCall(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, q_weight)); 23162b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(assembled, CEED_MEM_HOST, &assembled_array)); 23172b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(q_weight, CEED_MEM_HOST, &q_weight_array)); 23182b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_elem, &elem_avg)); 2319eaf62fffSJeremy L Thompson const CeedScalar qf_value_bound = max_norm * 100 * CEED_EPSILON; 2320eaf62fffSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 2321eaf62fffSJeremy L Thompson CeedInt count = 0; 23222b730f8bSJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 23232b730f8bSJeremy L Thompson for (CeedInt i = 0; i < num_comp * num_comp * num_modes * num_modes; i++) { 23242b730f8bSJeremy L Thompson if (fabs(assembled_array[q * layout[0] + i * layout[1] + e * layout[2]]) > qf_value_bound) { 23252b730f8bSJeremy L Thompson elem_avg[e] += assembled_array[q * layout[0] + i * layout[1] + e * layout[2]] / q_weight_array[q]; 2326eaf62fffSJeremy L Thompson count++; 2327eaf62fffSJeremy L Thompson } 23282b730f8bSJeremy L Thompson } 23292b730f8bSJeremy L Thompson } 2330eaf62fffSJeremy L Thompson if (count) { 2331eaf62fffSJeremy L Thompson elem_avg[e] /= count; 2332eaf62fffSJeremy L Thompson } else { 2333eaf62fffSJeremy L Thompson elem_avg[e] = 1.0; 2334eaf62fffSJeremy L Thompson } 2335eaf62fffSJeremy L Thompson } 23362b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(assembled, &assembled_array)); 23372b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled)); 23382b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(q_weight, &q_weight_array)); 23392b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&q_weight)); 2340eaf62fffSJeremy L Thompson 2341eaf62fffSJeremy L Thompson // Build FDM diagonal 2342eaf62fffSJeremy L Thompson CeedVector q_data; 2343eaf62fffSJeremy L Thompson CeedScalar *q_data_array, *fdm_diagonal; 2344352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_comp * num_nodes, &fdm_diagonal)); 2345352a5e7cSSebastian Grimberg const CeedScalar fdm_diagonal_bound = num_nodes * CEED_EPSILON; 23462b730f8bSJeremy L Thompson for (CeedInt c = 0; c < num_comp; c++) { 2347352a5e7cSSebastian Grimberg for (CeedInt n = 0; n < num_nodes; n++) { 2348352a5e7cSSebastian Grimberg if (interp) fdm_diagonal[c * num_nodes + n] = 1.0; 23492b730f8bSJeremy L Thompson if (grad) { 2350eaf62fffSJeremy L Thompson for (CeedInt d = 0; d < dim; d++) { 2351eaf62fffSJeremy L Thompson CeedInt i = (n / CeedIntPow(P_1d, d)) % P_1d; 2352352a5e7cSSebastian Grimberg fdm_diagonal[c * num_nodes + n] += lambda[i]; 2353eaf62fffSJeremy L Thompson } 2354eaf62fffSJeremy L Thompson } 2355352a5e7cSSebastian Grimberg if (fabs(fdm_diagonal[c * num_nodes + n]) < fdm_diagonal_bound) fdm_diagonal[c * num_nodes + n] = fdm_diagonal_bound; 23562b730f8bSJeremy L Thompson } 23572b730f8bSJeremy L Thompson } 2358352a5e7cSSebastian Grimberg CeedCall(CeedVectorCreate(ceed_parent, num_elem * num_comp * num_nodes, &q_data)); 23592b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(q_data, 0.0)); 23602b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayWrite(q_data, CEED_MEM_HOST, &q_data_array)); 23612b730f8bSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 23622b730f8bSJeremy L Thompson for (CeedInt c = 0; c < num_comp; c++) { 2363352a5e7cSSebastian Grimberg for (CeedInt n = 0; n < num_nodes; n++) q_data_array[(e * num_comp + c) * num_nodes + n] = 1. / (elem_avg[e] * fdm_diagonal[c * num_nodes + n]); 23642b730f8bSJeremy L Thompson } 23652b730f8bSJeremy L Thompson } 23662b730f8bSJeremy L Thompson CeedCall(CeedFree(&elem_avg)); 23672b730f8bSJeremy L Thompson CeedCall(CeedFree(&fdm_diagonal)); 23682b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(q_data, &q_data_array)); 2369eaf62fffSJeremy L Thompson 2370eaf62fffSJeremy L Thompson // Setup FDM operator 2371eaf62fffSJeremy L Thompson // -- Basis 2372eaf62fffSJeremy L Thompson CeedBasis fdm_basis; 2373eaf62fffSJeremy L Thompson CeedScalar *grad_dummy, *q_ref_dummy, *q_weight_dummy; 23742b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &grad_dummy)); 23752b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d, &q_ref_dummy)); 23762b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d, &q_weight_dummy)); 23772b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateTensorH1(ceed_parent, dim, num_comp, P_1d, P_1d, fdm_interp, grad_dummy, q_ref_dummy, q_weight_dummy, &fdm_basis)); 23782b730f8bSJeremy L Thompson CeedCall(CeedFree(&fdm_interp)); 23792b730f8bSJeremy L Thompson CeedCall(CeedFree(&grad_dummy)); 23802b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_ref_dummy)); 23812b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_weight_dummy)); 23822b730f8bSJeremy L Thompson CeedCall(CeedFree(&lambda)); 2383eaf62fffSJeremy L Thompson 2384eaf62fffSJeremy L Thompson // -- Restriction 2385eaf62fffSJeremy L Thompson CeedElemRestriction rstr_qd_i; 2386352a5e7cSSebastian Grimberg CeedInt strides[3] = {1, num_nodes, num_nodes * num_comp}; 2387352a5e7cSSebastian Grimberg CeedCall(CeedElemRestrictionCreateStrided(ceed_parent, num_elem, num_nodes, num_comp, num_elem * num_comp * num_nodes, strides, &rstr_qd_i)); 2388eaf62fffSJeremy L Thompson // -- QFunction 2389eaf62fffSJeremy L Thompson CeedQFunction qf_fdm; 23902b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateInteriorByName(ceed_parent, "Scale", &qf_fdm)); 23912b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_fdm, "input", num_comp, CEED_EVAL_INTERP)); 23922b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_fdm, "scale", num_comp, CEED_EVAL_NONE)); 23932b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(qf_fdm, "output", num_comp, CEED_EVAL_INTERP)); 23942b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_fdm, num_comp)); 2395eaf62fffSJeremy L Thompson // -- QFunction context 2396eaf62fffSJeremy L Thompson CeedInt *num_comp_data; 23972b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &num_comp_data)); 2398eaf62fffSJeremy L Thompson num_comp_data[0] = num_comp; 2399eaf62fffSJeremy L Thompson CeedQFunctionContext ctx_fdm; 24002b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextCreate(ceed, &ctx_fdm)); 24012b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextSetData(ctx_fdm, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_data), num_comp_data)); 24022b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(qf_fdm, ctx_fdm)); 24032b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextDestroy(&ctx_fdm)); 2404eaf62fffSJeremy L Thompson // -- Operator 24052b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed_parent, qf_fdm, NULL, NULL, fdm_inv)); 24062b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*fdm_inv, "input", rstr, fdm_basis, CEED_VECTOR_ACTIVE)); 24072b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*fdm_inv, "scale", rstr_qd_i, CEED_BASIS_COLLOCATED, q_data)); 24082b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*fdm_inv, "output", rstr, fdm_basis, CEED_VECTOR_ACTIVE)); 2409eaf62fffSJeremy L Thompson 2410eaf62fffSJeremy L Thompson // Cleanup 24112b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&q_data)); 24122b730f8bSJeremy L Thompson CeedCall(CeedBasisDestroy(&fdm_basis)); 24132b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_qd_i)); 24142b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&qf_fdm)); 2415eaf62fffSJeremy L Thompson 2416eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2417eaf62fffSJeremy L Thompson } 2418eaf62fffSJeremy L Thompson 2419eaf62fffSJeremy L Thompson /// @} 2420