13d8e8822SJeremy L Thompson // Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors. 23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details. 3eaf62fffSJeremy L Thompson // 43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause 5eaf62fffSJeremy L Thompson // 63d8e8822SJeremy L Thompson // This file is part of CEED: http://github.com/ceed 7eaf62fffSJeremy L Thompson 8ed9e99e6SJeremy L Thompson #include <assert.h> 92b730f8bSJeremy L Thompson #include <ceed-impl.h> 102b730f8bSJeremy L Thompson #include <ceed/backend.h> 112b730f8bSJeremy L Thompson #include <ceed/ceed.h> 122b730f8bSJeremy L Thompson #include <math.h> 13eaf62fffSJeremy L Thompson #include <stdbool.h> 14eaf62fffSJeremy L Thompson #include <stdio.h> 15eaf62fffSJeremy L Thompson #include <string.h> 16eaf62fffSJeremy L Thompson 17eaf62fffSJeremy L Thompson /// @file 18eaf62fffSJeremy L Thompson /// Implementation of CeedOperator preconditioning interfaces 19eaf62fffSJeremy L Thompson 20eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 21eaf62fffSJeremy L Thompson /// CeedOperator Library Internal Preconditioning Functions 22eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 23eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorDeveloper 24eaf62fffSJeremy L Thompson /// @{ 25eaf62fffSJeremy L Thompson 26eaf62fffSJeremy L Thompson /** 27ea61e9acSJeremy L Thompson @brief Duplicate a CeedQFunction with a reference Ceed to fallback for advanced CeedOperator functionality 289e77b9c8SJeremy L Thompson 2901ea9c81SJed Brown @param[in] fallback_ceed Ceed on which to create fallback CeedQFunction 309e77b9c8SJeremy L Thompson @param[in] qf CeedQFunction to create fallback for 3101ea9c81SJed Brown @param[out] qf_fallback fallback CeedQFunction 329e77b9c8SJeremy L Thompson 339e77b9c8SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 349e77b9c8SJeremy L Thompson 359e77b9c8SJeremy L Thompson @ref Developer 369e77b9c8SJeremy L Thompson **/ 372b730f8bSJeremy L Thompson static int CeedQFunctionCreateFallback(Ceed fallback_ceed, CeedQFunction qf, CeedQFunction *qf_fallback) { 389e77b9c8SJeremy L Thompson // Check if NULL qf passed in 399e77b9c8SJeremy L Thompson if (!qf) return CEED_ERROR_SUCCESS; 409e77b9c8SJeremy L Thompson 41d04bbc78SJeremy L Thompson CeedDebug256(qf->ceed, 1, "---------- CeedOperator Fallback ----------\n"); 4213f886e9SJeremy L Thompson CeedDebug(qf->ceed, "Creating fallback CeedQFunction\n"); 43d04bbc78SJeremy L Thompson 449e77b9c8SJeremy L Thompson char *source_path_with_name = ""; 459e77b9c8SJeremy L Thompson if (qf->source_path) { 462b730f8bSJeremy L Thompson size_t path_len = strlen(qf->source_path), name_len = strlen(qf->kernel_name); 472b730f8bSJeremy L Thompson CeedCall(CeedCalloc(path_len + name_len + 2, &source_path_with_name)); 489e77b9c8SJeremy L Thompson memcpy(source_path_with_name, qf->source_path, path_len); 499e77b9c8SJeremy L Thompson memcpy(&source_path_with_name[path_len], ":", 1); 509e77b9c8SJeremy L Thompson memcpy(&source_path_with_name[path_len + 1], qf->kernel_name, name_len); 519e77b9c8SJeremy L Thompson } else { 522b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &source_path_with_name)); 539e77b9c8SJeremy L Thompson } 549e77b9c8SJeremy L Thompson 552b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateInterior(fallback_ceed, qf->vec_length, qf->function, source_path_with_name, qf_fallback)); 569e77b9c8SJeremy L Thompson { 579e77b9c8SJeremy L Thompson CeedQFunctionContext ctx; 589e77b9c8SJeremy L Thompson 592b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetContext(qf, &ctx)); 602b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(*qf_fallback, ctx)); 619e77b9c8SJeremy L Thompson } 629e77b9c8SJeremy L Thompson for (CeedInt i = 0; i < qf->num_input_fields; i++) { 632b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(*qf_fallback, qf->input_fields[i]->field_name, qf->input_fields[i]->size, qf->input_fields[i]->eval_mode)); 649e77b9c8SJeremy L Thompson } 659e77b9c8SJeremy L Thompson for (CeedInt i = 0; i < qf->num_output_fields; i++) { 662b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(*qf_fallback, qf->output_fields[i]->field_name, qf->output_fields[i]->size, qf->output_fields[i]->eval_mode)); 679e77b9c8SJeremy L Thompson } 682b730f8bSJeremy L Thompson CeedCall(CeedFree(&source_path_with_name)); 699e77b9c8SJeremy L Thompson 709e77b9c8SJeremy L Thompson return CEED_ERROR_SUCCESS; 719e77b9c8SJeremy L Thompson } 729e77b9c8SJeremy L Thompson 739e77b9c8SJeremy L Thompson /** 74ea61e9acSJeremy L Thompson @brief Duplicate a CeedOperator with a reference Ceed to fallback for advanced CeedOperator functionality 75eaf62fffSJeremy L Thompson 76ea61e9acSJeremy L Thompson @param[in,out] op CeedOperator to create fallback for 77eaf62fffSJeremy L Thompson 78eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 79eaf62fffSJeremy L Thompson 80eaf62fffSJeremy L Thompson @ref Developer 81eaf62fffSJeremy L Thompson **/ 82d04bbc78SJeremy L Thompson static int CeedOperatorCreateFallback(CeedOperator op) { 83b275c451SJeremy L Thompson bool is_composite; 849e77b9c8SJeremy L Thompson Ceed ceed_fallback; 85eaf62fffSJeremy L Thompson 86805fe78eSJeremy L Thompson // Check not already created 87805fe78eSJeremy L Thompson if (op->op_fallback) return CEED_ERROR_SUCCESS; 88805fe78eSJeremy L Thompson 89eaf62fffSJeremy L Thompson // Fallback Ceed 902b730f8bSJeremy L Thompson CeedCall(CeedGetOperatorFallbackCeed(op->ceed, &ceed_fallback)); 91d04bbc78SJeremy L Thompson if (!ceed_fallback) return CEED_ERROR_SUCCESS; 92d04bbc78SJeremy L Thompson 93d04bbc78SJeremy L Thompson CeedDebug256(op->ceed, 1, "---------- CeedOperator Fallback ----------\n"); 9413f886e9SJeremy L Thompson CeedDebug(op->ceed, "Creating fallback CeedOperator\n"); 95eaf62fffSJeremy L Thompson 96eaf62fffSJeremy L Thompson // Clone Op 97805fe78eSJeremy L Thompson CeedOperator op_fallback; 98b275c451SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 99b275c451SJeremy L Thompson if (is_composite) { 100b275c451SJeremy L Thompson CeedInt num_suboperators; 101b275c451SJeremy L Thompson CeedOperator *sub_operators; 102b275c451SJeremy L Thompson 1032b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorCreate(ceed_fallback, &op_fallback)); 104b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 105b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 106b275c451SJeremy L Thompson for (CeedInt i = 0; i < num_suboperators; i++) { 107d04bbc78SJeremy L Thompson CeedOperator op_sub_fallback; 108d04bbc78SJeremy L Thompson 109b275c451SJeremy L Thompson CeedCall(CeedOperatorGetFallback(sub_operators[i], &op_sub_fallback)); 1102b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorAddSub(op_fallback, op_sub_fallback)); 111805fe78eSJeremy L Thompson } 112805fe78eSJeremy L Thompson } else { 1139e77b9c8SJeremy L Thompson CeedQFunction qf_fallback = NULL, dqf_fallback = NULL, dqfT_fallback = NULL; 1142b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->qf, &qf_fallback)); 1152b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqf, &dqf_fallback)); 1162b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqfT, &dqfT_fallback)); 1172b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed_fallback, qf_fallback, dqf_fallback, dqfT_fallback, &op_fallback)); 118805fe78eSJeremy L Thompson for (CeedInt i = 0; i < op->qf->num_input_fields; i++) { 119437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(op_fallback, op->input_fields[i]->field_name, op->input_fields[i]->elem_rstr, op->input_fields[i]->basis, 1202b730f8bSJeremy L Thompson op->input_fields[i]->vec)); 121805fe78eSJeremy L Thompson } 122805fe78eSJeremy L Thompson for (CeedInt i = 0; i < op->qf->num_output_fields; i++) { 123437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(op_fallback, op->output_fields[i]->field_name, op->output_fields[i]->elem_rstr, op->output_fields[i]->basis, 1242b730f8bSJeremy L Thompson op->output_fields[i]->vec)); 125805fe78eSJeremy L Thompson } 1262b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op->qf_assembled, &op_fallback->qf_assembled)); 127805fe78eSJeremy L Thompson if (op_fallback->num_qpts == 0) { 1282b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetNumQuadraturePoints(op_fallback, op->num_qpts)); 129805fe78eSJeremy L Thompson } 1309e77b9c8SJeremy L Thompson // Cleanup 1312b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&qf_fallback)); 1322b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&dqf_fallback)); 1332b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&dqfT_fallback)); 134805fe78eSJeremy L Thompson } 1352b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetName(op_fallback, op->name)); 1362b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fallback)); 137805fe78eSJeremy L Thompson op->op_fallback = op_fallback; 138eaf62fffSJeremy L Thompson 139eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 140eaf62fffSJeremy L Thompson } 141eaf62fffSJeremy L Thompson 142eaf62fffSJeremy L Thompson /** 143ea61e9acSJeremy L Thompson @brief Retrieve fallback CeedOperator with a reference Ceed for advanced CeedOperator functionality 144d04bbc78SJeremy L Thompson 145d04bbc78SJeremy L Thompson @param[in] op CeedOperator to retrieve fallback for 146d04bbc78SJeremy L Thompson @param[out] op_fallback Fallback CeedOperator 147d04bbc78SJeremy L Thompson 148d04bbc78SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 149d04bbc78SJeremy L Thompson 150d04bbc78SJeremy L Thompson @ref Developer 151d04bbc78SJeremy L Thompson **/ 152d04bbc78SJeremy L Thompson int CeedOperatorGetFallback(CeedOperator op, CeedOperator *op_fallback) { 153d04bbc78SJeremy L Thompson // Create if needed 154d04bbc78SJeremy L Thompson if (!op->op_fallback) { 1552b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreateFallback(op)); 156d04bbc78SJeremy L Thompson } 157d04bbc78SJeremy L Thompson if (op->op_fallback) { 158d04bbc78SJeremy L Thompson bool is_debug; 159d04bbc78SJeremy L Thompson 1602b730f8bSJeremy L Thompson CeedCall(CeedIsDebug(op->ceed, &is_debug)); 161d04bbc78SJeremy L Thompson if (is_debug) { 162b275c451SJeremy L Thompson Ceed ceed, ceed_fallback; 163d04bbc78SJeremy L Thompson const char *resource, *resource_fallback; 164d04bbc78SJeremy L Thompson 165b275c451SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 166b275c451SJeremy L Thompson CeedCall(CeedGetOperatorFallbackCeed(ceed, &ceed_fallback)); 167b275c451SJeremy L Thompson CeedCall(CeedGetResource(ceed, &resource)); 1682b730f8bSJeremy L Thompson CeedCall(CeedGetResource(ceed_fallback, &resource_fallback)); 169d04bbc78SJeremy L Thompson 170b275c451SJeremy L Thompson CeedDebug256(ceed, 1, "---------- CeedOperator Fallback ----------\n"); 171b275c451SJeremy L Thompson CeedDebug(ceed, "Falling back from %s operator at address %ld to %s operator at address %ld\n", resource, op, resource_fallback, 1722b730f8bSJeremy L Thompson op->op_fallback); 173d04bbc78SJeremy L Thompson } 174d04bbc78SJeremy L Thompson } 175d04bbc78SJeremy L Thompson *op_fallback = op->op_fallback; 176d04bbc78SJeremy L Thompson 177d04bbc78SJeremy L Thompson return CEED_ERROR_SUCCESS; 178d04bbc78SJeremy L Thompson } 179d04bbc78SJeremy L Thompson 180d04bbc78SJeremy L Thompson /** 181eaf62fffSJeremy L Thompson @brief Select correct basis matrix pointer based on CeedEvalMode 182eaf62fffSJeremy L Thompson 183eaf62fffSJeremy L Thompson @param[in] eval_mode Current basis evaluation mode 184eaf62fffSJeremy L Thompson @param[in] identity Pointer to identity matrix 185eaf62fffSJeremy L Thompson @param[in] interp Pointer to interpolation matrix 186eaf62fffSJeremy L Thompson @param[in] grad Pointer to gradient matrix 187eaf62fffSJeremy L Thompson @param[out] basis_ptr Basis pointer to set 188eaf62fffSJeremy L Thompson 189eaf62fffSJeremy L Thompson @ref Developer 190eaf62fffSJeremy L Thompson **/ 1912b730f8bSJeremy L Thompson static inline void CeedOperatorGetBasisPointer(CeedEvalMode eval_mode, const CeedScalar *identity, const CeedScalar *interp, const CeedScalar *grad, 1922b730f8bSJeremy L Thompson const CeedScalar **basis_ptr) { 193eaf62fffSJeremy L Thompson switch (eval_mode) { 194eaf62fffSJeremy L Thompson case CEED_EVAL_NONE: 195eaf62fffSJeremy L Thompson *basis_ptr = identity; 196eaf62fffSJeremy L Thompson break; 197eaf62fffSJeremy L Thompson case CEED_EVAL_INTERP: 198eaf62fffSJeremy L Thompson *basis_ptr = interp; 199eaf62fffSJeremy L Thompson break; 200eaf62fffSJeremy L Thompson case CEED_EVAL_GRAD: 201eaf62fffSJeremy L Thompson *basis_ptr = grad; 202eaf62fffSJeremy L Thompson break; 203eaf62fffSJeremy L Thompson case CEED_EVAL_WEIGHT: 204eaf62fffSJeremy L Thompson case CEED_EVAL_DIV: 205eaf62fffSJeremy L Thompson case CEED_EVAL_CURL: 206eaf62fffSJeremy L Thompson break; // Caught by QF Assembly 207eaf62fffSJeremy L Thompson } 208ed9e99e6SJeremy L Thompson assert(*basis_ptr != NULL); 209eaf62fffSJeremy L Thompson } 210eaf62fffSJeremy L Thompson 211eaf62fffSJeremy L Thompson /** 212eaf62fffSJeremy L Thompson @brief Create point block restriction for active operator field 213eaf62fffSJeremy L Thompson 214eaf62fffSJeremy L Thompson @param[in] rstr Original CeedElemRestriction for active field 215ea61e9acSJeremy L Thompson @param[out] pointblock_rstr Address of the variable where the newly created CeedElemRestriction will be stored 216eaf62fffSJeremy L Thompson 217eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 218eaf62fffSJeremy L Thompson 219eaf62fffSJeremy L Thompson @ref Developer 220eaf62fffSJeremy L Thompson **/ 2212b730f8bSJeremy L Thompson static int CeedOperatorCreateActivePointBlockRestriction(CeedElemRestriction rstr, CeedElemRestriction *pointblock_rstr) { 222eaf62fffSJeremy L Thompson Ceed ceed; 2232b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetCeed(rstr, &ceed)); 224eaf62fffSJeremy L Thompson const CeedInt *offsets; 2252b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetOffsets(rstr, CEED_MEM_HOST, &offsets)); 226eaf62fffSJeremy L Thompson 227eaf62fffSJeremy L Thompson // Expand offsets 2287b63f5c6SJed Brown CeedInt num_elem, num_comp, elem_size, comp_stride, *pointblock_offsets; 2297b63f5c6SJed Brown CeedSize l_size; 2302b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem)); 2312b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp)); 2322b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size)); 2332b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetCompStride(rstr, &comp_stride)); 2342b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size)); 235eaf62fffSJeremy L Thompson CeedInt shift = num_comp; 2362b730f8bSJeremy L Thompson if (comp_stride != 1) shift *= num_comp; 2372b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_elem * elem_size, &pointblock_offsets)); 238eaf62fffSJeremy L Thompson for (CeedInt i = 0; i < num_elem * elem_size; i++) { 239eaf62fffSJeremy L Thompson pointblock_offsets[i] = offsets[i] * shift; 240eaf62fffSJeremy L Thompson } 241eaf62fffSJeremy L Thompson 242eaf62fffSJeremy L Thompson // Create new restriction 2432b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionCreate(ceed, num_elem, elem_size, num_comp * num_comp, 1, l_size * num_comp, CEED_MEM_HOST, CEED_OWN_POINTER, 2442b730f8bSJeremy L Thompson pointblock_offsets, pointblock_rstr)); 245eaf62fffSJeremy L Thompson 246eaf62fffSJeremy L Thompson // Cleanup 2472b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionRestoreOffsets(rstr, &offsets)); 248eaf62fffSJeremy L Thompson 249eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 250eaf62fffSJeremy L Thompson } 251eaf62fffSJeremy L Thompson 252eaf62fffSJeremy L Thompson /** 253eaf62fffSJeremy L Thompson @brief Core logic for assembling operator diagonal or point block diagonal 254eaf62fffSJeremy L Thompson 255eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble point block diagonal 256ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE 257eaf62fffSJeremy L Thompson @param[in] is_pointblock Boolean flag to assemble diagonal or point block diagonal 258eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled diagonal 259eaf62fffSJeremy L Thompson 260eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 261eaf62fffSJeremy L Thompson 262eaf62fffSJeremy L Thompson @ref Developer 263eaf62fffSJeremy L Thompson **/ 2642b730f8bSJeremy L Thompson static inline int CeedSingleOperatorAssembleAddDiagonal_Core(CeedOperator op, CeedRequest *request, const bool is_pointblock, CeedVector assembled) { 265eaf62fffSJeremy L Thompson Ceed ceed; 2662b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 267eaf62fffSJeremy L Thompson 268eaf62fffSJeremy L Thompson // Assemble QFunction 269eaf62fffSJeremy L Thompson CeedQFunction qf; 270437c7c90SJeremy L Thompson const CeedScalar *assembled_qf_array; 271eaf62fffSJeremy L Thompson CeedVector assembled_qf; 272437c7c90SJeremy L Thompson CeedElemRestriction assembled_elem_rstr; 273437c7c90SJeremy L Thompson CeedInt num_input_fields, num_output_fields; 274eaf62fffSJeremy L Thompson CeedInt layout[3]; 275437c7c90SJeremy L Thompson 276437c7c90SJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 277437c7c90SJeremy L Thompson CeedCall(CeedQFunctionGetNumArgs(qf, &num_input_fields, &num_output_fields)); 278437c7c90SJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &assembled_elem_rstr, request)); 279437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(assembled_elem_rstr, &layout)); 280437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&assembled_elem_rstr)); 281437c7c90SJeremy L Thompson CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array)); 282eaf62fffSJeremy L Thompson 283ed9e99e6SJeremy L Thompson // Get assembly data 284ed9e99e6SJeremy L Thompson CeedOperatorAssemblyData data; 285437c7c90SJeremy L Thompson const CeedEvalMode **eval_modes_in, **eval_modes_out; 286437c7c90SJeremy L Thompson CeedInt *num_eval_modes_in, *num_eval_modes_out, num_active_bases; 287437c7c90SJeremy L Thompson CeedSize **eval_mode_offsets_in, **eval_mode_offsets_out, num_output_components; 288437c7c90SJeremy L Thompson CeedBasis *active_bases; 289437c7c90SJeremy L Thompson CeedElemRestriction *active_elem_rstrs; 290eaf62fffSJeremy L Thompson 291437c7c90SJeremy L Thompson CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data)); 292437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_active_bases, &num_eval_modes_in, &eval_modes_in, &eval_mode_offsets_in, 293437c7c90SJeremy L Thompson &num_eval_modes_out, &eval_modes_out, &eval_mode_offsets_out, &num_output_components)); 294437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, &active_bases, NULL, NULL)); 295437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetElemRestrictions(data, NULL, &active_elem_rstrs)); 296437c7c90SJeremy L Thompson 297437c7c90SJeremy L Thompson // Loop over all active bases 298437c7c90SJeremy L Thompson for (CeedInt b = 0; b < num_active_bases; b++) { 299eaf62fffSJeremy L Thompson // Assemble point block diagonal restriction, if needed 300437c7c90SJeremy L Thompson CeedElemRestriction diag_elem_rstr = active_elem_rstrs[b]; 301437c7c90SJeremy L Thompson 302eaf62fffSJeremy L Thompson if (is_pointblock) { 303437c7c90SJeremy L Thompson CeedElemRestriction point_block_elem_rstr; 304437c7c90SJeremy L Thompson 305437c7c90SJeremy L Thompson CeedCall(CeedOperatorCreateActivePointBlockRestriction(diag_elem_rstr, &point_block_elem_rstr)); 306437c7c90SJeremy L Thompson diag_elem_rstr = point_block_elem_rstr; 307eaf62fffSJeremy L Thompson } 308eaf62fffSJeremy L Thompson 309eaf62fffSJeremy L Thompson // Create diagonal vector 310eaf62fffSJeremy L Thompson CeedVector elem_diag; 311437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionCreateVector(diag_elem_rstr, NULL, &elem_diag)); 312eaf62fffSJeremy L Thompson 313eaf62fffSJeremy L Thompson // Assemble element operator diagonals 3149c774eddSJeremy L Thompson CeedScalar *elem_diag_array; 315437c7c90SJeremy L Thompson CeedInt num_elem, num_nodes, num_qpts, num_components; 316437c7c90SJeremy L Thompson 3172b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(elem_diag, 0.0)); 3182b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArray(elem_diag, CEED_MEM_HOST, &elem_diag_array)); 319437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(diag_elem_rstr, &num_elem)); 320437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumNodes(active_bases[b], &num_nodes)); 321437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumComponents(active_bases[b], &num_components)); 322437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(active_bases[b], &num_qpts)); 323ed9e99e6SJeremy L Thompson 324eaf62fffSJeremy L Thompson // Basis matrices 325437c7c90SJeremy L Thompson const CeedScalar *interp, *grad; 326eaf62fffSJeremy L Thompson CeedScalar *identity = NULL; 327ed9e99e6SJeremy L Thompson bool has_eval_none = false; 328437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_eval_modes_in[b]; i++) { 329437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (eval_modes_in[b][i] == CEED_EVAL_NONE); 330ed9e99e6SJeremy L Thompson } 331437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_eval_modes_out[b]; i++) { 332437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (eval_modes_out[b][i] == CEED_EVAL_NONE); 333ed9e99e6SJeremy L Thompson } 334ed9e99e6SJeremy L Thompson if (has_eval_none) { 3352b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_qpts * num_nodes, &identity)); 3362b730f8bSJeremy L Thompson for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) identity[i * num_nodes + i] = 1.0; 337eaf62fffSJeremy L Thompson } 338437c7c90SJeremy L Thompson CeedCall(CeedBasisGetInterp(active_bases[b], &interp)); 339437c7c90SJeremy L Thompson CeedCall(CeedBasisGetGrad(active_bases[b], &grad)); 340eaf62fffSJeremy L Thompson // Compute the diagonal of B^T D B 341eaf62fffSJeremy L Thompson // Each element 342eaf62fffSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 343eaf62fffSJeremy L Thompson CeedInt d_out = -1; 344eaf62fffSJeremy L Thompson // Each basis eval mode pair 345437c7c90SJeremy L Thompson for (CeedInt e_out = 0; e_out < num_eval_modes_out[b]; e_out++) { 346437c7c90SJeremy L Thompson const CeedScalar *B_t = NULL; 347437c7c90SJeremy L Thompson if (eval_modes_out[b][e_out] == CEED_EVAL_GRAD) d_out += 1; 348437c7c90SJeremy L Thompson CeedOperatorGetBasisPointer(eval_modes_out[b][e_out], identity, interp, &grad[d_out * num_qpts * num_nodes], &B_t); 349eaf62fffSJeremy L Thompson CeedInt d_in = -1; 350437c7c90SJeremy L Thompson for (CeedInt e_in = 0; e_in < num_eval_modes_in[b]; e_in++) { 351437c7c90SJeremy L Thompson const CeedScalar *B = NULL; 352437c7c90SJeremy L Thompson if (eval_modes_in[b][e_in] == CEED_EVAL_GRAD) d_in += 1; 353437c7c90SJeremy L Thompson CeedOperatorGetBasisPointer(eval_modes_in[b][e_in], identity, interp, &grad[d_in * num_qpts * num_nodes], &B); 354eaf62fffSJeremy L Thompson // Each component 355437c7c90SJeremy L Thompson for (CeedInt c_out = 0; c_out < num_components; c_out++) { 356437c7c90SJeremy L Thompson // Each qpt/node pair 3572b730f8bSJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 358eaf62fffSJeremy L Thompson if (is_pointblock) { 359eaf62fffSJeremy L Thompson // Point Block Diagonal 360437c7c90SJeremy L Thompson for (CeedInt c_in = 0; c_in < num_components; c_in++) { 361437c7c90SJeremy L Thompson const CeedInt c_offset = (eval_mode_offsets_in[b][e_in] + c_in) * num_output_components + eval_mode_offsets_out[b][e_out] + c_out; 362437c7c90SJeremy L Thompson const CeedScalar qf_value = assembled_qf_array[q * layout[0] + c_offset * layout[1] + e * layout[2]]; 3632b730f8bSJeremy L Thompson for (CeedInt n = 0; n < num_nodes; n++) { 364437c7c90SJeremy L Thompson elem_diag_array[((e * num_components + c_out) * num_components + c_in) * num_nodes + n] += 365437c7c90SJeremy L Thompson B_t[q * num_nodes + n] * qf_value * B[q * num_nodes + n]; 366eaf62fffSJeremy L Thompson } 3672b730f8bSJeremy L Thompson } 368eaf62fffSJeremy L Thompson } else { 369eaf62fffSJeremy L Thompson // Diagonal Only 370437c7c90SJeremy L Thompson const CeedInt c_offset = (eval_mode_offsets_in[b][e_in] + c_out) * num_output_components + eval_mode_offsets_out[b][e_out] + c_out; 371437c7c90SJeremy L Thompson const CeedScalar qf_value = assembled_qf_array[q * layout[0] + c_offset * layout[1] + e * layout[2]]; 3722b730f8bSJeremy L Thompson for (CeedInt n = 0; n < num_nodes; n++) { 373437c7c90SJeremy L Thompson elem_diag_array[(e * num_components + c_out) * num_nodes + n] += B_t[q * num_nodes + n] * qf_value * B[q * num_nodes + n]; 374eaf62fffSJeremy L Thompson } 375eaf62fffSJeremy L Thompson } 376eaf62fffSJeremy L Thompson } 377eaf62fffSJeremy L Thompson } 3782b730f8bSJeremy L Thompson } 3792b730f8bSJeremy L Thompson } 3802b730f8bSJeremy L Thompson } 3812b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(elem_diag, &elem_diag_array)); 382eaf62fffSJeremy L Thompson 383eaf62fffSJeremy L Thompson // Assemble local operator diagonal 384437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionApply(diag_elem_rstr, CEED_TRANSPOSE, elem_diag, assembled, request)); 385eaf62fffSJeremy L Thompson 386eaf62fffSJeremy L Thompson // Cleanup 387437c7c90SJeremy L Thompson if (is_pointblock) CeedCall(CeedElemRestrictionDestroy(&diag_elem_rstr)); 3882b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&elem_diag)); 3892b730f8bSJeremy L Thompson CeedCall(CeedFree(&identity)); 390437c7c90SJeremy L Thompson } 391437c7c90SJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array)); 392437c7c90SJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled_qf)); 393eaf62fffSJeremy L Thompson 394eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 395eaf62fffSJeremy L Thompson } 396eaf62fffSJeremy L Thompson 397eaf62fffSJeremy L Thompson /** 398eaf62fffSJeremy L Thompson @brief Core logic for assembling composite operator diagonal 399eaf62fffSJeremy L Thompson 400eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble point block diagonal 401ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE 402eaf62fffSJeremy L Thompson @param[in] is_pointblock Boolean flag to assemble diagonal or point block diagonal 403eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled diagonal 404eaf62fffSJeremy L Thompson 405eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 406eaf62fffSJeremy L Thompson 407eaf62fffSJeremy L Thompson @ref Developer 408eaf62fffSJeremy L Thompson **/ 4092b730f8bSJeremy L Thompson static inline int CeedCompositeOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedRequest *request, const bool is_pointblock, 410eaf62fffSJeremy L Thompson CeedVector assembled) { 411eaf62fffSJeremy L Thompson CeedInt num_sub; 412eaf62fffSJeremy L Thompson CeedOperator *suboperators; 413c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_sub)); 414c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &suboperators)); 415eaf62fffSJeremy L Thompson for (CeedInt i = 0; i < num_sub; i++) { 4166aa95790SJeremy L Thompson if (is_pointblock) { 4172b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(suboperators[i], assembled, request)); 4186aa95790SJeremy L Thompson } else { 4192b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddDiagonal(suboperators[i], assembled, request)); 4206aa95790SJeremy L Thompson } 421eaf62fffSJeremy L Thompson } 422eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 423eaf62fffSJeremy L Thompson } 424eaf62fffSJeremy L Thompson 425eaf62fffSJeremy L Thompson /** 426eaf62fffSJeremy L Thompson @brief Build nonzero pattern for non-composite operator 427eaf62fffSJeremy L Thompson 428eaf62fffSJeremy L Thompson Users should generally use CeedOperatorLinearAssembleSymbolic() 429eaf62fffSJeremy L Thompson 430eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble nonzero pattern 431eaf62fffSJeremy L Thompson @param[in] offset Offset for number of entries 432eaf62fffSJeremy L Thompson @param[out] rows Row number for each entry 433eaf62fffSJeremy L Thompson @param[out] cols Column number for each entry 434eaf62fffSJeremy L Thompson 435eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 436eaf62fffSJeremy L Thompson 437eaf62fffSJeremy L Thompson @ref Developer 438eaf62fffSJeremy L Thompson **/ 4392b730f8bSJeremy L Thompson static int CeedSingleOperatorAssembleSymbolic(CeedOperator op, CeedInt offset, CeedInt *rows, CeedInt *cols) { 440f3d47e36SJeremy L Thompson Ceed ceed; 441f3d47e36SJeremy L Thompson bool is_composite; 442f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 443f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 444f3d47e36SJeremy L Thompson 445b275c451SJeremy L Thompson if (is_composite) { 446eaf62fffSJeremy L Thompson // LCOV_EXCL_START 4472b730f8bSJeremy L Thompson return CeedError(ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 448eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 4492b730f8bSJeremy L Thompson } 450eaf62fffSJeremy L Thompson 451c9366a6bSJeremy L Thompson CeedSize num_nodes; 4522b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &num_nodes, NULL)); 453eaf62fffSJeremy L Thompson CeedElemRestriction rstr_in; 4542b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(op, &rstr_in)); 455e79b91d9SJeremy L Thompson CeedInt num_elem, elem_size, num_comp; 4562b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr_in, &num_elem)); 4572b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr_in, &elem_size)); 4582b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(rstr_in, &num_comp)); 459eaf62fffSJeremy L Thompson CeedInt layout_er[3]; 4602b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(rstr_in, &layout_er)); 461eaf62fffSJeremy L Thompson 462eaf62fffSJeremy L Thompson CeedInt local_num_entries = elem_size * num_comp * elem_size * num_comp * num_elem; 463eaf62fffSJeremy L Thompson 464eaf62fffSJeremy L Thompson // Determine elem_dof relation 465eaf62fffSJeremy L Thompson CeedVector index_vec; 4662b730f8bSJeremy L Thompson CeedCall(CeedVectorCreate(ceed, num_nodes, &index_vec)); 467eaf62fffSJeremy L Thompson CeedScalar *array; 4682b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayWrite(index_vec, CEED_MEM_HOST, &array)); 469ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_nodes; i++) array[i] = i; 4702b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(index_vec, &array)); 471eaf62fffSJeremy L Thompson CeedVector elem_dof; 4722b730f8bSJeremy L Thompson CeedCall(CeedVectorCreate(ceed, num_elem * elem_size * num_comp, &elem_dof)); 4732b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(elem_dof, 0.0)); 4742b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionApply(rstr_in, CEED_NOTRANSPOSE, index_vec, elem_dof, CEED_REQUEST_IMMEDIATE)); 475eaf62fffSJeremy L Thompson const CeedScalar *elem_dof_a; 4762b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(elem_dof, CEED_MEM_HOST, &elem_dof_a)); 4772b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&index_vec)); 478eaf62fffSJeremy L Thompson 479eaf62fffSJeremy L Thompson // Determine i, j locations for element matrices 480eaf62fffSJeremy L Thompson CeedInt count = 0; 481ed9e99e6SJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 482ed9e99e6SJeremy L Thompson for (CeedInt comp_in = 0; comp_in < num_comp; comp_in++) { 483ed9e99e6SJeremy L Thompson for (CeedInt comp_out = 0; comp_out < num_comp; comp_out++) { 484ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < elem_size; i++) { 485ed9e99e6SJeremy L Thompson for (CeedInt j = 0; j < elem_size; j++) { 4862b730f8bSJeremy L Thompson const CeedInt elem_dof_index_row = i * layout_er[0] + (comp_out)*layout_er[1] + e * layout_er[2]; 4872b730f8bSJeremy L Thompson const CeedInt elem_dof_index_col = j * layout_er[0] + comp_in * layout_er[1] + e * layout_er[2]; 488eaf62fffSJeremy L Thompson 489eaf62fffSJeremy L Thompson const CeedInt row = elem_dof_a[elem_dof_index_row]; 490eaf62fffSJeremy L Thompson const CeedInt col = elem_dof_a[elem_dof_index_col]; 491eaf62fffSJeremy L Thompson 492eaf62fffSJeremy L Thompson rows[offset + count] = row; 493eaf62fffSJeremy L Thompson cols[offset + count] = col; 494eaf62fffSJeremy L Thompson count++; 495eaf62fffSJeremy L Thompson } 496eaf62fffSJeremy L Thompson } 497eaf62fffSJeremy L Thompson } 498eaf62fffSJeremy L Thompson } 499eaf62fffSJeremy L Thompson } 5002b730f8bSJeremy L Thompson if (count != local_num_entries) { 501eaf62fffSJeremy L Thompson // LCOV_EXCL_START 502eaf62fffSJeremy L Thompson return CeedError(ceed, CEED_ERROR_MAJOR, "Error computing assembled entries"); 503eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 5042b730f8bSJeremy L Thompson } 5052b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(elem_dof, &elem_dof_a)); 5062b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&elem_dof)); 507eaf62fffSJeremy L Thompson 508eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 509eaf62fffSJeremy L Thompson } 510eaf62fffSJeremy L Thompson 511eaf62fffSJeremy L Thompson /** 512eaf62fffSJeremy L Thompson @brief Assemble nonzero entries for non-composite operator 513eaf62fffSJeremy L Thompson 514eaf62fffSJeremy L Thompson Users should generally use CeedOperatorLinearAssemble() 515eaf62fffSJeremy L Thompson 516eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 517ea61e9acSJeremy L Thompson @param[in] offset Offset for number of entries 518eaf62fffSJeremy L Thompson @param[out] values Values to assemble into matrix 519eaf62fffSJeremy L Thompson 520eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 521eaf62fffSJeremy L Thompson 522eaf62fffSJeremy L Thompson @ref Developer 523eaf62fffSJeremy L Thompson **/ 5242b730f8bSJeremy L Thompson static int CeedSingleOperatorAssemble(CeedOperator op, CeedInt offset, CeedVector values) { 525f3d47e36SJeremy L Thompson Ceed ceed; 526f3d47e36SJeremy L Thompson bool is_composite; 527f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 528f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 529f3d47e36SJeremy L Thompson 530f3d47e36SJeremy L Thompson if (is_composite) { 531eaf62fffSJeremy L Thompson // LCOV_EXCL_START 5322b730f8bSJeremy L Thompson return CeedError(ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 533eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 5342b730f8bSJeremy L Thompson } 535f3d47e36SJeremy L Thompson 536f3d47e36SJeremy L Thompson // Early exit for empty operator 537f3d47e36SJeremy L Thompson { 538f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 539f3d47e36SJeremy L Thompson 540f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 541f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 542f3d47e36SJeremy L Thompson } 543eaf62fffSJeremy L Thompson 544cefa2673SJeremy L Thompson if (op->LinearAssembleSingle) { 545cefa2673SJeremy L Thompson // Backend version 5462b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleSingle(op, offset, values)); 547cefa2673SJeremy L Thompson return CEED_ERROR_SUCCESS; 548cefa2673SJeremy L Thompson } else { 549cefa2673SJeremy L Thompson // Operator fallback 550cefa2673SJeremy L Thompson CeedOperator op_fallback; 551cefa2673SJeremy L Thompson 5522b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 553cefa2673SJeremy L Thompson if (op_fallback) { 5542b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemble(op_fallback, offset, values)); 555cefa2673SJeremy L Thompson return CEED_ERROR_SUCCESS; 556cefa2673SJeremy L Thompson } 557cefa2673SJeremy L Thompson } 558cefa2673SJeremy L Thompson 559eaf62fffSJeremy L Thompson // Assemble QFunction 560eaf62fffSJeremy L Thompson CeedQFunction qf; 5612b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 562eaf62fffSJeremy L Thompson CeedVector assembled_qf; 563eaf62fffSJeremy L Thompson CeedElemRestriction rstr_q; 5642b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &rstr_q, CEED_REQUEST_IMMEDIATE)); 5651f9221feSJeremy L Thompson CeedSize qf_length; 5662b730f8bSJeremy L Thompson CeedCall(CeedVectorGetLength(assembled_qf, &qf_length)); 567eaf62fffSJeremy L Thompson 5687e7773b5SJeremy L Thompson CeedInt num_input_fields, num_output_fields; 569eaf62fffSJeremy L Thompson CeedOperatorField *input_fields; 570eaf62fffSJeremy L Thompson CeedOperatorField *output_fields; 5712b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, &num_input_fields, &input_fields, &num_output_fields, &output_fields)); 572eaf62fffSJeremy L Thompson 573ed9e99e6SJeremy L Thompson // Get assembly data 574ed9e99e6SJeremy L Thompson CeedOperatorAssemblyData data; 5752b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data)); 576437c7c90SJeremy L Thompson const CeedEvalMode **eval_modes_in, **eval_modes_out; 577437c7c90SJeremy L Thompson CeedInt *num_eval_modes_in, *num_eval_modes_out, num_active_bases; 578437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_active_bases, &num_eval_modes_in, &eval_modes_in, NULL, &num_eval_modes_out, 579437c7c90SJeremy L Thompson &eval_modes_out, NULL, NULL)); 580437c7c90SJeremy L Thompson CeedBasis *bases; 581437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, &bases, NULL, NULL)); 582437c7c90SJeremy L Thompson CeedBasis basis_in = bases[0]; 583eaf62fffSJeremy L Thompson 584437c7c90SJeremy L Thompson if (num_active_bases > 1) { 585437c7c90SJeremy L Thompson // LCOV_EXCL_START 586437c7c90SJeremy L Thompson return CeedError(ceed, CEED_ERROR_UNSUPPORTED, "Cannot assemble operator with multiple active bases"); 587437c7c90SJeremy L Thompson // LCOV_EXCL_STOP 588437c7c90SJeremy L Thompson } 589437c7c90SJeremy L Thompson if (num_eval_modes_in[0] == 0 || num_eval_modes_out[0] == 0) { 590eaf62fffSJeremy L Thompson // LCOV_EXCL_START 5912b730f8bSJeremy L Thompson return CeedError(ceed, CEED_ERROR_UNSUPPORTED, "Cannot assemble operator with out inputs/outputs"); 592eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 5932b730f8bSJeremy L Thompson } 594eaf62fffSJeremy L Thompson 595ed9e99e6SJeremy L Thompson CeedElemRestriction active_rstr; 596eaf62fffSJeremy L Thompson CeedInt num_elem, elem_size, num_qpts, num_comp; 5972b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(op, &active_rstr)); 5982b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(active_rstr, &num_elem)); 5992b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(active_rstr, &elem_size)); 6002b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(active_rstr, &num_comp)); 6012b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_in, &num_qpts)); 602eaf62fffSJeremy L Thompson 603eaf62fffSJeremy L Thompson CeedInt local_num_entries = elem_size * num_comp * elem_size * num_comp * num_elem; 604eaf62fffSJeremy L Thompson 605eaf62fffSJeremy L Thompson // loop over elements and put in data structure 606eaf62fffSJeremy L Thompson const CeedScalar *interp_in, *grad_in; 6072b730f8bSJeremy L Thompson CeedCall(CeedBasisGetInterp(basis_in, &interp_in)); 6082b730f8bSJeremy L Thompson CeedCall(CeedBasisGetGrad(basis_in, &grad_in)); 609eaf62fffSJeremy L Thompson 610eaf62fffSJeremy L Thompson const CeedScalar *assembled_qf_array; 6112b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array)); 612eaf62fffSJeremy L Thompson 613eaf62fffSJeremy L Thompson CeedInt layout_qf[3]; 6142b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(rstr_q, &layout_qf)); 6152b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_q)); 616eaf62fffSJeremy L Thompson 617eaf62fffSJeremy L Thompson // we store B_mat_in, B_mat_out, BTD, elem_mat in row-major order 618437c7c90SJeremy L Thompson const CeedScalar **B_mats_in, **B_mats_out; 619437c7c90SJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, NULL, &B_mats_in, &B_mats_out)); 620437c7c90SJeremy L Thompson const CeedScalar *B_mat_in = B_mats_in[0], *B_mat_out = B_mats_out[0]; 621437c7c90SJeremy L Thompson CeedScalar BTD_mat[elem_size * num_qpts * num_eval_modes_in[0]]; 622eaf62fffSJeremy L Thompson CeedScalar elem_mat[elem_size * elem_size]; 62392ae7e47SJeremy L Thompson CeedInt count = 0; 624eaf62fffSJeremy L Thompson CeedScalar *vals; 6252b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayWrite(values, CEED_MEM_HOST, &vals)); 626ed9e99e6SJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 627ed9e99e6SJeremy L Thompson for (CeedInt comp_in = 0; comp_in < num_comp; comp_in++) { 628ed9e99e6SJeremy L Thompson for (CeedInt comp_out = 0; comp_out < num_comp; comp_out++) { 629ed9e99e6SJeremy L Thompson // Compute B^T*D 630ed9e99e6SJeremy L Thompson for (CeedInt n = 0; n < elem_size; n++) { 631ed9e99e6SJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 632437c7c90SJeremy L Thompson for (CeedInt e_in = 0; e_in < num_eval_modes_in[0]; e_in++) { 633437c7c90SJeremy L Thompson const CeedInt btd_index = n * (num_qpts * num_eval_modes_in[0]) + (num_eval_modes_in[0] * q + e_in); 634067fd99fSJeremy L Thompson CeedScalar sum = 0.0; 635437c7c90SJeremy L Thompson for (CeedInt e_out = 0; e_out < num_eval_modes_out[0]; e_out++) { 636437c7c90SJeremy L Thompson const CeedInt b_out_index = (num_eval_modes_out[0] * q + e_out) * elem_size + n; 637437c7c90SJeremy L Thompson const CeedInt eval_mode_index = ((e_in * num_comp + comp_in) * num_eval_modes_out[0] + e_out) * num_comp + comp_out; 6382b730f8bSJeremy L Thompson const CeedInt qf_index = q * layout_qf[0] + eval_mode_index * layout_qf[1] + e * layout_qf[2]; 639067fd99fSJeremy L Thompson sum += B_mat_out[b_out_index] * assembled_qf_array[qf_index]; 640eaf62fffSJeremy L Thompson } 641067fd99fSJeremy L Thompson BTD_mat[btd_index] = sum; 642ed9e99e6SJeremy L Thompson } 643ed9e99e6SJeremy L Thompson } 644eaf62fffSJeremy L Thompson } 645eaf62fffSJeremy L Thompson // form element matrix itself (for each block component) 646437c7c90SJeremy L Thompson CeedCall(CeedMatrixMatrixMultiply(ceed, BTD_mat, B_mat_in, elem_mat, elem_size, elem_size, num_qpts * num_eval_modes_in[0])); 647eaf62fffSJeremy L Thompson 648eaf62fffSJeremy L Thompson // put element matrix in coordinate data structure 649ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < elem_size; i++) { 650ed9e99e6SJeremy L Thompson for (CeedInt j = 0; j < elem_size; j++) { 651eaf62fffSJeremy L Thompson vals[offset + count] = elem_mat[i * elem_size + j]; 652eaf62fffSJeremy L Thompson count++; 653eaf62fffSJeremy L Thompson } 654eaf62fffSJeremy L Thompson } 655eaf62fffSJeremy L Thompson } 656eaf62fffSJeremy L Thompson } 657eaf62fffSJeremy L Thompson } 6582b730f8bSJeremy L Thompson if (count != local_num_entries) { 659eaf62fffSJeremy L Thompson // LCOV_EXCL_START 660eaf62fffSJeremy L Thompson return CeedError(ceed, CEED_ERROR_MAJOR, "Error computing entries"); 661eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 6622b730f8bSJeremy L Thompson } 6632b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(values, &vals)); 664eaf62fffSJeremy L Thompson 6652b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array)); 6662b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled_qf)); 667eaf62fffSJeremy L Thompson 668eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 669eaf62fffSJeremy L Thompson } 670eaf62fffSJeremy L Thompson 671eaf62fffSJeremy L Thompson /** 672eaf62fffSJeremy L Thompson @brief Count number of entries for assembled CeedOperator 673eaf62fffSJeremy L Thompson 674eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 675eaf62fffSJeremy L Thompson @param[out] num_entries Number of entries in assembled representation 676eaf62fffSJeremy L Thompson 677eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 678eaf62fffSJeremy L Thompson 679eaf62fffSJeremy L Thompson @ref Utility 680eaf62fffSJeremy L Thompson **/ 6812b730f8bSJeremy L Thompson static int CeedSingleOperatorAssemblyCountEntries(CeedOperator op, CeedInt *num_entries) { 682b275c451SJeremy L Thompson bool is_composite; 683eaf62fffSJeremy L Thompson CeedElemRestriction rstr; 684eaf62fffSJeremy L Thompson CeedInt num_elem, elem_size, num_comp; 685eaf62fffSJeremy L Thompson 686b275c451SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 687b275c451SJeremy L Thompson if (is_composite) { 688eaf62fffSJeremy L Thompson // LCOV_EXCL_START 6892b730f8bSJeremy L Thompson return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 690eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 6912b730f8bSJeremy L Thompson } 6922b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(op, &rstr)); 6932b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem)); 6942b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size)); 6952b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp)); 696eaf62fffSJeremy L Thompson *num_entries = elem_size * num_comp * elem_size * num_comp * num_elem; 697eaf62fffSJeremy L Thompson 698eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 699eaf62fffSJeremy L Thompson } 700eaf62fffSJeremy L Thompson 701eaf62fffSJeremy L Thompson /** 702ea61e9acSJeremy L Thompson @brief Common code for creating a multigrid coarse operator and level transfer operators for a CeedOperator 703eaf62fffSJeremy L Thompson 704eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 705eaf62fffSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter 706eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 707eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 708eaf62fffSJeremy L Thompson @param[in] basis_c_to_f Basis for coarse to fine interpolation 709eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 710eaf62fffSJeremy L Thompson @param[out] op_prolong Coarse to fine operator 711eaf62fffSJeremy L Thompson @param[out] op_restrict Fine to coarse operator 712eaf62fffSJeremy L Thompson 713eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 714eaf62fffSJeremy L Thompson 715eaf62fffSJeremy L Thompson @ref Developer 716eaf62fffSJeremy L Thompson **/ 7172b730f8bSJeremy L Thompson static int CeedSingleOperatorMultigridLevel(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 7182b730f8bSJeremy L Thompson CeedBasis basis_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) { 719eaf62fffSJeremy L Thompson Ceed ceed; 7202b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op_fine, &ceed)); 721eaf62fffSJeremy L Thompson 722eaf62fffSJeremy L Thompson // Check for composite operator 723eaf62fffSJeremy L Thompson bool is_composite; 7242b730f8bSJeremy L Thompson CeedCall(CeedOperatorIsComposite(op_fine, &is_composite)); 7252b730f8bSJeremy L Thompson if (is_composite) { 726eaf62fffSJeremy L Thompson // LCOV_EXCL_START 7272b730f8bSJeremy L Thompson return CeedError(ceed, CEED_ERROR_UNSUPPORTED, "Automatic multigrid setup for composite operators not supported"); 728eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 7292b730f8bSJeremy L Thompson } 730eaf62fffSJeremy L Thompson 731eaf62fffSJeremy L Thompson // Coarse Grid 7322b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed, op_fine->qf, op_fine->dqf, op_fine->dqfT, op_coarse)); 733eaf62fffSJeremy L Thompson CeedElemRestriction rstr_fine = NULL; 734eaf62fffSJeremy L Thompson // -- Clone input fields 73592ae7e47SJeremy L Thompson for (CeedInt i = 0; i < op_fine->qf->num_input_fields; i++) { 736eaf62fffSJeremy L Thompson if (op_fine->input_fields[i]->vec == CEED_VECTOR_ACTIVE) { 737437c7c90SJeremy L Thompson rstr_fine = op_fine->input_fields[i]->elem_rstr; 7382b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE)); 739eaf62fffSJeremy L Thompson } else { 740437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, op_fine->input_fields[i]->elem_rstr, 7412b730f8bSJeremy L Thompson op_fine->input_fields[i]->basis, op_fine->input_fields[i]->vec)); 742eaf62fffSJeremy L Thompson } 743eaf62fffSJeremy L Thompson } 744eaf62fffSJeremy L Thompson // -- Clone output fields 74592ae7e47SJeremy L Thompson for (CeedInt i = 0; i < op_fine->qf->num_output_fields; i++) { 746eaf62fffSJeremy L Thompson if (op_fine->output_fields[i]->vec == CEED_VECTOR_ACTIVE) { 7472b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE)); 748eaf62fffSJeremy L Thompson } else { 749437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, op_fine->output_fields[i]->elem_rstr, 7502b730f8bSJeremy L Thompson op_fine->output_fields[i]->basis, op_fine->output_fields[i]->vec)); 751eaf62fffSJeremy L Thompson } 752eaf62fffSJeremy L Thompson } 753af99e877SJeremy L Thompson // -- Clone QFunctionAssemblyData 7542b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op_fine->qf_assembled, &(*op_coarse)->qf_assembled)); 755eaf62fffSJeremy L Thompson 756eaf62fffSJeremy L Thompson // Multiplicity vector 757eaf62fffSJeremy L Thompson CeedVector mult_vec, mult_e_vec; 7582b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionCreateVector(rstr_fine, &mult_vec, &mult_e_vec)); 7592b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(mult_e_vec, 0.0)); 7602b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionApply(rstr_fine, CEED_NOTRANSPOSE, p_mult_fine, mult_e_vec, CEED_REQUEST_IMMEDIATE)); 7612b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(mult_vec, 0.0)); 7622b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionApply(rstr_fine, CEED_TRANSPOSE, mult_e_vec, mult_vec, CEED_REQUEST_IMMEDIATE)); 7632b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&mult_e_vec)); 7642b730f8bSJeremy L Thompson CeedCall(CeedVectorReciprocal(mult_vec)); 765eaf62fffSJeremy L Thompson 766eaf62fffSJeremy L Thompson // Restriction 767eaf62fffSJeremy L Thompson CeedInt num_comp; 7682b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_coarse, &num_comp)); 769eaf62fffSJeremy L Thompson CeedQFunction qf_restrict; 7702b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_restrict)); 771eaf62fffSJeremy L Thompson CeedInt *num_comp_r_data; 7722b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &num_comp_r_data)); 773eaf62fffSJeremy L Thompson num_comp_r_data[0] = num_comp; 774eaf62fffSJeremy L Thompson CeedQFunctionContext ctx_r; 7752b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextCreate(ceed, &ctx_r)); 7762b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextSetData(ctx_r, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_r_data), num_comp_r_data)); 7772b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(qf_restrict, ctx_r)); 7782b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextDestroy(&ctx_r)); 7792b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_restrict, "input", num_comp, CEED_EVAL_NONE)); 7802b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_restrict, "scale", num_comp, CEED_EVAL_NONE)); 7812b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(qf_restrict, "output", num_comp, CEED_EVAL_INTERP)); 7822b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_restrict, num_comp)); 783eaf62fffSJeremy L Thompson 7842b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed, qf_restrict, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_restrict)); 7852b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_restrict, "input", rstr_fine, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE)); 7862b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_restrict, "scale", rstr_fine, CEED_BASIS_COLLOCATED, mult_vec)); 7872b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_restrict, "output", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE)); 788eaf62fffSJeremy L Thompson 789eaf62fffSJeremy L Thompson // Prolongation 790eaf62fffSJeremy L Thompson CeedQFunction qf_prolong; 7912b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_prolong)); 792eaf62fffSJeremy L Thompson CeedInt *num_comp_p_data; 7932b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &num_comp_p_data)); 794eaf62fffSJeremy L Thompson num_comp_p_data[0] = num_comp; 795eaf62fffSJeremy L Thompson CeedQFunctionContext ctx_p; 7962b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextCreate(ceed, &ctx_p)); 7972b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextSetData(ctx_p, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_p_data), num_comp_p_data)); 7982b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(qf_prolong, ctx_p)); 7992b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextDestroy(&ctx_p)); 8002b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_prolong, "input", num_comp, CEED_EVAL_INTERP)); 8012b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_prolong, "scale", num_comp, CEED_EVAL_NONE)); 8022b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(qf_prolong, "output", num_comp, CEED_EVAL_NONE)); 8032b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_prolong, num_comp)); 804eaf62fffSJeremy L Thompson 8052b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed, qf_prolong, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_prolong)); 8062b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_prolong, "input", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE)); 8072b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_prolong, "scale", rstr_fine, CEED_BASIS_COLLOCATED, mult_vec)); 8082b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_prolong, "output", rstr_fine, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE)); 809eaf62fffSJeremy L Thompson 810ea6b5821SJeremy L Thompson // Clone name 811ea6b5821SJeremy L Thompson bool has_name = op_fine->name; 812ea6b5821SJeremy L Thompson size_t name_len = op_fine->name ? strlen(op_fine->name) : 0; 8132b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetName(*op_coarse, op_fine->name)); 814ea6b5821SJeremy L Thompson { 815ea6b5821SJeremy L Thompson char *prolongation_name; 8162b730f8bSJeremy L Thompson CeedCall(CeedCalloc(18 + name_len, &prolongation_name)); 8172b730f8bSJeremy L Thompson sprintf(prolongation_name, "prolongation%s%s", has_name ? " for " : "", has_name ? op_fine->name : ""); 8182b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetName(*op_prolong, prolongation_name)); 8192b730f8bSJeremy L Thompson CeedCall(CeedFree(&prolongation_name)); 820ea6b5821SJeremy L Thompson } 821ea6b5821SJeremy L Thompson { 822ea6b5821SJeremy L Thompson char *restriction_name; 8232b730f8bSJeremy L Thompson CeedCall(CeedCalloc(17 + name_len, &restriction_name)); 8242b730f8bSJeremy L Thompson sprintf(restriction_name, "restriction%s%s", has_name ? " for " : "", has_name ? op_fine->name : ""); 8252b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetName(*op_restrict, restriction_name)); 8262b730f8bSJeremy L Thompson CeedCall(CeedFree(&restriction_name)); 827ea6b5821SJeremy L Thompson } 828ea6b5821SJeremy L Thompson 82958e4b056SJeremy L Thompson // Check 83058e4b056SJeremy L Thompson CeedCall(CeedOperatorCheckReady(*op_coarse)); 83158e4b056SJeremy L Thompson CeedCall(CeedOperatorCheckReady(*op_prolong)); 83258e4b056SJeremy L Thompson CeedCall(CeedOperatorCheckReady(*op_restrict)); 83358e4b056SJeremy L Thompson 834eaf62fffSJeremy L Thompson // Cleanup 8352b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&mult_vec)); 8362b730f8bSJeremy L Thompson CeedCall(CeedBasisDestroy(&basis_c_to_f)); 8372b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&qf_restrict)); 8382b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&qf_prolong)); 839805fe78eSJeremy L Thompson 840eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 841eaf62fffSJeremy L Thompson } 842eaf62fffSJeremy L Thompson 843eaf62fffSJeremy L Thompson /** 844eaf62fffSJeremy L Thompson @brief Build 1D mass matrix and Laplacian with perturbation 845eaf62fffSJeremy L Thompson 846eaf62fffSJeremy L Thompson @param[in] interp_1d Interpolation matrix in one dimension 847eaf62fffSJeremy L Thompson @param[in] grad_1d Gradient matrix in one dimension 848eaf62fffSJeremy L Thompson @param[in] q_weight_1d Quadrature weights in one dimension 849eaf62fffSJeremy L Thompson @param[in] P_1d Number of basis nodes in one dimension 850eaf62fffSJeremy L Thompson @param[in] Q_1d Number of quadrature points in one dimension 851eaf62fffSJeremy L Thompson @param[in] dim Dimension of basis 852eaf62fffSJeremy L Thompson @param[out] mass Assembled mass matrix in one dimension 853eaf62fffSJeremy L Thompson @param[out] laplace Assembled perturbed Laplacian in one dimension 854eaf62fffSJeremy L Thompson 855eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 856eaf62fffSJeremy L Thompson 857eaf62fffSJeremy L Thompson @ref Developer 858eaf62fffSJeremy L Thompson **/ 8592b730f8bSJeremy L Thompson CeedPragmaOptimizeOff static int CeedBuildMassLaplace(const CeedScalar *interp_1d, const CeedScalar *grad_1d, const CeedScalar *q_weight_1d, 8602b730f8bSJeremy L Thompson CeedInt P_1d, CeedInt Q_1d, CeedInt dim, CeedScalar *mass, CeedScalar *laplace) { 8612b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) { 862eaf62fffSJeremy L Thompson for (CeedInt j = 0; j < P_1d; j++) { 863eaf62fffSJeremy L Thompson CeedScalar sum = 0.0; 8642b730f8bSJeremy L Thompson for (CeedInt k = 0; k < Q_1d; k++) sum += interp_1d[k * P_1d + i] * q_weight_1d[k] * interp_1d[k * P_1d + j]; 865eaf62fffSJeremy L Thompson mass[i + j * P_1d] = sum; 866eaf62fffSJeremy L Thompson } 8672b730f8bSJeremy L Thompson } 868eaf62fffSJeremy L Thompson // -- Laplacian 8692b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) { 870eaf62fffSJeremy L Thompson for (CeedInt j = 0; j < P_1d; j++) { 871eaf62fffSJeremy L Thompson CeedScalar sum = 0.0; 8722b730f8bSJeremy L Thompson for (CeedInt k = 0; k < Q_1d; k++) sum += grad_1d[k * P_1d + i] * q_weight_1d[k] * grad_1d[k * P_1d + j]; 873eaf62fffSJeremy L Thompson laplace[i + j * P_1d] = sum; 874eaf62fffSJeremy L Thompson } 8752b730f8bSJeremy L Thompson } 876eaf62fffSJeremy L Thompson CeedScalar perturbation = dim > 2 ? 1e-6 : 1e-4; 8772b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) laplace[i + P_1d * i] += perturbation; 878eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 879eaf62fffSJeremy L Thompson } 880ea61e9acSJeremy L Thompson CeedPragmaOptimizeOn; 881eaf62fffSJeremy L Thompson 882eaf62fffSJeremy L Thompson /// @} 883eaf62fffSJeremy L Thompson 884eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 885480fae85SJeremy L Thompson /// CeedOperator Backend API 886480fae85SJeremy L Thompson /// ---------------------------------------------------------------------------- 887480fae85SJeremy L Thompson /// @addtogroup CeedOperatorBackend 888480fae85SJeremy L Thompson /// @{ 889480fae85SJeremy L Thompson 890480fae85SJeremy L Thompson /** 891480fae85SJeremy L Thompson @brief Create object holding CeedQFunction assembly data for CeedOperator 892480fae85SJeremy L Thompson 893480fae85SJeremy L Thompson @param[in] ceed A Ceed object where the CeedQFunctionAssemblyData will be created 894ea61e9acSJeremy L Thompson @param[out] data Address of the variable where the newly created CeedQFunctionAssemblyData will be stored 895480fae85SJeremy L Thompson 896480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 897480fae85SJeremy L Thompson 898480fae85SJeremy L Thompson @ref Backend 899480fae85SJeremy L Thompson **/ 900ea61e9acSJeremy L Thompson int CeedQFunctionAssemblyDataCreate(Ceed ceed, CeedQFunctionAssemblyData *data) { 9012b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, data)); 902480fae85SJeremy L Thompson (*data)->ref_count = 1; 903480fae85SJeremy L Thompson (*data)->ceed = ceed; 9042b730f8bSJeremy L Thompson CeedCall(CeedReference(ceed)); 905480fae85SJeremy L Thompson 906480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 907480fae85SJeremy L Thompson } 908480fae85SJeremy L Thompson 909480fae85SJeremy L Thompson /** 910480fae85SJeremy L Thompson @brief Increment the reference counter for a CeedQFunctionAssemblyData 911480fae85SJeremy L Thompson 912ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to increment the reference counter 913480fae85SJeremy L Thompson 914480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 915480fae85SJeremy L Thompson 916480fae85SJeremy L Thompson @ref Backend 917480fae85SJeremy L Thompson **/ 918480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataReference(CeedQFunctionAssemblyData data) { 919480fae85SJeremy L Thompson data->ref_count++; 920480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 921480fae85SJeremy L Thompson } 922480fae85SJeremy L Thompson 923480fae85SJeremy L Thompson /** 924beecbf24SJeremy L Thompson @brief Set re-use of CeedQFunctionAssemblyData 9258b919e6bSJeremy L Thompson 926ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to mark for reuse 927ea61e9acSJeremy L Thompson @param[in] reuse_data Boolean flag indicating data re-use 9288b919e6bSJeremy L Thompson 9298b919e6bSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 9308b919e6bSJeremy L Thompson 9318b919e6bSJeremy L Thompson @ref Backend 9328b919e6bSJeremy L Thompson **/ 9332b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetReuse(CeedQFunctionAssemblyData data, bool reuse_data) { 934beecbf24SJeremy L Thompson data->reuse_data = reuse_data; 935beecbf24SJeremy L Thompson data->needs_data_update = true; 936beecbf24SJeremy L Thompson return CEED_ERROR_SUCCESS; 937beecbf24SJeremy L Thompson } 938beecbf24SJeremy L Thompson 939beecbf24SJeremy L Thompson /** 940beecbf24SJeremy L Thompson @brief Mark QFunctionAssemblyData as stale 941beecbf24SJeremy L Thompson 942ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to mark as stale 943ea61e9acSJeremy L Thompson @param[in] needs_data_update Boolean flag indicating if update is needed or completed 944beecbf24SJeremy L Thompson 945beecbf24SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 946beecbf24SJeremy L Thompson 947beecbf24SJeremy L Thompson @ref Backend 948beecbf24SJeremy L Thompson **/ 9492b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetUpdateNeeded(CeedQFunctionAssemblyData data, bool needs_data_update) { 950beecbf24SJeremy L Thompson data->needs_data_update = needs_data_update; 9518b919e6bSJeremy L Thompson return CEED_ERROR_SUCCESS; 9528b919e6bSJeremy L Thompson } 9538b919e6bSJeremy L Thompson 9548b919e6bSJeremy L Thompson /** 9558b919e6bSJeremy L Thompson @brief Determine if QFunctionAssemblyData needs update 9568b919e6bSJeremy L Thompson 9578b919e6bSJeremy L Thompson @param[in] data CeedQFunctionAssemblyData to mark as stale 9588b919e6bSJeremy L Thompson @param[out] is_update_needed Boolean flag indicating if re-assembly is required 9598b919e6bSJeremy L Thompson 9608b919e6bSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 9618b919e6bSJeremy L Thompson 9628b919e6bSJeremy L Thompson @ref Backend 9638b919e6bSJeremy L Thompson **/ 9642b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsUpdateNeeded(CeedQFunctionAssemblyData data, bool *is_update_needed) { 965beecbf24SJeremy L Thompson *is_update_needed = !data->reuse_data || data->needs_data_update; 9668b919e6bSJeremy L Thompson return CEED_ERROR_SUCCESS; 9678b919e6bSJeremy L Thompson } 9688b919e6bSJeremy L Thompson 9698b919e6bSJeremy L Thompson /** 970ea61e9acSJeremy L Thompson @brief Copy the pointer to a CeedQFunctionAssemblyData. 971ea61e9acSJeremy L Thompson Both pointers should be destroyed with `CeedCeedQFunctionAssemblyDataDestroy()`. 972ea61e9acSJeremy L Thompson Note: If `*data_copy` is non-NULL, then it is assumed that `*data_copy` is a pointer to a CeedQFunctionAssemblyData. 973ea61e9acSJeremy L Thompson This CeedQFunctionAssemblyData will be destroyed if `*data_copy` is the only reference to this CeedQFunctionAssemblyData. 974480fae85SJeremy L Thompson 975ea61e9acSJeremy L Thompson @param[in] data CeedQFunctionAssemblyData to copy reference to 976ea61e9acSJeremy L Thompson @param[in,out] data_copy Variable to store copied reference 977480fae85SJeremy L Thompson 978480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 979480fae85SJeremy L Thompson 980480fae85SJeremy L Thompson @ref Backend 981480fae85SJeremy L Thompson **/ 9822b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataReferenceCopy(CeedQFunctionAssemblyData data, CeedQFunctionAssemblyData *data_copy) { 9832b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataReference(data)); 9842b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataDestroy(data_copy)); 985480fae85SJeremy L Thompson *data_copy = data; 986480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 987480fae85SJeremy L Thompson } 988480fae85SJeremy L Thompson 989480fae85SJeremy L Thompson /** 990480fae85SJeremy L Thompson @brief Get setup status for internal objects for CeedQFunctionAssemblyData 991480fae85SJeremy L Thompson 992ea61e9acSJeremy L Thompson @param[in] data CeedQFunctionAssemblyData to retrieve status 993480fae85SJeremy L Thompson @param[out] is_setup Boolean flag for setup status 994480fae85SJeremy L Thompson 995480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 996480fae85SJeremy L Thompson 997480fae85SJeremy L Thompson @ref Backend 998480fae85SJeremy L Thompson **/ 9992b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsSetup(CeedQFunctionAssemblyData data, bool *is_setup) { 1000480fae85SJeremy L Thompson *is_setup = data->is_setup; 1001480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1002480fae85SJeremy L Thompson } 1003480fae85SJeremy L Thompson 1004480fae85SJeremy L Thompson /** 1005480fae85SJeremy L Thompson @brief Set internal objects for CeedQFunctionAssemblyData 1006480fae85SJeremy L Thompson 1007ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to set objects 1008480fae85SJeremy L Thompson @param[in] vec CeedVector to store assembled CeedQFunction at quadrature points 1009480fae85SJeremy L Thompson @param[in] rstr CeedElemRestriction for CeedVector containing assembled CeedQFunction 1010480fae85SJeremy L Thompson 1011480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1012480fae85SJeremy L Thompson 1013480fae85SJeremy L Thompson @ref Backend 1014480fae85SJeremy L Thompson **/ 10152b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetObjects(CeedQFunctionAssemblyData data, CeedVector vec, CeedElemRestriction rstr) { 10162b730f8bSJeremy L Thompson CeedCall(CeedVectorReferenceCopy(vec, &data->vec)); 10172b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(rstr, &data->rstr)); 1018480fae85SJeremy L Thompson 1019480fae85SJeremy L Thompson data->is_setup = true; 1020480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1021480fae85SJeremy L Thompson } 1022480fae85SJeremy L Thompson 10232b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataGetObjects(CeedQFunctionAssemblyData data, CeedVector *vec, CeedElemRestriction *rstr) { 10242b730f8bSJeremy L Thompson if (!data->is_setup) { 1025480fae85SJeremy L Thompson // LCOV_EXCL_START 10262b730f8bSJeremy L Thompson return CeedError(data->ceed, CEED_ERROR_INCOMPLETE, "Internal objects not set; must call CeedQFunctionAssemblyDataSetObjects first."); 1027480fae85SJeremy L Thompson // LCOV_EXCL_STOP 10282b730f8bSJeremy L Thompson } 1029480fae85SJeremy L Thompson 10302b730f8bSJeremy L Thompson CeedCall(CeedVectorReferenceCopy(data->vec, vec)); 10312b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(data->rstr, rstr)); 1032480fae85SJeremy L Thompson 1033480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1034480fae85SJeremy L Thompson } 1035480fae85SJeremy L Thompson 1036480fae85SJeremy L Thompson /** 1037480fae85SJeremy L Thompson @brief Destroy CeedQFunctionAssemblyData 1038480fae85SJeremy L Thompson 1039ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to destroy 1040480fae85SJeremy L Thompson 1041480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1042480fae85SJeremy L Thompson 1043480fae85SJeremy L Thompson @ref Backend 1044480fae85SJeremy L Thompson **/ 1045480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataDestroy(CeedQFunctionAssemblyData *data) { 1046480fae85SJeremy L Thompson if (!*data || --(*data)->ref_count > 0) return CEED_ERROR_SUCCESS; 1047480fae85SJeremy L Thompson 10482b730f8bSJeremy L Thompson CeedCall(CeedDestroy(&(*data)->ceed)); 10492b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&(*data)->vec)); 10502b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&(*data)->rstr)); 1051480fae85SJeremy L Thompson 10522b730f8bSJeremy L Thompson CeedCall(CeedFree(data)); 1053480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1054480fae85SJeremy L Thompson } 1055480fae85SJeremy L Thompson 1056ed9e99e6SJeremy L Thompson /** 1057ed9e99e6SJeremy L Thompson @brief Get CeedOperatorAssemblyData 1058ed9e99e6SJeremy L Thompson 1059ed9e99e6SJeremy L Thompson @param[in] op CeedOperator to assemble 1060ed9e99e6SJeremy L Thompson @param[out] data CeedQFunctionAssemblyData 1061ed9e99e6SJeremy L Thompson 1062ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1063ed9e99e6SJeremy L Thompson 1064ed9e99e6SJeremy L Thompson @ref Backend 1065ed9e99e6SJeremy L Thompson **/ 10662b730f8bSJeremy L Thompson int CeedOperatorGetOperatorAssemblyData(CeedOperator op, CeedOperatorAssemblyData *data) { 1067ed9e99e6SJeremy L Thompson if (!op->op_assembled) { 1068ed9e99e6SJeremy L Thompson CeedOperatorAssemblyData data; 1069ed9e99e6SJeremy L Thompson 10702b730f8bSJeremy L Thompson CeedCall(CeedOperatorAssemblyDataCreate(op->ceed, op, &data)); 1071ed9e99e6SJeremy L Thompson op->op_assembled = data; 1072ed9e99e6SJeremy L Thompson } 1073ed9e99e6SJeremy L Thompson *data = op->op_assembled; 1074ed9e99e6SJeremy L Thompson 1075ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1076ed9e99e6SJeremy L Thompson } 1077ed9e99e6SJeremy L Thompson 1078ed9e99e6SJeremy L Thompson /** 1079*ba746a46SJeremy L Thompson @brief Create object holding CeedOperator assembly data. 1080*ba746a46SJeremy L Thompson 1081*ba746a46SJeremy L Thompson The CeedOperatorAssemblyData holds an array with references to every active CeedBasis used in the CeedOperator. 1082*ba746a46SJeremy L Thompson An array with references to the corresponding active CeedElemRestrictions is also stored. 1083*ba746a46SJeremy L Thompson For each active CeedBasis, the CeedOperatorAssemblyData holds an array of all input and output CeedEvalModes for this CeedBasis. 1084*ba746a46SJeremy L Thompson The CeedOperatorAssemblyData holds an array of offsets for indexing into the assembled CeedQFunction arrays to the row representing each 1085*ba746a46SJeremy L Thompson CeedEvalMode. 1086*ba746a46SJeremy L Thompson The number of input columns across all active bases for the assembled CeedQFunction is also stored. 1087*ba746a46SJeremy L Thompson Lastly, the CeedOperatorAssembly data holds assembled matrices representing the full action of the CeedBasis for all CeedEvalModes. 1088ed9e99e6SJeremy L Thompson 1089ea61e9acSJeremy L Thompson @param[in] ceed Ceed object where the CeedOperatorAssemblyData will be created 1090ed9e99e6SJeremy L Thompson @param[in] op CeedOperator to be assembled 1091ea61e9acSJeremy L Thompson @param[out] data Address of the variable where the newly created CeedOperatorAssemblyData will be stored 1092ed9e99e6SJeremy L Thompson 1093ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1094ed9e99e6SJeremy L Thompson 1095ed9e99e6SJeremy L Thompson @ref Backend 1096ed9e99e6SJeremy L Thompson **/ 10972b730f8bSJeremy L Thompson int CeedOperatorAssemblyDataCreate(Ceed ceed, CeedOperator op, CeedOperatorAssemblyData *data) { 1098437c7c90SJeremy L Thompson CeedInt num_active_bases = 0; 1099437c7c90SJeremy L Thompson 1100437c7c90SJeremy L Thompson // Allocate 11012b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, data)); 1102ed9e99e6SJeremy L Thompson (*data)->ceed = ceed; 11032b730f8bSJeremy L Thompson CeedCall(CeedReference(ceed)); 1104ed9e99e6SJeremy L Thompson 1105ed9e99e6SJeremy L Thompson // Build OperatorAssembly data 1106ed9e99e6SJeremy L Thompson CeedQFunction qf; 1107ed9e99e6SJeremy L Thompson CeedQFunctionField *qf_fields; 1108ed9e99e6SJeremy L Thompson CeedOperatorField *op_fields; 1109ed9e99e6SJeremy L Thompson CeedInt num_input_fields; 11102b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 11112b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetFields(qf, &num_input_fields, &qf_fields, NULL, NULL)); 11122b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL)); 1113ed9e99e6SJeremy L Thompson 1114ed9e99e6SJeremy L Thompson // Determine active input basis 1115437c7c90SJeremy L Thompson CeedInt *num_eval_modes_in = NULL, *num_eval_modes_out = NULL, offset = 0; 1116437c7c90SJeremy L Thompson CeedEvalMode **eval_modes_in = NULL, **eval_modes_out = NULL; 1117437c7c90SJeremy L Thompson CeedSize **eval_mode_offsets_in = NULL, **eval_mode_offsets_out = NULL; 1118437c7c90SJeremy L Thompson 1119ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 1120ed9e99e6SJeremy L Thompson CeedVector vec; 1121437c7c90SJeremy L Thompson 11222b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec)); 1123ed9e99e6SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 1124437c7c90SJeremy L Thompson CeedInt index = -1, dim = 1, num_components; 1125437c7c90SJeremy L Thompson CeedBasis basis_in = NULL; 1126437c7c90SJeremy L Thompson CeedEvalMode eval_mode; 1127437c7c90SJeremy L Thompson 11282b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_in)); 11292b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis_in, &dim)); 1130437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_in, &num_components)); 11312b730f8bSJeremy L Thompson CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 1132437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_active_bases; i++) { 1133437c7c90SJeremy L Thompson if ((*data)->active_bases[i] == basis_in) index = i; 1134437c7c90SJeremy L Thompson } 1135437c7c90SJeremy L Thompson if (index == -1) { 1136437c7c90SJeremy L Thompson CeedElemRestriction elem_rstr_in; 1137437c7c90SJeremy L Thompson 1138437c7c90SJeremy L Thompson index = num_active_bases; 1139437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_bases)); 1140437c7c90SJeremy L Thompson (*data)->active_bases[num_active_bases] = NULL; 1141437c7c90SJeremy L Thompson CeedCall(CeedBasisReferenceCopy(basis_in, &(*data)->active_bases[num_active_bases])); 1142437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_elem_rstrs)); 1143437c7c90SJeremy L Thompson (*data)->active_elem_rstrs[num_active_bases] = NULL; 1144437c7c90SJeremy L Thompson CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr_in)); 1145437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(elem_rstr_in, &(*data)->active_elem_rstrs[num_active_bases])); 1146437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_in)); 1147437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_out)); 1148437c7c90SJeremy L Thompson num_eval_modes_in[index] = 0; 1149437c7c90SJeremy L Thompson num_eval_modes_out[index] = 0; 1150437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_in)); 1151437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_out)); 1152437c7c90SJeremy L Thompson eval_modes_in[index] = NULL; 1153437c7c90SJeremy L Thompson eval_modes_out[index] = NULL; 1154437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_in)); 1155437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_out)); 1156437c7c90SJeremy L Thompson eval_mode_offsets_in[index] = NULL; 1157437c7c90SJeremy L Thompson eval_mode_offsets_out[index] = NULL; 1158437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_in)); 1159437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_out)); 1160437c7c90SJeremy L Thompson (*data)->assembled_bases_in[index] = NULL; 1161437c7c90SJeremy L Thompson (*data)->assembled_bases_out[index] = NULL; 1162437c7c90SJeremy L Thompson num_active_bases++; 1163437c7c90SJeremy L Thompson } 1164ed9e99e6SJeremy L Thompson switch (eval_mode) { 1165ed9e99e6SJeremy L Thompson case CEED_EVAL_NONE: 1166ed9e99e6SJeremy L Thompson case CEED_EVAL_INTERP: 1167437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_eval_modes_in[index] + 1, &eval_modes_in[index])); 1168437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_eval_modes_in[index] + 1, &eval_mode_offsets_in[index])); 1169437c7c90SJeremy L Thompson eval_modes_in[index][num_eval_modes_in[index]] = eval_mode; 1170437c7c90SJeremy L Thompson eval_mode_offsets_in[index][num_eval_modes_in[index]] = offset; 1171437c7c90SJeremy L Thompson offset += num_components; 1172437c7c90SJeremy L Thompson num_eval_modes_in[index] += 1; 1173ed9e99e6SJeremy L Thompson break; 1174ed9e99e6SJeremy L Thompson case CEED_EVAL_GRAD: 1175437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_eval_modes_in[index] + dim, &eval_modes_in[index])); 1176437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_eval_modes_in[index] + dim, &eval_mode_offsets_in[index])); 1177ed9e99e6SJeremy L Thompson for (CeedInt d = 0; d < dim; d++) { 1178437c7c90SJeremy L Thompson eval_modes_in[index][num_eval_modes_in[index] + d] = eval_mode; 1179437c7c90SJeremy L Thompson eval_mode_offsets_in[index][num_eval_modes_in[index] + d] = offset; 1180437c7c90SJeremy L Thompson offset += num_components; 1181ed9e99e6SJeremy L Thompson } 1182437c7c90SJeremy L Thompson num_eval_modes_in[index] += dim; 1183ed9e99e6SJeremy L Thompson break; 1184ed9e99e6SJeremy L Thompson case CEED_EVAL_WEIGHT: 1185ed9e99e6SJeremy L Thompson case CEED_EVAL_DIV: 1186ed9e99e6SJeremy L Thompson case CEED_EVAL_CURL: 1187ed9e99e6SJeremy L Thompson break; // Caught by QF Assembly 1188ed9e99e6SJeremy L Thompson } 1189ed9e99e6SJeremy L Thompson } 1190ed9e99e6SJeremy L Thompson } 1191437c7c90SJeremy L Thompson (*data)->num_eval_modes_in = num_eval_modes_in; 1192437c7c90SJeremy L Thompson (*data)->eval_modes_in = eval_modes_in; 1193437c7c90SJeremy L Thompson (*data)->eval_mode_offsets_in = eval_mode_offsets_in; 1194ed9e99e6SJeremy L Thompson 1195ed9e99e6SJeremy L Thompson // Determine active output basis 1196ed9e99e6SJeremy L Thompson CeedInt num_output_fields; 1197437c7c90SJeremy L Thompson 11982b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetFields(qf, NULL, NULL, &num_output_fields, &qf_fields)); 11992b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields)); 1200437c7c90SJeremy L Thompson offset = 0; 1201ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_output_fields; i++) { 1202ed9e99e6SJeremy L Thompson CeedVector vec; 1203437c7c90SJeremy L Thompson 12042b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec)); 1205ed9e99e6SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 1206437c7c90SJeremy L Thompson CeedInt index = -1, dim = 1, num_components; 1207437c7c90SJeremy L Thompson CeedBasis basis_out = NULL; 1208ed9e99e6SJeremy L Thompson CeedEvalMode eval_mode; 1209437c7c90SJeremy L Thompson 1210437c7c90SJeremy L Thompson CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_out)); 1211437c7c90SJeremy L Thompson CeedCall(CeedBasisGetDimension(basis_out, &dim)); 1212437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_out, &num_components)); 12132b730f8bSJeremy L Thompson CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 1214437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_active_bases; i++) { 1215437c7c90SJeremy L Thompson if ((*data)->active_bases[i] == basis_out) index = i; 1216437c7c90SJeremy L Thompson } 1217437c7c90SJeremy L Thompson if (index == -1) { 1218437c7c90SJeremy L Thompson CeedElemRestriction elem_rstr_out; 1219437c7c90SJeremy L Thompson 1220437c7c90SJeremy L Thompson index = num_active_bases; 1221437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_bases)); 1222437c7c90SJeremy L Thompson (*data)->active_bases[num_active_bases] = NULL; 1223437c7c90SJeremy L Thompson CeedCall(CeedBasisReferenceCopy(basis_out, &(*data)->active_bases[num_active_bases])); 1224437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_elem_rstrs)); 1225437c7c90SJeremy L Thompson (*data)->active_elem_rstrs[num_active_bases] = NULL; 1226437c7c90SJeremy L Thompson CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr_out)); 1227437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(elem_rstr_out, &(*data)->active_elem_rstrs[num_active_bases])); 1228437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_in)); 1229437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_out)); 1230437c7c90SJeremy L Thompson num_eval_modes_in[index] = 0; 1231437c7c90SJeremy L Thompson num_eval_modes_out[index] = 0; 1232437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_in)); 1233437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_out)); 1234437c7c90SJeremy L Thompson eval_modes_in[index] = NULL; 1235437c7c90SJeremy L Thompson eval_modes_out[index] = NULL; 1236437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_in)); 1237437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_out)); 1238437c7c90SJeremy L Thompson eval_mode_offsets_in[index] = NULL; 1239437c7c90SJeremy L Thompson eval_mode_offsets_out[index] = NULL; 1240437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_in)); 1241437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_out)); 1242437c7c90SJeremy L Thompson (*data)->assembled_bases_in[index] = NULL; 1243437c7c90SJeremy L Thompson (*data)->assembled_bases_out[index] = NULL; 1244437c7c90SJeremy L Thompson num_active_bases++; 1245437c7c90SJeremy L Thompson } 1246ed9e99e6SJeremy L Thompson switch (eval_mode) { 1247ed9e99e6SJeremy L Thompson case CEED_EVAL_NONE: 1248ed9e99e6SJeremy L Thompson case CEED_EVAL_INTERP: 1249437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_eval_modes_out[index] + 1, &eval_modes_out[index])); 1250437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_eval_modes_out[index] + 1, &eval_mode_offsets_out[index])); 1251437c7c90SJeremy L Thompson eval_modes_out[index][num_eval_modes_out[index]] = eval_mode; 1252437c7c90SJeremy L Thompson eval_mode_offsets_out[index][num_eval_modes_out[index]] = offset; 1253437c7c90SJeremy L Thompson offset += num_components; 1254437c7c90SJeremy L Thompson num_eval_modes_out[index] += 1; 1255ed9e99e6SJeremy L Thompson break; 1256ed9e99e6SJeremy L Thompson case CEED_EVAL_GRAD: 1257437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_eval_modes_out[index] + dim, &eval_modes_out[index])); 1258437c7c90SJeremy L Thompson CeedCall(CeedRealloc(num_eval_modes_out[index] + dim, &eval_mode_offsets_out[index])); 1259ed9e99e6SJeremy L Thompson for (CeedInt d = 0; d < dim; d++) { 1260437c7c90SJeremy L Thompson eval_modes_out[index][num_eval_modes_out[index] + d] = eval_mode; 1261437c7c90SJeremy L Thompson eval_mode_offsets_out[index][num_eval_modes_out[index] + d] = offset; 1262437c7c90SJeremy L Thompson offset += num_components; 1263ed9e99e6SJeremy L Thompson } 1264437c7c90SJeremy L Thompson num_eval_modes_out[index] += dim; 1265ed9e99e6SJeremy L Thompson break; 1266ed9e99e6SJeremy L Thompson case CEED_EVAL_WEIGHT: 1267ed9e99e6SJeremy L Thompson case CEED_EVAL_DIV: 1268ed9e99e6SJeremy L Thompson case CEED_EVAL_CURL: 1269ed9e99e6SJeremy L Thompson break; // Caught by QF Assembly 1270ed9e99e6SJeremy L Thompson } 1271ed9e99e6SJeremy L Thompson } 1272ed9e99e6SJeremy L Thompson } 1273437c7c90SJeremy L Thompson (*data)->num_output_components = offset; 1274437c7c90SJeremy L Thompson (*data)->num_eval_modes_out = num_eval_modes_out; 1275437c7c90SJeremy L Thompson (*data)->eval_modes_out = eval_modes_out; 1276437c7c90SJeremy L Thompson (*data)->eval_mode_offsets_out = eval_mode_offsets_out; 1277437c7c90SJeremy L Thompson (*data)->num_active_bases = num_active_bases; 1278ed9e99e6SJeremy L Thompson 1279ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1280ed9e99e6SJeremy L Thompson } 1281ed9e99e6SJeremy L Thompson 1282ed9e99e6SJeremy L Thompson /** 1283*ba746a46SJeremy L Thompson @brief Get CeedOperator CeedEvalModes for assembly. 1284*ba746a46SJeremy L Thompson 1285*ba746a46SJeremy L Thompson Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object. 1286ed9e99e6SJeremy L Thompson 1287ed9e99e6SJeremy L Thompson @param[in] data CeedOperatorAssemblyData 1288*ba746a46SJeremy L Thompson @param[out] num_active_bases Total number of active bases 1289*ba746a46SJeremy L Thompson @param[out] num_eval_mode_in Pointer to hold array of numbers of input CeedEvalModes, or NULL. 1290*ba746a46SJeremy L Thompson `eval_modes_in[0]` holds an array of eval modes for the first active basis. 1291*ba746a46SJeremy L Thompson @param[out] eval_mode_in Pointer to hold arrays of input CeedEvalModes, or NULL. 1292*ba746a46SJeremy L Thompson @param[out] eval_mode_offsets_in Pointer to hold arrays of input offsets at each quadrature point. 1293437c7c90SJeremy L Thompson @param[out] num_eval_mode_out Pointer to hold array of numbers of output CeedEvalModes, or NULL 1294*ba746a46SJeremy L Thompson @param[out] eval_mode_out Pointer to hold arrays of output CeedEvalModes, or NULL. 1295437c7c90SJeremy L Thompson @param[out] eval_mode_offsets_out Pointer to hold arrays of output offsets at each quadrature point 1296*ba746a46SJeremy L Thompson @param[out] num_output_components The number of columns in the assembled CeedQFunction matrix for each quadrature point, 1297*ba746a46SJeremy L Thompson including contributions of all active bases 1298ed9e99e6SJeremy L Thompson 1299ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1300ed9e99e6SJeremy L Thompson 1301ed9e99e6SJeremy L Thompson @ref Backend 1302ed9e99e6SJeremy L Thompson **/ 1303437c7c90SJeremy L Thompson int CeedOperatorAssemblyDataGetEvalModes(CeedOperatorAssemblyData data, CeedInt *num_active_bases, CeedInt **num_eval_modes_in, 1304437c7c90SJeremy L Thompson const CeedEvalMode ***eval_modes_in, CeedSize ***eval_mode_offsets_in, CeedInt **num_eval_modes_out, 1305437c7c90SJeremy L Thompson const CeedEvalMode ***eval_modes_out, CeedSize ***eval_mode_offsets_out, CeedSize *num_output_components) { 1306437c7c90SJeremy L Thompson if (num_active_bases) *num_active_bases = data->num_active_bases; 1307437c7c90SJeremy L Thompson if (num_eval_modes_in) *num_eval_modes_in = data->num_eval_modes_in; 1308437c7c90SJeremy L Thompson if (eval_modes_in) *eval_modes_in = (const CeedEvalMode **)data->eval_modes_in; 1309437c7c90SJeremy L Thompson if (eval_mode_offsets_in) *eval_mode_offsets_in = data->eval_mode_offsets_in; 1310437c7c90SJeremy L Thompson if (num_eval_modes_out) *num_eval_modes_out = data->num_eval_modes_out; 1311437c7c90SJeremy L Thompson if (eval_modes_out) *eval_modes_out = (const CeedEvalMode **)data->eval_modes_out; 1312437c7c90SJeremy L Thompson if (eval_mode_offsets_out) *eval_mode_offsets_out = data->eval_mode_offsets_out; 1313437c7c90SJeremy L Thompson if (num_output_components) *num_output_components = data->num_output_components; 1314ed9e99e6SJeremy L Thompson 1315ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1316ed9e99e6SJeremy L Thompson } 1317ed9e99e6SJeremy L Thompson 1318ed9e99e6SJeremy L Thompson /** 1319*ba746a46SJeremy L Thompson @brief Get CeedOperator CeedBasis data for assembly. 1320*ba746a46SJeremy L Thompson 1321*ba746a46SJeremy L Thompson Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object. 1322ed9e99e6SJeremy L Thompson 1323ed9e99e6SJeremy L Thompson @param[in] data CeedOperatorAssemblyData 1324437c7c90SJeremy L Thompson @param[out] num_active_bases Number of active bases, or NULL 1325437c7c90SJeremy L Thompson @param[out] active_bases Pointer to hold active CeedBasis, or NULL 1326437c7c90SJeremy L Thompson @param[out] assembled_bases_in Pointer to hold assembled active input B, or NULL 1327437c7c90SJeremy L Thompson @param[out] assembled_bases_out Pointer to hold assembled active output B, or NULL 1328ed9e99e6SJeremy L Thompson 1329ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1330ed9e99e6SJeremy L Thompson 1331ed9e99e6SJeremy L Thompson @ref Backend 1332ed9e99e6SJeremy L Thompson **/ 1333437c7c90SJeremy L Thompson int CeedOperatorAssemblyDataGetBases(CeedOperatorAssemblyData data, CeedInt *num_active_bases, CeedBasis **active_bases, 1334437c7c90SJeremy L Thompson const CeedScalar ***assembled_bases_in, const CeedScalar ***assembled_bases_out) { 1335ed9e99e6SJeremy L Thompson // Assemble B_in, B_out if needed 1336437c7c90SJeremy L Thompson if (assembled_bases_in && !data->assembled_bases_in[0]) { 1337437c7c90SJeremy L Thompson CeedInt num_qpts; 1338437c7c90SJeremy L Thompson 1339437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(data->active_bases[0], &num_qpts)); 1340437c7c90SJeremy L Thompson for (CeedInt b = 0; b < data->num_active_bases; b++) { 1341437c7c90SJeremy L Thompson CeedInt elem_size; 1342437c7c90SJeremy L Thompson CeedScalar *B_in = NULL, *identity = NULL; 1343ed9e99e6SJeremy L Thompson const CeedScalar *interp_in, *grad_in; 1344ed9e99e6SJeremy L Thompson bool has_eval_none = false; 1345ed9e99e6SJeremy L Thompson 1346437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumNodes(data->active_bases[b], &elem_size)); 1347437c7c90SJeremy L Thompson CeedCall(CeedCalloc(num_qpts * elem_size * data->num_eval_modes_in[b], &B_in)); 1348ed9e99e6SJeremy L Thompson 1349437c7c90SJeremy L Thompson for (CeedInt i = 0; i < data->num_eval_modes_in[b]; i++) { 1350437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (data->eval_modes_in[b][i] == CEED_EVAL_NONE); 1351ed9e99e6SJeremy L Thompson } 1352ed9e99e6SJeremy L Thompson if (has_eval_none) { 13532b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_qpts * elem_size, &identity)); 1354ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < (elem_size < num_qpts ? elem_size : num_qpts); i++) { 1355ed9e99e6SJeremy L Thompson identity[i * elem_size + i] = 1.0; 1356ed9e99e6SJeremy L Thompson } 1357ed9e99e6SJeremy L Thompson } 1358437c7c90SJeremy L Thompson CeedCall(CeedBasisGetInterp(data->active_bases[b], &interp_in)); 1359437c7c90SJeremy L Thompson CeedCall(CeedBasisGetGrad(data->active_bases[b], &grad_in)); 1360ed9e99e6SJeremy L Thompson 1361ed9e99e6SJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 1362ed9e99e6SJeremy L Thompson for (CeedInt n = 0; n < elem_size; n++) { 1363ed9e99e6SJeremy L Thompson CeedInt d_in = -1; 1364437c7c90SJeremy L Thompson for (CeedInt e_in = 0; e_in < data->num_eval_modes_in[b]; e_in++) { 1365437c7c90SJeremy L Thompson const CeedInt qq = data->num_eval_modes_in[b] * q; 1366437c7c90SJeremy L Thompson const CeedScalar *B = NULL; 1367ed9e99e6SJeremy L Thompson 1368437c7c90SJeremy L Thompson if (data->eval_modes_in[b][e_in] == CEED_EVAL_GRAD) d_in++; 1369437c7c90SJeremy L Thompson CeedOperatorGetBasisPointer(data->eval_modes_in[b][e_in], identity, interp_in, &grad_in[d_in * num_qpts * elem_size], &B); 1370437c7c90SJeremy L Thompson B_in[(qq + e_in) * elem_size + n] = B[q * elem_size + n]; 1371ed9e99e6SJeremy L Thompson } 1372ed9e99e6SJeremy L Thompson } 1373ed9e99e6SJeremy L Thompson } 1374437c7c90SJeremy L Thompson if (identity) CeedCall(CeedFree(identity)); 1375437c7c90SJeremy L Thompson data->assembled_bases_in[b] = B_in; 1376437c7c90SJeremy L Thompson } 1377ed9e99e6SJeremy L Thompson } 1378ed9e99e6SJeremy L Thompson 1379437c7c90SJeremy L Thompson if (assembled_bases_out && !data->assembled_bases_out[0]) { 1380437c7c90SJeremy L Thompson CeedInt num_qpts; 1381437c7c90SJeremy L Thompson 1382437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(data->active_bases[0], &num_qpts)); 1383437c7c90SJeremy L Thompson for (CeedInt b = 0; b < data->num_active_bases; b++) { 1384437c7c90SJeremy L Thompson CeedInt elem_size; 1385ed9e99e6SJeremy L Thompson const CeedScalar *interp_out, *grad_out; 1386ed9e99e6SJeremy L Thompson bool has_eval_none = false; 1387437c7c90SJeremy L Thompson CeedScalar *B_out = NULL, *identity = NULL; 1388ed9e99e6SJeremy L Thompson 1389437c7c90SJeremy L Thompson CeedCall(CeedBasisGetNumNodes(data->active_bases[b], &elem_size)); 1390437c7c90SJeremy L Thompson CeedCall(CeedCalloc(num_qpts * elem_size * data->num_eval_modes_out[b], &B_out)); 1391ed9e99e6SJeremy L Thompson 1392437c7c90SJeremy L Thompson for (CeedInt i = 0; i < data->num_eval_modes_out[b]; i++) { 1393437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (data->eval_modes_out[b][i] == CEED_EVAL_NONE); 1394ed9e99e6SJeremy L Thompson } 1395ed9e99e6SJeremy L Thompson if (has_eval_none) { 13962b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_qpts * elem_size, &identity)); 1397ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < (elem_size < num_qpts ? elem_size : num_qpts); i++) { 1398ed9e99e6SJeremy L Thompson identity[i * elem_size + i] = 1.0; 1399ed9e99e6SJeremy L Thompson } 1400ed9e99e6SJeremy L Thompson } 1401437c7c90SJeremy L Thompson CeedCall(CeedBasisGetInterp(data->active_bases[b], &interp_out)); 1402437c7c90SJeremy L Thompson CeedCall(CeedBasisGetGrad(data->active_bases[b], &grad_out)); 1403ed9e99e6SJeremy L Thompson 1404ed9e99e6SJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 1405ed9e99e6SJeremy L Thompson for (CeedInt n = 0; n < elem_size; n++) { 1406ed9e99e6SJeremy L Thompson CeedInt d_out = -1; 1407437c7c90SJeremy L Thompson for (CeedInt e_out = 0; e_out < data->num_eval_modes_out[b]; e_out++) { 1408437c7c90SJeremy L Thompson const CeedInt qq = data->num_eval_modes_out[b] * q; 1409437c7c90SJeremy L Thompson const CeedScalar *B = NULL; 1410ed9e99e6SJeremy L Thompson 1411437c7c90SJeremy L Thompson if (data->eval_modes_out[b][e_out] == CEED_EVAL_GRAD) d_out++; 1412437c7c90SJeremy L Thompson CeedOperatorGetBasisPointer(data->eval_modes_out[b][e_out], identity, interp_out, &grad_out[d_out * num_qpts * elem_size], &B); 1413437c7c90SJeremy L Thompson B_out[(qq + e_out) * elem_size + n] = B[q * elem_size + n]; 1414ed9e99e6SJeremy L Thompson } 1415ed9e99e6SJeremy L Thompson } 1416ed9e99e6SJeremy L Thompson } 1417437c7c90SJeremy L Thompson if (identity) CeedCall(CeedFree(identity)); 1418437c7c90SJeremy L Thompson data->assembled_bases_out[b] = B_out; 1419437c7c90SJeremy L Thompson } 1420ed9e99e6SJeremy L Thompson } 1421ed9e99e6SJeremy L Thompson 1422437c7c90SJeremy L Thompson // Pass out assembled data 1423437c7c90SJeremy L Thompson if (active_bases) *active_bases = data->active_bases; 1424437c7c90SJeremy L Thompson if (assembled_bases_in) *assembled_bases_in = (const CeedScalar **)data->assembled_bases_in; 1425437c7c90SJeremy L Thompson if (assembled_bases_out) *assembled_bases_out = (const CeedScalar **)data->assembled_bases_out; 1426437c7c90SJeremy L Thompson 1427437c7c90SJeremy L Thompson return CEED_ERROR_SUCCESS; 1428437c7c90SJeremy L Thompson } 1429437c7c90SJeremy L Thompson 1430437c7c90SJeremy L Thompson /** 1431*ba746a46SJeremy L Thompson @brief Get CeedOperator CeedBasis data for assembly. 1432*ba746a46SJeremy L Thompson 1433*ba746a46SJeremy L Thompson Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object. 1434437c7c90SJeremy L Thompson 1435437c7c90SJeremy L Thompson @param[in] data CeedOperatorAssemblyData 1436437c7c90SJeremy L Thompson @param[out] num_active_elem_rstrs Number of active element restrictions, or NULL 1437437c7c90SJeremy L Thompson @param[out] active_elem_rstrs Pointer to hold active CeedElemRestrictions, or NULL 1438437c7c90SJeremy L Thompson 1439437c7c90SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1440437c7c90SJeremy L Thompson 1441437c7c90SJeremy L Thompson @ref Backend 1442437c7c90SJeremy L Thompson **/ 1443437c7c90SJeremy L Thompson int CeedOperatorAssemblyDataGetElemRestrictions(CeedOperatorAssemblyData data, CeedInt *num_active_elem_rstrs, 1444437c7c90SJeremy L Thompson CeedElemRestriction **active_elem_rstrs) { 1445437c7c90SJeremy L Thompson if (num_active_elem_rstrs) *num_active_elem_rstrs = data->num_active_bases; 1446437c7c90SJeremy L Thompson if (active_elem_rstrs) *active_elem_rstrs = data->active_elem_rstrs; 1447ed9e99e6SJeremy L Thompson 1448ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1449ed9e99e6SJeremy L Thompson } 1450ed9e99e6SJeremy L Thompson 1451ed9e99e6SJeremy L Thompson /** 1452ed9e99e6SJeremy L Thompson @brief Destroy CeedOperatorAssemblyData 1453ed9e99e6SJeremy L Thompson 1454ea61e9acSJeremy L Thompson @param[in,out] data CeedOperatorAssemblyData to destroy 1455ed9e99e6SJeremy L Thompson 1456ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1457ed9e99e6SJeremy L Thompson 1458ed9e99e6SJeremy L Thompson @ref Backend 1459ed9e99e6SJeremy L Thompson **/ 1460ed9e99e6SJeremy L Thompson int CeedOperatorAssemblyDataDestroy(CeedOperatorAssemblyData *data) { 1461ed9e99e6SJeremy L Thompson if (!*data) return CEED_ERROR_SUCCESS; 1462ed9e99e6SJeremy L Thompson 14632b730f8bSJeremy L Thompson CeedCall(CeedDestroy(&(*data)->ceed)); 1464437c7c90SJeremy L Thompson for (CeedInt b = 0; b < (*data)->num_active_bases; b++) { 1465437c7c90SJeremy L Thompson CeedCall(CeedBasisDestroy(&(*data)->active_bases[b])); 1466437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&(*data)->active_elem_rstrs[b])); 1467437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_in[b])); 1468437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_out[b])); 1469437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_in[b])); 1470437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_out[b])); 1471437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_in[b])); 1472437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_out[b])); 1473437c7c90SJeremy L Thompson } 1474437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->active_bases)); 1475437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->active_elem_rstrs)); 1476437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->num_eval_modes_in)); 1477437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->num_eval_modes_out)); 1478437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_in)); 1479437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_out)); 1480437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_in)); 1481437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_out)); 1482437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_in)); 1483437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_out)); 1484ed9e99e6SJeremy L Thompson 14852b730f8bSJeremy L Thompson CeedCall(CeedFree(data)); 1486ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1487ed9e99e6SJeremy L Thompson } 1488ed9e99e6SJeremy L Thompson 1489480fae85SJeremy L Thompson /// @} 1490480fae85SJeremy L Thompson 1491480fae85SJeremy L Thompson /// ---------------------------------------------------------------------------- 1492eaf62fffSJeremy L Thompson /// CeedOperator Public API 1493eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 1494eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorUser 1495eaf62fffSJeremy L Thompson /// @{ 1496eaf62fffSJeremy L Thompson 1497eaf62fffSJeremy L Thompson /** 1498eaf62fffSJeremy L Thompson @brief Assemble a linear CeedQFunction associated with a CeedOperator 1499eaf62fffSJeremy L Thompson 1500ea61e9acSJeremy L Thompson This returns a CeedVector containing a matrix at each quadrature point providing the action of the CeedQFunction associated with the CeedOperator. 1501ea61e9acSJeremy L Thompson The vector 'assembled' is of shape [num_elements, num_input_fields, num_output_fields, num_quad_points] and contains column-major matrices 1502ea61e9acSJeremy L Thompson representing the action of the CeedQFunction for a corresponding quadrature point on an element. Inputs and outputs are in the order provided by the 1503ea61e9acSJeremy L Thompson user when adding CeedOperator fields. For example, a CeedQFunction with inputs 'u' and 'gradu' and outputs 'gradv' and 'v', provided in that order, 1504ea61e9acSJeremy L Thompson would result in an assembled QFunction that consists of (1 + dim) x (dim + 1) matrices at each quadrature point acting on the input [u, du_0, du_1] 1505ea61e9acSJeremy L Thompson and producing the output [dv_0, dv_1, v]. 1506eaf62fffSJeremy L Thompson 1507ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1508f04ea552SJeremy L Thompson 1509ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1510ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points 1511ea61e9acSJeremy L Thompson @param[out] rstr CeedElemRestriction for CeedVector containing assembled CeedQFunction 1512ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1513eaf62fffSJeremy L Thompson 1514eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1515eaf62fffSJeremy L Thompson 1516eaf62fffSJeremy L Thompson @ref User 1517eaf62fffSJeremy L Thompson **/ 15182b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunction(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 15192b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1520eaf62fffSJeremy L Thompson 1521eaf62fffSJeremy L Thompson if (op->LinearAssembleQFunction) { 1522d04bbc78SJeremy L Thompson // Backend version 15232b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleQFunction(op, assembled, rstr, request)); 1524eaf62fffSJeremy L Thompson } else { 1525d04bbc78SJeremy L Thompson // Operator fallback 1526d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1527d04bbc78SJeremy L Thompson 15282b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1529d04bbc78SJeremy L Thompson if (op_fallback) { 15302b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunction(op_fallback, assembled, rstr, request)); 1531d04bbc78SJeremy L Thompson } else { 1532d04bbc78SJeremy L Thompson // LCOV_EXCL_START 15332b730f8bSJeremy L Thompson return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunction"); 1534d04bbc78SJeremy L Thompson // LCOV_EXCL_STOP 1535d04bbc78SJeremy L Thompson } 153670a7ffb3SJeremy L Thompson } 1537eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1538eaf62fffSJeremy L Thompson } 153970a7ffb3SJeremy L Thompson 154070a7ffb3SJeremy L Thompson /** 1541ea61e9acSJeremy L Thompson @brief Assemble CeedQFunction and store result internally. 1542ea61e9acSJeremy L Thompson Return copied references of stored data to the caller. 1543ea61e9acSJeremy L Thompson Caller is responsible for ownership and destruction of the copied references. 1544ea61e9acSJeremy L Thompson See also @ref CeedOperatorLinearAssembleQFunction 154570a7ffb3SJeremy L Thompson 1546ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1547ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points 1548ea61e9acSJeremy L Thompson @param[out] rstr CeedElemRestriction for CeedVector containing assembledCeedQFunction 1549ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 155070a7ffb3SJeremy L Thompson 155170a7ffb3SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 155270a7ffb3SJeremy L Thompson 155370a7ffb3SJeremy L Thompson @ref User 155470a7ffb3SJeremy L Thompson **/ 15552b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunctionBuildOrUpdate(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 15562b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 155770a7ffb3SJeremy L Thompson 155870a7ffb3SJeremy L Thompson if (op->LinearAssembleQFunctionUpdate) { 1559d04bbc78SJeremy L Thompson // Backend version 1560480fae85SJeremy L Thompson bool qf_assembled_is_setup; 15612efa2d85SJeremy L Thompson CeedVector assembled_vec = NULL; 15622efa2d85SJeremy L Thompson CeedElemRestriction assembled_rstr = NULL; 1563480fae85SJeremy L Thompson 15642b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataIsSetup(op->qf_assembled, &qf_assembled_is_setup)); 1565480fae85SJeremy L Thompson if (qf_assembled_is_setup) { 1566d04bbc78SJeremy L Thompson bool update_needed; 1567d04bbc78SJeremy L Thompson 15682b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataGetObjects(op->qf_assembled, &assembled_vec, &assembled_rstr)); 15692b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataIsUpdateNeeded(op->qf_assembled, &update_needed)); 15708b919e6bSJeremy L Thompson if (update_needed) { 15712b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleQFunctionUpdate(op, assembled_vec, assembled_rstr, request)); 15728b919e6bSJeremy L Thompson } 157370a7ffb3SJeremy L Thompson } else { 15742b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleQFunction(op, &assembled_vec, &assembled_rstr, request)); 15752b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataSetObjects(op->qf_assembled, assembled_vec, assembled_rstr)); 157670a7ffb3SJeremy L Thompson } 15772b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataSetUpdateNeeded(op->qf_assembled, false)); 15782efa2d85SJeremy L Thompson 1579d04bbc78SJeremy L Thompson // Copy reference from internally held copy 158070a7ffb3SJeremy L Thompson *assembled = NULL; 158170a7ffb3SJeremy L Thompson *rstr = NULL; 15822b730f8bSJeremy L Thompson CeedCall(CeedVectorReferenceCopy(assembled_vec, assembled)); 15832b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled_vec)); 15842b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(assembled_rstr, rstr)); 15852b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&assembled_rstr)); 158670a7ffb3SJeremy L Thompson } else { 1587d04bbc78SJeremy L Thompson // Operator fallback 1588d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1589d04bbc78SJeremy L Thompson 15902b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1591d04bbc78SJeremy L Thompson if (op_fallback) { 15922b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op_fallback, assembled, rstr, request)); 1593d04bbc78SJeremy L Thompson } else { 1594d04bbc78SJeremy L Thompson // LCOV_EXCL_START 15952b730f8bSJeremy L Thompson return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunctionUpdate"); 1596d04bbc78SJeremy L Thompson // LCOV_EXCL_STOP 159770a7ffb3SJeremy L Thompson } 159870a7ffb3SJeremy L Thompson } 159970a7ffb3SJeremy L Thompson 160070a7ffb3SJeremy L Thompson return CEED_ERROR_SUCCESS; 1601eaf62fffSJeremy L Thompson } 1602eaf62fffSJeremy L Thompson 1603eaf62fffSJeremy L Thompson /** 1604eaf62fffSJeremy L Thompson @brief Assemble the diagonal of a square linear CeedOperator 1605eaf62fffSJeremy L Thompson 1606eaf62fffSJeremy L Thompson This overwrites a CeedVector with the diagonal of a linear CeedOperator. 1607eaf62fffSJeremy L Thompson 1608ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1609eaf62fffSJeremy L Thompson 1610ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1611f04ea552SJeremy L Thompson 1612ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1613eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator diagonal 1614ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1615eaf62fffSJeremy L Thompson 1616eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1617eaf62fffSJeremy L Thompson 1618eaf62fffSJeremy L Thompson @ref User 1619eaf62fffSJeremy L Thompson **/ 16202b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1621f3d47e36SJeremy L Thompson bool is_composite; 16222b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1623f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1624eaf62fffSJeremy L Thompson 1625c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 16262b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 16272b730f8bSJeremy L Thompson if (input_size != output_size) { 1628c9366a6bSJeremy L Thompson // LCOV_EXCL_START 1629c9366a6bSJeremy L Thompson return CeedError(op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1630c9366a6bSJeremy L Thompson // LCOV_EXCL_STOP 16312b730f8bSJeremy L Thompson } 1632c9366a6bSJeremy L Thompson 1633f3d47e36SJeremy L Thompson // Early exit for empty operator 1634f3d47e36SJeremy L Thompson if (!is_composite) { 1635f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1636f3d47e36SJeremy L Thompson 1637f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1638f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1639f3d47e36SJeremy L Thompson } 1640f3d47e36SJeremy L Thompson 1641eaf62fffSJeremy L Thompson if (op->LinearAssembleDiagonal) { 1642d04bbc78SJeremy L Thompson // Backend version 16432b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleDiagonal(op, assembled, request)); 1644eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1645eaf62fffSJeremy L Thompson } else if (op->LinearAssembleAddDiagonal) { 1646d04bbc78SJeremy L Thompson // Backend version with zeroing first 16472b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 16482b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request)); 1649eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1650eaf62fffSJeremy L Thompson } else { 1651d04bbc78SJeremy L Thompson // Operator fallback 1652d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1653d04bbc78SJeremy L Thompson 16542b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1655d04bbc78SJeremy L Thompson if (op_fallback) { 16562b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleDiagonal(op_fallback, assembled, request)); 1657eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1658eaf62fffSJeremy L Thompson } 1659eaf62fffSJeremy L Thompson } 1660eaf62fffSJeremy L Thompson // Default interface implementation 16612b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 16622b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddDiagonal(op, assembled, request)); 1663d04bbc78SJeremy L Thompson 1664eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1665eaf62fffSJeremy L Thompson } 1666eaf62fffSJeremy L Thompson 1667eaf62fffSJeremy L Thompson /** 1668eaf62fffSJeremy L Thompson @brief Assemble the diagonal of a square linear CeedOperator 1669eaf62fffSJeremy L Thompson 1670eaf62fffSJeremy L Thompson This sums into a CeedVector the diagonal of a linear CeedOperator. 1671eaf62fffSJeremy L Thompson 1672ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1673eaf62fffSJeremy L Thompson 1674ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1675f04ea552SJeremy L Thompson 1676ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1677eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator diagonal 1678ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1679eaf62fffSJeremy L Thompson 1680eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1681eaf62fffSJeremy L Thompson 1682eaf62fffSJeremy L Thompson @ref User 1683eaf62fffSJeremy L Thompson **/ 16842b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1685f3d47e36SJeremy L Thompson bool is_composite; 16862b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1687f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1688eaf62fffSJeremy L Thompson 1689c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 16902b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 16912b730f8bSJeremy L Thompson if (input_size != output_size) { 1692c9366a6bSJeremy L Thompson // LCOV_EXCL_START 1693c9366a6bSJeremy L Thompson return CeedError(op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1694c9366a6bSJeremy L Thompson // LCOV_EXCL_STOP 16952b730f8bSJeremy L Thompson } 1696c9366a6bSJeremy L Thompson 1697f3d47e36SJeremy L Thompson // Early exit for empty operator 1698f3d47e36SJeremy L Thompson if (!is_composite) { 1699f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1700f3d47e36SJeremy L Thompson 1701f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1702f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1703f3d47e36SJeremy L Thompson } 1704f3d47e36SJeremy L Thompson 1705eaf62fffSJeremy L Thompson if (op->LinearAssembleAddDiagonal) { 1706d04bbc78SJeremy L Thompson // Backend version 17072b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request)); 1708eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1709eaf62fffSJeremy L Thompson } else { 1710d04bbc78SJeremy L Thompson // Operator fallback 1711d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1712d04bbc78SJeremy L Thompson 17132b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1714d04bbc78SJeremy L Thompson if (op_fallback) { 17152b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddDiagonal(op_fallback, assembled, request)); 1716eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1717eaf62fffSJeremy L Thompson } 1718eaf62fffSJeremy L Thompson } 1719eaf62fffSJeremy L Thompson // Default interface implementation 1720eaf62fffSJeremy L Thompson if (is_composite) { 17212b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, false, assembled)); 1722eaf62fffSJeremy L Thompson } else { 17232b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, false, assembled)); 1724eaf62fffSJeremy L Thompson } 1725d04bbc78SJeremy L Thompson 1726d04bbc78SJeremy L Thompson return CEED_ERROR_SUCCESS; 1727eaf62fffSJeremy L Thompson } 1728eaf62fffSJeremy L Thompson 1729eaf62fffSJeremy L Thompson /** 1730eaf62fffSJeremy L Thompson @brief Assemble the point block diagonal of a square linear CeedOperator 1731eaf62fffSJeremy L Thompson 1732ea61e9acSJeremy L Thompson This overwrites a CeedVector with the point block diagonal of a linear CeedOperator. 1733eaf62fffSJeremy L Thompson 1734ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1735eaf62fffSJeremy L Thompson 1736ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1737f04ea552SJeremy L Thompson 1738ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1739ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp 1740ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out, 1741ea61e9acSJeremy L Thompson component in]. 1742ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1743eaf62fffSJeremy L Thompson 1744eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1745eaf62fffSJeremy L Thompson 1746eaf62fffSJeremy L Thompson @ref User 1747eaf62fffSJeremy L Thompson **/ 17482b730f8bSJeremy L Thompson int CeedOperatorLinearAssemblePointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1749f3d47e36SJeremy L Thompson bool is_composite; 17502b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1751f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1752eaf62fffSJeremy L Thompson 1753c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 17542b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 17552b730f8bSJeremy L Thompson if (input_size != output_size) { 1756c9366a6bSJeremy L Thompson // LCOV_EXCL_START 1757c9366a6bSJeremy L Thompson return CeedError(op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1758c9366a6bSJeremy L Thompson // LCOV_EXCL_STOP 17592b730f8bSJeremy L Thompson } 1760c9366a6bSJeremy L Thompson 1761f3d47e36SJeremy L Thompson // Early exit for empty operator 1762f3d47e36SJeremy L Thompson if (!is_composite) { 1763f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1764f3d47e36SJeremy L Thompson 1765f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1766f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1767f3d47e36SJeremy L Thompson } 1768f3d47e36SJeremy L Thompson 1769eaf62fffSJeremy L Thompson if (op->LinearAssemblePointBlockDiagonal) { 1770d04bbc78SJeremy L Thompson // Backend version 17712b730f8bSJeremy L Thompson CeedCall(op->LinearAssemblePointBlockDiagonal(op, assembled, request)); 1772eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1773eaf62fffSJeremy L Thompson } else if (op->LinearAssembleAddPointBlockDiagonal) { 1774d04bbc78SJeremy L Thompson // Backend version with zeroing first 17752b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 17762b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request)); 1777eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1778eaf62fffSJeremy L Thompson } else { 1779d04bbc78SJeremy L Thompson // Operator fallback 1780d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1781d04bbc78SJeremy L Thompson 17822b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1783d04bbc78SJeremy L Thompson if (op_fallback) { 17842b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssemblePointBlockDiagonal(op_fallback, assembled, request)); 1785eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1786eaf62fffSJeremy L Thompson } 1787eaf62fffSJeremy L Thompson } 1788eaf62fffSJeremy L Thompson // Default interface implementation 17892b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 17902b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request)); 1791d04bbc78SJeremy L Thompson 1792eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1793eaf62fffSJeremy L Thompson } 1794eaf62fffSJeremy L Thompson 1795eaf62fffSJeremy L Thompson /** 1796eaf62fffSJeremy L Thompson @brief Assemble the point block diagonal of a square linear CeedOperator 1797eaf62fffSJeremy L Thompson 1798ea61e9acSJeremy L Thompson This sums into a CeedVector with the point block diagonal of a linear CeedOperator. 1799eaf62fffSJeremy L Thompson 1800ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1801eaf62fffSJeremy L Thompson 1802ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1803f04ea552SJeremy L Thompson 1804ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1805ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp 1806ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out, 1807ea61e9acSJeremy L Thompson component in]. 1808ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1809eaf62fffSJeremy L Thompson 1810eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1811eaf62fffSJeremy L Thompson 1812eaf62fffSJeremy L Thompson @ref User 1813eaf62fffSJeremy L Thompson **/ 18142b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddPointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1815f3d47e36SJeremy L Thompson bool is_composite; 18162b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1817f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1818eaf62fffSJeremy L Thompson 1819c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 18202b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 18212b730f8bSJeremy L Thompson if (input_size != output_size) { 1822c9366a6bSJeremy L Thompson // LCOV_EXCL_START 1823c9366a6bSJeremy L Thompson return CeedError(op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1824c9366a6bSJeremy L Thompson // LCOV_EXCL_STOP 18252b730f8bSJeremy L Thompson } 1826c9366a6bSJeremy L Thompson 1827f3d47e36SJeremy L Thompson // Early exit for empty operator 1828f3d47e36SJeremy L Thompson if (!is_composite) { 1829f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1830f3d47e36SJeremy L Thompson 1831f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1832f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1833f3d47e36SJeremy L Thompson } 1834f3d47e36SJeremy L Thompson 1835eaf62fffSJeremy L Thompson if (op->LinearAssembleAddPointBlockDiagonal) { 1836d04bbc78SJeremy L Thompson // Backend version 18372b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleAddPointBlockDiagonal(op, assembled, request)); 1838eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1839eaf62fffSJeremy L Thompson } else { 1840d04bbc78SJeremy L Thompson // Operator fallback 1841d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1842d04bbc78SJeremy L Thompson 18432b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1844d04bbc78SJeremy L Thompson if (op_fallback) { 18452b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op_fallback, assembled, request)); 1846eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1847eaf62fffSJeremy L Thompson } 1848eaf62fffSJeremy L Thompson } 1849ea61e9acSJeremy L Thompson // Default interface implementation 1850eaf62fffSJeremy L Thompson if (is_composite) { 18512b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, true, assembled)); 1852eaf62fffSJeremy L Thompson } else { 18532b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, true, assembled)); 1854eaf62fffSJeremy L Thompson } 1855d04bbc78SJeremy L Thompson 1856d04bbc78SJeremy L Thompson return CEED_ERROR_SUCCESS; 1857eaf62fffSJeremy L Thompson } 1858eaf62fffSJeremy L Thompson 1859eaf62fffSJeremy L Thompson /** 1860eaf62fffSJeremy L Thompson @brief Fully assemble the nonzero pattern of a linear operator. 1861eaf62fffSJeremy L Thompson 1862ea61e9acSJeremy L Thompson Expected to be used in conjunction with CeedOperatorLinearAssemble(). 1863eaf62fffSJeremy L Thompson 1864ea61e9acSJeremy L Thompson The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the 1865ea61e9acSJeremy L Thompson matrix in entry (i, j). Note that the (i, j) pairs are not unique and may repeat. This function returns the number of entries and their (i, j) 1866ea61e9acSJeremy L Thompson locations, while CeedOperatorLinearAssemble() provides the values in the same ordering. 1867eaf62fffSJeremy L Thompson 1868eaf62fffSJeremy L Thompson This will generally be slow unless your operator is low-order. 1869eaf62fffSJeremy L Thompson 1870ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1871f04ea552SJeremy L Thompson 1872eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 1873eaf62fffSJeremy L Thompson @param[out] num_entries Number of entries in coordinate nonzero pattern 1874eaf62fffSJeremy L Thompson @param[out] rows Row number for each entry 1875eaf62fffSJeremy L Thompson @param[out] cols Column number for each entry 1876eaf62fffSJeremy L Thompson 1877eaf62fffSJeremy L Thompson @ref User 1878eaf62fffSJeremy L Thompson **/ 18792b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleSymbolic(CeedOperator op, CeedSize *num_entries, CeedInt **rows, CeedInt **cols) { 1880eaf62fffSJeremy L Thompson CeedInt num_suboperators, single_entries; 1881eaf62fffSJeremy L Thompson CeedOperator *sub_operators; 1882eaf62fffSJeremy L Thompson bool is_composite; 18832b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1884f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1885eaf62fffSJeremy L Thompson 1886eaf62fffSJeremy L Thompson if (op->LinearAssembleSymbolic) { 1887d04bbc78SJeremy L Thompson // Backend version 18882b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleSymbolic(op, num_entries, rows, cols)); 1889eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1890eaf62fffSJeremy L Thompson } else { 1891d04bbc78SJeremy L Thompson // Operator fallback 1892d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1893d04bbc78SJeremy L Thompson 18942b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1895d04bbc78SJeremy L Thompson if (op_fallback) { 18962b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleSymbolic(op_fallback, num_entries, rows, cols)); 1897eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1898eaf62fffSJeremy L Thompson } 1899eaf62fffSJeremy L Thompson } 1900eaf62fffSJeremy L Thompson 1901eaf62fffSJeremy L Thompson // Default interface implementation 1902eaf62fffSJeremy L Thompson 1903eaf62fffSJeremy L Thompson // count entries and allocate rows, cols arrays 1904eaf62fffSJeremy L Thompson *num_entries = 0; 1905eaf62fffSJeremy L Thompson if (is_composite) { 1906c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1907c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 190892ae7e47SJeremy L Thompson for (CeedInt k = 0; k < num_suboperators; ++k) { 19092b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries)); 1910eaf62fffSJeremy L Thompson *num_entries += single_entries; 1911eaf62fffSJeremy L Thompson } 1912eaf62fffSJeremy L Thompson } else { 19132b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(op, &single_entries)); 1914eaf62fffSJeremy L Thompson *num_entries += single_entries; 1915eaf62fffSJeremy L Thompson } 19162b730f8bSJeremy L Thompson CeedCall(CeedCalloc(*num_entries, rows)); 19172b730f8bSJeremy L Thompson CeedCall(CeedCalloc(*num_entries, cols)); 1918eaf62fffSJeremy L Thompson 1919eaf62fffSJeremy L Thompson // assemble nonzero locations 1920eaf62fffSJeremy L Thompson CeedInt offset = 0; 1921eaf62fffSJeremy L Thompson if (is_composite) { 1922c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1923c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 192492ae7e47SJeremy L Thompson for (CeedInt k = 0; k < num_suboperators; ++k) { 19252b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleSymbolic(sub_operators[k], offset, *rows, *cols)); 19262b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries)); 1927eaf62fffSJeremy L Thompson offset += single_entries; 1928eaf62fffSJeremy L Thompson } 1929eaf62fffSJeremy L Thompson } else { 19302b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleSymbolic(op, offset, *rows, *cols)); 1931eaf62fffSJeremy L Thompson } 1932eaf62fffSJeremy L Thompson 1933eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1934eaf62fffSJeremy L Thompson } 1935eaf62fffSJeremy L Thompson 1936eaf62fffSJeremy L Thompson /** 1937eaf62fffSJeremy L Thompson @brief Fully assemble the nonzero entries of a linear operator. 1938eaf62fffSJeremy L Thompson 1939ea61e9acSJeremy L Thompson Expected to be used in conjunction with CeedOperatorLinearAssembleSymbolic(). 1940eaf62fffSJeremy L Thompson 1941ea61e9acSJeremy L Thompson The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the 1942ea61e9acSJeremy L Thompson matrix in entry (i, j). Note that the (i, j) pairs are not unique and may repeat. This function returns the values of the nonzero entries to be added, 1943ea61e9acSJeremy L Thompson their (i, j) locations are provided by CeedOperatorLinearAssembleSymbolic() 1944eaf62fffSJeremy L Thompson 1945eaf62fffSJeremy L Thompson This will generally be slow unless your operator is low-order. 1946eaf62fffSJeremy L Thompson 1947ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1948f04ea552SJeremy L Thompson 1949eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 1950eaf62fffSJeremy L Thompson @param[out] values Values to assemble into matrix 1951eaf62fffSJeremy L Thompson 1952eaf62fffSJeremy L Thompson @ref User 1953eaf62fffSJeremy L Thompson **/ 1954eaf62fffSJeremy L Thompson int CeedOperatorLinearAssemble(CeedOperator op, CeedVector values) { 1955eaf62fffSJeremy L Thompson CeedInt num_suboperators, single_entries = 0; 1956eaf62fffSJeremy L Thompson CeedOperator *sub_operators; 1957f3d47e36SJeremy L Thompson bool is_composite; 19582b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1959f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1960f3d47e36SJeremy L Thompson 1961f3d47e36SJeremy L Thompson // Early exit for empty operator 1962f3d47e36SJeremy L Thompson if (!is_composite) { 1963f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1964f3d47e36SJeremy L Thompson 1965f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1966f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1967f3d47e36SJeremy L Thompson } 1968eaf62fffSJeremy L Thompson 1969eaf62fffSJeremy L Thompson if (op->LinearAssemble) { 1970d04bbc78SJeremy L Thompson // Backend version 19712b730f8bSJeremy L Thompson CeedCall(op->LinearAssemble(op, values)); 1972eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1973eaf62fffSJeremy L Thompson } else { 1974d04bbc78SJeremy L Thompson // Operator fallback 1975d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1976d04bbc78SJeremy L Thompson 19772b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1978d04bbc78SJeremy L Thompson if (op_fallback) { 19792b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssemble(op_fallback, values)); 1980eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1981eaf62fffSJeremy L Thompson } 1982eaf62fffSJeremy L Thompson } 1983eaf62fffSJeremy L Thompson 1984eaf62fffSJeremy L Thompson // Default interface implementation 1985eaf62fffSJeremy L Thompson CeedInt offset = 0; 1986eaf62fffSJeremy L Thompson if (is_composite) { 1987c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1988c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 1989cefa2673SJeremy L Thompson for (CeedInt k = 0; k < num_suboperators; k++) { 19902b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemble(sub_operators[k], offset, values)); 19912b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries)); 1992eaf62fffSJeremy L Thompson offset += single_entries; 1993eaf62fffSJeremy L Thompson } 1994eaf62fffSJeremy L Thompson } else { 19952b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemble(op, offset, values)); 1996eaf62fffSJeremy L Thompson } 1997eaf62fffSJeremy L Thompson 1998eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1999eaf62fffSJeremy L Thompson } 2000eaf62fffSJeremy L Thompson 2001eaf62fffSJeremy L Thompson /** 200275f0d5a4SJeremy L Thompson @brief Get the multiplicity of nodes across suboperators in a composite CeedOperator 200375f0d5a4SJeremy L Thompson 200475f0d5a4SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 200575f0d5a4SJeremy L Thompson 200675f0d5a4SJeremy L Thompson @param[in] op Composite CeedOperator 200775f0d5a4SJeremy L Thompson @param[in] num_skip_indices Number of suboperators to skip 200875f0d5a4SJeremy L Thompson @param[in] skip_indices Array of indices of suboperators to skip 200975f0d5a4SJeremy L Thompson @param[out] mult Vector to store multiplicity (of size l_size) 201075f0d5a4SJeremy L Thompson 201175f0d5a4SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 201275f0d5a4SJeremy L Thompson 201375f0d5a4SJeremy L Thompson @ref User 201475f0d5a4SJeremy L Thompson **/ 201575f0d5a4SJeremy L Thompson int CeedCompositeOperatorGetMultiplicity(CeedOperator op, CeedInt num_skip_indices, CeedInt *skip_indices, CeedVector mult) { 201675f0d5a4SJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 201775f0d5a4SJeremy L Thompson 201875f0d5a4SJeremy L Thompson Ceed ceed; 2019b275c451SJeremy L Thompson CeedInt num_suboperators; 202075f0d5a4SJeremy L Thompson CeedSize l_vec_len; 202175f0d5a4SJeremy L Thompson CeedScalar *mult_array; 202275f0d5a4SJeremy L Thompson CeedVector ones_l_vec; 2023437c7c90SJeremy L Thompson CeedElemRestriction elem_rstr; 2024b275c451SJeremy L Thompson CeedOperator *sub_operators; 202575f0d5a4SJeremy L Thompson 202675f0d5a4SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 202775f0d5a4SJeremy L Thompson 202875f0d5a4SJeremy L Thompson // Zero mult vector 202975f0d5a4SJeremy L Thompson CeedCall(CeedVectorSetValue(mult, 0.0)); 203075f0d5a4SJeremy L Thompson 203175f0d5a4SJeremy L Thompson // Get suboperators 2032b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 2033b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 2034b275c451SJeremy L Thompson if (num_suboperators == 0) return CEED_ERROR_SUCCESS; 203575f0d5a4SJeremy L Thompson 203675f0d5a4SJeremy L Thompson // Work vector 203775f0d5a4SJeremy L Thompson CeedCall(CeedVectorGetLength(mult, &l_vec_len)); 203875f0d5a4SJeremy L Thompson CeedCall(CeedVectorCreate(ceed, l_vec_len, &ones_l_vec)); 203975f0d5a4SJeremy L Thompson CeedCall(CeedVectorSetValue(ones_l_vec, 1.0)); 204075f0d5a4SJeremy L Thompson CeedCall(CeedVectorGetArray(mult, CEED_MEM_HOST, &mult_array)); 204175f0d5a4SJeremy L Thompson 204275f0d5a4SJeremy L Thompson // Compute multiplicity across suboperators 2043b275c451SJeremy L Thompson for (CeedInt i = 0; i < num_suboperators; i++) { 204475f0d5a4SJeremy L Thompson const CeedScalar *sub_mult_array; 204575f0d5a4SJeremy L Thompson CeedVector sub_mult_l_vec, ones_e_vec; 204675f0d5a4SJeremy L Thompson 204775f0d5a4SJeremy L Thompson // -- Check for suboperator to skip 204875f0d5a4SJeremy L Thompson for (CeedInt j = 0; j < num_skip_indices; j++) { 204975f0d5a4SJeremy L Thompson if (skip_indices[j] == i) continue; 205075f0d5a4SJeremy L Thompson } 205175f0d5a4SJeremy L Thompson 205275f0d5a4SJeremy L Thompson // -- Sub operator multiplicity 2053437c7c90SJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(sub_operators[i], &elem_rstr)); 2054437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionCreateVector(elem_rstr, &sub_mult_l_vec, &ones_e_vec)); 205575f0d5a4SJeremy L Thompson CeedCall(CeedVectorSetValue(sub_mult_l_vec, 0.0)); 2056437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionApply(elem_rstr, CEED_NOTRANSPOSE, ones_l_vec, ones_e_vec, CEED_REQUEST_IMMEDIATE)); 2057437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionApply(elem_rstr, CEED_TRANSPOSE, ones_e_vec, sub_mult_l_vec, CEED_REQUEST_IMMEDIATE)); 205875f0d5a4SJeremy L Thompson CeedCall(CeedVectorGetArrayRead(sub_mult_l_vec, CEED_MEM_HOST, &sub_mult_array)); 205975f0d5a4SJeremy L Thompson // ---- Flag every node present in the current suboperator 206075f0d5a4SJeremy L Thompson for (CeedInt j = 0; j < l_vec_len; j++) { 206175f0d5a4SJeremy L Thompson if (sub_mult_array[j] > 0.0) mult_array[j] += 1.0; 206275f0d5a4SJeremy L Thompson } 206375f0d5a4SJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(sub_mult_l_vec, &sub_mult_array)); 206475f0d5a4SJeremy L Thompson CeedCall(CeedVectorDestroy(&sub_mult_l_vec)); 206575f0d5a4SJeremy L Thompson CeedCall(CeedVectorDestroy(&ones_e_vec)); 206675f0d5a4SJeremy L Thompson } 206775f0d5a4SJeremy L Thompson CeedCall(CeedVectorRestoreArray(mult, &mult_array)); 2068811d0ccfSJeremy L Thompson CeedCall(CeedVectorDestroy(&ones_l_vec)); 206975f0d5a4SJeremy L Thompson 207075f0d5a4SJeremy L Thompson return CEED_ERROR_SUCCESS; 207175f0d5a4SJeremy L Thompson } 207275f0d5a4SJeremy L Thompson 207375f0d5a4SJeremy L Thompson /** 2074ea61e9acSJeremy L Thompson @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator, creating the prolongation basis from the fine and coarse 2075ea61e9acSJeremy L Thompson grid interpolation 2076eaf62fffSJeremy L Thompson 207758e4b056SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable. 2078f04ea552SJeremy L Thompson 2079eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 2080eaf62fffSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter 2081eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 2082eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 2083eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 2084eaf62fffSJeremy L Thompson @param[out] op_prolong Coarse to fine operator 2085eaf62fffSJeremy L Thompson @param[out] op_restrict Fine to coarse operator 2086eaf62fffSJeremy L Thompson 2087eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2088eaf62fffSJeremy L Thompson 2089eaf62fffSJeremy L Thompson @ref User 2090eaf62fffSJeremy L Thompson **/ 20912b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreate(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 20922b730f8bSJeremy L Thompson CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) { 20932b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fine)); 2094eaf62fffSJeremy L Thompson 2095f113e5dcSJeremy L Thompson // Build prolongation matrix 2096f113e5dcSJeremy L Thompson CeedBasis basis_fine, basis_c_to_f; 20972b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine)); 20982b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateProjection(basis_coarse, basis_fine, &basis_c_to_f)); 2099eaf62fffSJeremy L Thompson 2100f113e5dcSJeremy L Thompson // Core code 21012b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict)); 2102f113e5dcSJeremy L Thompson 2103eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2104eaf62fffSJeremy L Thompson } 2105eaf62fffSJeremy L Thompson 2106eaf62fffSJeremy L Thompson /** 2107ea61e9acSJeremy L Thompson @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a tensor basis for the active basis 2108eaf62fffSJeremy L Thompson 210958e4b056SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable. 2110f04ea552SJeremy L Thompson 2111eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 2112eaf62fffSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter 2113eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 2114eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 2115eaf62fffSJeremy L Thompson @param[in] interp_c_to_f Matrix for coarse to fine interpolation 2116eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 2117eaf62fffSJeremy L Thompson @param[out] op_prolong Coarse to fine operator 2118eaf62fffSJeremy L Thompson @param[out] op_restrict Fine to coarse operator 2119eaf62fffSJeremy L Thompson 2120eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2121eaf62fffSJeremy L Thompson 2122eaf62fffSJeremy L Thompson @ref User 2123eaf62fffSJeremy L Thompson **/ 21242b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateTensorH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 21252b730f8bSJeremy L Thompson const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, 21262b730f8bSJeremy L Thompson CeedOperator *op_restrict) { 21272b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fine)); 2128eaf62fffSJeremy L Thompson Ceed ceed; 21292b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op_fine, &ceed)); 2130eaf62fffSJeremy L Thompson 2131eaf62fffSJeremy L Thompson // Check for compatible quadrature spaces 2132eaf62fffSJeremy L Thompson CeedBasis basis_fine; 21332b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine)); 2134eaf62fffSJeremy L Thompson CeedInt Q_f, Q_c; 21352b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f)); 21362b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c)); 21372b730f8bSJeremy L Thompson if (Q_f != Q_c) { 2138eaf62fffSJeremy L Thompson // LCOV_EXCL_START 21392b730f8bSJeremy L Thompson return CeedError(ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces"); 2140eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 21412b730f8bSJeremy L Thompson } 2142eaf62fffSJeremy L Thompson 2143eaf62fffSJeremy L Thompson // Coarse to fine basis 2144eaf62fffSJeremy L Thompson CeedInt dim, num_comp, num_nodes_c, P_1d_f, P_1d_c; 21452b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis_fine, &dim)); 21462b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp)); 21472b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes1D(basis_fine, &P_1d_f)); 21482b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c)); 21492b730f8bSJeremy L Thompson P_1d_c = dim == 1 ? num_nodes_c : dim == 2 ? sqrt(num_nodes_c) : cbrt(num_nodes_c); 2150eaf62fffSJeremy L Thompson CeedScalar *q_ref, *q_weight, *grad; 21512b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d_f, &q_ref)); 21522b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d_f, &q_weight)); 21532b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d_f * P_1d_c * dim, &grad)); 2154eaf62fffSJeremy L Thompson CeedBasis basis_c_to_f; 21552b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateTensorH1(ceed, dim, num_comp, P_1d_c, P_1d_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f)); 21562b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_ref)); 21572b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_weight)); 21582b730f8bSJeremy L Thompson CeedCall(CeedFree(&grad)); 2159eaf62fffSJeremy L Thompson 2160eaf62fffSJeremy L Thompson // Core code 21612b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict)); 2162eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2163eaf62fffSJeremy L Thompson } 2164eaf62fffSJeremy L Thompson 2165eaf62fffSJeremy L Thompson /** 2166ea61e9acSJeremy L Thompson @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a non-tensor basis for the active vector 2167eaf62fffSJeremy L Thompson 216858e4b056SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable. 2169f04ea552SJeremy L Thompson 2170eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 2171eaf62fffSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter 2172eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 2173eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 2174eaf62fffSJeremy L Thompson @param[in] interp_c_to_f Matrix for coarse to fine interpolation 2175eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 2176eaf62fffSJeremy L Thompson @param[out] op_prolong Coarse to fine operator 2177eaf62fffSJeremy L Thompson @param[out] op_restrict Fine to coarse operator 2178eaf62fffSJeremy L Thompson 2179eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2180eaf62fffSJeremy L Thompson 2181eaf62fffSJeremy L Thompson @ref User 2182eaf62fffSJeremy L Thompson **/ 21832b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 21842b730f8bSJeremy L Thompson const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, 2185eaf62fffSJeremy L Thompson CeedOperator *op_restrict) { 21862b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fine)); 2187eaf62fffSJeremy L Thompson Ceed ceed; 21882b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op_fine, &ceed)); 2189eaf62fffSJeremy L Thompson 2190eaf62fffSJeremy L Thompson // Check for compatible quadrature spaces 2191eaf62fffSJeremy L Thompson CeedBasis basis_fine; 21922b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine)); 2193eaf62fffSJeremy L Thompson CeedInt Q_f, Q_c; 21942b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f)); 21952b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c)); 21962b730f8bSJeremy L Thompson if (Q_f != Q_c) { 2197eaf62fffSJeremy L Thompson // LCOV_EXCL_START 21982b730f8bSJeremy L Thompson return CeedError(ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces"); 2199eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 22002b730f8bSJeremy L Thompson } 2201eaf62fffSJeremy L Thompson 2202eaf62fffSJeremy L Thompson // Coarse to fine basis 2203eaf62fffSJeremy L Thompson CeedElemTopology topo; 22042b730f8bSJeremy L Thompson CeedCall(CeedBasisGetTopology(basis_fine, &topo)); 2205eaf62fffSJeremy L Thompson CeedInt dim, num_comp, num_nodes_c, num_nodes_f; 22062b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis_fine, &dim)); 22072b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp)); 22082b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes(basis_fine, &num_nodes_f)); 22092b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c)); 2210eaf62fffSJeremy L Thompson CeedScalar *q_ref, *q_weight, *grad; 22112b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_nodes_f * dim, &q_ref)); 22122b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_nodes_f, &q_weight)); 22132b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_nodes_f * num_nodes_c * dim, &grad)); 2214eaf62fffSJeremy L Thompson CeedBasis basis_c_to_f; 22152b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateH1(ceed, topo, num_comp, num_nodes_c, num_nodes_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f)); 22162b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_ref)); 22172b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_weight)); 22182b730f8bSJeremy L Thompson CeedCall(CeedFree(&grad)); 2219eaf62fffSJeremy L Thompson 2220eaf62fffSJeremy L Thompson // Core code 22212b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict)); 2222eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2223eaf62fffSJeremy L Thompson } 2224eaf62fffSJeremy L Thompson 2225eaf62fffSJeremy L Thompson /** 2226ea61e9acSJeremy L Thompson @brief Build a FDM based approximate inverse for each element for a CeedOperator 2227eaf62fffSJeremy L Thompson 2228ea61e9acSJeremy L Thompson This returns a CeedOperator and CeedVector to apply a Fast Diagonalization Method based approximate inverse. 2229ea61e9acSJeremy L Thompson This function obtains the simultaneous diagonalization for the 1D mass and Laplacian operators, M = V^T V, K = V^T S V. 2230ea61e9acSJeremy L Thompson The assembled QFunction is used to modify the eigenvalues from simultaneous diagonalization and obtain an approximate inverse of the form V^T 2231ea61e9acSJeremy L Thompson S^hat V. The CeedOperator must be linear and non-composite. The associated CeedQFunction must therefore also be linear. 2232eaf62fffSJeremy L Thompson 2233ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 2234f04ea552SJeremy L Thompson 2235ea61e9acSJeremy L Thompson @param[in] op CeedOperator to create element inverses 2236ea61e9acSJeremy L Thompson @param[out] fdm_inv CeedOperator to apply the action of a FDM based inverse for each element 2237ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 2238eaf62fffSJeremy L Thompson 2239eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2240eaf62fffSJeremy L Thompson 2241480fae85SJeremy L Thompson @ref User 2242eaf62fffSJeremy L Thompson **/ 22432b730f8bSJeremy L Thompson int CeedOperatorCreateFDMElementInverse(CeedOperator op, CeedOperator *fdm_inv, CeedRequest *request) { 22442b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 2245eaf62fffSJeremy L Thompson 2246eaf62fffSJeremy L Thompson if (op->CreateFDMElementInverse) { 2247d04bbc78SJeremy L Thompson // Backend version 22482b730f8bSJeremy L Thompson CeedCall(op->CreateFDMElementInverse(op, fdm_inv, request)); 2249eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2250eaf62fffSJeremy L Thompson } else { 2251d04bbc78SJeremy L Thompson // Operator fallback 2252d04bbc78SJeremy L Thompson CeedOperator op_fallback; 2253d04bbc78SJeremy L Thompson 22542b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 2255d04bbc78SJeremy L Thompson if (op_fallback) { 22562b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreateFDMElementInverse(op_fallback, fdm_inv, request)); 2257eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2258eaf62fffSJeremy L Thompson } 2259eaf62fffSJeremy L Thompson } 2260eaf62fffSJeremy L Thompson 2261d04bbc78SJeremy L Thompson // Default interface implementation 2262eaf62fffSJeremy L Thompson Ceed ceed, ceed_parent; 22632b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 22642b730f8bSJeremy L Thompson CeedCall(CeedGetOperatorFallbackParentCeed(ceed, &ceed_parent)); 2265eaf62fffSJeremy L Thompson ceed_parent = ceed_parent ? ceed_parent : ceed; 2266eaf62fffSJeremy L Thompson CeedQFunction qf; 22672b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 2268eaf62fffSJeremy L Thompson 2269eaf62fffSJeremy L Thompson // Determine active input basis 2270eaf62fffSJeremy L Thompson bool interp = false, grad = false; 2271eaf62fffSJeremy L Thompson CeedBasis basis = NULL; 2272eaf62fffSJeremy L Thompson CeedElemRestriction rstr = NULL; 2273eaf62fffSJeremy L Thompson CeedOperatorField *op_fields; 2274eaf62fffSJeremy L Thompson CeedQFunctionField *qf_fields; 2275eaf62fffSJeremy L Thompson CeedInt num_input_fields; 22762b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, &num_input_fields, &op_fields, NULL, NULL)); 22772b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL)); 2278eaf62fffSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 2279eaf62fffSJeremy L Thompson CeedVector vec; 22802b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec)); 2281eaf62fffSJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 2282eaf62fffSJeremy L Thompson CeedEvalMode eval_mode; 22832b730f8bSJeremy L Thompson CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 2284eaf62fffSJeremy L Thompson interp = interp || eval_mode == CEED_EVAL_INTERP; 2285eaf62fffSJeremy L Thompson grad = grad || eval_mode == CEED_EVAL_GRAD; 22862b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 22872b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr)); 2288eaf62fffSJeremy L Thompson } 2289eaf62fffSJeremy L Thompson } 22902b730f8bSJeremy L Thompson if (!basis) { 2291eaf62fffSJeremy L Thompson // LCOV_EXCL_START 2292eaf62fffSJeremy L Thompson return CeedError(ceed, CEED_ERROR_BACKEND, "No active field set"); 2293eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 22942b730f8bSJeremy L Thompson } 2295e79b91d9SJeremy L Thompson CeedSize l_size = 1; 2296e79b91d9SJeremy L Thompson CeedInt P_1d, Q_1d, elem_size, num_qpts, dim, num_comp = 1, num_elem = 1; 22972b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes1D(basis, &P_1d)); 22982b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes(basis, &elem_size)); 22992b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints1D(basis, &Q_1d)); 23002b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis, &num_qpts)); 23012b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis, &dim)); 23022b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis, &num_comp)); 23032b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem)); 23042b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size)); 2305eaf62fffSJeremy L Thompson 2306eaf62fffSJeremy L Thompson // Build and diagonalize 1D Mass and Laplacian 2307eaf62fffSJeremy L Thompson bool tensor_basis; 23082b730f8bSJeremy L Thompson CeedCall(CeedBasisIsTensor(basis, &tensor_basis)); 23092b730f8bSJeremy L Thompson if (!tensor_basis) { 2310eaf62fffSJeremy L Thompson // LCOV_EXCL_START 23112b730f8bSJeremy L Thompson return CeedError(ceed, CEED_ERROR_BACKEND, "FDMElementInverse only supported for tensor bases"); 2312eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 23132b730f8bSJeremy L Thompson } 2314eaf62fffSJeremy L Thompson CeedScalar *mass, *laplace, *x, *fdm_interp, *lambda; 23152b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &mass)); 23162b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &laplace)); 23172b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &x)); 23182b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &fdm_interp)); 23192b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d, &lambda)); 2320eaf62fffSJeremy L Thompson // -- Build matrices 2321eaf62fffSJeremy L Thompson const CeedScalar *interp_1d, *grad_1d, *q_weight_1d; 23222b730f8bSJeremy L Thompson CeedCall(CeedBasisGetInterp1D(basis, &interp_1d)); 23232b730f8bSJeremy L Thompson CeedCall(CeedBasisGetGrad1D(basis, &grad_1d)); 23242b730f8bSJeremy L Thompson CeedCall(CeedBasisGetQWeights(basis, &q_weight_1d)); 23252b730f8bSJeremy L Thompson CeedCall(CeedBuildMassLaplace(interp_1d, grad_1d, q_weight_1d, P_1d, Q_1d, dim, mass, laplace)); 2326eaf62fffSJeremy L Thompson 2327eaf62fffSJeremy L Thompson // -- Diagonalize 23282b730f8bSJeremy L Thompson CeedCall(CeedSimultaneousDiagonalization(ceed, laplace, mass, x, lambda, P_1d)); 23292b730f8bSJeremy L Thompson CeedCall(CeedFree(&mass)); 23302b730f8bSJeremy L Thompson CeedCall(CeedFree(&laplace)); 23312b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) { 23322b730f8bSJeremy L Thompson for (CeedInt j = 0; j < P_1d; j++) fdm_interp[i + j * P_1d] = x[j + i * P_1d]; 23332b730f8bSJeremy L Thompson } 23342b730f8bSJeremy L Thompson CeedCall(CeedFree(&x)); 2335eaf62fffSJeremy L Thompson 2336eaf62fffSJeremy L Thompson // Assemble QFunction 2337eaf62fffSJeremy L Thompson CeedVector assembled; 2338eaf62fffSJeremy L Thompson CeedElemRestriction rstr_qf; 23392b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled, &rstr_qf, request)); 2340eaf62fffSJeremy L Thompson CeedInt layout[3]; 23412b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(rstr_qf, &layout)); 23422b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_qf)); 2343eaf62fffSJeremy L Thompson CeedScalar max_norm = 0; 23442b730f8bSJeremy L Thompson CeedCall(CeedVectorNorm(assembled, CEED_NORM_MAX, &max_norm)); 2345eaf62fffSJeremy L Thompson 2346eaf62fffSJeremy L Thompson // Calculate element averages 2347eaf62fffSJeremy L Thompson CeedInt num_modes = (interp ? 1 : 0) + (grad ? dim : 0); 2348eaf62fffSJeremy L Thompson CeedScalar *elem_avg; 2349eaf62fffSJeremy L Thompson const CeedScalar *assembled_array, *q_weight_array; 2350eaf62fffSJeremy L Thompson CeedVector q_weight; 23512b730f8bSJeremy L Thompson CeedCall(CeedVectorCreate(ceed_parent, num_qpts, &q_weight)); 23522b730f8bSJeremy L Thompson CeedCall(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, q_weight)); 23532b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(assembled, CEED_MEM_HOST, &assembled_array)); 23542b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(q_weight, CEED_MEM_HOST, &q_weight_array)); 23552b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_elem, &elem_avg)); 2356eaf62fffSJeremy L Thompson const CeedScalar qf_value_bound = max_norm * 100 * CEED_EPSILON; 2357eaf62fffSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 2358eaf62fffSJeremy L Thompson CeedInt count = 0; 23592b730f8bSJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 23602b730f8bSJeremy L Thompson for (CeedInt i = 0; i < num_comp * num_comp * num_modes * num_modes; i++) { 23612b730f8bSJeremy L Thompson if (fabs(assembled_array[q * layout[0] + i * layout[1] + e * layout[2]]) > qf_value_bound) { 23622b730f8bSJeremy L Thompson elem_avg[e] += assembled_array[q * layout[0] + i * layout[1] + e * layout[2]] / q_weight_array[q]; 2363eaf62fffSJeremy L Thompson count++; 2364eaf62fffSJeremy L Thompson } 23652b730f8bSJeremy L Thompson } 23662b730f8bSJeremy L Thompson } 2367eaf62fffSJeremy L Thompson if (count) { 2368eaf62fffSJeremy L Thompson elem_avg[e] /= count; 2369eaf62fffSJeremy L Thompson } else { 2370eaf62fffSJeremy L Thompson elem_avg[e] = 1.0; 2371eaf62fffSJeremy L Thompson } 2372eaf62fffSJeremy L Thompson } 23732b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(assembled, &assembled_array)); 23742b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled)); 23752b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(q_weight, &q_weight_array)); 23762b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&q_weight)); 2377eaf62fffSJeremy L Thompson 2378eaf62fffSJeremy L Thompson // Build FDM diagonal 2379eaf62fffSJeremy L Thompson CeedVector q_data; 2380eaf62fffSJeremy L Thompson CeedScalar *q_data_array, *fdm_diagonal; 23812b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_comp * elem_size, &fdm_diagonal)); 2382eaf62fffSJeremy L Thompson const CeedScalar fdm_diagonal_bound = elem_size * CEED_EPSILON; 23832b730f8bSJeremy L Thompson for (CeedInt c = 0; c < num_comp; c++) { 2384eaf62fffSJeremy L Thompson for (CeedInt n = 0; n < elem_size; n++) { 23852b730f8bSJeremy L Thompson if (interp) fdm_diagonal[c * elem_size + n] = 1.0; 23862b730f8bSJeremy L Thompson if (grad) { 2387eaf62fffSJeremy L Thompson for (CeedInt d = 0; d < dim; d++) { 2388eaf62fffSJeremy L Thompson CeedInt i = (n / CeedIntPow(P_1d, d)) % P_1d; 2389eaf62fffSJeremy L Thompson fdm_diagonal[c * elem_size + n] += lambda[i]; 2390eaf62fffSJeremy L Thompson } 2391eaf62fffSJeremy L Thompson } 23922b730f8bSJeremy L Thompson if (fabs(fdm_diagonal[c * elem_size + n]) < fdm_diagonal_bound) fdm_diagonal[c * elem_size + n] = fdm_diagonal_bound; 23932b730f8bSJeremy L Thompson } 23942b730f8bSJeremy L Thompson } 23952b730f8bSJeremy L Thompson CeedCall(CeedVectorCreate(ceed_parent, num_elem * num_comp * elem_size, &q_data)); 23962b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(q_data, 0.0)); 23972b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayWrite(q_data, CEED_MEM_HOST, &q_data_array)); 23982b730f8bSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 23992b730f8bSJeremy L Thompson for (CeedInt c = 0; c < num_comp; c++) { 24002b730f8bSJeremy L Thompson for (CeedInt n = 0; n < elem_size; n++) q_data_array[(e * num_comp + c) * elem_size + n] = 1. / (elem_avg[e] * fdm_diagonal[c * elem_size + n]); 24012b730f8bSJeremy L Thompson } 24022b730f8bSJeremy L Thompson } 24032b730f8bSJeremy L Thompson CeedCall(CeedFree(&elem_avg)); 24042b730f8bSJeremy L Thompson CeedCall(CeedFree(&fdm_diagonal)); 24052b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(q_data, &q_data_array)); 2406eaf62fffSJeremy L Thompson 2407eaf62fffSJeremy L Thompson // Setup FDM operator 2408eaf62fffSJeremy L Thompson // -- Basis 2409eaf62fffSJeremy L Thompson CeedBasis fdm_basis; 2410eaf62fffSJeremy L Thompson CeedScalar *grad_dummy, *q_ref_dummy, *q_weight_dummy; 24112b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &grad_dummy)); 24122b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d, &q_ref_dummy)); 24132b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d, &q_weight_dummy)); 24142b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateTensorH1(ceed_parent, dim, num_comp, P_1d, P_1d, fdm_interp, grad_dummy, q_ref_dummy, q_weight_dummy, &fdm_basis)); 24152b730f8bSJeremy L Thompson CeedCall(CeedFree(&fdm_interp)); 24162b730f8bSJeremy L Thompson CeedCall(CeedFree(&grad_dummy)); 24172b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_ref_dummy)); 24182b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_weight_dummy)); 24192b730f8bSJeremy L Thompson CeedCall(CeedFree(&lambda)); 2420eaf62fffSJeremy L Thompson 2421eaf62fffSJeremy L Thompson // -- Restriction 2422eaf62fffSJeremy L Thompson CeedElemRestriction rstr_qd_i; 2423eaf62fffSJeremy L Thompson CeedInt strides[3] = {1, elem_size, elem_size * num_comp}; 24242b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionCreateStrided(ceed_parent, num_elem, elem_size, num_comp, num_elem * num_comp * elem_size, strides, &rstr_qd_i)); 2425eaf62fffSJeremy L Thompson // -- QFunction 2426eaf62fffSJeremy L Thompson CeedQFunction qf_fdm; 24272b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateInteriorByName(ceed_parent, "Scale", &qf_fdm)); 24282b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_fdm, "input", num_comp, CEED_EVAL_INTERP)); 24292b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_fdm, "scale", num_comp, CEED_EVAL_NONE)); 24302b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(qf_fdm, "output", num_comp, CEED_EVAL_INTERP)); 24312b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_fdm, num_comp)); 2432eaf62fffSJeremy L Thompson // -- QFunction context 2433eaf62fffSJeremy L Thompson CeedInt *num_comp_data; 24342b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &num_comp_data)); 2435eaf62fffSJeremy L Thompson num_comp_data[0] = num_comp; 2436eaf62fffSJeremy L Thompson CeedQFunctionContext ctx_fdm; 24372b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextCreate(ceed, &ctx_fdm)); 24382b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextSetData(ctx_fdm, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_data), num_comp_data)); 24392b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(qf_fdm, ctx_fdm)); 24402b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextDestroy(&ctx_fdm)); 2441eaf62fffSJeremy L Thompson // -- Operator 24422b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed_parent, qf_fdm, NULL, NULL, fdm_inv)); 24432b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*fdm_inv, "input", rstr, fdm_basis, CEED_VECTOR_ACTIVE)); 24442b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*fdm_inv, "scale", rstr_qd_i, CEED_BASIS_COLLOCATED, q_data)); 24452b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*fdm_inv, "output", rstr, fdm_basis, CEED_VECTOR_ACTIVE)); 2446eaf62fffSJeremy L Thompson 2447eaf62fffSJeremy L Thompson // Cleanup 24482b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&q_data)); 24492b730f8bSJeremy L Thompson CeedCall(CeedBasisDestroy(&fdm_basis)); 24502b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_qd_i)); 24512b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&qf_fdm)); 2452eaf62fffSJeremy L Thompson 2453eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2454eaf62fffSJeremy L Thompson } 2455eaf62fffSJeremy L Thompson 2456eaf62fffSJeremy L Thompson /// @} 2457