13d8e8822SJeremy L Thompson // Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors. 23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details. 3eaf62fffSJeremy L Thompson // 43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause 5eaf62fffSJeremy L Thompson // 63d8e8822SJeremy L Thompson // This file is part of CEED: http://github.com/ceed 7eaf62fffSJeremy L Thompson 82b730f8bSJeremy L Thompson #include <ceed-impl.h> 949aac155SJeremy L Thompson #include <ceed.h> 102b730f8bSJeremy L Thompson #include <ceed/backend.h> 11c85e8640SSebastian Grimberg #include <assert.h> 122b730f8bSJeremy L Thompson #include <math.h> 13eaf62fffSJeremy L Thompson #include <stdbool.h> 14eaf62fffSJeremy L Thompson #include <stdio.h> 15eaf62fffSJeremy L Thompson #include <string.h> 16eaf62fffSJeremy L Thompson 17eaf62fffSJeremy L Thompson /// @file 18eaf62fffSJeremy L Thompson /// Implementation of CeedOperator preconditioning interfaces 19eaf62fffSJeremy L Thompson 20eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 21eaf62fffSJeremy L Thompson /// CeedOperator Library Internal Preconditioning Functions 22eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 23eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorDeveloper 24eaf62fffSJeremy L Thompson /// @{ 25eaf62fffSJeremy L Thompson 26eaf62fffSJeremy L Thompson /** 27ea61e9acSJeremy L Thompson @brief Duplicate a CeedQFunction with a reference Ceed to fallback for advanced CeedOperator functionality 289e77b9c8SJeremy L Thompson 2901ea9c81SJed Brown @param[in] fallback_ceed Ceed on which to create fallback CeedQFunction 309e77b9c8SJeremy L Thompson @param[in] qf CeedQFunction to create fallback for 3101ea9c81SJed Brown @param[out] qf_fallback fallback CeedQFunction 329e77b9c8SJeremy L Thompson 339e77b9c8SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 349e77b9c8SJeremy L Thompson 359e77b9c8SJeremy L Thompson @ref Developer 369e77b9c8SJeremy L Thompson **/ 372b730f8bSJeremy L Thompson static int CeedQFunctionCreateFallback(Ceed fallback_ceed, CeedQFunction qf, CeedQFunction *qf_fallback) { 381c66c397SJeremy L Thompson char *source_path_with_name = NULL; 391c66c397SJeremy L Thompson 409e77b9c8SJeremy L Thompson // Check if NULL qf passed in 419e77b9c8SJeremy L Thompson if (!qf) return CEED_ERROR_SUCCESS; 429e77b9c8SJeremy L Thompson 43d04bbc78SJeremy L Thompson CeedDebug256(qf->ceed, 1, "---------- CeedOperator Fallback ----------\n"); 4413f886e9SJeremy L Thompson CeedDebug(qf->ceed, "Creating fallback CeedQFunction\n"); 45d04bbc78SJeremy L Thompson 469e77b9c8SJeremy L Thompson if (qf->source_path) { 472b730f8bSJeremy L Thompson size_t path_len = strlen(qf->source_path), name_len = strlen(qf->kernel_name); 482b730f8bSJeremy L Thompson CeedCall(CeedCalloc(path_len + name_len + 2, &source_path_with_name)); 499e77b9c8SJeremy L Thompson memcpy(source_path_with_name, qf->source_path, path_len); 509e77b9c8SJeremy L Thompson memcpy(&source_path_with_name[path_len], ":", 1); 519e77b9c8SJeremy L Thompson memcpy(&source_path_with_name[path_len + 1], qf->kernel_name, name_len); 529e77b9c8SJeremy L Thompson } else { 532b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &source_path_with_name)); 549e77b9c8SJeremy L Thompson } 559e77b9c8SJeremy L Thompson 562b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateInterior(fallback_ceed, qf->vec_length, qf->function, source_path_with_name, qf_fallback)); 579e77b9c8SJeremy L Thompson { 589e77b9c8SJeremy L Thompson CeedQFunctionContext ctx; 599e77b9c8SJeremy L Thompson 602b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetContext(qf, &ctx)); 612b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(*qf_fallback, ctx)); 629e77b9c8SJeremy L Thompson } 639e77b9c8SJeremy L Thompson for (CeedInt i = 0; i < qf->num_input_fields; i++) { 642b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(*qf_fallback, qf->input_fields[i]->field_name, qf->input_fields[i]->size, qf->input_fields[i]->eval_mode)); 659e77b9c8SJeremy L Thompson } 669e77b9c8SJeremy L Thompson for (CeedInt i = 0; i < qf->num_output_fields; i++) { 672b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(*qf_fallback, qf->output_fields[i]->field_name, qf->output_fields[i]->size, qf->output_fields[i]->eval_mode)); 689e77b9c8SJeremy L Thompson } 692b730f8bSJeremy L Thompson CeedCall(CeedFree(&source_path_with_name)); 709e77b9c8SJeremy L Thompson return CEED_ERROR_SUCCESS; 719e77b9c8SJeremy L Thompson } 729e77b9c8SJeremy L Thompson 739e77b9c8SJeremy L Thompson /** 74ea61e9acSJeremy L Thompson @brief Duplicate a CeedOperator with a reference Ceed to fallback for advanced CeedOperator functionality 75eaf62fffSJeremy L Thompson 76ea61e9acSJeremy L Thompson @param[in,out] op CeedOperator to create fallback for 77eaf62fffSJeremy L Thompson 78eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 79eaf62fffSJeremy L Thompson 80eaf62fffSJeremy L Thompson @ref Developer 81eaf62fffSJeremy L Thompson **/ 82d04bbc78SJeremy L Thompson static int CeedOperatorCreateFallback(CeedOperator op) { 839e77b9c8SJeremy L Thompson Ceed ceed_fallback; 841c66c397SJeremy L Thompson bool is_composite; 851c66c397SJeremy L Thompson CeedOperator op_fallback; 86eaf62fffSJeremy L Thompson 87805fe78eSJeremy L Thompson // Check not already created 88805fe78eSJeremy L Thompson if (op->op_fallback) return CEED_ERROR_SUCCESS; 89805fe78eSJeremy L Thompson 90eaf62fffSJeremy L Thompson // Fallback Ceed 912b730f8bSJeremy L Thompson CeedCall(CeedGetOperatorFallbackCeed(op->ceed, &ceed_fallback)); 92d04bbc78SJeremy L Thompson if (!ceed_fallback) return CEED_ERROR_SUCCESS; 93d04bbc78SJeremy L Thompson 94d04bbc78SJeremy L Thompson CeedDebug256(op->ceed, 1, "---------- CeedOperator Fallback ----------\n"); 9513f886e9SJeremy L Thompson CeedDebug(op->ceed, "Creating fallback CeedOperator\n"); 96eaf62fffSJeremy L Thompson 97eaf62fffSJeremy L Thompson // Clone Op 98b275c451SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 99b275c451SJeremy L Thompson if (is_composite) { 100b275c451SJeremy L Thompson CeedInt num_suboperators; 101b275c451SJeremy L Thompson CeedOperator *sub_operators; 102b275c451SJeremy L Thompson 1032b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorCreate(ceed_fallback, &op_fallback)); 104b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 105b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 106b275c451SJeremy L Thompson for (CeedInt i = 0; i < num_suboperators; i++) { 107d04bbc78SJeremy L Thompson CeedOperator op_sub_fallback; 108d04bbc78SJeremy L Thompson 109b275c451SJeremy L Thompson CeedCall(CeedOperatorGetFallback(sub_operators[i], &op_sub_fallback)); 1102b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorAddSub(op_fallback, op_sub_fallback)); 111805fe78eSJeremy L Thompson } 112805fe78eSJeremy L Thompson } else { 1139e77b9c8SJeremy L Thompson CeedQFunction qf_fallback = NULL, dqf_fallback = NULL, dqfT_fallback = NULL; 1141c66c397SJeremy L Thompson 1152b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->qf, &qf_fallback)); 1162b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqf, &dqf_fallback)); 1172b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqfT, &dqfT_fallback)); 1182b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed_fallback, qf_fallback, dqf_fallback, dqfT_fallback, &op_fallback)); 119805fe78eSJeremy L Thompson for (CeedInt i = 0; i < op->qf->num_input_fields; i++) { 120437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(op_fallback, op->input_fields[i]->field_name, op->input_fields[i]->elem_rstr, op->input_fields[i]->basis, 1212b730f8bSJeremy L Thompson op->input_fields[i]->vec)); 122805fe78eSJeremy L Thompson } 123805fe78eSJeremy L Thompson for (CeedInt i = 0; i < op->qf->num_output_fields; i++) { 124437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(op_fallback, op->output_fields[i]->field_name, op->output_fields[i]->elem_rstr, op->output_fields[i]->basis, 1252b730f8bSJeremy L Thompson op->output_fields[i]->vec)); 126805fe78eSJeremy L Thompson } 1272b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op->qf_assembled, &op_fallback->qf_assembled)); 128febe2972SJeremy L Thompson if (op_fallback->num_qpts == 0) CeedCall(CeedOperatorSetNumQuadraturePoints(op_fallback, op->num_qpts)); 1299e77b9c8SJeremy L Thompson // Cleanup 1302b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&qf_fallback)); 1312b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&dqf_fallback)); 1322b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&dqfT_fallback)); 133805fe78eSJeremy L Thompson } 1342b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetName(op_fallback, op->name)); 1352b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fallback)); 136b05f7e9fSJeremy L Thompson // Note: No ref-counting here so we don't get caught in a reference loop. 137b05f7e9fSJeremy L Thompson // The op holds the only reference to op_fallback and is responsible for deleting itself and op_fallback. 138805fe78eSJeremy L Thompson op->op_fallback = op_fallback; 139b05f7e9fSJeremy L Thompson op_fallback->op_fallback_parent = op; 140eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 141eaf62fffSJeremy L Thompson } 142eaf62fffSJeremy L Thompson 143eaf62fffSJeremy L Thompson /** 144ea61e9acSJeremy L Thompson @brief Retrieve fallback CeedOperator with a reference Ceed for advanced CeedOperator functionality 145d04bbc78SJeremy L Thompson 146d04bbc78SJeremy L Thompson @param[in] op CeedOperator to retrieve fallback for 147d04bbc78SJeremy L Thompson @param[out] op_fallback Fallback CeedOperator 148d04bbc78SJeremy L Thompson 149d04bbc78SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 150d04bbc78SJeremy L Thompson 151d04bbc78SJeremy L Thompson @ref Developer 152d04bbc78SJeremy L Thompson **/ 153d04bbc78SJeremy L Thompson int CeedOperatorGetFallback(CeedOperator op, CeedOperator *op_fallback) { 154d04bbc78SJeremy L Thompson // Create if needed 1551c66c397SJeremy L Thompson if (!op->op_fallback) CeedCall(CeedOperatorCreateFallback(op)); 156d04bbc78SJeremy L Thompson if (op->op_fallback) { 157d04bbc78SJeremy L Thompson bool is_debug; 158d04bbc78SJeremy L Thompson 1592b730f8bSJeremy L Thompson CeedCall(CeedIsDebug(op->ceed, &is_debug)); 160d04bbc78SJeremy L Thompson if (is_debug) { 161b275c451SJeremy L Thompson Ceed ceed, ceed_fallback; 162d04bbc78SJeremy L Thompson const char *resource, *resource_fallback; 163d04bbc78SJeremy L Thompson 164b275c451SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 165b275c451SJeremy L Thompson CeedCall(CeedGetOperatorFallbackCeed(ceed, &ceed_fallback)); 166b275c451SJeremy L Thompson CeedCall(CeedGetResource(ceed, &resource)); 1672b730f8bSJeremy L Thompson CeedCall(CeedGetResource(ceed_fallback, &resource_fallback)); 168d04bbc78SJeremy L Thompson 16923d4529eSJeremy L Thompson CeedDebug256(ceed, CEED_DEBUG_COLOR_SUCCESS, "---------- CeedOperator Fallback ----------\n"); 170b275c451SJeremy L Thompson CeedDebug(ceed, "Falling back from %s operator at address %ld to %s operator at address %ld\n", resource, op, resource_fallback, 1712b730f8bSJeremy L Thompson op->op_fallback); 172d04bbc78SJeremy L Thompson } 173d04bbc78SJeremy L Thompson } 174d04bbc78SJeremy L Thompson *op_fallback = op->op_fallback; 175d04bbc78SJeremy L Thompson return CEED_ERROR_SUCCESS; 176d04bbc78SJeremy L Thompson } 177d04bbc78SJeremy L Thompson 178d04bbc78SJeremy L Thompson /** 1792e8f5c67SJeremy L Thompson @brief Get the parent CeedOperator for a fallback CeedOperator 180bb229da9SJeremy L Thompson 181bb229da9SJeremy L Thompson @param[in] op CeedOperator context 182bb229da9SJeremy L Thompson @param[out] parent Variable to store parent CeedOperator context 183bb229da9SJeremy L Thompson 184bb229da9SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 185bb229da9SJeremy L Thompson 186bb229da9SJeremy L Thompson @ref Developer 187bb229da9SJeremy L Thompson **/ 188bb229da9SJeremy L Thompson int CeedOperatorGetFallbackParent(CeedOperator op, CeedOperator *parent) { 189bb229da9SJeremy L Thompson *parent = op->op_fallback_parent ? op->op_fallback_parent : NULL; 190bb229da9SJeremy L Thompson return CEED_ERROR_SUCCESS; 191bb229da9SJeremy L Thompson } 192bb229da9SJeremy L Thompson 193bb229da9SJeremy L Thompson /** 1942e8f5c67SJeremy L Thompson @brief Get the Ceed context of the parent CeedOperator for a fallback CeedOperator 195bb229da9SJeremy L Thompson 196bb229da9SJeremy L Thompson @param[in] op CeedOperator context 197bb229da9SJeremy L Thompson @param[out] parent Variable to store parent Ceed context 198bb229da9SJeremy L Thompson 199bb229da9SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 200bb229da9SJeremy L Thompson 201bb229da9SJeremy L Thompson @ref Developer 202bb229da9SJeremy L Thompson **/ 203bb229da9SJeremy L Thompson int CeedOperatorGetFallbackParentCeed(CeedOperator op, Ceed *parent) { 204e984cf9aSJeremy L Thompson *parent = op->op_fallback_parent ? op->op_fallback_parent->ceed : op->ceed; 205bb229da9SJeremy L Thompson return CEED_ERROR_SUCCESS; 206bb229da9SJeremy L Thompson } 207bb229da9SJeremy L Thompson 208bb229da9SJeremy L Thompson /** 209eaf62fffSJeremy L Thompson @brief Select correct basis matrix pointer based on CeedEvalMode 210eaf62fffSJeremy L Thompson 211352a5e7cSSebastian Grimberg @param[in] basis CeedBasis from which to get the basis matrix 212eaf62fffSJeremy L Thompson @param[in] eval_mode Current basis evaluation mode 213eaf62fffSJeremy L Thompson @param[in] identity Pointer to identity matrix 214eaf62fffSJeremy L Thompson @param[out] basis_ptr Basis pointer to set 215eaf62fffSJeremy L Thompson 216eaf62fffSJeremy L Thompson @ref Developer 217eaf62fffSJeremy L Thompson **/ 218352a5e7cSSebastian Grimberg static inline int CeedOperatorGetBasisPointer(CeedBasis basis, CeedEvalMode eval_mode, const CeedScalar *identity, const CeedScalar **basis_ptr) { 219eaf62fffSJeremy L Thompson switch (eval_mode) { 220eaf62fffSJeremy L Thompson case CEED_EVAL_NONE: 221eaf62fffSJeremy L Thompson *basis_ptr = identity; 222eaf62fffSJeremy L Thompson break; 223eaf62fffSJeremy L Thompson case CEED_EVAL_INTERP: 224352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetInterp(basis, basis_ptr)); 225eaf62fffSJeremy L Thompson break; 226eaf62fffSJeremy L Thompson case CEED_EVAL_GRAD: 227352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetGrad(basis, basis_ptr)); 228352a5e7cSSebastian Grimberg break; 229352a5e7cSSebastian Grimberg case CEED_EVAL_DIV: 230352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetDiv(basis, basis_ptr)); 231352a5e7cSSebastian Grimberg break; 232352a5e7cSSebastian Grimberg case CEED_EVAL_CURL: 233352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetCurl(basis, basis_ptr)); 234eaf62fffSJeremy L Thompson break; 235eaf62fffSJeremy L Thompson case CEED_EVAL_WEIGHT: 236eaf62fffSJeremy L Thompson break; // Caught by QF Assembly 237eaf62fffSJeremy L Thompson } 238ed9e99e6SJeremy L Thompson assert(*basis_ptr != NULL); 239352a5e7cSSebastian Grimberg return CEED_ERROR_SUCCESS; 240eaf62fffSJeremy L Thompson } 241eaf62fffSJeremy L Thompson 242eaf62fffSJeremy L Thompson /** 243eaf62fffSJeremy L Thompson @brief Core logic for assembling operator diagonal or point block diagonal 244eaf62fffSJeremy L Thompson 245eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble point block diagonal 246ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE 247bd83916cSSebastian Grimberg @param[in] is_point_block Boolean flag to assemble diagonal or point block diagonal 248eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled diagonal 249eaf62fffSJeremy L Thompson 250eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 251eaf62fffSJeremy L Thompson 252eaf62fffSJeremy L Thompson @ref Developer 253eaf62fffSJeremy L Thompson **/ 254bd83916cSSebastian Grimberg static inline int CeedSingleOperatorAssembleAddDiagonal_Core(CeedOperator op, CeedRequest *request, const bool is_point_block, CeedVector assembled) { 255eaf62fffSJeremy L Thompson Ceed ceed; 256506b1a0cSSebastian Grimberg bool is_composite; 257506b1a0cSSebastian Grimberg 258506b1a0cSSebastian Grimberg CeedCall(CeedOperatorGetCeed(op, &ceed)); 259506b1a0cSSebastian Grimberg CeedCall(CeedOperatorIsComposite(op, &is_composite)); 260506b1a0cSSebastian Grimberg CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 261506b1a0cSSebastian Grimberg 262506b1a0cSSebastian Grimberg // Assemble QFunction 263506b1a0cSSebastian Grimberg CeedInt layout_qf[3]; 264437c7c90SJeremy L Thompson const CeedScalar *assembled_qf_array; 265c5f45aeaSJeremy L Thompson CeedVector assembled_qf = NULL; 266c5f45aeaSJeremy L Thompson CeedElemRestriction assembled_elem_rstr = NULL; 267437c7c90SJeremy L Thompson 268437c7c90SJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &assembled_elem_rstr, request)); 269506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetELayout(assembled_elem_rstr, &layout_qf)); 270437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&assembled_elem_rstr)); 271437c7c90SJeremy L Thompson CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array)); 272eaf62fffSJeremy L Thompson 273ed9e99e6SJeremy L Thompson // Get assembly data 274437c7c90SJeremy L Thompson const CeedEvalMode **eval_modes_in, **eval_modes_out; 275506b1a0cSSebastian Grimberg CeedInt num_active_bases_in, *num_eval_modes_in, num_active_bases_out, *num_eval_modes_out; 276437c7c90SJeremy L Thompson CeedSize **eval_mode_offsets_in, **eval_mode_offsets_out, num_output_components; 277506b1a0cSSebastian Grimberg CeedBasis *active_bases_in, *active_bases_out; 278506b1a0cSSebastian Grimberg CeedElemRestriction *active_elem_rstrs_in, *active_elem_rstrs_out; 2791c66c397SJeremy L Thompson CeedOperatorAssemblyData data; 2801c66c397SJeremy L Thompson 281437c7c90SJeremy L Thompson CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data)); 282506b1a0cSSebastian Grimberg CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_active_bases_in, &num_eval_modes_in, &eval_modes_in, &eval_mode_offsets_in, 283506b1a0cSSebastian Grimberg &num_active_bases_out, &num_eval_modes_out, &eval_modes_out, &eval_mode_offsets_out, 284506b1a0cSSebastian Grimberg &num_output_components)); 285506b1a0cSSebastian Grimberg CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, &active_bases_in, NULL, NULL, &active_bases_out, NULL)); 286506b1a0cSSebastian Grimberg CeedCall(CeedOperatorAssemblyDataGetElemRestrictions(data, NULL, &active_elem_rstrs_in, NULL, &active_elem_rstrs_out)); 287506b1a0cSSebastian Grimberg 288506b1a0cSSebastian Grimberg CeedCheck(num_active_bases_in == num_active_bases_out, ceed, CEED_ERROR_UNSUPPORTED, 289506b1a0cSSebastian Grimberg "Cannot assemble operator diagonal with different numbers of input and output active bases"); 290437c7c90SJeremy L Thompson 291437c7c90SJeremy L Thompson // Loop over all active bases 292506b1a0cSSebastian Grimberg for (CeedInt b = 0; b < num_active_bases_in; b++) { 2931c66c397SJeremy L Thompson bool has_eval_none = false; 294506b1a0cSSebastian Grimberg CeedInt num_elem, num_nodes, num_qpts, num_comp; 2951c66c397SJeremy L Thompson CeedScalar *elem_diag_array, *identity = NULL; 2961c66c397SJeremy L Thompson CeedVector elem_diag; 2977c1dbaffSSebastian Grimberg CeedElemRestriction diag_elem_rstr; 2981c66c397SJeremy L Thompson 299506b1a0cSSebastian Grimberg CeedCheck(active_elem_rstrs_in[b] == active_elem_rstrs_out[b], ceed, CEED_ERROR_UNSUPPORTED, 300506b1a0cSSebastian Grimberg "Cannot assemble operator diagonal with different input and output active element restrictions"); 301506b1a0cSSebastian Grimberg 3021c66c397SJeremy L Thompson // Assemble point block diagonal restriction, if needed 303bd83916cSSebastian Grimberg if (is_point_block) { 304506b1a0cSSebastian Grimberg CeedCall(CeedOperatorCreateActivePointBlockRestriction(active_elem_rstrs_in[b], &diag_elem_rstr)); 3057c1dbaffSSebastian Grimberg } else { 306506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionCreateUnsignedCopy(active_elem_rstrs_in[b], &diag_elem_rstr)); 307eaf62fffSJeremy L Thompson } 308eaf62fffSJeremy L Thompson 309eaf62fffSJeremy L Thompson // Create diagonal vector 310437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionCreateVector(diag_elem_rstr, NULL, &elem_diag)); 311eaf62fffSJeremy L Thompson 312eaf62fffSJeremy L Thompson // Assemble element operator diagonals 3132b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(elem_diag, 0.0)); 3142b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArray(elem_diag, CEED_MEM_HOST, &elem_diag_array)); 315437c7c90SJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(diag_elem_rstr, &num_elem)); 316506b1a0cSSebastian Grimberg CeedCall(CeedBasisGetNumNodes(active_bases_in[b], &num_nodes)); 317506b1a0cSSebastian Grimberg CeedCall(CeedBasisGetNumComponents(active_bases_in[b], &num_comp)); 318506b1a0cSSebastian Grimberg if (active_bases_in[b] == CEED_BASIS_NONE) num_qpts = num_nodes; 319506b1a0cSSebastian Grimberg else CeedCall(CeedBasisGetNumQuadraturePoints(active_bases_in[b], &num_qpts)); 320506b1a0cSSebastian Grimberg 321506b1a0cSSebastian Grimberg if (active_bases_in[b] != active_bases_out[b]) { 322506b1a0cSSebastian Grimberg CeedInt num_nodes_out, num_qpts_out, num_comp_out; 323506b1a0cSSebastian Grimberg 324506b1a0cSSebastian Grimberg CeedCall(CeedBasisGetNumNodes(active_bases_out[b], &num_nodes_out)); 325506b1a0cSSebastian Grimberg CeedCheck(num_nodes == num_nodes_out, ceed, CEED_ERROR_UNSUPPORTED, "Active input and output bases must have the same number of nodes"); 326506b1a0cSSebastian Grimberg CeedCall(CeedBasisGetNumComponents(active_bases_out[b], &num_comp_out)); 327506b1a0cSSebastian Grimberg CeedCheck(num_comp == num_comp_out, ceed, CEED_ERROR_UNSUPPORTED, "Active input and output bases must have the same number of components"); 328506b1a0cSSebastian Grimberg if (active_bases_out[b] == CEED_BASIS_NONE) num_qpts_out = num_nodes_out; 329506b1a0cSSebastian Grimberg else CeedCall(CeedBasisGetNumQuadraturePoints(active_bases_out[b], &num_qpts_out)); 330506b1a0cSSebastian Grimberg CeedCheck(num_qpts == num_qpts_out, ceed, CEED_ERROR_UNSUPPORTED, 331506b1a0cSSebastian Grimberg "Active input and output bases must have the same number of quadrature points"); 332506b1a0cSSebastian Grimberg } 333ed9e99e6SJeremy L Thompson 334352a5e7cSSebastian Grimberg // Construct identity matrix for basis if required 335437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_eval_modes_in[b]; i++) { 336437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (eval_modes_in[b][i] == CEED_EVAL_NONE); 337ed9e99e6SJeremy L Thompson } 338437c7c90SJeremy L Thompson for (CeedInt i = 0; i < num_eval_modes_out[b]; i++) { 339437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (eval_modes_out[b][i] == CEED_EVAL_NONE); 340ed9e99e6SJeremy L Thompson } 341ed9e99e6SJeremy L Thompson if (has_eval_none) { 3422b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_qpts * num_nodes, &identity)); 3432b730f8bSJeremy L Thompson for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) identity[i * num_nodes + i] = 1.0; 344eaf62fffSJeremy L Thompson } 345352a5e7cSSebastian Grimberg 346eaf62fffSJeremy L Thompson // Compute the diagonal of B^T D B 347eaf62fffSJeremy L Thompson // Each element 348b94338b9SJed Brown for (CeedSize e = 0; e < num_elem; e++) { 349eaf62fffSJeremy L Thompson // Each basis eval mode pair 350352a5e7cSSebastian Grimberg CeedInt d_out = 0, q_comp_out; 351352a5e7cSSebastian Grimberg CeedEvalMode eval_mode_out_prev = CEED_EVAL_NONE; 3521c66c397SJeremy L Thompson 353437c7c90SJeremy L Thompson for (CeedInt e_out = 0; e_out < num_eval_modes_out[b]; e_out++) { 3541c66c397SJeremy L Thompson CeedInt d_in = 0, q_comp_in; 355437c7c90SJeremy L Thompson const CeedScalar *B_t = NULL; 3561c66c397SJeremy L Thompson CeedEvalMode eval_mode_in_prev = CEED_EVAL_NONE; 3571c66c397SJeremy L Thompson 358506b1a0cSSebastian Grimberg CeedCall(CeedOperatorGetBasisPointer(active_bases_out[b], eval_modes_out[b][e_out], identity, &B_t)); 359506b1a0cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(active_bases_out[b], eval_modes_out[b][e_out], &q_comp_out)); 360352a5e7cSSebastian Grimberg if (q_comp_out > 1) { 361352a5e7cSSebastian Grimberg if (e_out == 0 || eval_modes_out[b][e_out] != eval_mode_out_prev) d_out = 0; 362352a5e7cSSebastian Grimberg else B_t = &B_t[(++d_out) * num_qpts * num_nodes]; 363352a5e7cSSebastian Grimberg } 364352a5e7cSSebastian Grimberg eval_mode_out_prev = eval_modes_out[b][e_out]; 365352a5e7cSSebastian Grimberg 366437c7c90SJeremy L Thompson for (CeedInt e_in = 0; e_in < num_eval_modes_in[b]; e_in++) { 367437c7c90SJeremy L Thompson const CeedScalar *B = NULL; 3681c66c397SJeremy L Thompson 369506b1a0cSSebastian Grimberg CeedCall(CeedOperatorGetBasisPointer(active_bases_in[b], eval_modes_in[b][e_in], identity, &B)); 370506b1a0cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(active_bases_in[b], eval_modes_in[b][e_in], &q_comp_in)); 371352a5e7cSSebastian Grimberg if (q_comp_in > 1) { 372352a5e7cSSebastian Grimberg if (e_in == 0 || eval_modes_in[b][e_in] != eval_mode_in_prev) d_in = 0; 373352a5e7cSSebastian Grimberg else B = &B[(++d_in) * num_qpts * num_nodes]; 374352a5e7cSSebastian Grimberg } 375352a5e7cSSebastian Grimberg eval_mode_in_prev = eval_modes_in[b][e_in]; 376352a5e7cSSebastian Grimberg 377eaf62fffSJeremy L Thompson // Each component 378506b1a0cSSebastian Grimberg for (CeedInt c_out = 0; c_out < num_comp; c_out++) { 379437c7c90SJeremy L Thompson // Each qpt/node pair 3802b730f8bSJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 381bd83916cSSebastian Grimberg if (is_point_block) { 382eaf62fffSJeremy L Thompson // Point Block Diagonal 383506b1a0cSSebastian Grimberg for (CeedInt c_in = 0; c_in < num_comp; c_in++) { 384b94338b9SJed Brown const CeedSize c_offset = (eval_mode_offsets_in[b][e_in] + c_in) * num_output_components + eval_mode_offsets_out[b][e_out] + c_out; 385506b1a0cSSebastian Grimberg const CeedScalar qf_value = assembled_qf_array[q * layout_qf[0] + c_offset * layout_qf[1] + e * layout_qf[2]]; 3861c66c397SJeremy L Thompson 3872b730f8bSJeremy L Thompson for (CeedInt n = 0; n < num_nodes; n++) { 388506b1a0cSSebastian Grimberg elem_diag_array[((e * num_comp + c_out) * num_comp + c_in) * num_nodes + n] += 389437c7c90SJeremy L Thompson B_t[q * num_nodes + n] * qf_value * B[q * num_nodes + n]; 390eaf62fffSJeremy L Thompson } 3912b730f8bSJeremy L Thompson } 392eaf62fffSJeremy L Thompson } else { 393eaf62fffSJeremy L Thompson // Diagonal Only 394437c7c90SJeremy L Thompson const CeedInt c_offset = (eval_mode_offsets_in[b][e_in] + c_out) * num_output_components + eval_mode_offsets_out[b][e_out] + c_out; 395506b1a0cSSebastian Grimberg const CeedScalar qf_value = assembled_qf_array[q * layout_qf[0] + c_offset * layout_qf[1] + e * layout_qf[2]]; 3961c66c397SJeremy L Thompson 3972b730f8bSJeremy L Thompson for (CeedInt n = 0; n < num_nodes; n++) { 398506b1a0cSSebastian Grimberg elem_diag_array[(e * num_comp + c_out) * num_nodes + n] += B_t[q * num_nodes + n] * qf_value * B[q * num_nodes + n]; 399eaf62fffSJeremy L Thompson } 400eaf62fffSJeremy L Thompson } 401eaf62fffSJeremy L Thompson } 402eaf62fffSJeremy L Thompson } 4032b730f8bSJeremy L Thompson } 4042b730f8bSJeremy L Thompson } 4052b730f8bSJeremy L Thompson } 4062b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(elem_diag, &elem_diag_array)); 407eaf62fffSJeremy L Thompson 408eaf62fffSJeremy L Thompson // Assemble local operator diagonal 4097c1dbaffSSebastian Grimberg CeedCall(CeedElemRestrictionApply(diag_elem_rstr, CEED_TRANSPOSE, elem_diag, assembled, request)); 410eaf62fffSJeremy L Thompson 411eaf62fffSJeremy L Thompson // Cleanup 4127c1dbaffSSebastian Grimberg CeedCall(CeedElemRestrictionDestroy(&diag_elem_rstr)); 4132b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&elem_diag)); 4142b730f8bSJeremy L Thompson CeedCall(CeedFree(&identity)); 415437c7c90SJeremy L Thompson } 416437c7c90SJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array)); 417437c7c90SJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled_qf)); 418eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 419eaf62fffSJeremy L Thompson } 420eaf62fffSJeremy L Thompson 421eaf62fffSJeremy L Thompson /** 422eaf62fffSJeremy L Thompson @brief Core logic for assembling composite operator diagonal 423eaf62fffSJeremy L Thompson 424eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble point block diagonal 425ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE 426bd83916cSSebastian Grimberg @param[in] is_point_block Boolean flag to assemble diagonal or point block diagonal 427eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled diagonal 428eaf62fffSJeremy L Thompson 429eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 430eaf62fffSJeremy L Thompson 431eaf62fffSJeremy L Thompson @ref Developer 432eaf62fffSJeremy L Thompson **/ 433bd83916cSSebastian Grimberg static inline int CeedCompositeOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedRequest *request, const bool is_point_block, 434eaf62fffSJeremy L Thompson CeedVector assembled) { 435eaf62fffSJeremy L Thompson CeedInt num_sub; 436eaf62fffSJeremy L Thompson CeedOperator *suboperators; 4371c66c397SJeremy L Thompson 438c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_sub)); 439c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &suboperators)); 440eaf62fffSJeremy L Thompson for (CeedInt i = 0; i < num_sub; i++) { 441bd83916cSSebastian Grimberg if (is_point_block) { 4422b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(suboperators[i], assembled, request)); 4436aa95790SJeremy L Thompson } else { 4442b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddDiagonal(suboperators[i], assembled, request)); 4456aa95790SJeremy L Thompson } 446eaf62fffSJeremy L Thompson } 447eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 448eaf62fffSJeremy L Thompson } 449eaf62fffSJeremy L Thompson 450eaf62fffSJeremy L Thompson /** 451eaf62fffSJeremy L Thompson @brief Build nonzero pattern for non-composite operator 452eaf62fffSJeremy L Thompson 453eaf62fffSJeremy L Thompson Users should generally use CeedOperatorLinearAssembleSymbolic() 454eaf62fffSJeremy L Thompson 455eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble nonzero pattern 456eaf62fffSJeremy L Thompson @param[in] offset Offset for number of entries 457eaf62fffSJeremy L Thompson @param[out] rows Row number for each entry 458eaf62fffSJeremy L Thompson @param[out] cols Column number for each entry 459eaf62fffSJeremy L Thompson 460eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 461eaf62fffSJeremy L Thompson 462eaf62fffSJeremy L Thompson @ref Developer 463eaf62fffSJeremy L Thompson **/ 4642b730f8bSJeremy L Thompson static int CeedSingleOperatorAssembleSymbolic(CeedOperator op, CeedInt offset, CeedInt *rows, CeedInt *cols) { 465f3d47e36SJeremy L Thompson Ceed ceed; 466f3d47e36SJeremy L Thompson bool is_composite; 467506b1a0cSSebastian Grimberg CeedSize num_nodes_in, num_nodes_out, count = 0; 468506b1a0cSSebastian Grimberg CeedInt num_elem_in, elem_size_in, num_comp_in, layout_er_in[3]; 469506b1a0cSSebastian Grimberg CeedInt num_elem_out, elem_size_out, num_comp_out, layout_er_out[3], local_num_entries; 4701c66c397SJeremy L Thompson CeedScalar *array; 471506b1a0cSSebastian Grimberg const CeedScalar *elem_dof_a_in, *elem_dof_a_out; 472506b1a0cSSebastian Grimberg CeedVector index_vec_in, index_vec_out, elem_dof_in, elem_dof_out; 473506b1a0cSSebastian Grimberg CeedElemRestriction elem_rstr_in, elem_rstr_out, index_elem_rstr_in, index_elem_rstr_out; 4741c66c397SJeremy L Thompson 475f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 476f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 4776574a04fSJeremy L Thompson CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 478eaf62fffSJeremy L Thompson 479506b1a0cSSebastian Grimberg CeedCall(CeedOperatorGetActiveVectorLengths(op, &num_nodes_in, &num_nodes_out)); 480506b1a0cSSebastian Grimberg CeedCall(CeedOperatorGetActiveElemRestrictions(op, &elem_rstr_in, &elem_rstr_out)); 481506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetNumElements(elem_rstr_in, &num_elem_in)); 482506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetElementSize(elem_rstr_in, &elem_size_in)); 483506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetNumComponents(elem_rstr_in, &num_comp_in)); 484506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetELayout(elem_rstr_in, &layout_er_in)); 485eaf62fffSJeremy L Thompson 486506b1a0cSSebastian Grimberg // Determine elem_dof relation for input 487506b1a0cSSebastian Grimberg CeedCall(CeedVectorCreate(ceed, num_nodes_in, &index_vec_in)); 488506b1a0cSSebastian Grimberg CeedCall(CeedVectorGetArrayWrite(index_vec_in, CEED_MEM_HOST, &array)); 489506b1a0cSSebastian Grimberg for (CeedInt i = 0; i < num_nodes_in; i++) array[i] = i; 490506b1a0cSSebastian Grimberg CeedCall(CeedVectorRestoreArray(index_vec_in, &array)); 491506b1a0cSSebastian Grimberg CeedCall(CeedVectorCreate(ceed, num_elem_in * elem_size_in * num_comp_in, &elem_dof_in)); 492506b1a0cSSebastian Grimberg CeedCall(CeedVectorSetValue(elem_dof_in, 0.0)); 493506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionCreateUnorientedCopy(elem_rstr_in, &index_elem_rstr_in)); 494506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionApply(index_elem_rstr_in, CEED_NOTRANSPOSE, index_vec_in, elem_dof_in, CEED_REQUEST_IMMEDIATE)); 495506b1a0cSSebastian Grimberg CeedCall(CeedVectorGetArrayRead(elem_dof_in, CEED_MEM_HOST, &elem_dof_a_in)); 496506b1a0cSSebastian Grimberg CeedCall(CeedVectorDestroy(&index_vec_in)); 497506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionDestroy(&index_elem_rstr_in)); 498506b1a0cSSebastian Grimberg 499506b1a0cSSebastian Grimberg if (elem_rstr_in != elem_rstr_out) { 500506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetNumElements(elem_rstr_out, &num_elem_out)); 501506b1a0cSSebastian Grimberg CeedCheck(num_elem_in == num_elem_out, ceed, CEED_ERROR_UNSUPPORTED, 502506b1a0cSSebastian Grimberg "Active input and output operator restrictions must have the same number of elements"); 503506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetElementSize(elem_rstr_out, &elem_size_out)); 504506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetNumComponents(elem_rstr_out, &num_comp_out)); 505506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetELayout(elem_rstr_out, &layout_er_out)); 506506b1a0cSSebastian Grimberg 507506b1a0cSSebastian Grimberg // Determine elem_dof relation for output 508506b1a0cSSebastian Grimberg CeedCall(CeedVectorCreate(ceed, num_nodes_out, &index_vec_out)); 509506b1a0cSSebastian Grimberg CeedCall(CeedVectorGetArrayWrite(index_vec_out, CEED_MEM_HOST, &array)); 510506b1a0cSSebastian Grimberg for (CeedInt i = 0; i < num_nodes_out; i++) array[i] = i; 511506b1a0cSSebastian Grimberg CeedCall(CeedVectorRestoreArray(index_vec_out, &array)); 512506b1a0cSSebastian Grimberg CeedCall(CeedVectorCreate(ceed, num_elem_out * elem_size_out * num_comp_out, &elem_dof_out)); 513506b1a0cSSebastian Grimberg CeedCall(CeedVectorSetValue(elem_dof_out, 0.0)); 514506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionCreateUnorientedCopy(elem_rstr_out, &index_elem_rstr_out)); 515506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionApply(index_elem_rstr_out, CEED_NOTRANSPOSE, index_vec_out, elem_dof_out, CEED_REQUEST_IMMEDIATE)); 516506b1a0cSSebastian Grimberg CeedCall(CeedVectorGetArrayRead(elem_dof_out, CEED_MEM_HOST, &elem_dof_a_out)); 517506b1a0cSSebastian Grimberg CeedCall(CeedVectorDestroy(&index_vec_out)); 518506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionDestroy(&index_elem_rstr_out)); 519506b1a0cSSebastian Grimberg } else { 520506b1a0cSSebastian Grimberg num_elem_out = num_elem_in; 521506b1a0cSSebastian Grimberg elem_size_out = elem_size_in; 522506b1a0cSSebastian Grimberg num_comp_out = num_comp_in; 523506b1a0cSSebastian Grimberg layout_er_out[0] = layout_er_in[0]; 524506b1a0cSSebastian Grimberg layout_er_out[1] = layout_er_in[1]; 525506b1a0cSSebastian Grimberg layout_er_out[2] = layout_er_in[2]; 526506b1a0cSSebastian Grimberg elem_dof_a_out = elem_dof_a_in; 527506b1a0cSSebastian Grimberg } 528506b1a0cSSebastian Grimberg local_num_entries = elem_size_out * num_comp_out * elem_size_in * num_comp_in * num_elem_in; 529eaf62fffSJeremy L Thompson 530eaf62fffSJeremy L Thompson // Determine i, j locations for element matrices 531506b1a0cSSebastian Grimberg for (CeedInt e = 0; e < num_elem_in; e++) { 532506b1a0cSSebastian Grimberg for (CeedInt comp_in = 0; comp_in < num_comp_in; comp_in++) { 533506b1a0cSSebastian Grimberg for (CeedInt comp_out = 0; comp_out < num_comp_out; comp_out++) { 534506b1a0cSSebastian Grimberg for (CeedInt i = 0; i < elem_size_out; i++) { 535506b1a0cSSebastian Grimberg for (CeedInt j = 0; j < elem_size_in; j++) { 536506b1a0cSSebastian Grimberg const CeedInt elem_dof_index_row = i * layout_er_out[0] + comp_out * layout_er_out[1] + e * layout_er_out[2]; 537506b1a0cSSebastian Grimberg const CeedInt elem_dof_index_col = j * layout_er_in[0] + comp_in * layout_er_in[1] + e * layout_er_in[2]; 538506b1a0cSSebastian Grimberg const CeedInt row = elem_dof_a_out[elem_dof_index_row]; 539506b1a0cSSebastian Grimberg const CeedInt col = elem_dof_a_in[elem_dof_index_col]; 540eaf62fffSJeremy L Thompson 541eaf62fffSJeremy L Thompson rows[offset + count] = row; 542eaf62fffSJeremy L Thompson cols[offset + count] = col; 543eaf62fffSJeremy L Thompson count++; 544eaf62fffSJeremy L Thompson } 545eaf62fffSJeremy L Thompson } 546eaf62fffSJeremy L Thompson } 547eaf62fffSJeremy L Thompson } 548eaf62fffSJeremy L Thompson } 5496574a04fSJeremy L Thompson CeedCheck(count == local_num_entries, ceed, CEED_ERROR_MAJOR, "Error computing assembled entries"); 550506b1a0cSSebastian Grimberg CeedCall(CeedVectorRestoreArrayRead(elem_dof_in, &elem_dof_a_in)); 551506b1a0cSSebastian Grimberg CeedCall(CeedVectorDestroy(&elem_dof_in)); 552506b1a0cSSebastian Grimberg if (elem_rstr_in != elem_rstr_out) { 553506b1a0cSSebastian Grimberg CeedCall(CeedVectorRestoreArrayRead(elem_dof_out, &elem_dof_a_out)); 554506b1a0cSSebastian Grimberg CeedCall(CeedVectorDestroy(&elem_dof_out)); 555506b1a0cSSebastian Grimberg } 556eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 557eaf62fffSJeremy L Thompson } 558eaf62fffSJeremy L Thompson 559eaf62fffSJeremy L Thompson /** 560eaf62fffSJeremy L Thompson @brief Assemble nonzero entries for non-composite operator 561eaf62fffSJeremy L Thompson 562eaf62fffSJeremy L Thompson Users should generally use CeedOperatorLinearAssemble() 563eaf62fffSJeremy L Thompson 564eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 565ea61e9acSJeremy L Thompson @param[in] offset Offset for number of entries 566eaf62fffSJeremy L Thompson @param[out] values Values to assemble into matrix 567eaf62fffSJeremy L Thompson 568eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 569eaf62fffSJeremy L Thompson 570eaf62fffSJeremy L Thompson @ref Developer 571eaf62fffSJeremy L Thompson **/ 5722b730f8bSJeremy L Thompson static int CeedSingleOperatorAssemble(CeedOperator op, CeedInt offset, CeedVector values) { 573f3d47e36SJeremy L Thompson Ceed ceed; 574f3d47e36SJeremy L Thompson bool is_composite; 5751c66c397SJeremy L Thompson 576f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 577f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 5786574a04fSJeremy L Thompson CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 579f3d47e36SJeremy L Thompson 580f3d47e36SJeremy L Thompson // Early exit for empty operator 581f3d47e36SJeremy L Thompson { 582f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 583f3d47e36SJeremy L Thompson 584f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 585f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 586f3d47e36SJeremy L Thompson } 587eaf62fffSJeremy L Thompson 588cefa2673SJeremy L Thompson if (op->LinearAssembleSingle) { 589cefa2673SJeremy L Thompson // Backend version 5902b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleSingle(op, offset, values)); 591cefa2673SJeremy L Thompson return CEED_ERROR_SUCCESS; 592cefa2673SJeremy L Thompson } else { 593cefa2673SJeremy L Thompson // Operator fallback 594cefa2673SJeremy L Thompson CeedOperator op_fallback; 595cefa2673SJeremy L Thompson 5962b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 597cefa2673SJeremy L Thompson if (op_fallback) { 5982b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemble(op_fallback, offset, values)); 599cefa2673SJeremy L Thompson return CEED_ERROR_SUCCESS; 600cefa2673SJeremy L Thompson } 601cefa2673SJeremy L Thompson } 602cefa2673SJeremy L Thompson 603eaf62fffSJeremy L Thompson // Assemble QFunction 604506b1a0cSSebastian Grimberg CeedInt layout_qf[3]; 6051c66c397SJeremy L Thompson const CeedScalar *assembled_qf_array; 606c5f45aeaSJeremy L Thompson CeedVector assembled_qf = NULL; 607506b1a0cSSebastian Grimberg CeedElemRestriction assembled_elem_rstr = NULL; 608eaf62fffSJeremy L Thompson 609506b1a0cSSebastian Grimberg CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &assembled_elem_rstr, CEED_REQUEST_IMMEDIATE)); 610506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetELayout(assembled_elem_rstr, &layout_qf)); 611506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionDestroy(&assembled_elem_rstr)); 612506b1a0cSSebastian Grimberg CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array)); 613eaf62fffSJeremy L Thompson 614ed9e99e6SJeremy L Thompson // Get assembly data 615506b1a0cSSebastian Grimberg CeedInt num_elem_in, elem_size_in, num_comp_in, num_qpts_in; 616506b1a0cSSebastian Grimberg CeedInt num_elem_out, elem_size_out, num_comp_out, num_qpts_out, local_num_entries; 617506b1a0cSSebastian Grimberg const CeedEvalMode **eval_modes_in, **eval_modes_out; 618506b1a0cSSebastian Grimberg CeedInt num_active_bases_in, *num_eval_modes_in, num_active_bases_out, *num_eval_modes_out; 619506b1a0cSSebastian Grimberg CeedBasis *active_bases_in, *active_bases_out, basis_in, basis_out; 620506b1a0cSSebastian Grimberg const CeedScalar **B_mats_in, **B_mats_out, *B_mat_in, *B_mat_out; 621506b1a0cSSebastian Grimberg CeedElemRestriction elem_rstr_in, elem_rstr_out; 622506b1a0cSSebastian Grimberg CeedRestrictionType elem_rstr_type_in, elem_rstr_type_out; 623506b1a0cSSebastian Grimberg const bool *elem_rstr_orients_in = NULL, *elem_rstr_orients_out = NULL; 624506b1a0cSSebastian Grimberg const CeedInt8 *elem_rstr_curl_orients_in = NULL, *elem_rstr_curl_orients_out = NULL; 625506b1a0cSSebastian Grimberg CeedOperatorAssemblyData data; 626eaf62fffSJeremy L Thompson 627506b1a0cSSebastian Grimberg CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data)); 628506b1a0cSSebastian Grimberg CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_active_bases_in, &num_eval_modes_in, &eval_modes_in, NULL, &num_active_bases_out, 629506b1a0cSSebastian Grimberg &num_eval_modes_out, &eval_modes_out, NULL, NULL)); 630506b1a0cSSebastian Grimberg 631506b1a0cSSebastian Grimberg CeedCheck(num_active_bases_in == num_active_bases_out && num_active_bases_in == 1, ceed, CEED_ERROR_UNSUPPORTED, 632506b1a0cSSebastian Grimberg "Cannot assemble operator with multiple active bases"); 6336574a04fSJeremy L Thompson CeedCheck(num_eval_modes_in[0] > 0 && num_eval_modes_out[0] > 0, ceed, CEED_ERROR_UNSUPPORTED, "Cannot assemble operator without inputs/outputs"); 634eaf62fffSJeremy L Thompson 635506b1a0cSSebastian Grimberg CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, &active_bases_in, &B_mats_in, NULL, &active_bases_out, &B_mats_out)); 636506b1a0cSSebastian Grimberg CeedCall(CeedOperatorGetActiveElemRestrictions(op, &elem_rstr_in, &elem_rstr_out)); 637506b1a0cSSebastian Grimberg basis_in = active_bases_in[0]; 638506b1a0cSSebastian Grimberg basis_out = active_bases_out[0]; 639506b1a0cSSebastian Grimberg B_mat_in = B_mats_in[0]; 640506b1a0cSSebastian Grimberg B_mat_out = B_mats_out[0]; 641eaf62fffSJeremy L Thompson 642506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetNumElements(elem_rstr_in, &num_elem_in)); 643506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetElementSize(elem_rstr_in, &elem_size_in)); 644506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetNumComponents(elem_rstr_in, &num_comp_in)); 645506b1a0cSSebastian Grimberg if (basis_in == CEED_BASIS_NONE) num_qpts_in = elem_size_in; 646506b1a0cSSebastian Grimberg else CeedCall(CeedBasisGetNumQuadraturePoints(basis_in, &num_qpts_in)); 647506b1a0cSSebastian Grimberg 648506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetType(elem_rstr_in, &elem_rstr_type_in)); 649506b1a0cSSebastian Grimberg if (elem_rstr_type_in == CEED_RESTRICTION_ORIENTED) { 650506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetOrientations(elem_rstr_in, CEED_MEM_HOST, &elem_rstr_orients_in)); 651506b1a0cSSebastian Grimberg } else if (elem_rstr_type_in == CEED_RESTRICTION_CURL_ORIENTED) { 652506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetCurlOrientations(elem_rstr_in, CEED_MEM_HOST, &elem_rstr_curl_orients_in)); 6537c1dbaffSSebastian Grimberg } 6547c1dbaffSSebastian Grimberg 655506b1a0cSSebastian Grimberg if (elem_rstr_in != elem_rstr_out) { 656506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetNumElements(elem_rstr_out, &num_elem_out)); 657506b1a0cSSebastian Grimberg CeedCheck(num_elem_in == num_elem_out, ceed, CEED_ERROR_UNSUPPORTED, 658506b1a0cSSebastian Grimberg "Active input and output operator restrictions must have the same number of elements"); 659506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetElementSize(elem_rstr_out, &elem_size_out)); 660506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetNumComponents(elem_rstr_out, &num_comp_out)); 661506b1a0cSSebastian Grimberg if (basis_out == CEED_BASIS_NONE) num_qpts_out = elem_size_out; 662506b1a0cSSebastian Grimberg else CeedCall(CeedBasisGetNumQuadraturePoints(basis_out, &num_qpts_out)); 663506b1a0cSSebastian Grimberg CeedCheck(num_qpts_in == num_qpts_out, ceed, CEED_ERROR_UNSUPPORTED, 664506b1a0cSSebastian Grimberg "Active input and output bases must have the same number of quadrature points"); 665eaf62fffSJeremy L Thompson 666506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetType(elem_rstr_out, &elem_rstr_type_out)); 667506b1a0cSSebastian Grimberg if (elem_rstr_type_out == CEED_RESTRICTION_ORIENTED) { 668506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetOrientations(elem_rstr_out, CEED_MEM_HOST, &elem_rstr_orients_out)); 669506b1a0cSSebastian Grimberg } else if (elem_rstr_type_out == CEED_RESTRICTION_CURL_ORIENTED) { 670506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetCurlOrientations(elem_rstr_out, CEED_MEM_HOST, &elem_rstr_curl_orients_out)); 671506b1a0cSSebastian Grimberg } 672506b1a0cSSebastian Grimberg } else { 673506b1a0cSSebastian Grimberg num_elem_out = num_elem_in; 674506b1a0cSSebastian Grimberg elem_size_out = elem_size_in; 675506b1a0cSSebastian Grimberg num_comp_out = num_comp_in; 676506b1a0cSSebastian Grimberg num_qpts_out = num_qpts_in; 677506b1a0cSSebastian Grimberg 678506b1a0cSSebastian Grimberg elem_rstr_orients_out = elem_rstr_orients_in; 679506b1a0cSSebastian Grimberg elem_rstr_curl_orients_out = elem_rstr_curl_orients_in; 680506b1a0cSSebastian Grimberg } 681506b1a0cSSebastian Grimberg local_num_entries = elem_size_out * num_comp_out * elem_size_in * num_comp_in * num_elem_in; 682506b1a0cSSebastian Grimberg 683506b1a0cSSebastian Grimberg // Loop over elements and put in data structure 6847c1dbaffSSebastian Grimberg // We store B_mat_in, B_mat_out, BTD, elem_mat in row-major order 6851c66c397SJeremy L Thompson CeedSize count = 0; 686*123d890dSSebastian Grimberg CeedScalar *vals, *BTD_mat = NULL, *elem_mat = NULL, *elem_mat_b = NULL; 687506b1a0cSSebastian Grimberg 688*123d890dSSebastian Grimberg CeedCall(CeedCalloc(elem_size_out * num_qpts_in * num_eval_modes_in[0], &BTD_mat)); 689*123d890dSSebastian Grimberg CeedCall(CeedCalloc(elem_size_out * elem_size_in, &elem_mat)); 690506b1a0cSSebastian Grimberg if (elem_rstr_curl_orients_in || elem_rstr_curl_orients_out) CeedCall(CeedCalloc(elem_size_out * elem_size_in, &elem_mat_b)); 6911c66c397SJeremy L Thompson 69228ec399dSJeremy L Thompson CeedCall(CeedVectorGetArray(values, CEED_MEM_HOST, &vals)); 693506b1a0cSSebastian Grimberg for (CeedSize e = 0; e < num_elem_in; e++) { 694506b1a0cSSebastian Grimberg for (CeedInt comp_in = 0; comp_in < num_comp_in; comp_in++) { 695506b1a0cSSebastian Grimberg for (CeedInt comp_out = 0; comp_out < num_comp_out; comp_out++) { 696ed9e99e6SJeremy L Thompson // Compute B^T*D 697506b1a0cSSebastian Grimberg for (CeedSize n = 0; n < elem_size_out; n++) { 698506b1a0cSSebastian Grimberg for (CeedSize q = 0; q < num_qpts_in; q++) { 699437c7c90SJeremy L Thompson for (CeedInt e_in = 0; e_in < num_eval_modes_in[0]; e_in++) { 700506b1a0cSSebastian Grimberg const CeedSize btd_index = n * (num_qpts_in * num_eval_modes_in[0]) + q * num_eval_modes_in[0] + e_in; 701067fd99fSJeremy L Thompson CeedScalar sum = 0.0; 7021c66c397SJeremy L Thompson 703437c7c90SJeremy L Thompson for (CeedInt e_out = 0; e_out < num_eval_modes_out[0]; e_out++) { 704506b1a0cSSebastian Grimberg const CeedSize b_out_index = (q * num_eval_modes_out[0] + e_out) * elem_size_out + n; 705506b1a0cSSebastian Grimberg const CeedSize eval_mode_index = ((e_in * num_comp_in + comp_in) * num_eval_modes_out[0] + e_out) * num_comp_out + comp_out; 706b94338b9SJed Brown const CeedSize qf_index = q * layout_qf[0] + eval_mode_index * layout_qf[1] + e * layout_qf[2]; 7071c66c397SJeremy L Thompson 708067fd99fSJeremy L Thompson sum += B_mat_out[b_out_index] * assembled_qf_array[qf_index]; 709eaf62fffSJeremy L Thompson } 710067fd99fSJeremy L Thompson BTD_mat[btd_index] = sum; 711ed9e99e6SJeremy L Thompson } 712ed9e99e6SJeremy L Thompson } 713eaf62fffSJeremy L Thompson } 7147c1dbaffSSebastian Grimberg 7157c1dbaffSSebastian Grimberg // Form element matrix itself (for each block component) 716506b1a0cSSebastian Grimberg CeedCall(CeedMatrixMatrixMultiply(ceed, BTD_mat, B_mat_in, elem_mat, elem_size_out, elem_size_in, num_qpts_in * num_eval_modes_in[0])); 717eaf62fffSJeremy L Thompson 7187c1dbaffSSebastian Grimberg // Transform the element matrix if required 719506b1a0cSSebastian Grimberg if (elem_rstr_orients_out) { 720506b1a0cSSebastian Grimberg const bool *elem_orients = &elem_rstr_orients_out[e * elem_size_out]; 7211c66c397SJeremy L Thompson 722506b1a0cSSebastian Grimberg for (CeedInt i = 0; i < elem_size_out; i++) { 723506b1a0cSSebastian Grimberg const double orient = elem_orients[i] ? -1.0 : 1.0; 724506b1a0cSSebastian Grimberg 725506b1a0cSSebastian Grimberg for (CeedInt j = 0; j < elem_size_in; j++) { 726506b1a0cSSebastian Grimberg elem_mat[i * elem_size_in + j] *= orient; 7277c1dbaffSSebastian Grimberg } 7287c1dbaffSSebastian Grimberg } 729506b1a0cSSebastian Grimberg } else if (elem_rstr_curl_orients_out) { 730506b1a0cSSebastian Grimberg const CeedInt8 *elem_curl_orients = &elem_rstr_curl_orients_out[e * 3 * elem_size_out]; 7311c66c397SJeremy L Thompson 7327c1dbaffSSebastian Grimberg // T^T*(B^T*D*B) 733506b1a0cSSebastian Grimberg memcpy(elem_mat_b, elem_mat, elem_size_out * elem_size_in * sizeof(CeedScalar)); 734506b1a0cSSebastian Grimberg for (CeedInt i = 0; i < elem_size_out; i++) { 735506b1a0cSSebastian Grimberg for (CeedInt j = 0; j < elem_size_in; j++) { 736506b1a0cSSebastian Grimberg elem_mat[i * elem_size_in + j] = elem_mat_b[i * elem_size_in + j] * elem_curl_orients[3 * i + 1] + 737506b1a0cSSebastian Grimberg (i > 0 ? elem_mat_b[(i - 1) * elem_size_in + j] * elem_curl_orients[3 * i - 1] : 0.0) + 738506b1a0cSSebastian Grimberg (i < elem_size_out - 1 ? elem_mat_b[(i + 1) * elem_size_in + j] * elem_curl_orients[3 * i + 3] : 0.0); 7397c1dbaffSSebastian Grimberg } 7407c1dbaffSSebastian Grimberg } 741506b1a0cSSebastian Grimberg } 742506b1a0cSSebastian Grimberg if (elem_rstr_orients_in) { 743506b1a0cSSebastian Grimberg const bool *elem_orients = &elem_rstr_orients_in[e * elem_size_in]; 744506b1a0cSSebastian Grimberg 745506b1a0cSSebastian Grimberg for (CeedInt i = 0; i < elem_size_out; i++) { 746506b1a0cSSebastian Grimberg for (CeedInt j = 0; j < elem_size_in; j++) { 747506b1a0cSSebastian Grimberg elem_mat[i * elem_size_in + j] *= elem_orients[j] ? -1.0 : 1.0; 748506b1a0cSSebastian Grimberg } 749506b1a0cSSebastian Grimberg } 750506b1a0cSSebastian Grimberg } else if (elem_rstr_curl_orients_in) { 751506b1a0cSSebastian Grimberg const CeedInt8 *elem_curl_orients = &elem_rstr_curl_orients_in[e * 3 * elem_size_in]; 752506b1a0cSSebastian Grimberg 753506b1a0cSSebastian Grimberg // (B^T*D*B)*T 754506b1a0cSSebastian Grimberg memcpy(elem_mat_b, elem_mat, elem_size_out * elem_size_in * sizeof(CeedScalar)); 755506b1a0cSSebastian Grimberg for (CeedInt i = 0; i < elem_size_out; i++) { 756506b1a0cSSebastian Grimberg for (CeedInt j = 0; j < elem_size_in; j++) { 757506b1a0cSSebastian Grimberg elem_mat[i * elem_size_in + j] = elem_mat_b[i * elem_size_in + j] * elem_curl_orients[3 * j + 1] + 758506b1a0cSSebastian Grimberg (j > 0 ? elem_mat_b[i * elem_size_in + j - 1] * elem_curl_orients[3 * j - 1] : 0.0) + 759506b1a0cSSebastian Grimberg (j < elem_size_in - 1 ? elem_mat_b[i * elem_size_in + j + 1] * elem_curl_orients[3 * j + 3] : 0.0); 7607c1dbaffSSebastian Grimberg } 7617c1dbaffSSebastian Grimberg } 7627c1dbaffSSebastian Grimberg } 7637c1dbaffSSebastian Grimberg 7647c1dbaffSSebastian Grimberg // Put element matrix in coordinate data structure 765506b1a0cSSebastian Grimberg for (CeedInt i = 0; i < elem_size_out; i++) { 766506b1a0cSSebastian Grimberg for (CeedInt j = 0; j < elem_size_in; j++) { 767506b1a0cSSebastian Grimberg vals[offset + count] = elem_mat[i * elem_size_in + j]; 768eaf62fffSJeremy L Thompson count++; 769eaf62fffSJeremy L Thompson } 770eaf62fffSJeremy L Thompson } 771eaf62fffSJeremy L Thompson } 772eaf62fffSJeremy L Thompson } 773eaf62fffSJeremy L Thompson } 7746574a04fSJeremy L Thompson CeedCheck(count == local_num_entries, ceed, CEED_ERROR_MAJOR, "Error computing entries"); 7752b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(values, &vals)); 776eaf62fffSJeremy L Thompson 777506b1a0cSSebastian Grimberg // Cleanup 778*123d890dSSebastian Grimberg CeedCall(CeedFree(&BTD_mat)); 779*123d890dSSebastian Grimberg CeedCall(CeedFree(&elem_mat)); 780506b1a0cSSebastian Grimberg CeedCall(CeedFree(&elem_mat_b)); 781506b1a0cSSebastian Grimberg if (elem_rstr_type_in == CEED_RESTRICTION_ORIENTED) { 782506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionRestoreOrientations(elem_rstr_in, &elem_rstr_orients_in)); 783506b1a0cSSebastian Grimberg } else if (elem_rstr_type_in == CEED_RESTRICTION_CURL_ORIENTED) { 784506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionRestoreCurlOrientations(elem_rstr_in, &elem_rstr_curl_orients_in)); 785506b1a0cSSebastian Grimberg } 786506b1a0cSSebastian Grimberg if (elem_rstr_in != elem_rstr_out) { 787506b1a0cSSebastian Grimberg if (elem_rstr_type_out == CEED_RESTRICTION_ORIENTED) { 788506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionRestoreOrientations(elem_rstr_out, &elem_rstr_orients_out)); 789506b1a0cSSebastian Grimberg } else if (elem_rstr_type_out == CEED_RESTRICTION_CURL_ORIENTED) { 790506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionRestoreCurlOrientations(elem_rstr_out, &elem_rstr_curl_orients_out)); 791506b1a0cSSebastian Grimberg } 792506b1a0cSSebastian Grimberg } 7932b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array)); 7942b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled_qf)); 795eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 796eaf62fffSJeremy L Thompson } 797eaf62fffSJeremy L Thompson 798eaf62fffSJeremy L Thompson /** 799eaf62fffSJeremy L Thompson @brief Count number of entries for assembled CeedOperator 800eaf62fffSJeremy L Thompson 801eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 802eaf62fffSJeremy L Thompson @param[out] num_entries Number of entries in assembled representation 803eaf62fffSJeremy L Thompson 804eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 805eaf62fffSJeremy L Thompson 806eaf62fffSJeremy L Thompson @ref Utility 807eaf62fffSJeremy L Thompson **/ 808b94338b9SJed Brown static int CeedSingleOperatorAssemblyCountEntries(CeedOperator op, CeedSize *num_entries) { 809b275c451SJeremy L Thompson bool is_composite; 810506b1a0cSSebastian Grimberg CeedInt num_elem_in, elem_size_in, num_comp_in, num_elem_out, elem_size_out, num_comp_out; 811506b1a0cSSebastian Grimberg CeedElemRestriction rstr_in, rstr_out; 812eaf62fffSJeremy L Thompson 813b275c451SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 8146574a04fSJeremy L Thompson CeedCheck(!is_composite, op->ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 815506b1a0cSSebastian Grimberg 816506b1a0cSSebastian Grimberg CeedCall(CeedOperatorGetActiveElemRestrictions(op, &rstr_in, &rstr_out)); 817506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetNumElements(rstr_in, &num_elem_in)); 818506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetElementSize(rstr_in, &elem_size_in)); 819506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetNumComponents(rstr_in, &num_comp_in)); 820506b1a0cSSebastian Grimberg if (rstr_in != rstr_out) { 821506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetNumElements(rstr_out, &num_elem_out)); 822506b1a0cSSebastian Grimberg CeedCheck(num_elem_in == num_elem_out, op->ceed, CEED_ERROR_UNSUPPORTED, 823506b1a0cSSebastian Grimberg "Active input and output operator restrictions must have the same number of elements"); 824506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetElementSize(rstr_out, &elem_size_out)); 825506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetNumComponents(rstr_out, &num_comp_out)); 826506b1a0cSSebastian Grimberg } else { 827506b1a0cSSebastian Grimberg num_elem_out = num_elem_in; 828506b1a0cSSebastian Grimberg elem_size_out = elem_size_in; 829506b1a0cSSebastian Grimberg num_comp_out = num_comp_in; 830506b1a0cSSebastian Grimberg } 831506b1a0cSSebastian Grimberg *num_entries = (CeedSize)elem_size_in * num_comp_in * elem_size_out * num_comp_out * num_elem_in; 832eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 833eaf62fffSJeremy L Thompson } 834eaf62fffSJeremy L Thompson 835eaf62fffSJeremy L Thompson /** 836ea61e9acSJeremy L Thompson @brief Common code for creating a multigrid coarse operator and level transfer operators for a CeedOperator 837eaf62fffSJeremy L Thompson 838eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 83985bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 840eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 841eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 84285bb9dcfSJeremy L Thompson @param[in] basis_c_to_f Basis for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators 843eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 84485bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 8457758292fSSebastian Grimberg @param[out] op_restrict Fine to coarse operator, or NULL 846eaf62fffSJeremy L Thompson 847eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 848eaf62fffSJeremy L Thompson 849eaf62fffSJeremy L Thompson @ref Developer 850eaf62fffSJeremy L Thompson **/ 8512b730f8bSJeremy L Thompson static int CeedSingleOperatorMultigridLevel(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 8527758292fSSebastian Grimberg CeedBasis basis_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) { 8531c66c397SJeremy L Thompson bool is_composite; 854eaf62fffSJeremy L Thompson Ceed ceed; 8551c66c397SJeremy L Thompson CeedInt num_comp; 85685bb9dcfSJeremy L Thompson CeedVector mult_vec = NULL; 8571c66c397SJeremy L Thompson CeedElemRestriction rstr_p_mult_fine = NULL, rstr_fine = NULL; 8581c66c397SJeremy L Thompson 8592b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op_fine, &ceed)); 860eaf62fffSJeremy L Thompson 861eaf62fffSJeremy L Thompson // Check for composite operator 8622b730f8bSJeremy L Thompson CeedCall(CeedOperatorIsComposite(op_fine, &is_composite)); 8636574a04fSJeremy L Thompson CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Automatic multigrid setup for composite operators not supported"); 864eaf62fffSJeremy L Thompson 865eaf62fffSJeremy L Thompson // Coarse Grid 8662b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed, op_fine->qf, op_fine->dqf, op_fine->dqfT, op_coarse)); 867eaf62fffSJeremy L Thompson // -- Clone input fields 86892ae7e47SJeremy L Thompson for (CeedInt i = 0; i < op_fine->qf->num_input_fields; i++) { 869eaf62fffSJeremy L Thompson if (op_fine->input_fields[i]->vec == CEED_VECTOR_ACTIVE) { 870437c7c90SJeremy L Thompson rstr_fine = op_fine->input_fields[i]->elem_rstr; 8712b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE)); 872eaf62fffSJeremy L Thompson } else { 873437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, op_fine->input_fields[i]->elem_rstr, 8742b730f8bSJeremy L Thompson op_fine->input_fields[i]->basis, op_fine->input_fields[i]->vec)); 875eaf62fffSJeremy L Thompson } 876eaf62fffSJeremy L Thompson } 877eaf62fffSJeremy L Thompson // -- Clone output fields 87892ae7e47SJeremy L Thompson for (CeedInt i = 0; i < op_fine->qf->num_output_fields; i++) { 879eaf62fffSJeremy L Thompson if (op_fine->output_fields[i]->vec == CEED_VECTOR_ACTIVE) { 8802b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE)); 881eaf62fffSJeremy L Thompson } else { 882437c7c90SJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, op_fine->output_fields[i]->elem_rstr, 8832b730f8bSJeremy L Thompson op_fine->output_fields[i]->basis, op_fine->output_fields[i]->vec)); 884eaf62fffSJeremy L Thompson } 885eaf62fffSJeremy L Thompson } 886af99e877SJeremy L Thompson // -- Clone QFunctionAssemblyData 8872b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op_fine->qf_assembled, &(*op_coarse)->qf_assembled)); 888eaf62fffSJeremy L Thompson 889eaf62fffSJeremy L Thompson // Multiplicity vector 8907758292fSSebastian Grimberg if (op_restrict || op_prolong) { 89185bb9dcfSJeremy L Thompson CeedVector mult_e_vec; 8921c66c397SJeremy L Thompson CeedRestrictionType rstr_type; 89385bb9dcfSJeremy L Thompson 8947c1dbaffSSebastian Grimberg CeedCall(CeedElemRestrictionGetType(rstr_fine, &rstr_type)); 8957c1dbaffSSebastian Grimberg CeedCheck(rstr_type != CEED_RESTRICTION_CURL_ORIENTED, ceed, CEED_ERROR_UNSUPPORTED, 8967c1dbaffSSebastian Grimberg "Element restrictions created with CeedElemRestrictionCreateCurlOriented are not supported"); 8976574a04fSJeremy L Thompson CeedCheck(p_mult_fine, ceed, CEED_ERROR_INCOMPATIBLE, "Prolongation or restriction operator creation requires fine grid multiplicity vector"); 8987c1dbaffSSebastian Grimberg CeedCall(CeedElemRestrictionCreateUnsignedCopy(rstr_fine, &rstr_p_mult_fine)); 8992b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionCreateVector(rstr_fine, &mult_vec, &mult_e_vec)); 9002b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(mult_e_vec, 0.0)); 901c17ec2beSJeremy L Thompson CeedCall(CeedElemRestrictionApply(rstr_p_mult_fine, CEED_NOTRANSPOSE, p_mult_fine, mult_e_vec, CEED_REQUEST_IMMEDIATE)); 9022b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(mult_vec, 0.0)); 903c17ec2beSJeremy L Thompson CeedCall(CeedElemRestrictionApply(rstr_p_mult_fine, CEED_TRANSPOSE, mult_e_vec, mult_vec, CEED_REQUEST_IMMEDIATE)); 9042b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&mult_e_vec)); 9052b730f8bSJeremy L Thompson CeedCall(CeedVectorReciprocal(mult_vec)); 90685bb9dcfSJeremy L Thompson } 907eaf62fffSJeremy L Thompson 908addd79feSZach Atkins // Clone name 909addd79feSZach Atkins bool has_name = op_fine->name; 910addd79feSZach Atkins size_t name_len = op_fine->name ? strlen(op_fine->name) : 0; 911addd79feSZach Atkins CeedCall(CeedOperatorSetName(*op_coarse, op_fine->name)); 912addd79feSZach Atkins 9137758292fSSebastian Grimberg // Check that coarse to fine basis is provided if prolong/restrict operators are requested 9147758292fSSebastian Grimberg CeedCheck(basis_c_to_f || (!op_restrict && !op_prolong), ceed, CEED_ERROR_INCOMPATIBLE, 9156574a04fSJeremy L Thompson "Prolongation or restriction operator creation requires coarse-to-fine basis"); 91683d6adf3SZach Atkins 91785bb9dcfSJeremy L Thompson // Restriction/Prolongation Operators 9182b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_coarse, &num_comp)); 919addd79feSZach Atkins 920addd79feSZach Atkins // Restriction 9217758292fSSebastian Grimberg if (op_restrict) { 922eaf62fffSJeremy L Thompson CeedInt *num_comp_r_data; 92385bb9dcfSJeremy L Thompson CeedQFunctionContext ctx_r; 9247758292fSSebastian Grimberg CeedQFunction qf_restrict; 92585bb9dcfSJeremy L Thompson 9267758292fSSebastian Grimberg CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_restrict)); 9272b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &num_comp_r_data)); 928eaf62fffSJeremy L Thompson num_comp_r_data[0] = num_comp; 9292b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextCreate(ceed, &ctx_r)); 9302b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextSetData(ctx_r, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_r_data), num_comp_r_data)); 9317758292fSSebastian Grimberg CeedCall(CeedQFunctionSetContext(qf_restrict, ctx_r)); 9322b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextDestroy(&ctx_r)); 9337758292fSSebastian Grimberg CeedCall(CeedQFunctionAddInput(qf_restrict, "input", num_comp, CEED_EVAL_NONE)); 9347758292fSSebastian Grimberg CeedCall(CeedQFunctionAddInput(qf_restrict, "scale", num_comp, CEED_EVAL_NONE)); 9357758292fSSebastian Grimberg CeedCall(CeedQFunctionAddOutput(qf_restrict, "output", num_comp, CEED_EVAL_INTERP)); 9367758292fSSebastian Grimberg CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_restrict, num_comp)); 937eaf62fffSJeremy L Thompson 9387758292fSSebastian Grimberg CeedCall(CeedOperatorCreate(ceed, qf_restrict, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_restrict)); 9397758292fSSebastian Grimberg CeedCall(CeedOperatorSetField(*op_restrict, "input", rstr_fine, CEED_BASIS_NONE, CEED_VECTOR_ACTIVE)); 9407758292fSSebastian Grimberg CeedCall(CeedOperatorSetField(*op_restrict, "scale", rstr_p_mult_fine, CEED_BASIS_NONE, mult_vec)); 9417758292fSSebastian Grimberg CeedCall(CeedOperatorSetField(*op_restrict, "output", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE)); 942eaf62fffSJeremy L Thompson 943addd79feSZach Atkins // Set name 944addd79feSZach Atkins char *restriction_name; 9451c66c397SJeremy L Thompson 946addd79feSZach Atkins CeedCall(CeedCalloc(17 + name_len, &restriction_name)); 947addd79feSZach Atkins sprintf(restriction_name, "restriction%s%s", has_name ? " for " : "", has_name ? op_fine->name : ""); 9487758292fSSebastian Grimberg CeedCall(CeedOperatorSetName(*op_restrict, restriction_name)); 949addd79feSZach Atkins CeedCall(CeedFree(&restriction_name)); 950addd79feSZach Atkins 951addd79feSZach Atkins // Check 9527758292fSSebastian Grimberg CeedCall(CeedOperatorCheckReady(*op_restrict)); 953addd79feSZach Atkins 954addd79feSZach Atkins // Cleanup 9557758292fSSebastian Grimberg CeedCall(CeedQFunctionDestroy(&qf_restrict)); 956addd79feSZach Atkins } 957addd79feSZach Atkins 958eaf62fffSJeremy L Thompson // Prolongation 959addd79feSZach Atkins if (op_prolong) { 960eaf62fffSJeremy L Thompson CeedInt *num_comp_p_data; 96185bb9dcfSJeremy L Thompson CeedQFunctionContext ctx_p; 9621c66c397SJeremy L Thompson CeedQFunction qf_prolong; 96385bb9dcfSJeremy L Thompson 96485bb9dcfSJeremy L Thompson CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_prolong)); 9652b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &num_comp_p_data)); 966eaf62fffSJeremy L Thompson num_comp_p_data[0] = num_comp; 9672b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextCreate(ceed, &ctx_p)); 9682b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextSetData(ctx_p, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_p_data), num_comp_p_data)); 9692b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(qf_prolong, ctx_p)); 9702b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextDestroy(&ctx_p)); 9712b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_prolong, "input", num_comp, CEED_EVAL_INTERP)); 9722b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_prolong, "scale", num_comp, CEED_EVAL_NONE)); 9732b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(qf_prolong, "output", num_comp, CEED_EVAL_NONE)); 9742b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_prolong, num_comp)); 975eaf62fffSJeremy L Thompson 9762b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed, qf_prolong, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_prolong)); 9772b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_prolong, "input", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE)); 978356036faSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_prolong, "scale", rstr_p_mult_fine, CEED_BASIS_NONE, mult_vec)); 979356036faSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_prolong, "output", rstr_fine, CEED_BASIS_NONE, CEED_VECTOR_ACTIVE)); 980eaf62fffSJeremy L Thompson 981addd79feSZach Atkins // Set name 982ea6b5821SJeremy L Thompson char *prolongation_name; 9831c66c397SJeremy L Thompson 9842b730f8bSJeremy L Thompson CeedCall(CeedCalloc(18 + name_len, &prolongation_name)); 9852b730f8bSJeremy L Thompson sprintf(prolongation_name, "prolongation%s%s", has_name ? " for " : "", has_name ? op_fine->name : ""); 9862b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetName(*op_prolong, prolongation_name)); 9872b730f8bSJeremy L Thompson CeedCall(CeedFree(&prolongation_name)); 988addd79feSZach Atkins 989addd79feSZach Atkins // Check 990addd79feSZach Atkins CeedCall(CeedOperatorCheckReady(*op_prolong)); 991addd79feSZach Atkins 992addd79feSZach Atkins // Cleanup 993addd79feSZach Atkins CeedCall(CeedQFunctionDestroy(&qf_prolong)); 994ea6b5821SJeremy L Thompson } 995ea6b5821SJeremy L Thompson 99658e4b056SJeremy L Thompson // Check 99758e4b056SJeremy L Thompson CeedCall(CeedOperatorCheckReady(*op_coarse)); 99858e4b056SJeremy L Thompson 999eaf62fffSJeremy L Thompson // Cleanup 10002b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&mult_vec)); 1001c17ec2beSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_p_mult_fine)); 10022b730f8bSJeremy L Thompson CeedCall(CeedBasisDestroy(&basis_c_to_f)); 1003eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1004eaf62fffSJeremy L Thompson } 1005eaf62fffSJeremy L Thompson 1006eaf62fffSJeremy L Thompson /** 1007eaf62fffSJeremy L Thompson @brief Build 1D mass matrix and Laplacian with perturbation 1008eaf62fffSJeremy L Thompson 1009eaf62fffSJeremy L Thompson @param[in] interp_1d Interpolation matrix in one dimension 1010eaf62fffSJeremy L Thompson @param[in] grad_1d Gradient matrix in one dimension 1011eaf62fffSJeremy L Thompson @param[in] q_weight_1d Quadrature weights in one dimension 1012eaf62fffSJeremy L Thompson @param[in] P_1d Number of basis nodes in one dimension 1013eaf62fffSJeremy L Thompson @param[in] Q_1d Number of quadrature points in one dimension 1014eaf62fffSJeremy L Thompson @param[in] dim Dimension of basis 1015eaf62fffSJeremy L Thompson @param[out] mass Assembled mass matrix in one dimension 1016eaf62fffSJeremy L Thompson @param[out] laplace Assembled perturbed Laplacian in one dimension 1017eaf62fffSJeremy L Thompson 1018eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1019eaf62fffSJeremy L Thompson 1020eaf62fffSJeremy L Thompson @ref Developer 1021eaf62fffSJeremy L Thompson **/ 10222c2ea1dbSJeremy L Thompson CeedPragmaOptimizeOff 10232c2ea1dbSJeremy L Thompson static int CeedBuildMassLaplace(const CeedScalar *interp_1d, const CeedScalar *grad_1d, const CeedScalar *q_weight_1d, CeedInt P_1d, CeedInt Q_1d, 10242c2ea1dbSJeremy L Thompson CeedInt dim, CeedScalar *mass, CeedScalar *laplace) { 10252b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) { 1026eaf62fffSJeremy L Thompson for (CeedInt j = 0; j < P_1d; j++) { 1027eaf62fffSJeremy L Thompson CeedScalar sum = 0.0; 10282b730f8bSJeremy L Thompson for (CeedInt k = 0; k < Q_1d; k++) sum += interp_1d[k * P_1d + i] * q_weight_1d[k] * interp_1d[k * P_1d + j]; 1029eaf62fffSJeremy L Thompson mass[i + j * P_1d] = sum; 1030eaf62fffSJeremy L Thompson } 10312b730f8bSJeremy L Thompson } 1032eaf62fffSJeremy L Thompson // -- Laplacian 10332b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) { 1034eaf62fffSJeremy L Thompson for (CeedInt j = 0; j < P_1d; j++) { 1035eaf62fffSJeremy L Thompson CeedScalar sum = 0.0; 10361c66c397SJeremy L Thompson 10372b730f8bSJeremy L Thompson for (CeedInt k = 0; k < Q_1d; k++) sum += grad_1d[k * P_1d + i] * q_weight_1d[k] * grad_1d[k * P_1d + j]; 1038eaf62fffSJeremy L Thompson laplace[i + j * P_1d] = sum; 1039eaf62fffSJeremy L Thompson } 10402b730f8bSJeremy L Thompson } 1041eaf62fffSJeremy L Thompson CeedScalar perturbation = dim > 2 ? 1e-6 : 1e-4; 10422b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) laplace[i + P_1d * i] += perturbation; 1043eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1044eaf62fffSJeremy L Thompson } 10452c2ea1dbSJeremy L Thompson CeedPragmaOptimizeOn 1046eaf62fffSJeremy L Thompson 1047eaf62fffSJeremy L Thompson /// @} 1048eaf62fffSJeremy L Thompson 1049eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 1050480fae85SJeremy L Thompson /// CeedOperator Backend API 1051480fae85SJeremy L Thompson /// ---------------------------------------------------------------------------- 1052480fae85SJeremy L Thompson /// @addtogroup CeedOperatorBackend 1053480fae85SJeremy L Thompson /// @{ 1054480fae85SJeremy L Thompson 1055480fae85SJeremy L Thompson /** 1056506b1a0cSSebastian Grimberg @brief Create point block restriction for active operator field 1057506b1a0cSSebastian Grimberg 1058506b1a0cSSebastian Grimberg @param[in] rstr Original CeedElemRestriction for active field 1059506b1a0cSSebastian Grimberg @param[out] point_block_rstr Address of the variable where the newly created CeedElemRestriction will be stored 1060506b1a0cSSebastian Grimberg 1061506b1a0cSSebastian Grimberg @return An error code: 0 - success, otherwise - failure 1062506b1a0cSSebastian Grimberg 1063506b1a0cSSebastian Grimberg @ref Backend 1064506b1a0cSSebastian Grimberg **/ 1065506b1a0cSSebastian Grimberg int CeedOperatorCreateActivePointBlockRestriction(CeedElemRestriction rstr, CeedElemRestriction *point_block_rstr) { 1066506b1a0cSSebastian Grimberg Ceed ceed; 1067506b1a0cSSebastian Grimberg CeedInt num_elem, num_comp, shift, elem_size, comp_stride, *point_block_offsets; 1068506b1a0cSSebastian Grimberg CeedSize l_size; 1069506b1a0cSSebastian Grimberg const CeedInt *offsets; 1070506b1a0cSSebastian Grimberg 1071506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetCeed(rstr, &ceed)); 1072506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetOffsets(rstr, CEED_MEM_HOST, &offsets)); 1073506b1a0cSSebastian Grimberg 1074506b1a0cSSebastian Grimberg // Expand offsets 1075506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem)); 1076506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp)); 1077506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size)); 1078506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetCompStride(rstr, &comp_stride)); 1079506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size)); 1080506b1a0cSSebastian Grimberg shift = num_comp; 1081506b1a0cSSebastian Grimberg if (comp_stride != 1) shift *= num_comp; 1082506b1a0cSSebastian Grimberg CeedCall(CeedCalloc(num_elem * elem_size, &point_block_offsets)); 1083506b1a0cSSebastian Grimberg for (CeedInt i = 0; i < num_elem * elem_size; i++) { 1084506b1a0cSSebastian Grimberg point_block_offsets[i] = offsets[i] * shift; 1085506b1a0cSSebastian Grimberg } 1086506b1a0cSSebastian Grimberg 1087506b1a0cSSebastian Grimberg // Create new restriction 1088506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionCreate(ceed, num_elem, elem_size, num_comp * num_comp, 1, l_size * num_comp, CEED_MEM_HOST, CEED_OWN_POINTER, 1089506b1a0cSSebastian Grimberg point_block_offsets, point_block_rstr)); 1090506b1a0cSSebastian Grimberg 1091506b1a0cSSebastian Grimberg // Cleanup 1092506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionRestoreOffsets(rstr, &offsets)); 1093506b1a0cSSebastian Grimberg return CEED_ERROR_SUCCESS; 1094506b1a0cSSebastian Grimberg } 1095506b1a0cSSebastian Grimberg 1096506b1a0cSSebastian Grimberg /** 1097480fae85SJeremy L Thompson @brief Create object holding CeedQFunction assembly data for CeedOperator 1098480fae85SJeremy L Thompson 1099480fae85SJeremy L Thompson @param[in] ceed A Ceed object where the CeedQFunctionAssemblyData will be created 1100ea61e9acSJeremy L Thompson @param[out] data Address of the variable where the newly created CeedQFunctionAssemblyData will be stored 1101480fae85SJeremy L Thompson 1102480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1103480fae85SJeremy L Thompson 1104480fae85SJeremy L Thompson @ref Backend 1105480fae85SJeremy L Thompson **/ 1106ea61e9acSJeremy L Thompson int CeedQFunctionAssemblyDataCreate(Ceed ceed, CeedQFunctionAssemblyData *data) { 11072b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, data)); 1108480fae85SJeremy L Thompson (*data)->ref_count = 1; 1109480fae85SJeremy L Thompson (*data)->ceed = ceed; 11102b730f8bSJeremy L Thompson CeedCall(CeedReference(ceed)); 1111480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1112480fae85SJeremy L Thompson } 1113480fae85SJeremy L Thompson 1114480fae85SJeremy L Thompson /** 1115480fae85SJeremy L Thompson @brief Increment the reference counter for a CeedQFunctionAssemblyData 1116480fae85SJeremy L Thompson 1117ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to increment the reference counter 1118480fae85SJeremy L Thompson 1119480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1120480fae85SJeremy L Thompson 1121480fae85SJeremy L Thompson @ref Backend 1122480fae85SJeremy L Thompson **/ 1123480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataReference(CeedQFunctionAssemblyData data) { 1124480fae85SJeremy L Thompson data->ref_count++; 1125480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1126480fae85SJeremy L Thompson } 1127480fae85SJeremy L Thompson 1128480fae85SJeremy L Thompson /** 1129beecbf24SJeremy L Thompson @brief Set re-use of CeedQFunctionAssemblyData 11308b919e6bSJeremy L Thompson 1131ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to mark for reuse 1132ea61e9acSJeremy L Thompson @param[in] reuse_data Boolean flag indicating data re-use 11338b919e6bSJeremy L Thompson 11348b919e6bSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 11358b919e6bSJeremy L Thompson 11368b919e6bSJeremy L Thompson @ref Backend 11378b919e6bSJeremy L Thompson **/ 11382b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetReuse(CeedQFunctionAssemblyData data, bool reuse_data) { 1139beecbf24SJeremy L Thompson data->reuse_data = reuse_data; 1140beecbf24SJeremy L Thompson data->needs_data_update = true; 1141beecbf24SJeremy L Thompson return CEED_ERROR_SUCCESS; 1142beecbf24SJeremy L Thompson } 1143beecbf24SJeremy L Thompson 1144beecbf24SJeremy L Thompson /** 1145beecbf24SJeremy L Thompson @brief Mark QFunctionAssemblyData as stale 1146beecbf24SJeremy L Thompson 1147ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to mark as stale 1148ea61e9acSJeremy L Thompson @param[in] needs_data_update Boolean flag indicating if update is needed or completed 1149beecbf24SJeremy L Thompson 1150beecbf24SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1151beecbf24SJeremy L Thompson 1152beecbf24SJeremy L Thompson @ref Backend 1153beecbf24SJeremy L Thompson **/ 11542b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetUpdateNeeded(CeedQFunctionAssemblyData data, bool needs_data_update) { 1155beecbf24SJeremy L Thompson data->needs_data_update = needs_data_update; 11568b919e6bSJeremy L Thompson return CEED_ERROR_SUCCESS; 11578b919e6bSJeremy L Thompson } 11588b919e6bSJeremy L Thompson 11598b919e6bSJeremy L Thompson /** 11608b919e6bSJeremy L Thompson @brief Determine if QFunctionAssemblyData needs update 11618b919e6bSJeremy L Thompson 11628b919e6bSJeremy L Thompson @param[in] data CeedQFunctionAssemblyData to mark as stale 11638b919e6bSJeremy L Thompson @param[out] is_update_needed Boolean flag indicating if re-assembly is required 11648b919e6bSJeremy L Thompson 11658b919e6bSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 11668b919e6bSJeremy L Thompson 11678b919e6bSJeremy L Thompson @ref Backend 11688b919e6bSJeremy L Thompson **/ 11692b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsUpdateNeeded(CeedQFunctionAssemblyData data, bool *is_update_needed) { 1170beecbf24SJeremy L Thompson *is_update_needed = !data->reuse_data || data->needs_data_update; 11718b919e6bSJeremy L Thompson return CEED_ERROR_SUCCESS; 11728b919e6bSJeremy L Thompson } 11738b919e6bSJeremy L Thompson 11748b919e6bSJeremy L Thompson /** 1175ea61e9acSJeremy L Thompson @brief Copy the pointer to a CeedQFunctionAssemblyData. 11764385fb7fSSebastian Grimberg 1177ea61e9acSJeremy L Thompson Both pointers should be destroyed with `CeedCeedQFunctionAssemblyDataDestroy()`. 1178512bb800SJeremy L Thompson 1179512bb800SJeremy L Thompson Note: If the value of `data_copy` passed to this function is non-NULL, then it is assumed that `*data_copy` is a pointer to a 1180512bb800SJeremy L Thompson CeedQFunctionAssemblyData. This CeedQFunctionAssemblyData will be destroyed if `data_copy` is the only reference to this 1181512bb800SJeremy L Thompson CeedQFunctionAssemblyData. 1182480fae85SJeremy L Thompson 1183ea61e9acSJeremy L Thompson @param[in] data CeedQFunctionAssemblyData to copy reference to 1184ea61e9acSJeremy L Thompson @param[in,out] data_copy Variable to store copied reference 1185480fae85SJeremy L Thompson 1186480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1187480fae85SJeremy L Thompson 1188480fae85SJeremy L Thompson @ref Backend 1189480fae85SJeremy L Thompson **/ 11902b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataReferenceCopy(CeedQFunctionAssemblyData data, CeedQFunctionAssemblyData *data_copy) { 11912b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataReference(data)); 11922b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataDestroy(data_copy)); 1193480fae85SJeremy L Thompson *data_copy = data; 1194480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1195480fae85SJeremy L Thompson } 1196480fae85SJeremy L Thompson 1197480fae85SJeremy L Thompson /** 1198480fae85SJeremy L Thompson @brief Get setup status for internal objects for CeedQFunctionAssemblyData 1199480fae85SJeremy L Thompson 1200ea61e9acSJeremy L Thompson @param[in] data CeedQFunctionAssemblyData to retrieve status 1201480fae85SJeremy L Thompson @param[out] is_setup Boolean flag for setup status 1202480fae85SJeremy L Thompson 1203480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1204480fae85SJeremy L Thompson 1205480fae85SJeremy L Thompson @ref Backend 1206480fae85SJeremy L Thompson **/ 12072b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsSetup(CeedQFunctionAssemblyData data, bool *is_setup) { 1208480fae85SJeremy L Thompson *is_setup = data->is_setup; 1209480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1210480fae85SJeremy L Thompson } 1211480fae85SJeremy L Thompson 1212480fae85SJeremy L Thompson /** 1213480fae85SJeremy L Thompson @brief Set internal objects for CeedQFunctionAssemblyData 1214480fae85SJeremy L Thompson 1215ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to set objects 1216480fae85SJeremy L Thompson @param[in] vec CeedVector to store assembled CeedQFunction at quadrature points 1217480fae85SJeremy L Thompson @param[in] rstr CeedElemRestriction for CeedVector containing assembled CeedQFunction 1218480fae85SJeremy L Thompson 1219480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1220480fae85SJeremy L Thompson 1221480fae85SJeremy L Thompson @ref Backend 1222480fae85SJeremy L Thompson **/ 12232b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetObjects(CeedQFunctionAssemblyData data, CeedVector vec, CeedElemRestriction rstr) { 12242b730f8bSJeremy L Thompson CeedCall(CeedVectorReferenceCopy(vec, &data->vec)); 12252b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(rstr, &data->rstr)); 1226480fae85SJeremy L Thompson 1227480fae85SJeremy L Thompson data->is_setup = true; 1228480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1229480fae85SJeremy L Thompson } 1230480fae85SJeremy L Thompson 12312b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataGetObjects(CeedQFunctionAssemblyData data, CeedVector *vec, CeedElemRestriction *rstr) { 12326574a04fSJeremy L Thompson CeedCheck(data->is_setup, data->ceed, CEED_ERROR_INCOMPLETE, "Internal objects not set; must call CeedQFunctionAssemblyDataSetObjects first."); 1233480fae85SJeremy L Thompson 12342b730f8bSJeremy L Thompson CeedCall(CeedVectorReferenceCopy(data->vec, vec)); 12352b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(data->rstr, rstr)); 1236480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1237480fae85SJeremy L Thompson } 1238480fae85SJeremy L Thompson 1239480fae85SJeremy L Thompson /** 1240480fae85SJeremy L Thompson @brief Destroy CeedQFunctionAssemblyData 1241480fae85SJeremy L Thompson 1242ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to destroy 1243480fae85SJeremy L Thompson 1244480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1245480fae85SJeremy L Thompson 1246480fae85SJeremy L Thompson @ref Backend 1247480fae85SJeremy L Thompson **/ 1248480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataDestroy(CeedQFunctionAssemblyData *data) { 1249ad6481ceSJeremy L Thompson if (!*data || --(*data)->ref_count > 0) { 1250ad6481ceSJeremy L Thompson *data = NULL; 1251ad6481ceSJeremy L Thompson return CEED_ERROR_SUCCESS; 1252ad6481ceSJeremy L Thompson } 12532b730f8bSJeremy L Thompson CeedCall(CeedDestroy(&(*data)->ceed)); 12542b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&(*data)->vec)); 12552b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&(*data)->rstr)); 1256480fae85SJeremy L Thompson 12572b730f8bSJeremy L Thompson CeedCall(CeedFree(data)); 1258480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1259480fae85SJeremy L Thompson } 1260480fae85SJeremy L Thompson 1261ed9e99e6SJeremy L Thompson /** 1262ed9e99e6SJeremy L Thompson @brief Get CeedOperatorAssemblyData 1263ed9e99e6SJeremy L Thompson 1264ed9e99e6SJeremy L Thompson @param[in] op CeedOperator to assemble 1265ed9e99e6SJeremy L Thompson @param[out] data CeedQFunctionAssemblyData 1266ed9e99e6SJeremy L Thompson 1267ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1268ed9e99e6SJeremy L Thompson 1269ed9e99e6SJeremy L Thompson @ref Backend 1270ed9e99e6SJeremy L Thompson **/ 12712b730f8bSJeremy L Thompson int CeedOperatorGetOperatorAssemblyData(CeedOperator op, CeedOperatorAssemblyData *data) { 1272ed9e99e6SJeremy L Thompson if (!op->op_assembled) { 1273ed9e99e6SJeremy L Thompson CeedOperatorAssemblyData data; 1274ed9e99e6SJeremy L Thompson 12752b730f8bSJeremy L Thompson CeedCall(CeedOperatorAssemblyDataCreate(op->ceed, op, &data)); 1276ed9e99e6SJeremy L Thompson op->op_assembled = data; 1277ed9e99e6SJeremy L Thompson } 1278ed9e99e6SJeremy L Thompson *data = op->op_assembled; 1279ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1280ed9e99e6SJeremy L Thompson } 1281ed9e99e6SJeremy L Thompson 1282ed9e99e6SJeremy L Thompson /** 1283ba746a46SJeremy L Thompson @brief Create object holding CeedOperator assembly data. 1284ba746a46SJeremy L Thompson 1285ba746a46SJeremy L Thompson The CeedOperatorAssemblyData holds an array with references to every active CeedBasis used in the CeedOperator. 1286ba746a46SJeremy L Thompson An array with references to the corresponding active CeedElemRestrictions is also stored. 1287ba746a46SJeremy L Thompson For each active CeedBasis, the CeedOperatorAssemblyData holds an array of all input and output CeedEvalModes for this CeedBasis. 1288ba746a46SJeremy L Thompson The CeedOperatorAssemblyData holds an array of offsets for indexing into the assembled CeedQFunction arrays to the row representing each 1289ba746a46SJeremy L Thompson CeedEvalMode. 1290ba746a46SJeremy L Thompson The number of input columns across all active bases for the assembled CeedQFunction is also stored. 1291ba746a46SJeremy L Thompson Lastly, the CeedOperatorAssembly data holds assembled matrices representing the full action of the CeedBasis for all CeedEvalModes. 1292ed9e99e6SJeremy L Thompson 1293ea61e9acSJeremy L Thompson @param[in] ceed Ceed object where the CeedOperatorAssemblyData will be created 1294ed9e99e6SJeremy L Thompson @param[in] op CeedOperator to be assembled 1295ea61e9acSJeremy L Thompson @param[out] data Address of the variable where the newly created CeedOperatorAssemblyData will be stored 1296ed9e99e6SJeremy L Thompson 1297ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1298ed9e99e6SJeremy L Thompson 1299ed9e99e6SJeremy L Thompson @ref Backend 1300ed9e99e6SJeremy L Thompson **/ 13012b730f8bSJeremy L Thompson int CeedOperatorAssemblyDataCreate(Ceed ceed, CeedOperator op, CeedOperatorAssemblyData *data) { 1302506b1a0cSSebastian Grimberg CeedInt num_active_bases_in = 0, num_active_bases_out = 0, offset = 0; 1303506b1a0cSSebastian Grimberg CeedInt num_input_fields, *num_eval_modes_in = NULL, num_output_fields, *num_eval_modes_out = NULL; 13041c66c397SJeremy L Thompson CeedSize **eval_mode_offsets_in = NULL, **eval_mode_offsets_out = NULL; 13051c66c397SJeremy L Thompson CeedEvalMode **eval_modes_in = NULL, **eval_modes_out = NULL; 13061c66c397SJeremy L Thompson CeedQFunctionField *qf_fields; 13071c66c397SJeremy L Thompson CeedQFunction qf; 13081c66c397SJeremy L Thompson CeedOperatorField *op_fields; 130901f0e615SJames Wright bool is_composite; 131001f0e615SJames Wright 131101f0e615SJames Wright CeedCall(CeedOperatorIsComposite(op, &is_composite)); 131201f0e615SJames Wright CeedCheck(!is_composite, ceed, CEED_ERROR_INCOMPATIBLE, "Can only create CeedOperator assembly data for non-composite operators."); 1313437c7c90SJeremy L Thompson 1314437c7c90SJeremy L Thompson // Allocate 13152b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, data)); 1316ed9e99e6SJeremy L Thompson (*data)->ceed = ceed; 13172b730f8bSJeremy L Thompson CeedCall(CeedReference(ceed)); 1318ed9e99e6SJeremy L Thompson 1319ed9e99e6SJeremy L Thompson // Build OperatorAssembly data 13202b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 13212b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetFields(qf, &num_input_fields, &qf_fields, NULL, NULL)); 13222b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL)); 1323ed9e99e6SJeremy L Thompson 1324ed9e99e6SJeremy L Thompson // Determine active input basis 1325ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 1326ed9e99e6SJeremy L Thompson CeedVector vec; 13271c66c397SJeremy L Thompson 13282b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec)); 1329ed9e99e6SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 13307c1dbaffSSebastian Grimberg CeedInt index = -1, num_comp, q_comp; 13311c66c397SJeremy L Thompson CeedEvalMode eval_mode; 13321c66c397SJeremy L Thompson CeedBasis basis_in = NULL; 13331c66c397SJeremy L Thompson 13342b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_in)); 13352b730f8bSJeremy L Thompson CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 1336352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumComponents(basis_in, &num_comp)); 1337352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(basis_in, eval_mode, &q_comp)); 1338506b1a0cSSebastian Grimberg for (CeedInt i = 0; i < num_active_bases_in; i++) { 1339506b1a0cSSebastian Grimberg if ((*data)->active_bases_in[i] == basis_in) index = i; 1340437c7c90SJeremy L Thompson } 1341437c7c90SJeremy L Thompson if (index == -1) { 1342437c7c90SJeremy L Thompson CeedElemRestriction elem_rstr_in; 13431c66c397SJeremy L Thompson 1344506b1a0cSSebastian Grimberg index = num_active_bases_in; 1345506b1a0cSSebastian Grimberg CeedCall(CeedRealloc(num_active_bases_in + 1, &(*data)->active_bases_in)); 1346506b1a0cSSebastian Grimberg (*data)->active_bases_in[num_active_bases_in] = NULL; 1347506b1a0cSSebastian Grimberg CeedCall(CeedBasisReferenceCopy(basis_in, &(*data)->active_bases_in[num_active_bases_in])); 1348506b1a0cSSebastian Grimberg CeedCall(CeedRealloc(num_active_bases_in + 1, &(*data)->active_elem_rstrs_in)); 1349506b1a0cSSebastian Grimberg (*data)->active_elem_rstrs_in[num_active_bases_in] = NULL; 1350437c7c90SJeremy L Thompson CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr_in)); 1351506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionReferenceCopy(elem_rstr_in, &(*data)->active_elem_rstrs_in[num_active_bases_in])); 1352506b1a0cSSebastian Grimberg CeedCall(CeedRealloc(num_active_bases_in + 1, &num_eval_modes_in)); 1353437c7c90SJeremy L Thompson num_eval_modes_in[index] = 0; 1354506b1a0cSSebastian Grimberg CeedCall(CeedRealloc(num_active_bases_in + 1, &eval_modes_in)); 1355437c7c90SJeremy L Thompson eval_modes_in[index] = NULL; 1356506b1a0cSSebastian Grimberg CeedCall(CeedRealloc(num_active_bases_in + 1, &eval_mode_offsets_in)); 1357437c7c90SJeremy L Thompson eval_mode_offsets_in[index] = NULL; 1358506b1a0cSSebastian Grimberg CeedCall(CeedRealloc(num_active_bases_in + 1, &(*data)->assembled_bases_in)); 1359437c7c90SJeremy L Thompson (*data)->assembled_bases_in[index] = NULL; 1360506b1a0cSSebastian Grimberg num_active_bases_in++; 1361437c7c90SJeremy L Thompson } 1362352a5e7cSSebastian Grimberg if (eval_mode != CEED_EVAL_WEIGHT) { 1363352a5e7cSSebastian Grimberg // q_comp = 1 if CEED_EVAL_NONE, CEED_EVAL_WEIGHT caught by QF Assembly 1364352a5e7cSSebastian Grimberg CeedCall(CeedRealloc(num_eval_modes_in[index] + q_comp, &eval_modes_in[index])); 1365352a5e7cSSebastian Grimberg CeedCall(CeedRealloc(num_eval_modes_in[index] + q_comp, &eval_mode_offsets_in[index])); 1366352a5e7cSSebastian Grimberg for (CeedInt d = 0; d < q_comp; d++) { 1367437c7c90SJeremy L Thompson eval_modes_in[index][num_eval_modes_in[index] + d] = eval_mode; 1368437c7c90SJeremy L Thompson eval_mode_offsets_in[index][num_eval_modes_in[index] + d] = offset; 1369352a5e7cSSebastian Grimberg offset += num_comp; 1370ed9e99e6SJeremy L Thompson } 1371352a5e7cSSebastian Grimberg num_eval_modes_in[index] += q_comp; 1372ed9e99e6SJeremy L Thompson } 1373ed9e99e6SJeremy L Thompson } 1374ed9e99e6SJeremy L Thompson } 1375ed9e99e6SJeremy L Thompson 1376ed9e99e6SJeremy L Thompson // Determine active output basis 13772b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetFields(qf, NULL, NULL, &num_output_fields, &qf_fields)); 13782b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields)); 1379437c7c90SJeremy L Thompson offset = 0; 1380ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_output_fields; i++) { 1381ed9e99e6SJeremy L Thompson CeedVector vec; 13821c66c397SJeremy L Thompson 13832b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec)); 1384ed9e99e6SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 13857c1dbaffSSebastian Grimberg CeedInt index = -1, num_comp, q_comp; 13861c66c397SJeremy L Thompson CeedEvalMode eval_mode; 13871c66c397SJeremy L Thompson CeedBasis basis_out = NULL; 13881c66c397SJeremy L Thompson 1389437c7c90SJeremy L Thompson CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_out)); 13902b730f8bSJeremy L Thompson CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 1391352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumComponents(basis_out, &num_comp)); 1392352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(basis_out, eval_mode, &q_comp)); 1393506b1a0cSSebastian Grimberg for (CeedInt i = 0; i < num_active_bases_out; i++) { 1394506b1a0cSSebastian Grimberg if ((*data)->active_bases_out[i] == basis_out) index = i; 1395437c7c90SJeremy L Thompson } 1396437c7c90SJeremy L Thompson if (index == -1) { 1397437c7c90SJeremy L Thompson CeedElemRestriction elem_rstr_out; 13981c66c397SJeremy L Thompson 1399506b1a0cSSebastian Grimberg index = num_active_bases_out; 1400506b1a0cSSebastian Grimberg CeedCall(CeedRealloc(num_active_bases_out + 1, &(*data)->active_bases_out)); 1401506b1a0cSSebastian Grimberg (*data)->active_bases_out[num_active_bases_out] = NULL; 1402506b1a0cSSebastian Grimberg CeedCall(CeedBasisReferenceCopy(basis_out, &(*data)->active_bases_out[num_active_bases_out])); 1403506b1a0cSSebastian Grimberg CeedCall(CeedRealloc(num_active_bases_out + 1, &(*data)->active_elem_rstrs_out)); 1404506b1a0cSSebastian Grimberg (*data)->active_elem_rstrs_out[num_active_bases_out] = NULL; 1405437c7c90SJeremy L Thompson CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr_out)); 1406506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionReferenceCopy(elem_rstr_out, &(*data)->active_elem_rstrs_out[num_active_bases_out])); 1407506b1a0cSSebastian Grimberg CeedCall(CeedRealloc(num_active_bases_out + 1, &num_eval_modes_out)); 1408437c7c90SJeremy L Thompson num_eval_modes_out[index] = 0; 1409506b1a0cSSebastian Grimberg CeedCall(CeedRealloc(num_active_bases_out + 1, &eval_modes_out)); 1410437c7c90SJeremy L Thompson eval_modes_out[index] = NULL; 1411506b1a0cSSebastian Grimberg CeedCall(CeedRealloc(num_active_bases_out + 1, &eval_mode_offsets_out)); 1412437c7c90SJeremy L Thompson eval_mode_offsets_out[index] = NULL; 1413506b1a0cSSebastian Grimberg CeedCall(CeedRealloc(num_active_bases_out + 1, &(*data)->assembled_bases_out)); 1414437c7c90SJeremy L Thompson (*data)->assembled_bases_out[index] = NULL; 1415506b1a0cSSebastian Grimberg num_active_bases_out++; 1416437c7c90SJeremy L Thompson } 1417352a5e7cSSebastian Grimberg if (eval_mode != CEED_EVAL_WEIGHT) { 1418352a5e7cSSebastian Grimberg // q_comp = 1 if CEED_EVAL_NONE, CEED_EVAL_WEIGHT caught by QF Assembly 1419352a5e7cSSebastian Grimberg CeedCall(CeedRealloc(num_eval_modes_out[index] + q_comp, &eval_modes_out[index])); 1420352a5e7cSSebastian Grimberg CeedCall(CeedRealloc(num_eval_modes_out[index] + q_comp, &eval_mode_offsets_out[index])); 1421352a5e7cSSebastian Grimberg for (CeedInt d = 0; d < q_comp; d++) { 1422437c7c90SJeremy L Thompson eval_modes_out[index][num_eval_modes_out[index] + d] = eval_mode; 1423437c7c90SJeremy L Thompson eval_mode_offsets_out[index][num_eval_modes_out[index] + d] = offset; 1424352a5e7cSSebastian Grimberg offset += num_comp; 1425ed9e99e6SJeremy L Thompson } 1426352a5e7cSSebastian Grimberg num_eval_modes_out[index] += q_comp; 1427ed9e99e6SJeremy L Thompson } 1428ed9e99e6SJeremy L Thompson } 1429ed9e99e6SJeremy L Thompson } 1430506b1a0cSSebastian Grimberg (*data)->num_active_bases_in = num_active_bases_in; 143127789c4aSJed Brown (*data)->num_eval_modes_in = num_eval_modes_in; 143227789c4aSJed Brown (*data)->eval_modes_in = eval_modes_in; 143327789c4aSJed Brown (*data)->eval_mode_offsets_in = eval_mode_offsets_in; 1434506b1a0cSSebastian Grimberg (*data)->num_active_bases_out = num_active_bases_out; 1435437c7c90SJeremy L Thompson (*data)->num_eval_modes_out = num_eval_modes_out; 1436437c7c90SJeremy L Thompson (*data)->eval_modes_out = eval_modes_out; 1437437c7c90SJeremy L Thompson (*data)->eval_mode_offsets_out = eval_mode_offsets_out; 1438506b1a0cSSebastian Grimberg (*data)->num_output_components = offset; 1439ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1440ed9e99e6SJeremy L Thompson } 1441ed9e99e6SJeremy L Thompson 1442ed9e99e6SJeremy L Thompson /** 1443ba746a46SJeremy L Thompson @brief Get CeedOperator CeedEvalModes for assembly. 1444ba746a46SJeremy L Thompson 1445ba746a46SJeremy L Thompson Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object. 1446ed9e99e6SJeremy L Thompson 1447ed9e99e6SJeremy L Thompson @param[in] data CeedOperatorAssemblyData 1448506b1a0cSSebastian Grimberg @param[out] num_active_bases_in Total number of active bases for input 1449c5d0f995SJed Brown @param[out] num_eval_modes_in Pointer to hold array of numbers of input CeedEvalModes, or NULL. 1450ba746a46SJeremy L Thompson `eval_modes_in[0]` holds an array of eval modes for the first active basis. 1451c5d0f995SJed Brown @param[out] eval_modes_in Pointer to hold arrays of input CeedEvalModes, or NULL. 1452ba746a46SJeremy L Thompson @param[out] eval_mode_offsets_in Pointer to hold arrays of input offsets at each quadrature point. 1453506b1a0cSSebastian Grimberg @param[out] num_active_bases_out Total number of active bases for output 1454c5d0f995SJed Brown @param[out] num_eval_modes_out Pointer to hold array of numbers of output CeedEvalModes, or NULL 1455c5d0f995SJed Brown @param[out] eval_modes_out Pointer to hold arrays of output CeedEvalModes, or NULL. 1456437c7c90SJeremy L Thompson @param[out] eval_mode_offsets_out Pointer to hold arrays of output offsets at each quadrature point 1457ba746a46SJeremy L Thompson @param[out] num_output_components The number of columns in the assembled CeedQFunction matrix for each quadrature point, 1458ba746a46SJeremy L Thompson including contributions of all active bases 1459ed9e99e6SJeremy L Thompson 1460ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1461ed9e99e6SJeremy L Thompson 1462ed9e99e6SJeremy L Thompson @ref Backend 1463ed9e99e6SJeremy L Thompson **/ 1464506b1a0cSSebastian Grimberg int CeedOperatorAssemblyDataGetEvalModes(CeedOperatorAssemblyData data, CeedInt *num_active_bases_in, CeedInt **num_eval_modes_in, 1465506b1a0cSSebastian Grimberg const CeedEvalMode ***eval_modes_in, CeedSize ***eval_mode_offsets_in, CeedInt *num_active_bases_out, 1466506b1a0cSSebastian Grimberg CeedInt **num_eval_modes_out, const CeedEvalMode ***eval_modes_out, CeedSize ***eval_mode_offsets_out, 1467506b1a0cSSebastian Grimberg CeedSize *num_output_components) { 1468506b1a0cSSebastian Grimberg if (num_active_bases_in) *num_active_bases_in = data->num_active_bases_in; 1469437c7c90SJeremy L Thompson if (num_eval_modes_in) *num_eval_modes_in = data->num_eval_modes_in; 1470437c7c90SJeremy L Thompson if (eval_modes_in) *eval_modes_in = (const CeedEvalMode **)data->eval_modes_in; 1471437c7c90SJeremy L Thompson if (eval_mode_offsets_in) *eval_mode_offsets_in = data->eval_mode_offsets_in; 1472506b1a0cSSebastian Grimberg if (num_active_bases_out) *num_active_bases_out = data->num_active_bases_out; 1473437c7c90SJeremy L Thompson if (num_eval_modes_out) *num_eval_modes_out = data->num_eval_modes_out; 1474437c7c90SJeremy L Thompson if (eval_modes_out) *eval_modes_out = (const CeedEvalMode **)data->eval_modes_out; 1475437c7c90SJeremy L Thompson if (eval_mode_offsets_out) *eval_mode_offsets_out = data->eval_mode_offsets_out; 1476437c7c90SJeremy L Thompson if (num_output_components) *num_output_components = data->num_output_components; 1477ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1478ed9e99e6SJeremy L Thompson } 1479ed9e99e6SJeremy L Thompson 1480ed9e99e6SJeremy L Thompson /** 1481ba746a46SJeremy L Thompson @brief Get CeedOperator CeedBasis data for assembly. 1482ba746a46SJeremy L Thompson 1483ba746a46SJeremy L Thompson Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object. 1484ed9e99e6SJeremy L Thompson 1485ed9e99e6SJeremy L Thompson @param[in] data CeedOperatorAssemblyData 1486506b1a0cSSebastian Grimberg @param[out] num_active_bases_in Number of active input bases, or NULL 1487506b1a0cSSebastian Grimberg @param[out] active_bases_in Pointer to hold active input CeedBasis, or NULL 1488437c7c90SJeremy L Thompson @param[out] assembled_bases_in Pointer to hold assembled active input B, or NULL 1489506b1a0cSSebastian Grimberg @param[out] num_active_bases_out Number of active output bases, or NULL 1490506b1a0cSSebastian Grimberg @param[out] active_bases_out Pointer to hold active output CeedBasis, or NULL 1491437c7c90SJeremy L Thompson @param[out] assembled_bases_out Pointer to hold assembled active output B, or NULL 1492ed9e99e6SJeremy L Thompson 1493ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1494ed9e99e6SJeremy L Thompson 1495ed9e99e6SJeremy L Thompson @ref Backend 1496ed9e99e6SJeremy L Thompson **/ 1497506b1a0cSSebastian Grimberg int CeedOperatorAssemblyDataGetBases(CeedOperatorAssemblyData data, CeedInt *num_active_bases_in, CeedBasis **active_bases_in, 1498506b1a0cSSebastian Grimberg const CeedScalar ***assembled_bases_in, CeedInt *num_active_bases_out, CeedBasis **active_bases_out, 1499506b1a0cSSebastian Grimberg const CeedScalar ***assembled_bases_out) { 1500ed9e99e6SJeremy L Thompson // Assemble B_in, B_out if needed 1501437c7c90SJeremy L Thompson if (assembled_bases_in && !data->assembled_bases_in[0]) { 1502437c7c90SJeremy L Thompson CeedInt num_qpts; 1503437c7c90SJeremy L Thompson 1504506b1a0cSSebastian Grimberg if (data->active_bases_in[0] == CEED_BASIS_NONE) CeedCall(CeedElemRestrictionGetElementSize(data->active_elem_rstrs_in[0], &num_qpts)); 1505506b1a0cSSebastian Grimberg else CeedCall(CeedBasisGetNumQuadraturePoints(data->active_bases_in[0], &num_qpts)); 1506506b1a0cSSebastian Grimberg for (CeedInt b = 0; b < data->num_active_bases_in; b++) { 15071c66c397SJeremy L Thompson bool has_eval_none = false; 1508352a5e7cSSebastian Grimberg CeedInt num_nodes; 1509437c7c90SJeremy L Thompson CeedScalar *B_in = NULL, *identity = NULL; 1510ed9e99e6SJeremy L Thompson 1511506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetElementSize(data->active_elem_rstrs_in[b], &num_nodes)); 1512352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_qpts * num_nodes * data->num_eval_modes_in[b], &B_in)); 1513ed9e99e6SJeremy L Thompson 1514437c7c90SJeremy L Thompson for (CeedInt i = 0; i < data->num_eval_modes_in[b]; i++) { 1515437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (data->eval_modes_in[b][i] == CEED_EVAL_NONE); 1516ed9e99e6SJeremy L Thompson } 1517ed9e99e6SJeremy L Thompson if (has_eval_none) { 1518352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_qpts * num_nodes, &identity)); 1519352a5e7cSSebastian Grimberg for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) { 1520352a5e7cSSebastian Grimberg identity[i * num_nodes + i] = 1.0; 1521ed9e99e6SJeremy L Thompson } 1522ed9e99e6SJeremy L Thompson } 1523ed9e99e6SJeremy L Thompson 1524ed9e99e6SJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 1525352a5e7cSSebastian Grimberg for (CeedInt n = 0; n < num_nodes; n++) { 1526352a5e7cSSebastian Grimberg CeedInt d_in = 0, q_comp_in; 1527352a5e7cSSebastian Grimberg CeedEvalMode eval_mode_in_prev = CEED_EVAL_NONE; 15281c66c397SJeremy L Thompson 1529437c7c90SJeremy L Thompson for (CeedInt e_in = 0; e_in < data->num_eval_modes_in[b]; e_in++) { 1530437c7c90SJeremy L Thompson const CeedInt qq = data->num_eval_modes_in[b] * q; 1531437c7c90SJeremy L Thompson const CeedScalar *B = NULL; 15321c66c397SJeremy L Thompson 1533506b1a0cSSebastian Grimberg CeedCall(CeedOperatorGetBasisPointer(data->active_bases_in[b], data->eval_modes_in[b][e_in], identity, &B)); 1534506b1a0cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(data->active_bases_in[b], data->eval_modes_in[b][e_in], &q_comp_in)); 1535352a5e7cSSebastian Grimberg if (q_comp_in > 1) { 1536352a5e7cSSebastian Grimberg if (e_in == 0 || data->eval_modes_in[b][e_in] != eval_mode_in_prev) d_in = 0; 1537352a5e7cSSebastian Grimberg else B = &B[(++d_in) * num_qpts * num_nodes]; 1538352a5e7cSSebastian Grimberg } 1539352a5e7cSSebastian Grimberg eval_mode_in_prev = data->eval_modes_in[b][e_in]; 1540352a5e7cSSebastian Grimberg B_in[(qq + e_in) * num_nodes + n] = B[q * num_nodes + n]; 1541ed9e99e6SJeremy L Thompson } 1542ed9e99e6SJeremy L Thompson } 1543ed9e99e6SJeremy L Thompson } 15447c1dbaffSSebastian Grimberg if (identity) CeedCall(CeedFree(&identity)); 1545437c7c90SJeremy L Thompson data->assembled_bases_in[b] = B_in; 1546437c7c90SJeremy L Thompson } 1547ed9e99e6SJeremy L Thompson } 1548ed9e99e6SJeremy L Thompson 1549437c7c90SJeremy L Thompson if (assembled_bases_out && !data->assembled_bases_out[0]) { 1550437c7c90SJeremy L Thompson CeedInt num_qpts; 1551437c7c90SJeremy L Thompson 1552506b1a0cSSebastian Grimberg if (data->active_bases_out[0] == CEED_BASIS_NONE) CeedCall(CeedElemRestrictionGetElementSize(data->active_elem_rstrs_out[0], &num_qpts)); 1553506b1a0cSSebastian Grimberg else CeedCall(CeedBasisGetNumQuadraturePoints(data->active_bases_out[0], &num_qpts)); 1554506b1a0cSSebastian Grimberg for (CeedInt b = 0; b < data->num_active_bases_out; b++) { 1555ed9e99e6SJeremy L Thompson bool has_eval_none = false; 15561c66c397SJeremy L Thompson CeedInt num_nodes; 1557437c7c90SJeremy L Thompson CeedScalar *B_out = NULL, *identity = NULL; 1558ed9e99e6SJeremy L Thompson 1559506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetElementSize(data->active_elem_rstrs_out[b], &num_nodes)); 1560352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_qpts * num_nodes * data->num_eval_modes_out[b], &B_out)); 1561ed9e99e6SJeremy L Thompson 1562437c7c90SJeremy L Thompson for (CeedInt i = 0; i < data->num_eval_modes_out[b]; i++) { 1563437c7c90SJeremy L Thompson has_eval_none = has_eval_none || (data->eval_modes_out[b][i] == CEED_EVAL_NONE); 1564ed9e99e6SJeremy L Thompson } 1565ed9e99e6SJeremy L Thompson if (has_eval_none) { 1566352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_qpts * num_nodes, &identity)); 1567352a5e7cSSebastian Grimberg for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) { 1568352a5e7cSSebastian Grimberg identity[i * num_nodes + i] = 1.0; 1569ed9e99e6SJeremy L Thompson } 1570ed9e99e6SJeremy L Thompson } 1571ed9e99e6SJeremy L Thompson 1572ed9e99e6SJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 1573352a5e7cSSebastian Grimberg for (CeedInt n = 0; n < num_nodes; n++) { 1574352a5e7cSSebastian Grimberg CeedInt d_out = 0, q_comp_out; 1575352a5e7cSSebastian Grimberg CeedEvalMode eval_mode_out_prev = CEED_EVAL_NONE; 15761c66c397SJeremy L Thompson 1577437c7c90SJeremy L Thompson for (CeedInt e_out = 0; e_out < data->num_eval_modes_out[b]; e_out++) { 1578437c7c90SJeremy L Thompson const CeedInt qq = data->num_eval_modes_out[b] * q; 1579437c7c90SJeremy L Thompson const CeedScalar *B = NULL; 15801c66c397SJeremy L Thompson 1581506b1a0cSSebastian Grimberg CeedCall(CeedOperatorGetBasisPointer(data->active_bases_out[b], data->eval_modes_out[b][e_out], identity, &B)); 1582506b1a0cSSebastian Grimberg CeedCall(CeedBasisGetNumQuadratureComponents(data->active_bases_out[b], data->eval_modes_out[b][e_out], &q_comp_out)); 1583352a5e7cSSebastian Grimberg if (q_comp_out > 1) { 1584352a5e7cSSebastian Grimberg if (e_out == 0 || data->eval_modes_out[b][e_out] != eval_mode_out_prev) d_out = 0; 1585352a5e7cSSebastian Grimberg else B = &B[(++d_out) * num_qpts * num_nodes]; 1586352a5e7cSSebastian Grimberg } 1587352a5e7cSSebastian Grimberg eval_mode_out_prev = data->eval_modes_out[b][e_out]; 1588352a5e7cSSebastian Grimberg B_out[(qq + e_out) * num_nodes + n] = B[q * num_nodes + n]; 1589ed9e99e6SJeremy L Thompson } 1590ed9e99e6SJeremy L Thompson } 1591ed9e99e6SJeremy L Thompson } 15927c1dbaffSSebastian Grimberg if (identity) CeedCall(CeedFree(&identity)); 1593437c7c90SJeremy L Thompson data->assembled_bases_out[b] = B_out; 1594437c7c90SJeremy L Thompson } 1595ed9e99e6SJeremy L Thompson } 1596ed9e99e6SJeremy L Thompson 1597437c7c90SJeremy L Thompson // Pass out assembled data 1598506b1a0cSSebastian Grimberg if (num_active_bases_in) *num_active_bases_in = data->num_active_bases_in; 1599506b1a0cSSebastian Grimberg if (active_bases_in) *active_bases_in = data->active_bases_in; 1600437c7c90SJeremy L Thompson if (assembled_bases_in) *assembled_bases_in = (const CeedScalar **)data->assembled_bases_in; 1601506b1a0cSSebastian Grimberg if (num_active_bases_out) *num_active_bases_out = data->num_active_bases_out; 1602506b1a0cSSebastian Grimberg if (active_bases_out) *active_bases_out = data->active_bases_out; 1603437c7c90SJeremy L Thompson if (assembled_bases_out) *assembled_bases_out = (const CeedScalar **)data->assembled_bases_out; 1604437c7c90SJeremy L Thompson return CEED_ERROR_SUCCESS; 1605437c7c90SJeremy L Thompson } 1606437c7c90SJeremy L Thompson 1607437c7c90SJeremy L Thompson /** 1608ba746a46SJeremy L Thompson @brief Get CeedOperator CeedBasis data for assembly. 1609ba746a46SJeremy L Thompson 1610ba746a46SJeremy L Thompson Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object. 1611437c7c90SJeremy L Thompson 1612437c7c90SJeremy L Thompson @param[in] data CeedOperatorAssemblyData 1613506b1a0cSSebastian Grimberg @param[out] num_active_elem_rstrs_in Number of active input element restrictions, or NULL 1614506b1a0cSSebastian Grimberg @param[out] active_elem_rstrs_in Pointer to hold active input CeedElemRestrictions, or NULL 1615506b1a0cSSebastian Grimberg @param[out] num_active_elem_rstrs_out Number of active output element restrictions, or NULL 1616506b1a0cSSebastian Grimberg @param[out] active_elem_rstrs_out Pointer to hold active output CeedElemRestrictions, or NULL 1617437c7c90SJeremy L Thompson 1618437c7c90SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1619437c7c90SJeremy L Thompson 1620437c7c90SJeremy L Thompson @ref Backend 1621437c7c90SJeremy L Thompson **/ 1622506b1a0cSSebastian Grimberg int CeedOperatorAssemblyDataGetElemRestrictions(CeedOperatorAssemblyData data, CeedInt *num_active_elem_rstrs_in, 1623506b1a0cSSebastian Grimberg CeedElemRestriction **active_elem_rstrs_in, CeedInt *num_active_elem_rstrs_out, 1624506b1a0cSSebastian Grimberg CeedElemRestriction **active_elem_rstrs_out) { 1625506b1a0cSSebastian Grimberg if (num_active_elem_rstrs_in) *num_active_elem_rstrs_in = data->num_active_bases_in; 1626506b1a0cSSebastian Grimberg if (active_elem_rstrs_in) *active_elem_rstrs_in = data->active_elem_rstrs_in; 1627506b1a0cSSebastian Grimberg if (num_active_elem_rstrs_out) *num_active_elem_rstrs_out = data->num_active_bases_out; 1628506b1a0cSSebastian Grimberg if (active_elem_rstrs_out) *active_elem_rstrs_out = data->active_elem_rstrs_out; 1629ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1630ed9e99e6SJeremy L Thompson } 1631ed9e99e6SJeremy L Thompson 1632ed9e99e6SJeremy L Thompson /** 1633ed9e99e6SJeremy L Thompson @brief Destroy CeedOperatorAssemblyData 1634ed9e99e6SJeremy L Thompson 1635ea61e9acSJeremy L Thompson @param[in,out] data CeedOperatorAssemblyData to destroy 1636ed9e99e6SJeremy L Thompson 1637ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1638ed9e99e6SJeremy L Thompson 1639ed9e99e6SJeremy L Thompson @ref Backend 1640ed9e99e6SJeremy L Thompson **/ 1641ed9e99e6SJeremy L Thompson int CeedOperatorAssemblyDataDestroy(CeedOperatorAssemblyData *data) { 1642ad6481ceSJeremy L Thompson if (!*data) { 1643ad6481ceSJeremy L Thompson *data = NULL; 1644ad6481ceSJeremy L Thompson return CEED_ERROR_SUCCESS; 1645ad6481ceSJeremy L Thompson } 16462b730f8bSJeremy L Thompson CeedCall(CeedDestroy(&(*data)->ceed)); 1647506b1a0cSSebastian Grimberg for (CeedInt b = 0; b < (*data)->num_active_bases_in; b++) { 1648506b1a0cSSebastian Grimberg CeedCall(CeedBasisDestroy(&(*data)->active_bases_in[b])); 1649506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionDestroy(&(*data)->active_elem_rstrs_in[b])); 1650437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_in[b])); 1651437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_in[b])); 1652437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_in[b])); 1653506b1a0cSSebastian Grimberg } 1654506b1a0cSSebastian Grimberg for (CeedInt b = 0; b < (*data)->num_active_bases_out; b++) { 1655506b1a0cSSebastian Grimberg CeedCall(CeedBasisDestroy(&(*data)->active_bases_out[b])); 1656506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionDestroy(&(*data)->active_elem_rstrs_out[b])); 1657506b1a0cSSebastian Grimberg CeedCall(CeedFree(&(*data)->eval_modes_out[b])); 1658506b1a0cSSebastian Grimberg CeedCall(CeedFree(&(*data)->eval_mode_offsets_out[b])); 1659437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_out[b])); 1660437c7c90SJeremy L Thompson } 1661506b1a0cSSebastian Grimberg CeedCall(CeedFree(&(*data)->active_bases_in)); 1662506b1a0cSSebastian Grimberg CeedCall(CeedFree(&(*data)->active_bases_out)); 1663506b1a0cSSebastian Grimberg CeedCall(CeedFree(&(*data)->active_elem_rstrs_in)); 1664506b1a0cSSebastian Grimberg CeedCall(CeedFree(&(*data)->active_elem_rstrs_out)); 1665437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->num_eval_modes_in)); 1666437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->num_eval_modes_out)); 1667437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_in)); 1668437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_modes_out)); 1669437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_in)); 1670437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_offsets_out)); 1671437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_in)); 1672437c7c90SJeremy L Thompson CeedCall(CeedFree(&(*data)->assembled_bases_out)); 1673ed9e99e6SJeremy L Thompson 16742b730f8bSJeremy L Thompson CeedCall(CeedFree(data)); 1675ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1676ed9e99e6SJeremy L Thompson } 1677ed9e99e6SJeremy L Thompson 1678480fae85SJeremy L Thompson /// @} 1679480fae85SJeremy L Thompson 1680480fae85SJeremy L Thompson /// ---------------------------------------------------------------------------- 1681eaf62fffSJeremy L Thompson /// CeedOperator Public API 1682eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 1683eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorUser 1684eaf62fffSJeremy L Thompson /// @{ 1685eaf62fffSJeremy L Thompson 1686eaf62fffSJeremy L Thompson /** 1687eaf62fffSJeremy L Thompson @brief Assemble a linear CeedQFunction associated with a CeedOperator 1688eaf62fffSJeremy L Thompson 1689ea61e9acSJeremy L Thompson This returns a CeedVector containing a matrix at each quadrature point providing the action of the CeedQFunction associated with the CeedOperator. 1690859c15bbSJames Wright The vector `assembled` is of shape `[num_elements, num_input_fields, num_output_fields, num_quad_points]` and contains column-major matrices 1691859c15bbSJames Wright representing the action of the CeedQFunction for a corresponding quadrature point on an element. 1692859c15bbSJames Wright 16939fd66db6SSebastian Grimberg Inputs and outputs are in the order provided by the user when adding CeedOperator fields. 16949fd66db6SSebastian Grimberg For example, a CeedQFunction with inputs 'u' and 'gradu' and outputs 'gradv' and 'v', provided in that order, would result in an assembled QFunction 16959fd66db6SSebastian Grimberg that consists of (1 + dim) x (dim + 1) matrices at each quadrature point acting on the input [u, du_0, du_1] and producing the output [dv_0, dv_1, v]. 1696eaf62fffSJeremy L Thompson 1697ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1698f04ea552SJeremy L Thompson 1699ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1700ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points 1701ea61e9acSJeremy L Thompson @param[out] rstr CeedElemRestriction for CeedVector containing assembled CeedQFunction 1702ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1703eaf62fffSJeremy L Thompson 1704eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1705eaf62fffSJeremy L Thompson 1706eaf62fffSJeremy L Thompson @ref User 1707eaf62fffSJeremy L Thompson **/ 17082b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunction(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 17092b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1710eaf62fffSJeremy L Thompson 1711eaf62fffSJeremy L Thompson if (op->LinearAssembleQFunction) { 1712d04bbc78SJeremy L Thompson // Backend version 17132b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleQFunction(op, assembled, rstr, request)); 1714eaf62fffSJeremy L Thompson } else { 1715d04bbc78SJeremy L Thompson // Operator fallback 1716d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1717d04bbc78SJeremy L Thompson 17182b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 17196574a04fSJeremy L Thompson if (op_fallback) CeedCall(CeedOperatorLinearAssembleQFunction(op_fallback, assembled, rstr, request)); 17206574a04fSJeremy L Thompson else return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunction"); 172170a7ffb3SJeremy L Thompson } 1722eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1723eaf62fffSJeremy L Thompson } 172470a7ffb3SJeremy L Thompson 172570a7ffb3SJeremy L Thompson /** 1726ea61e9acSJeremy L Thompson @brief Assemble CeedQFunction and store result internally. 17274385fb7fSSebastian Grimberg 1728ea61e9acSJeremy L Thompson Return copied references of stored data to the caller. 1729ea61e9acSJeremy L Thompson Caller is responsible for ownership and destruction of the copied references. 1730ea61e9acSJeremy L Thompson See also @ref CeedOperatorLinearAssembleQFunction 173170a7ffb3SJeremy L Thompson 1732c5f45aeaSJeremy L Thompson Note: If the value of `assembled` or `rstr` passed to this function are non-NULL, then it is assumed that they hold valid pointers. 1733c5f45aeaSJeremy L Thompson These objects will be destroyed if `*assembled` or `*rstr` is the only reference to the object. 1734c5f45aeaSJeremy L Thompson 1735ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1736ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points 1737ea61e9acSJeremy L Thompson @param[out] rstr CeedElemRestriction for CeedVector containing assembledCeedQFunction 1738ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 173970a7ffb3SJeremy L Thompson 174070a7ffb3SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 174170a7ffb3SJeremy L Thompson 174270a7ffb3SJeremy L Thompson @ref User 174370a7ffb3SJeremy L Thompson **/ 17442b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunctionBuildOrUpdate(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 1745b05f7e9fSJeremy L Thompson int (*LinearAssembleQFunctionUpdate)(CeedOperator, CeedVector, CeedElemRestriction, CeedRequest *) = NULL; 1746b05f7e9fSJeremy L Thompson CeedOperator op_assemble = NULL; 1747bb229da9SJeremy L Thompson CeedOperator op_fallback_parent = NULL; 1748b05f7e9fSJeremy L Thompson 17492b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 175070a7ffb3SJeremy L Thompson 1751b05f7e9fSJeremy L Thompson // Determine if fallback parent or operator has implementation 1752bb229da9SJeremy L Thompson CeedCall(CeedOperatorGetFallbackParent(op, &op_fallback_parent)); 1753bb229da9SJeremy L Thompson if (op_fallback_parent && op_fallback_parent->LinearAssembleQFunctionUpdate) { 1754b05f7e9fSJeremy L Thompson // -- Backend version for op fallback parent is faster, if it exists 1755bb229da9SJeremy L Thompson LinearAssembleQFunctionUpdate = op_fallback_parent->LinearAssembleQFunctionUpdate; 1756bb229da9SJeremy L Thompson op_assemble = op_fallback_parent; 1757b05f7e9fSJeremy L Thompson } else if (op->LinearAssembleQFunctionUpdate) { 1758b05f7e9fSJeremy L Thompson // -- Backend version for op 1759b05f7e9fSJeremy L Thompson LinearAssembleQFunctionUpdate = op->LinearAssembleQFunctionUpdate; 1760b05f7e9fSJeremy L Thompson op_assemble = op; 1761b05f7e9fSJeremy L Thompson } 1762b05f7e9fSJeremy L Thompson 1763b05f7e9fSJeremy L Thompson // Assemble QFunction 1764b05f7e9fSJeremy L Thompson if (LinearAssembleQFunctionUpdate) { 1765b05f7e9fSJeremy L Thompson // Backend or fallback parent version 1766480fae85SJeremy L Thompson bool qf_assembled_is_setup; 17672efa2d85SJeremy L Thompson CeedVector assembled_vec = NULL; 17682efa2d85SJeremy L Thompson CeedElemRestriction assembled_rstr = NULL; 1769480fae85SJeremy L Thompson 17702b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataIsSetup(op->qf_assembled, &qf_assembled_is_setup)); 1771480fae85SJeremy L Thompson if (qf_assembled_is_setup) { 1772d04bbc78SJeremy L Thompson bool update_needed; 1773d04bbc78SJeremy L Thompson 17742b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataGetObjects(op->qf_assembled, &assembled_vec, &assembled_rstr)); 17752b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataIsUpdateNeeded(op->qf_assembled, &update_needed)); 1776b05f7e9fSJeremy L Thompson if (update_needed) CeedCall(LinearAssembleQFunctionUpdate(op_assemble, assembled_vec, assembled_rstr, request)); 177770a7ffb3SJeremy L Thompson } else { 1778b05f7e9fSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunction(op_assemble, &assembled_vec, &assembled_rstr, request)); 17792b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataSetObjects(op->qf_assembled, assembled_vec, assembled_rstr)); 178070a7ffb3SJeremy L Thompson } 17812b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataSetUpdateNeeded(op->qf_assembled, false)); 17822efa2d85SJeremy L Thompson 1783d04bbc78SJeremy L Thompson // Copy reference from internally held copy 17842b730f8bSJeremy L Thompson CeedCall(CeedVectorReferenceCopy(assembled_vec, assembled)); 17852b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(assembled_rstr, rstr)); 1786c5f45aeaSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled_vec)); 17872b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&assembled_rstr)); 178870a7ffb3SJeremy L Thompson } else { 1789d04bbc78SJeremy L Thompson // Operator fallback 1790d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1791d04bbc78SJeremy L Thompson 17922b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 17936574a04fSJeremy L Thompson if (op_fallback) CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op_fallback, assembled, rstr, request)); 17946574a04fSJeremy L Thompson else return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunctionUpdate"); 179570a7ffb3SJeremy L Thompson } 179670a7ffb3SJeremy L Thompson return CEED_ERROR_SUCCESS; 1797eaf62fffSJeremy L Thompson } 1798eaf62fffSJeremy L Thompson 1799eaf62fffSJeremy L Thompson /** 1800eaf62fffSJeremy L Thompson @brief Assemble the diagonal of a square linear CeedOperator 1801eaf62fffSJeremy L Thompson 1802eaf62fffSJeremy L Thompson This overwrites a CeedVector with the diagonal of a linear CeedOperator. 1803eaf62fffSJeremy L Thompson 1804ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1805eaf62fffSJeremy L Thompson 1806ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1807f04ea552SJeremy L Thompson 1808ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1809eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator diagonal 1810ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1811eaf62fffSJeremy L Thompson 1812eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1813eaf62fffSJeremy L Thompson 1814eaf62fffSJeremy L Thompson @ref User 1815eaf62fffSJeremy L Thompson **/ 18162b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1817f3d47e36SJeremy L Thompson bool is_composite; 18181c66c397SJeremy L Thompson CeedSize input_size = 0, output_size = 0; 18191c66c397SJeremy L Thompson 18202b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1821f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1822eaf62fffSJeremy L Thompson 18232b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 18246574a04fSJeremy L Thompson CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1825c9366a6bSJeremy L Thompson 1826f3d47e36SJeremy L Thompson // Early exit for empty operator 1827f3d47e36SJeremy L Thompson if (!is_composite) { 1828f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1829f3d47e36SJeremy L Thompson 1830f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1831f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1832f3d47e36SJeremy L Thompson } 1833f3d47e36SJeremy L Thompson 1834eaf62fffSJeremy L Thompson if (op->LinearAssembleDiagonal) { 1835d04bbc78SJeremy L Thompson // Backend version 18362b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleDiagonal(op, assembled, request)); 1837eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1838eaf62fffSJeremy L Thompson } else if (op->LinearAssembleAddDiagonal) { 1839d04bbc78SJeremy L Thompson // Backend version with zeroing first 18402b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 18412b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request)); 1842eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1843eaf62fffSJeremy L Thompson } else { 1844d04bbc78SJeremy L Thompson // Operator fallback 1845d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1846d04bbc78SJeremy L Thompson 18472b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1848d04bbc78SJeremy L Thompson if (op_fallback) { 18492b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleDiagonal(op_fallback, assembled, request)); 1850eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1851eaf62fffSJeremy L Thompson } 1852eaf62fffSJeremy L Thompson } 1853eaf62fffSJeremy L Thompson // Default interface implementation 18542b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 18552b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddDiagonal(op, assembled, request)); 1856eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1857eaf62fffSJeremy L Thompson } 1858eaf62fffSJeremy L Thompson 1859eaf62fffSJeremy L Thompson /** 1860eaf62fffSJeremy L Thompson @brief Assemble the diagonal of a square linear CeedOperator 1861eaf62fffSJeremy L Thompson 1862eaf62fffSJeremy L Thompson This sums into a CeedVector the diagonal of a linear CeedOperator. 1863eaf62fffSJeremy L Thompson 1864ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1865eaf62fffSJeremy L Thompson 1866ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1867f04ea552SJeremy L Thompson 1868ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1869eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator diagonal 1870ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1871eaf62fffSJeremy L Thompson 1872eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1873eaf62fffSJeremy L Thompson 1874eaf62fffSJeremy L Thompson @ref User 1875eaf62fffSJeremy L Thompson **/ 18762b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1877f3d47e36SJeremy L Thompson bool is_composite; 18781c66c397SJeremy L Thompson CeedSize input_size = 0, output_size = 0; 18791c66c397SJeremy L Thompson 18802b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1881f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1882eaf62fffSJeremy L Thompson 18832b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 18846574a04fSJeremy L Thompson CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1885c9366a6bSJeremy L Thompson 1886f3d47e36SJeremy L Thompson // Early exit for empty operator 1887f3d47e36SJeremy L Thompson if (!is_composite) { 1888f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1889f3d47e36SJeremy L Thompson 1890f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1891f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1892f3d47e36SJeremy L Thompson } 1893f3d47e36SJeremy L Thompson 1894eaf62fffSJeremy L Thompson if (op->LinearAssembleAddDiagonal) { 1895d04bbc78SJeremy L Thompson // Backend version 18962b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request)); 1897eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1898eaf62fffSJeremy L Thompson } else { 1899d04bbc78SJeremy L Thompson // Operator fallback 1900d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1901d04bbc78SJeremy L Thompson 19022b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1903d04bbc78SJeremy L Thompson if (op_fallback) { 19042b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddDiagonal(op_fallback, assembled, request)); 1905eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1906eaf62fffSJeremy L Thompson } 1907eaf62fffSJeremy L Thompson } 1908eaf62fffSJeremy L Thompson // Default interface implementation 1909eaf62fffSJeremy L Thompson if (is_composite) { 19102b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, false, assembled)); 1911eaf62fffSJeremy L Thompson } else { 19122b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, false, assembled)); 1913eaf62fffSJeremy L Thompson } 1914d04bbc78SJeremy L Thompson return CEED_ERROR_SUCCESS; 1915eaf62fffSJeremy L Thompson } 1916eaf62fffSJeremy L Thompson 1917eaf62fffSJeremy L Thompson /** 191801f0e615SJames Wright @brief Fully assemble the point-block diagonal pattern of a linear operator. 191901f0e615SJames Wright 192001f0e615SJames Wright Expected to be used in conjunction with CeedOperatorLinearAssemblePointBlockDiagonal(). 192101f0e615SJames Wright 192201f0e615SJames Wright The assembly routines use coordinate format, with `num_entries` tuples of the form (i, j, value) which indicate that value should be added to the 192301f0e615SJames Wright matrix in entry (i, j). 192401f0e615SJames Wright Note that the (i, j) pairs are unique. 192501f0e615SJames Wright This function returns the number of entries and their (i, j) locations, while CeedOperatorLinearAssemblePointBlockDiagonal() provides the values in 192601f0e615SJames Wright the same ordering. 192701f0e615SJames Wright 192801f0e615SJames Wright This will generally be slow unless your operator is low-order. 192901f0e615SJames Wright 193001f0e615SJames Wright Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 193101f0e615SJames Wright 193201f0e615SJames Wright @param[in] op CeedOperator to assemble 193301f0e615SJames Wright @param[out] num_entries Number of entries in coordinate nonzero pattern 193401f0e615SJames Wright @param[out] rows Row number for each entry 193501f0e615SJames Wright @param[out] cols Column number for each entry 193601f0e615SJames Wright 193701f0e615SJames Wright @ref User 193801f0e615SJames Wright **/ 193901f0e615SJames Wright int CeedOperatorLinearAssemblePointBlockDiagonalSymbolic(CeedOperator op, CeedSize *num_entries, CeedInt **rows, CeedInt **cols) { 194001f0e615SJames Wright Ceed ceed; 194101f0e615SJames Wright bool is_composite; 194201f0e615SJames Wright CeedInt num_active_components, num_sub_operators; 194301f0e615SJames Wright CeedOperator *sub_operators; 194401f0e615SJames Wright 194501f0e615SJames Wright CeedCall(CeedOperatorGetCeed(op, &ceed)); 194601f0e615SJames Wright CeedCall(CeedOperatorIsComposite(op, &is_composite)); 194701f0e615SJames Wright 194801f0e615SJames Wright CeedSize input_size = 0, output_size = 0; 194901f0e615SJames Wright CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 195001f0e615SJames Wright CeedCheck(input_size == output_size, ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 195101f0e615SJames Wright 195201f0e615SJames Wright if (is_composite) { 195301f0e615SJames Wright CeedCall(CeedCompositeOperatorGetNumSub(op, &num_sub_operators)); 195401f0e615SJames Wright CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 195501f0e615SJames Wright } else { 195601f0e615SJames Wright sub_operators = &op; 195701f0e615SJames Wright num_sub_operators = 1; 195801f0e615SJames Wright } 195901f0e615SJames Wright 1960506b1a0cSSebastian Grimberg // Verify operator can be assembled correctly 1961506b1a0cSSebastian Grimberg { 196201f0e615SJames Wright CeedOperatorAssemblyData data; 1963506b1a0cSSebastian Grimberg CeedInt num_active_elem_rstrs, comp_stride; 196401f0e615SJames Wright CeedElemRestriction *active_elem_rstrs; 196501f0e615SJames Wright 196601f0e615SJames Wright // Get initial values to check against 196701f0e615SJames Wright CeedCall(CeedOperatorGetOperatorAssemblyData(sub_operators[0], &data)); 1968506b1a0cSSebastian Grimberg CeedCall(CeedOperatorAssemblyDataGetElemRestrictions(data, &num_active_elem_rstrs, &active_elem_rstrs, NULL, NULL)); 196901f0e615SJames Wright CeedCall(CeedElemRestrictionGetCompStride(active_elem_rstrs[0], &comp_stride)); 197001f0e615SJames Wright CeedCall(CeedElemRestrictionGetNumComponents(active_elem_rstrs[0], &num_active_components)); 197101f0e615SJames Wright 1972506b1a0cSSebastian Grimberg // Verify that all active element restrictions have same component stride and number of components 197301f0e615SJames Wright for (CeedInt k = 0; k < num_sub_operators; k++) { 197401f0e615SJames Wright CeedCall(CeedOperatorGetOperatorAssemblyData(sub_operators[k], &data)); 1975506b1a0cSSebastian Grimberg CeedCall(CeedOperatorAssemblyDataGetElemRestrictions(data, &num_active_elem_rstrs, &active_elem_rstrs, NULL, NULL)); 197601f0e615SJames Wright for (CeedInt i = 0; i < num_active_elem_rstrs; i++) { 1977506b1a0cSSebastian Grimberg CeedInt comp_stride_sub, num_active_components_sub; 1978506b1a0cSSebastian Grimberg 197901f0e615SJames Wright CeedCall(CeedElemRestrictionGetCompStride(active_elem_rstrs[i], &comp_stride_sub)); 198001f0e615SJames Wright CeedCheck(comp_stride == comp_stride_sub, ceed, CEED_ERROR_DIMENSION, 198101f0e615SJames Wright "Active element restrictions must have the same component stride: %d vs %d", comp_stride, comp_stride_sub); 198201f0e615SJames Wright CeedCall(CeedElemRestrictionGetNumComponents(active_elem_rstrs[i], &num_active_components_sub)); 198301f0e615SJames Wright CeedCheck(num_active_components == num_active_components_sub, ceed, CEED_ERROR_INCOMPATIBLE, 198401f0e615SJames Wright "All suboperators must have the same number of output components"); 198501f0e615SJames Wright } 198601f0e615SJames Wright } 198701f0e615SJames Wright } 198801f0e615SJames Wright *num_entries = input_size * num_active_components; 198901f0e615SJames Wright CeedCall(CeedCalloc(*num_entries, rows)); 199001f0e615SJames Wright CeedCall(CeedCalloc(*num_entries, cols)); 199101f0e615SJames Wright 199201f0e615SJames Wright for (CeedInt o = 0; o < num_sub_operators; o++) { 1993506b1a0cSSebastian Grimberg CeedElemRestriction active_elem_rstr, point_block_active_elem_rstr; 199401f0e615SJames Wright CeedInt comp_stride, num_elem, elem_size; 1995506b1a0cSSebastian Grimberg const CeedInt *offsets, *point_block_offsets; 199601f0e615SJames Wright 199701f0e615SJames Wright CeedCall(CeedOperatorGetActiveElemRestriction(sub_operators[o], &active_elem_rstr)); 199801f0e615SJames Wright CeedCall(CeedElemRestrictionGetCompStride(active_elem_rstr, &comp_stride)); 199901f0e615SJames Wright CeedCall(CeedElemRestrictionGetNumElements(active_elem_rstr, &num_elem)); 200001f0e615SJames Wright CeedCall(CeedElemRestrictionGetElementSize(active_elem_rstr, &elem_size)); 200101f0e615SJames Wright CeedCall(CeedElemRestrictionGetOffsets(active_elem_rstr, CEED_MEM_HOST, &offsets)); 200201f0e615SJames Wright 2003506b1a0cSSebastian Grimberg CeedCall(CeedOperatorCreateActivePointBlockRestriction(active_elem_rstr, &point_block_active_elem_rstr)); 2004506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionGetOffsets(point_block_active_elem_rstr, CEED_MEM_HOST, &point_block_offsets)); 200501f0e615SJames Wright 200601f0e615SJames Wright for (CeedSize i = 0; i < num_elem * elem_size; i++) { 200701f0e615SJames Wright for (CeedInt c_out = 0; c_out < num_active_components; c_out++) { 200801f0e615SJames Wright for (CeedInt c_in = 0; c_in < num_active_components; c_in++) { 2009506b1a0cSSebastian Grimberg (*rows)[point_block_offsets[i] + c_out * num_active_components + c_in] = offsets[i] + c_out * comp_stride; 2010506b1a0cSSebastian Grimberg (*cols)[point_block_offsets[i] + c_out * num_active_components + c_in] = offsets[i] + c_in * comp_stride; 201101f0e615SJames Wright } 201201f0e615SJames Wright } 201301f0e615SJames Wright } 201401f0e615SJames Wright 201501f0e615SJames Wright CeedCall(CeedElemRestrictionRestoreOffsets(active_elem_rstr, &offsets)); 2016506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionRestoreOffsets(point_block_active_elem_rstr, &point_block_offsets)); 2017506b1a0cSSebastian Grimberg CeedCall(CeedElemRestrictionDestroy(&point_block_active_elem_rstr)); 201801f0e615SJames Wright } 201901f0e615SJames Wright return CEED_ERROR_SUCCESS; 202001f0e615SJames Wright } 202101f0e615SJames Wright 202201f0e615SJames Wright /** 2023eaf62fffSJeremy L Thompson @brief Assemble the point block diagonal of a square linear CeedOperator 2024eaf62fffSJeremy L Thompson 2025ea61e9acSJeremy L Thompson This overwrites a CeedVector with the point block diagonal of a linear CeedOperator. 2026eaf62fffSJeremy L Thompson 2027ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 2028eaf62fffSJeremy L Thompson 2029ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 2030f04ea552SJeremy L Thompson 2031ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 2032ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp 2033ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out, 2034ea61e9acSJeremy L Thompson component in]. 2035ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 2036eaf62fffSJeremy L Thompson 2037eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2038eaf62fffSJeremy L Thompson 2039eaf62fffSJeremy L Thompson @ref User 2040eaf62fffSJeremy L Thompson **/ 20412b730f8bSJeremy L Thompson int CeedOperatorLinearAssemblePointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 2042f3d47e36SJeremy L Thompson bool is_composite; 20431c66c397SJeremy L Thompson CeedSize input_size = 0, output_size = 0; 20441c66c397SJeremy L Thompson 20452b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 2046f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 2047eaf62fffSJeremy L Thompson 20482b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 20496574a04fSJeremy L Thompson CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 2050c9366a6bSJeremy L Thompson 2051f3d47e36SJeremy L Thompson // Early exit for empty operator 2052f3d47e36SJeremy L Thompson if (!is_composite) { 2053f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 2054f3d47e36SJeremy L Thompson 2055f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 2056f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 2057f3d47e36SJeremy L Thompson } 2058f3d47e36SJeremy L Thompson 2059eaf62fffSJeremy L Thompson if (op->LinearAssemblePointBlockDiagonal) { 2060d04bbc78SJeremy L Thompson // Backend version 20612b730f8bSJeremy L Thompson CeedCall(op->LinearAssemblePointBlockDiagonal(op, assembled, request)); 2062eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2063eaf62fffSJeremy L Thompson } else if (op->LinearAssembleAddPointBlockDiagonal) { 2064d04bbc78SJeremy L Thompson // Backend version with zeroing first 20652b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 20662b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request)); 2067eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2068eaf62fffSJeremy L Thompson } else { 2069d04bbc78SJeremy L Thompson // Operator fallback 2070d04bbc78SJeremy L Thompson CeedOperator op_fallback; 2071d04bbc78SJeremy L Thompson 20722b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 2073d04bbc78SJeremy L Thompson if (op_fallback) { 20742b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssemblePointBlockDiagonal(op_fallback, assembled, request)); 2075eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2076eaf62fffSJeremy L Thompson } 2077eaf62fffSJeremy L Thompson } 2078eaf62fffSJeremy L Thompson // Default interface implementation 20792b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 20802b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request)); 2081eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2082eaf62fffSJeremy L Thompson } 2083eaf62fffSJeremy L Thompson 2084eaf62fffSJeremy L Thompson /** 2085eaf62fffSJeremy L Thompson @brief Assemble the point block diagonal of a square linear CeedOperator 2086eaf62fffSJeremy L Thompson 2087ea61e9acSJeremy L Thompson This sums into a CeedVector with the point block diagonal of a linear CeedOperator. 2088eaf62fffSJeremy L Thompson 2089ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 2090eaf62fffSJeremy L Thompson 2091ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 2092f04ea552SJeremy L Thompson 2093ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 2094ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp 2095ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out, 2096ea61e9acSJeremy L Thompson component in]. 2097ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 2098eaf62fffSJeremy L Thompson 2099eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2100eaf62fffSJeremy L Thompson 2101eaf62fffSJeremy L Thompson @ref User 2102eaf62fffSJeremy L Thompson **/ 21032b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddPointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 2104f3d47e36SJeremy L Thompson bool is_composite; 21051c66c397SJeremy L Thompson CeedSize input_size = 0, output_size = 0; 21061c66c397SJeremy L Thompson 21072b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 2108f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 2109eaf62fffSJeremy L Thompson 21102b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 21116574a04fSJeremy L Thompson CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 2112c9366a6bSJeremy L Thompson 2113f3d47e36SJeremy L Thompson // Early exit for empty operator 2114f3d47e36SJeremy L Thompson if (!is_composite) { 2115f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 2116f3d47e36SJeremy L Thompson 2117f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 2118f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 2119f3d47e36SJeremy L Thompson } 2120f3d47e36SJeremy L Thompson 2121eaf62fffSJeremy L Thompson if (op->LinearAssembleAddPointBlockDiagonal) { 2122d04bbc78SJeremy L Thompson // Backend version 21232b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleAddPointBlockDiagonal(op, assembled, request)); 2124eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2125eaf62fffSJeremy L Thompson } else { 2126d04bbc78SJeremy L Thompson // Operator fallback 2127d04bbc78SJeremy L Thompson CeedOperator op_fallback; 2128d04bbc78SJeremy L Thompson 21292b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 2130d04bbc78SJeremy L Thompson if (op_fallback) { 21312b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op_fallback, assembled, request)); 2132eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2133eaf62fffSJeremy L Thompson } 2134eaf62fffSJeremy L Thompson } 2135ea61e9acSJeremy L Thompson // Default interface implementation 2136eaf62fffSJeremy L Thompson if (is_composite) { 21372b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, true, assembled)); 2138eaf62fffSJeremy L Thompson } else { 21392b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, true, assembled)); 2140eaf62fffSJeremy L Thompson } 2141d04bbc78SJeremy L Thompson return CEED_ERROR_SUCCESS; 2142eaf62fffSJeremy L Thompson } 2143eaf62fffSJeremy L Thompson 2144eaf62fffSJeremy L Thompson /** 2145eaf62fffSJeremy L Thompson @brief Fully assemble the nonzero pattern of a linear operator. 2146eaf62fffSJeremy L Thompson 2147ea61e9acSJeremy L Thompson Expected to be used in conjunction with CeedOperatorLinearAssemble(). 2148eaf62fffSJeremy L Thompson 2149ea61e9acSJeremy L Thompson The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the 21509fd66db6SSebastian Grimberg matrix in entry (i, j). 21519fd66db6SSebastian Grimberg Note that the (i, j) pairs are not unique and may repeat. 21529fd66db6SSebastian Grimberg This function returns the number of entries and their (i, j) locations, while CeedOperatorLinearAssemble() provides the values in the same ordering. 2153eaf62fffSJeremy L Thompson 2154eaf62fffSJeremy L Thompson This will generally be slow unless your operator is low-order. 2155eaf62fffSJeremy L Thompson 2156ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 2157f04ea552SJeremy L Thompson 2158eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 2159eaf62fffSJeremy L Thompson @param[out] num_entries Number of entries in coordinate nonzero pattern 2160eaf62fffSJeremy L Thompson @param[out] rows Row number for each entry 2161eaf62fffSJeremy L Thompson @param[out] cols Column number for each entry 2162eaf62fffSJeremy L Thompson 2163eaf62fffSJeremy L Thompson @ref User 2164eaf62fffSJeremy L Thompson **/ 21652b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleSymbolic(CeedOperator op, CeedSize *num_entries, CeedInt **rows, CeedInt **cols) { 21661c66c397SJeremy L Thompson bool is_composite; 21671c66c397SJeremy L Thompson CeedInt num_suboperators, offset = 0; 2168b94338b9SJed Brown CeedSize single_entries; 2169eaf62fffSJeremy L Thompson CeedOperator *sub_operators; 21701c66c397SJeremy L Thompson 21712b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 2172f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 2173eaf62fffSJeremy L Thompson 2174eaf62fffSJeremy L Thompson if (op->LinearAssembleSymbolic) { 2175d04bbc78SJeremy L Thompson // Backend version 21762b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleSymbolic(op, num_entries, rows, cols)); 2177eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2178eaf62fffSJeremy L Thompson } else { 2179d04bbc78SJeremy L Thompson // Operator fallback 2180d04bbc78SJeremy L Thompson CeedOperator op_fallback; 2181d04bbc78SJeremy L Thompson 21822b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 2183d04bbc78SJeremy L Thompson if (op_fallback) { 21842b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleSymbolic(op_fallback, num_entries, rows, cols)); 2185eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2186eaf62fffSJeremy L Thompson } 2187eaf62fffSJeremy L Thompson } 2188eaf62fffSJeremy L Thompson 2189eaf62fffSJeremy L Thompson // Default interface implementation 2190eaf62fffSJeremy L Thompson 2191506b1a0cSSebastian Grimberg // Count entries and allocate rows, cols arrays 2192eaf62fffSJeremy L Thompson *num_entries = 0; 2193eaf62fffSJeremy L Thompson if (is_composite) { 2194c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 2195c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 219692ae7e47SJeremy L Thompson for (CeedInt k = 0; k < num_suboperators; ++k) { 21972b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries)); 2198eaf62fffSJeremy L Thompson *num_entries += single_entries; 2199eaf62fffSJeremy L Thompson } 2200eaf62fffSJeremy L Thompson } else { 22012b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(op, &single_entries)); 2202eaf62fffSJeremy L Thompson *num_entries += single_entries; 2203eaf62fffSJeremy L Thompson } 22042b730f8bSJeremy L Thompson CeedCall(CeedCalloc(*num_entries, rows)); 22052b730f8bSJeremy L Thompson CeedCall(CeedCalloc(*num_entries, cols)); 2206eaf62fffSJeremy L Thompson 2207506b1a0cSSebastian Grimberg // Assemble nonzero locations 2208eaf62fffSJeremy L Thompson if (is_composite) { 2209c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 2210c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 221192ae7e47SJeremy L Thompson for (CeedInt k = 0; k < num_suboperators; ++k) { 22122b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleSymbolic(sub_operators[k], offset, *rows, *cols)); 22132b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries)); 2214eaf62fffSJeremy L Thompson offset += single_entries; 2215eaf62fffSJeremy L Thompson } 2216eaf62fffSJeremy L Thompson } else { 22172b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleSymbolic(op, offset, *rows, *cols)); 2218eaf62fffSJeremy L Thompson } 2219eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2220eaf62fffSJeremy L Thompson } 2221eaf62fffSJeremy L Thompson 2222eaf62fffSJeremy L Thompson /** 2223eaf62fffSJeremy L Thompson @brief Fully assemble the nonzero entries of a linear operator. 2224eaf62fffSJeremy L Thompson 2225ea61e9acSJeremy L Thompson Expected to be used in conjunction with CeedOperatorLinearAssembleSymbolic(). 2226eaf62fffSJeremy L Thompson 2227ea61e9acSJeremy L Thompson The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the 22289fd66db6SSebastian Grimberg matrix in entry (i, j). 22299fd66db6SSebastian Grimberg Note that the (i, j) pairs are not unique and may repeat. 22309fd66db6SSebastian Grimberg This function returns the values of the nonzero entries to be added, their (i, j) locations are provided by CeedOperatorLinearAssembleSymbolic() 2231eaf62fffSJeremy L Thompson 2232eaf62fffSJeremy L Thompson This will generally be slow unless your operator is low-order. 2233eaf62fffSJeremy L Thompson 2234ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 2235f04ea552SJeremy L Thompson 2236eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 2237eaf62fffSJeremy L Thompson @param[out] values Values to assemble into matrix 2238eaf62fffSJeremy L Thompson 2239eaf62fffSJeremy L Thompson @ref User 2240eaf62fffSJeremy L Thompson **/ 2241eaf62fffSJeremy L Thompson int CeedOperatorLinearAssemble(CeedOperator op, CeedVector values) { 22421c66c397SJeremy L Thompson bool is_composite; 22431c66c397SJeremy L Thompson CeedInt num_suboperators, offset = 0; 2244b94338b9SJed Brown CeedSize single_entries = 0; 2245eaf62fffSJeremy L Thompson CeedOperator *sub_operators; 22461c66c397SJeremy L Thompson 22472b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 2248f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 2249f3d47e36SJeremy L Thompson 2250f3d47e36SJeremy L Thompson // Early exit for empty operator 2251f3d47e36SJeremy L Thompson if (!is_composite) { 2252f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 2253f3d47e36SJeremy L Thompson 2254f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 2255f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 2256f3d47e36SJeremy L Thompson } 2257eaf62fffSJeremy L Thompson 2258eaf62fffSJeremy L Thompson if (op->LinearAssemble) { 2259d04bbc78SJeremy L Thompson // Backend version 22602b730f8bSJeremy L Thompson CeedCall(op->LinearAssemble(op, values)); 2261eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2262eaf62fffSJeremy L Thompson } else { 2263d04bbc78SJeremy L Thompson // Operator fallback 2264d04bbc78SJeremy L Thompson CeedOperator op_fallback; 2265d04bbc78SJeremy L Thompson 22662b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 2267d04bbc78SJeremy L Thompson if (op_fallback) { 22682b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssemble(op_fallback, values)); 2269eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2270eaf62fffSJeremy L Thompson } 2271eaf62fffSJeremy L Thompson } 2272eaf62fffSJeremy L Thompson 2273eaf62fffSJeremy L Thompson // Default interface implementation 227428ec399dSJeremy L Thompson CeedCall(CeedVectorSetValue(values, 0.0)); 2275eaf62fffSJeremy L Thompson if (is_composite) { 2276c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 2277c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 2278cefa2673SJeremy L Thompson for (CeedInt k = 0; k < num_suboperators; k++) { 22792b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemble(sub_operators[k], offset, values)); 22802b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries)); 2281eaf62fffSJeremy L Thompson offset += single_entries; 2282eaf62fffSJeremy L Thompson } 2283eaf62fffSJeremy L Thompson } else { 22842b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemble(op, offset, values)); 2285eaf62fffSJeremy L Thompson } 2286eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2287eaf62fffSJeremy L Thompson } 2288eaf62fffSJeremy L Thompson 2289eaf62fffSJeremy L Thompson /** 229075f0d5a4SJeremy L Thompson @brief Get the multiplicity of nodes across suboperators in a composite CeedOperator 229175f0d5a4SJeremy L Thompson 229275f0d5a4SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 229375f0d5a4SJeremy L Thompson 229475f0d5a4SJeremy L Thompson @param[in] op Composite CeedOperator 229575f0d5a4SJeremy L Thompson @param[in] num_skip_indices Number of suboperators to skip 229675f0d5a4SJeremy L Thompson @param[in] skip_indices Array of indices of suboperators to skip 229775f0d5a4SJeremy L Thompson @param[out] mult Vector to store multiplicity (of size l_size) 229875f0d5a4SJeremy L Thompson 229975f0d5a4SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 230075f0d5a4SJeremy L Thompson 230175f0d5a4SJeremy L Thompson @ref User 230275f0d5a4SJeremy L Thompson **/ 230375f0d5a4SJeremy L Thompson int CeedCompositeOperatorGetMultiplicity(CeedOperator op, CeedInt num_skip_indices, CeedInt *skip_indices, CeedVector mult) { 230475f0d5a4SJeremy L Thompson Ceed ceed; 2305b275c451SJeremy L Thompson CeedInt num_suboperators; 230675f0d5a4SJeremy L Thompson CeedSize l_vec_len; 230775f0d5a4SJeremy L Thompson CeedScalar *mult_array; 230875f0d5a4SJeremy L Thompson CeedVector ones_l_vec; 23097c1dbaffSSebastian Grimberg CeedElemRestriction elem_rstr, mult_elem_rstr; 2310b275c451SJeremy L Thompson CeedOperator *sub_operators; 231175f0d5a4SJeremy L Thompson 23121c66c397SJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 23131c66c397SJeremy L Thompson 231475f0d5a4SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 231575f0d5a4SJeremy L Thompson 231675f0d5a4SJeremy L Thompson // Zero mult vector 231775f0d5a4SJeremy L Thompson CeedCall(CeedVectorSetValue(mult, 0.0)); 231875f0d5a4SJeremy L Thompson 231975f0d5a4SJeremy L Thompson // Get suboperators 2320b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 2321b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 2322b275c451SJeremy L Thompson if (num_suboperators == 0) return CEED_ERROR_SUCCESS; 232375f0d5a4SJeremy L Thompson 232475f0d5a4SJeremy L Thompson // Work vector 232575f0d5a4SJeremy L Thompson CeedCall(CeedVectorGetLength(mult, &l_vec_len)); 232675f0d5a4SJeremy L Thompson CeedCall(CeedVectorCreate(ceed, l_vec_len, &ones_l_vec)); 232775f0d5a4SJeremy L Thompson CeedCall(CeedVectorSetValue(ones_l_vec, 1.0)); 232875f0d5a4SJeremy L Thompson CeedCall(CeedVectorGetArray(mult, CEED_MEM_HOST, &mult_array)); 232975f0d5a4SJeremy L Thompson 233075f0d5a4SJeremy L Thompson // Compute multiplicity across suboperators 2331b275c451SJeremy L Thompson for (CeedInt i = 0; i < num_suboperators; i++) { 233275f0d5a4SJeremy L Thompson const CeedScalar *sub_mult_array; 233375f0d5a4SJeremy L Thompson CeedVector sub_mult_l_vec, ones_e_vec; 233475f0d5a4SJeremy L Thompson 233575f0d5a4SJeremy L Thompson // -- Check for suboperator to skip 233675f0d5a4SJeremy L Thompson for (CeedInt j = 0; j < num_skip_indices; j++) { 233775f0d5a4SJeremy L Thompson if (skip_indices[j] == i) continue; 233875f0d5a4SJeremy L Thompson } 233975f0d5a4SJeremy L Thompson 234075f0d5a4SJeremy L Thompson // -- Sub operator multiplicity 2341437c7c90SJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(sub_operators[i], &elem_rstr)); 23427c1dbaffSSebastian Grimberg CeedCall(CeedElemRestrictionCreateUnorientedCopy(elem_rstr, &mult_elem_rstr)); 23437c1dbaffSSebastian Grimberg CeedCall(CeedElemRestrictionCreateVector(mult_elem_rstr, &sub_mult_l_vec, &ones_e_vec)); 234475f0d5a4SJeremy L Thompson CeedCall(CeedVectorSetValue(sub_mult_l_vec, 0.0)); 23457c1dbaffSSebastian Grimberg CeedCall(CeedElemRestrictionApply(mult_elem_rstr, CEED_NOTRANSPOSE, ones_l_vec, ones_e_vec, CEED_REQUEST_IMMEDIATE)); 23467c1dbaffSSebastian Grimberg CeedCall(CeedElemRestrictionApply(mult_elem_rstr, CEED_TRANSPOSE, ones_e_vec, sub_mult_l_vec, CEED_REQUEST_IMMEDIATE)); 234775f0d5a4SJeremy L Thompson CeedCall(CeedVectorGetArrayRead(sub_mult_l_vec, CEED_MEM_HOST, &sub_mult_array)); 234875f0d5a4SJeremy L Thompson // ---- Flag every node present in the current suboperator 234975f0d5a4SJeremy L Thompson for (CeedInt j = 0; j < l_vec_len; j++) { 235075f0d5a4SJeremy L Thompson if (sub_mult_array[j] > 0.0) mult_array[j] += 1.0; 235175f0d5a4SJeremy L Thompson } 235275f0d5a4SJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(sub_mult_l_vec, &sub_mult_array)); 235375f0d5a4SJeremy L Thompson CeedCall(CeedVectorDestroy(&sub_mult_l_vec)); 235475f0d5a4SJeremy L Thompson CeedCall(CeedVectorDestroy(&ones_e_vec)); 23557c1dbaffSSebastian Grimberg CeedCall(CeedElemRestrictionDestroy(&mult_elem_rstr)); 235675f0d5a4SJeremy L Thompson } 235775f0d5a4SJeremy L Thompson CeedCall(CeedVectorRestoreArray(mult, &mult_array)); 2358811d0ccfSJeremy L Thompson CeedCall(CeedVectorDestroy(&ones_l_vec)); 235975f0d5a4SJeremy L Thompson return CEED_ERROR_SUCCESS; 236075f0d5a4SJeremy L Thompson } 236175f0d5a4SJeremy L Thompson 236275f0d5a4SJeremy L Thompson /** 2363ea61e9acSJeremy L Thompson @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator, creating the prolongation basis from the fine and coarse 2364ea61e9acSJeremy L Thompson grid interpolation 2365eaf62fffSJeremy L Thompson 236658e4b056SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable. 2367f04ea552SJeremy L Thompson 2368eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 236985bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 2370eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 2371eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 2372eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 237385bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 23747758292fSSebastian Grimberg @param[out] op_restrict Fine to coarse operator, or NULL 2375eaf62fffSJeremy L Thompson 2376eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2377eaf62fffSJeremy L Thompson 2378eaf62fffSJeremy L Thompson @ref User 2379eaf62fffSJeremy L Thompson **/ 23802b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreate(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 23817758292fSSebastian Grimberg CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) { 23821c66c397SJeremy L Thompson CeedBasis basis_c_to_f = NULL; 23831c66c397SJeremy L Thompson 23842b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fine)); 2385eaf62fffSJeremy L Thompson 238683d6adf3SZach Atkins // Build prolongation matrix, if required 23877758292fSSebastian Grimberg if (op_prolong || op_restrict) { 238883d6adf3SZach Atkins CeedBasis basis_fine; 23891c66c397SJeremy L Thompson 23902b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine)); 23912b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateProjection(basis_coarse, basis_fine, &basis_c_to_f)); 239283d6adf3SZach Atkins } 2393eaf62fffSJeremy L Thompson 2394f113e5dcSJeremy L Thompson // Core code 23957758292fSSebastian Grimberg CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict)); 2396eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2397eaf62fffSJeremy L Thompson } 2398eaf62fffSJeremy L Thompson 2399eaf62fffSJeremy L Thompson /** 2400ea61e9acSJeremy L Thompson @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a tensor basis for the active basis 2401eaf62fffSJeremy L Thompson 240258e4b056SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable. 2403f04ea552SJeremy L Thompson 2404eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 240585bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 2406eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 2407eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 240885bb9dcfSJeremy L Thompson @param[in] interp_c_to_f Matrix for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators 2409eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 241085bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 24117758292fSSebastian Grimberg @param[out] op_restrict Fine to coarse operator, or NULL 2412eaf62fffSJeremy L Thompson 2413eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2414eaf62fffSJeremy L Thompson 2415eaf62fffSJeremy L Thompson @ref User 2416eaf62fffSJeremy L Thompson **/ 24172b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateTensorH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 24182b730f8bSJeremy L Thompson const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, 24197758292fSSebastian Grimberg CeedOperator *op_restrict) { 2420eaf62fffSJeremy L Thompson Ceed ceed; 24211c66c397SJeremy L Thompson CeedInt Q_f, Q_c; 24221c66c397SJeremy L Thompson CeedBasis basis_fine, basis_c_to_f = NULL; 24231c66c397SJeremy L Thompson 24241c66c397SJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fine)); 24252b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op_fine, &ceed)); 2426eaf62fffSJeremy L Thompson 2427eaf62fffSJeremy L Thompson // Check for compatible quadrature spaces 24282b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine)); 24292b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f)); 24302b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c)); 24316574a04fSJeremy L Thompson CeedCheck(Q_f == Q_c, ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces"); 2432eaf62fffSJeremy L Thompson 243383d6adf3SZach Atkins // Create coarse to fine basis, if required 24347758292fSSebastian Grimberg if (op_prolong || op_restrict) { 24351c66c397SJeremy L Thompson CeedInt dim, num_comp, num_nodes_c, P_1d_f, P_1d_c; 24361c66c397SJeremy L Thompson CeedScalar *q_ref, *q_weight, *grad; 24371c66c397SJeremy L Thompson 243883d6adf3SZach Atkins // Check if interpolation matrix is provided 24396574a04fSJeremy L Thompson CeedCheck(interp_c_to_f, ceed, CEED_ERROR_INCOMPATIBLE, 24406574a04fSJeremy L Thompson "Prolongation or restriction operator creation requires coarse-to-fine interpolation matrix"); 24412b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis_fine, &dim)); 24422b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp)); 24432b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes1D(basis_fine, &P_1d_f)); 24442b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c)); 24452b730f8bSJeremy L Thompson P_1d_c = dim == 1 ? num_nodes_c : dim == 2 ? sqrt(num_nodes_c) : cbrt(num_nodes_c); 24462b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d_f, &q_ref)); 24472b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d_f, &q_weight)); 24482b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d_f * P_1d_c * dim, &grad)); 24492b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateTensorH1(ceed, dim, num_comp, P_1d_c, P_1d_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f)); 24502b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_ref)); 24512b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_weight)); 24522b730f8bSJeremy L Thompson CeedCall(CeedFree(&grad)); 245383d6adf3SZach Atkins } 2454eaf62fffSJeremy L Thompson 2455eaf62fffSJeremy L Thompson // Core code 24567758292fSSebastian Grimberg CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict)); 2457eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2458eaf62fffSJeremy L Thompson } 2459eaf62fffSJeremy L Thompson 2460eaf62fffSJeremy L Thompson /** 2461ea61e9acSJeremy L Thompson @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a non-tensor basis for the active vector 2462eaf62fffSJeremy L Thompson 246358e4b056SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable. 2464f04ea552SJeremy L Thompson 2465eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 246685bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 2467eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 2468eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 246985bb9dcfSJeremy L Thompson @param[in] interp_c_to_f Matrix for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators 2470eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 247185bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 24727758292fSSebastian Grimberg @param[out] op_restrict Fine to coarse operator, or NULL 2473eaf62fffSJeremy L Thompson 2474eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2475eaf62fffSJeremy L Thompson 2476eaf62fffSJeremy L Thompson @ref User 2477eaf62fffSJeremy L Thompson **/ 24782b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 24797758292fSSebastian Grimberg const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, 24807758292fSSebastian Grimberg CeedOperator *op_restrict) { 2481eaf62fffSJeremy L Thompson Ceed ceed; 24821c66c397SJeremy L Thompson CeedInt Q_f, Q_c; 24831c66c397SJeremy L Thompson CeedBasis basis_fine, basis_c_to_f = NULL; 24841c66c397SJeremy L Thompson 24851c66c397SJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fine)); 24862b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op_fine, &ceed)); 2487eaf62fffSJeremy L Thompson 2488eaf62fffSJeremy L Thompson // Check for compatible quadrature spaces 24892b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine)); 24902b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f)); 24912b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c)); 24926574a04fSJeremy L Thompson CeedCheck(Q_f == Q_c, ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces"); 2493eaf62fffSJeremy L Thompson 2494eaf62fffSJeremy L Thompson // Coarse to fine basis 24957758292fSSebastian Grimberg if (op_prolong || op_restrict) { 24961c66c397SJeremy L Thompson CeedInt dim, num_comp, num_nodes_c, num_nodes_f; 24971c66c397SJeremy L Thompson CeedScalar *q_ref, *q_weight, *grad; 24981c66c397SJeremy L Thompson CeedElemTopology topo; 24991c66c397SJeremy L Thompson 250083d6adf3SZach Atkins // Check if interpolation matrix is provided 25016574a04fSJeremy L Thompson CeedCheck(interp_c_to_f, ceed, CEED_ERROR_INCOMPATIBLE, 25026574a04fSJeremy L Thompson "Prolongation or restriction operator creation requires coarse-to-fine interpolation matrix"); 25032b730f8bSJeremy L Thompson CeedCall(CeedBasisGetTopology(basis_fine, &topo)); 25042b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis_fine, &dim)); 25052b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp)); 25062b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes(basis_fine, &num_nodes_f)); 25072b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c)); 25082b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_nodes_f * dim, &q_ref)); 25092b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_nodes_f, &q_weight)); 25102b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_nodes_f * num_nodes_c * dim, &grad)); 25112b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateH1(ceed, topo, num_comp, num_nodes_c, num_nodes_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f)); 25122b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_ref)); 25132b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_weight)); 25142b730f8bSJeremy L Thompson CeedCall(CeedFree(&grad)); 251583d6adf3SZach Atkins } 2516eaf62fffSJeremy L Thompson 2517eaf62fffSJeremy L Thompson // Core code 25187758292fSSebastian Grimberg CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict)); 2519eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2520eaf62fffSJeremy L Thompson } 2521eaf62fffSJeremy L Thompson 2522eaf62fffSJeremy L Thompson /** 2523ea61e9acSJeremy L Thompson @brief Build a FDM based approximate inverse for each element for a CeedOperator 2524eaf62fffSJeremy L Thompson 2525ea61e9acSJeremy L Thompson This returns a CeedOperator and CeedVector to apply a Fast Diagonalization Method based approximate inverse. 2526859c15bbSJames Wright This function obtains the simultaneous diagonalization for the 1D mass and Laplacian operators, \f$M = V^T V, K = V^T S V\f$. 2527859c15bbSJames Wright The assembled QFunction is used to modify the eigenvalues from simultaneous diagonalization and obtain an approximate inverse of the form \f$V^T 25289fd66db6SSebastian Grimberg \hat S V\f$. 25299fd66db6SSebastian Grimberg The CeedOperator must be linear and non-composite. 25309fd66db6SSebastian Grimberg The associated CeedQFunction must therefore also be linear. 2531eaf62fffSJeremy L Thompson 2532ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 2533f04ea552SJeremy L Thompson 2534ea61e9acSJeremy L Thompson @param[in] op CeedOperator to create element inverses 2535ea61e9acSJeremy L Thompson @param[out] fdm_inv CeedOperator to apply the action of a FDM based inverse for each element 2536ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 2537eaf62fffSJeremy L Thompson 2538eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2539eaf62fffSJeremy L Thompson 2540480fae85SJeremy L Thompson @ref User 2541eaf62fffSJeremy L Thompson **/ 25422b730f8bSJeremy L Thompson int CeedOperatorCreateFDMElementInverse(CeedOperator op, CeedOperator *fdm_inv, CeedRequest *request) { 25431c66c397SJeremy L Thompson Ceed ceed, ceed_parent; 25441c66c397SJeremy L Thompson bool interp = false, grad = false, is_tensor_basis = true; 25451c66c397SJeremy L Thompson CeedInt num_input_fields, P_1d, Q_1d, num_nodes, num_qpts, dim, num_comp = 1, num_elem = 1; 25461c66c397SJeremy L Thompson CeedSize l_size = 1; 25471c66c397SJeremy L Thompson CeedScalar *mass, *laplace, *x, *fdm_interp, *lambda, *elem_avg; 25481c66c397SJeremy L Thompson const CeedScalar *interp_1d, *grad_1d, *q_weight_1d; 25491c66c397SJeremy L Thompson CeedVector q_data; 25501c66c397SJeremy L Thompson CeedElemRestriction rstr = NULL, rstr_qd_i; 25511c66c397SJeremy L Thompson CeedBasis basis = NULL, fdm_basis; 25521c66c397SJeremy L Thompson CeedQFunctionContext ctx_fdm; 25531c66c397SJeremy L Thompson CeedQFunctionField *qf_fields; 25541c66c397SJeremy L Thompson CeedQFunction qf, qf_fdm; 25551c66c397SJeremy L Thompson CeedOperatorField *op_fields; 25561c66c397SJeremy L Thompson 25572b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 2558eaf62fffSJeremy L Thompson 2559eaf62fffSJeremy L Thompson if (op->CreateFDMElementInverse) { 2560d04bbc78SJeremy L Thompson // Backend version 25612b730f8bSJeremy L Thompson CeedCall(op->CreateFDMElementInverse(op, fdm_inv, request)); 2562eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2563eaf62fffSJeremy L Thompson } else { 2564d04bbc78SJeremy L Thompson // Operator fallback 2565d04bbc78SJeremy L Thompson CeedOperator op_fallback; 2566d04bbc78SJeremy L Thompson 25672b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 2568d04bbc78SJeremy L Thompson if (op_fallback) { 25692b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreateFDMElementInverse(op_fallback, fdm_inv, request)); 2570eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2571eaf62fffSJeremy L Thompson } 2572eaf62fffSJeremy L Thompson } 2573eaf62fffSJeremy L Thompson 2574d04bbc78SJeremy L Thompson // Default interface implementation 25752b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 2576bb229da9SJeremy L Thompson CeedCall(CeedOperatorGetFallbackParentCeed(op, &ceed_parent)); 25772b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 2578eaf62fffSJeremy L Thompson 2579eaf62fffSJeremy L Thompson // Determine active input basis 25802b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, &num_input_fields, &op_fields, NULL, NULL)); 25812b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL)); 2582eaf62fffSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 2583eaf62fffSJeremy L Thompson CeedVector vec; 25841c66c397SJeremy L Thompson 25852b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec)); 2586eaf62fffSJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 2587eaf62fffSJeremy L Thompson CeedEvalMode eval_mode; 25881c66c397SJeremy L Thompson 25892b730f8bSJeremy L Thompson CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 2590eaf62fffSJeremy L Thompson interp = interp || eval_mode == CEED_EVAL_INTERP; 2591eaf62fffSJeremy L Thompson grad = grad || eval_mode == CEED_EVAL_GRAD; 25922b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 25932b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr)); 2594eaf62fffSJeremy L Thompson } 2595eaf62fffSJeremy L Thompson } 25966574a04fSJeremy L Thompson CeedCheck(basis, ceed, CEED_ERROR_BACKEND, "No active field set"); 25972b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes1D(basis, &P_1d)); 2598352a5e7cSSebastian Grimberg CeedCall(CeedBasisGetNumNodes(basis, &num_nodes)); 25992b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints1D(basis, &Q_1d)); 26002b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis, &num_qpts)); 26012b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis, &dim)); 26022b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis, &num_comp)); 26032b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem)); 26042b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size)); 2605eaf62fffSJeremy L Thompson 2606eaf62fffSJeremy L Thompson // Build and diagonalize 1D Mass and Laplacian 26076574a04fSJeremy L Thompson CeedCall(CeedBasisIsTensor(basis, &is_tensor_basis)); 26086574a04fSJeremy L Thompson CeedCheck(is_tensor_basis, ceed, CEED_ERROR_BACKEND, "FDMElementInverse only supported for tensor bases"); 26092b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &mass)); 26102b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &laplace)); 26112b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &x)); 26122b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &fdm_interp)); 26132b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d, &lambda)); 2614eaf62fffSJeremy L Thompson // -- Build matrices 26152b730f8bSJeremy L Thompson CeedCall(CeedBasisGetInterp1D(basis, &interp_1d)); 26162b730f8bSJeremy L Thompson CeedCall(CeedBasisGetGrad1D(basis, &grad_1d)); 26172b730f8bSJeremy L Thompson CeedCall(CeedBasisGetQWeights(basis, &q_weight_1d)); 26182b730f8bSJeremy L Thompson CeedCall(CeedBuildMassLaplace(interp_1d, grad_1d, q_weight_1d, P_1d, Q_1d, dim, mass, laplace)); 2619eaf62fffSJeremy L Thompson 2620eaf62fffSJeremy L Thompson // -- Diagonalize 26212b730f8bSJeremy L Thompson CeedCall(CeedSimultaneousDiagonalization(ceed, laplace, mass, x, lambda, P_1d)); 26222b730f8bSJeremy L Thompson CeedCall(CeedFree(&mass)); 26232b730f8bSJeremy L Thompson CeedCall(CeedFree(&laplace)); 26242b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) { 26252b730f8bSJeremy L Thompson for (CeedInt j = 0; j < P_1d; j++) fdm_interp[i + j * P_1d] = x[j + i * P_1d]; 26262b730f8bSJeremy L Thompson } 26272b730f8bSJeremy L Thompson CeedCall(CeedFree(&x)); 2628eaf62fffSJeremy L Thompson 26291c66c397SJeremy L Thompson { 26301c66c397SJeremy L Thompson CeedInt layout[3], num_modes = (interp ? 1 : 0) + (grad ? dim : 0); 26311c66c397SJeremy L Thompson CeedScalar max_norm = 0; 26321c66c397SJeremy L Thompson const CeedScalar *assembled_array, *q_weight_array; 26331c66c397SJeremy L Thompson CeedVector assembled = NULL, q_weight; 2634c5f45aeaSJeremy L Thompson CeedElemRestriction rstr_qf = NULL; 26351c66c397SJeremy L Thompson 26361c66c397SJeremy L Thompson // Assemble QFunction 26372b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled, &rstr_qf, request)); 26382b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(rstr_qf, &layout)); 26392b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_qf)); 26402b730f8bSJeremy L Thompson CeedCall(CeedVectorNorm(assembled, CEED_NORM_MAX, &max_norm)); 2641eaf62fffSJeremy L Thompson 2642eaf62fffSJeremy L Thompson // Calculate element averages 26432b730f8bSJeremy L Thompson CeedCall(CeedVectorCreate(ceed_parent, num_qpts, &q_weight)); 26442b730f8bSJeremy L Thompson CeedCall(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, q_weight)); 26452b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(assembled, CEED_MEM_HOST, &assembled_array)); 26462b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(q_weight, CEED_MEM_HOST, &q_weight_array)); 26472b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_elem, &elem_avg)); 2648eaf62fffSJeremy L Thompson const CeedScalar qf_value_bound = max_norm * 100 * CEED_EPSILON; 26491c66c397SJeremy L Thompson 2650eaf62fffSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 2651eaf62fffSJeremy L Thompson CeedInt count = 0; 26521c66c397SJeremy L Thompson 26532b730f8bSJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 26542b730f8bSJeremy L Thompson for (CeedInt i = 0; i < num_comp * num_comp * num_modes * num_modes; i++) { 26552b730f8bSJeremy L Thompson if (fabs(assembled_array[q * layout[0] + i * layout[1] + e * layout[2]]) > qf_value_bound) { 26562b730f8bSJeremy L Thompson elem_avg[e] += assembled_array[q * layout[0] + i * layout[1] + e * layout[2]] / q_weight_array[q]; 2657eaf62fffSJeremy L Thompson count++; 2658eaf62fffSJeremy L Thompson } 26592b730f8bSJeremy L Thompson } 26602b730f8bSJeremy L Thompson } 2661eaf62fffSJeremy L Thompson if (count) { 2662eaf62fffSJeremy L Thompson elem_avg[e] /= count; 2663eaf62fffSJeremy L Thompson } else { 2664eaf62fffSJeremy L Thompson elem_avg[e] = 1.0; 2665eaf62fffSJeremy L Thompson } 2666eaf62fffSJeremy L Thompson } 26672b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(assembled, &assembled_array)); 26682b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled)); 26692b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(q_weight, &q_weight_array)); 26702b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&q_weight)); 26711c66c397SJeremy L Thompson } 2672eaf62fffSJeremy L Thompson 2673eaf62fffSJeremy L Thompson // Build FDM diagonal 26741c66c397SJeremy L Thompson { 2675eaf62fffSJeremy L Thompson CeedScalar *q_data_array, *fdm_diagonal; 26761c66c397SJeremy L Thompson 2677352a5e7cSSebastian Grimberg CeedCall(CeedCalloc(num_comp * num_nodes, &fdm_diagonal)); 2678352a5e7cSSebastian Grimberg const CeedScalar fdm_diagonal_bound = num_nodes * CEED_EPSILON; 26792b730f8bSJeremy L Thompson for (CeedInt c = 0; c < num_comp; c++) { 2680352a5e7cSSebastian Grimberg for (CeedInt n = 0; n < num_nodes; n++) { 2681352a5e7cSSebastian Grimberg if (interp) fdm_diagonal[c * num_nodes + n] = 1.0; 26822b730f8bSJeremy L Thompson if (grad) { 2683eaf62fffSJeremy L Thompson for (CeedInt d = 0; d < dim; d++) { 2684eaf62fffSJeremy L Thompson CeedInt i = (n / CeedIntPow(P_1d, d)) % P_1d; 2685352a5e7cSSebastian Grimberg fdm_diagonal[c * num_nodes + n] += lambda[i]; 2686eaf62fffSJeremy L Thompson } 2687eaf62fffSJeremy L Thompson } 2688352a5e7cSSebastian Grimberg if (fabs(fdm_diagonal[c * num_nodes + n]) < fdm_diagonal_bound) fdm_diagonal[c * num_nodes + n] = fdm_diagonal_bound; 26892b730f8bSJeremy L Thompson } 26902b730f8bSJeremy L Thompson } 2691352a5e7cSSebastian Grimberg CeedCall(CeedVectorCreate(ceed_parent, num_elem * num_comp * num_nodes, &q_data)); 26922b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(q_data, 0.0)); 26932b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayWrite(q_data, CEED_MEM_HOST, &q_data_array)); 26942b730f8bSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 26952b730f8bSJeremy L Thompson for (CeedInt c = 0; c < num_comp; c++) { 26961c66c397SJeremy L Thompson for (CeedInt n = 0; n < num_nodes; n++) 26971c66c397SJeremy L Thompson q_data_array[(e * num_comp + c) * num_nodes + n] = 1. / (elem_avg[e] * fdm_diagonal[c * num_nodes + n]); 26982b730f8bSJeremy L Thompson } 26992b730f8bSJeremy L Thompson } 27002b730f8bSJeremy L Thompson CeedCall(CeedFree(&elem_avg)); 27012b730f8bSJeremy L Thompson CeedCall(CeedFree(&fdm_diagonal)); 27022b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(q_data, &q_data_array)); 27031c66c397SJeremy L Thompson } 2704eaf62fffSJeremy L Thompson 2705eaf62fffSJeremy L Thompson // Setup FDM operator 2706eaf62fffSJeremy L Thompson // -- Basis 27071c66c397SJeremy L Thompson { 2708eaf62fffSJeremy L Thompson CeedScalar *grad_dummy, *q_ref_dummy, *q_weight_dummy; 27091c66c397SJeremy L Thompson 27102b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &grad_dummy)); 27112b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d, &q_ref_dummy)); 27122b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d, &q_weight_dummy)); 27132b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateTensorH1(ceed_parent, dim, num_comp, P_1d, P_1d, fdm_interp, grad_dummy, q_ref_dummy, q_weight_dummy, &fdm_basis)); 27142b730f8bSJeremy L Thompson CeedCall(CeedFree(&fdm_interp)); 27152b730f8bSJeremy L Thompson CeedCall(CeedFree(&grad_dummy)); 27162b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_ref_dummy)); 27172b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_weight_dummy)); 27182b730f8bSJeremy L Thompson CeedCall(CeedFree(&lambda)); 27191c66c397SJeremy L Thompson } 2720eaf62fffSJeremy L Thompson 2721eaf62fffSJeremy L Thompson // -- Restriction 27221c66c397SJeremy L Thompson { 2723352a5e7cSSebastian Grimberg CeedInt strides[3] = {1, num_nodes, num_nodes * num_comp}; 2724352a5e7cSSebastian Grimberg CeedCall(CeedElemRestrictionCreateStrided(ceed_parent, num_elem, num_nodes, num_comp, num_elem * num_comp * num_nodes, strides, &rstr_qd_i)); 27251c66c397SJeremy L Thompson } 27261c66c397SJeremy L Thompson 2727eaf62fffSJeremy L Thompson // -- QFunction 27282b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateInteriorByName(ceed_parent, "Scale", &qf_fdm)); 27292b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_fdm, "input", num_comp, CEED_EVAL_INTERP)); 27302b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_fdm, "scale", num_comp, CEED_EVAL_NONE)); 27312b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(qf_fdm, "output", num_comp, CEED_EVAL_INTERP)); 27322b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_fdm, num_comp)); 27331c66c397SJeremy L Thompson 2734eaf62fffSJeremy L Thompson // -- QFunction context 27351c66c397SJeremy L Thompson { 2736eaf62fffSJeremy L Thompson CeedInt *num_comp_data; 27371c66c397SJeremy L Thompson 27382b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &num_comp_data)); 2739eaf62fffSJeremy L Thompson num_comp_data[0] = num_comp; 27402b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextCreate(ceed, &ctx_fdm)); 27412b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextSetData(ctx_fdm, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_data), num_comp_data)); 27421c66c397SJeremy L Thompson } 27432b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(qf_fdm, ctx_fdm)); 27442b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextDestroy(&ctx_fdm)); 27451c66c397SJeremy L Thompson 2746eaf62fffSJeremy L Thompson // -- Operator 27472b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed_parent, qf_fdm, NULL, NULL, fdm_inv)); 27482b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*fdm_inv, "input", rstr, fdm_basis, CEED_VECTOR_ACTIVE)); 2749356036faSJeremy L Thompson CeedCall(CeedOperatorSetField(*fdm_inv, "scale", rstr_qd_i, CEED_BASIS_NONE, q_data)); 27502b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*fdm_inv, "output", rstr, fdm_basis, CEED_VECTOR_ACTIVE)); 2751eaf62fffSJeremy L Thompson 2752eaf62fffSJeremy L Thompson // Cleanup 27532b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&q_data)); 27542b730f8bSJeremy L Thompson CeedCall(CeedBasisDestroy(&fdm_basis)); 27552b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_qd_i)); 27562b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&qf_fdm)); 2757eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2758eaf62fffSJeremy L Thompson } 2759eaf62fffSJeremy L Thompson 2760eaf62fffSJeremy L Thompson /// @} 2761