13d8e8822SJeremy L Thompson // Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors. 23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details. 3eaf62fffSJeremy L Thompson // 43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause 5eaf62fffSJeremy L Thompson // 63d8e8822SJeremy L Thompson // This file is part of CEED: http://github.com/ceed 7eaf62fffSJeremy L Thompson 8ed9e99e6SJeremy L Thompson #include <assert.h> 92b730f8bSJeremy L Thompson #include <ceed-impl.h> 102b730f8bSJeremy L Thompson #include <ceed/backend.h> 112b730f8bSJeremy L Thompson #include <ceed/ceed.h> 122b730f8bSJeremy L Thompson #include <math.h> 13eaf62fffSJeremy L Thompson #include <stdbool.h> 14eaf62fffSJeremy L Thompson #include <stdio.h> 15eaf62fffSJeremy L Thompson #include <string.h> 16eaf62fffSJeremy L Thompson 17eaf62fffSJeremy L Thompson /// @file 18eaf62fffSJeremy L Thompson /// Implementation of CeedOperator preconditioning interfaces 19eaf62fffSJeremy L Thompson 20eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 21eaf62fffSJeremy L Thompson /// CeedOperator Library Internal Preconditioning Functions 22eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 23eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorDeveloper 24eaf62fffSJeremy L Thompson /// @{ 25eaf62fffSJeremy L Thompson 26eaf62fffSJeremy L Thompson /** 27ea61e9acSJeremy L Thompson @brief Duplicate a CeedQFunction with a reference Ceed to fallback for advanced CeedOperator functionality 289e77b9c8SJeremy L Thompson 2901ea9c81SJed Brown @param[in] fallback_ceed Ceed on which to create fallback CeedQFunction 309e77b9c8SJeremy L Thompson @param[in] qf CeedQFunction to create fallback for 3101ea9c81SJed Brown @param[out] qf_fallback fallback CeedQFunction 329e77b9c8SJeremy L Thompson 339e77b9c8SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 349e77b9c8SJeremy L Thompson 359e77b9c8SJeremy L Thompson @ref Developer 369e77b9c8SJeremy L Thompson **/ 372b730f8bSJeremy L Thompson static int CeedQFunctionCreateFallback(Ceed fallback_ceed, CeedQFunction qf, CeedQFunction *qf_fallback) { 389e77b9c8SJeremy L Thompson // Check if NULL qf passed in 399e77b9c8SJeremy L Thompson if (!qf) return CEED_ERROR_SUCCESS; 409e77b9c8SJeremy L Thompson 41d04bbc78SJeremy L Thompson CeedDebug256(qf->ceed, 1, "---------- CeedOperator Fallback ----------\n"); 4213f886e9SJeremy L Thompson CeedDebug(qf->ceed, "Creating fallback CeedQFunction\n"); 43d04bbc78SJeremy L Thompson 449e77b9c8SJeremy L Thompson char *source_path_with_name = ""; 459e77b9c8SJeremy L Thompson if (qf->source_path) { 462b730f8bSJeremy L Thompson size_t path_len = strlen(qf->source_path), name_len = strlen(qf->kernel_name); 472b730f8bSJeremy L Thompson CeedCall(CeedCalloc(path_len + name_len + 2, &source_path_with_name)); 489e77b9c8SJeremy L Thompson memcpy(source_path_with_name, qf->source_path, path_len); 499e77b9c8SJeremy L Thompson memcpy(&source_path_with_name[path_len], ":", 1); 509e77b9c8SJeremy L Thompson memcpy(&source_path_with_name[path_len + 1], qf->kernel_name, name_len); 519e77b9c8SJeremy L Thompson } else { 522b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &source_path_with_name)); 539e77b9c8SJeremy L Thompson } 549e77b9c8SJeremy L Thompson 552b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateInterior(fallback_ceed, qf->vec_length, qf->function, source_path_with_name, qf_fallback)); 569e77b9c8SJeremy L Thompson { 579e77b9c8SJeremy L Thompson CeedQFunctionContext ctx; 589e77b9c8SJeremy L Thompson 592b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetContext(qf, &ctx)); 602b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(*qf_fallback, ctx)); 619e77b9c8SJeremy L Thompson } 629e77b9c8SJeremy L Thompson for (CeedInt i = 0; i < qf->num_input_fields; i++) { 632b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(*qf_fallback, qf->input_fields[i]->field_name, qf->input_fields[i]->size, qf->input_fields[i]->eval_mode)); 649e77b9c8SJeremy L Thompson } 659e77b9c8SJeremy L Thompson for (CeedInt i = 0; i < qf->num_output_fields; i++) { 662b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(*qf_fallback, qf->output_fields[i]->field_name, qf->output_fields[i]->size, qf->output_fields[i]->eval_mode)); 679e77b9c8SJeremy L Thompson } 682b730f8bSJeremy L Thompson CeedCall(CeedFree(&source_path_with_name)); 699e77b9c8SJeremy L Thompson 709e77b9c8SJeremy L Thompson return CEED_ERROR_SUCCESS; 719e77b9c8SJeremy L Thompson } 729e77b9c8SJeremy L Thompson 739e77b9c8SJeremy L Thompson /** 74ea61e9acSJeremy L Thompson @brief Duplicate a CeedOperator with a reference Ceed to fallback for advanced CeedOperator functionality 75eaf62fffSJeremy L Thompson 76ea61e9acSJeremy L Thompson @param[in,out] op CeedOperator to create fallback for 77eaf62fffSJeremy L Thompson 78eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 79eaf62fffSJeremy L Thompson 80eaf62fffSJeremy L Thompson @ref Developer 81eaf62fffSJeremy L Thompson **/ 82d04bbc78SJeremy L Thompson static int CeedOperatorCreateFallback(CeedOperator op) { 83b275c451SJeremy L Thompson bool is_composite; 849e77b9c8SJeremy L Thompson Ceed ceed_fallback; 85eaf62fffSJeremy L Thompson 86805fe78eSJeremy L Thompson // Check not already created 87805fe78eSJeremy L Thompson if (op->op_fallback) return CEED_ERROR_SUCCESS; 88805fe78eSJeremy L Thompson 89eaf62fffSJeremy L Thompson // Fallback Ceed 902b730f8bSJeremy L Thompson CeedCall(CeedGetOperatorFallbackCeed(op->ceed, &ceed_fallback)); 91d04bbc78SJeremy L Thompson if (!ceed_fallback) return CEED_ERROR_SUCCESS; 92d04bbc78SJeremy L Thompson 93d04bbc78SJeremy L Thompson CeedDebug256(op->ceed, 1, "---------- CeedOperator Fallback ----------\n"); 9413f886e9SJeremy L Thompson CeedDebug(op->ceed, "Creating fallback CeedOperator\n"); 95eaf62fffSJeremy L Thompson 96eaf62fffSJeremy L Thompson // Clone Op 97805fe78eSJeremy L Thompson CeedOperator op_fallback; 98b275c451SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 99b275c451SJeremy L Thompson if (is_composite) { 100b275c451SJeremy L Thompson CeedInt num_suboperators; 101b275c451SJeremy L Thompson CeedOperator *sub_operators; 102b275c451SJeremy L Thompson 1032b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorCreate(ceed_fallback, &op_fallback)); 104b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 105b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 106b275c451SJeremy L Thompson for (CeedInt i = 0; i < num_suboperators; i++) { 107d04bbc78SJeremy L Thompson CeedOperator op_sub_fallback; 108d04bbc78SJeremy L Thompson 109b275c451SJeremy L Thompson CeedCall(CeedOperatorGetFallback(sub_operators[i], &op_sub_fallback)); 1102b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorAddSub(op_fallback, op_sub_fallback)); 111805fe78eSJeremy L Thompson } 112805fe78eSJeremy L Thompson } else { 1139e77b9c8SJeremy L Thompson CeedQFunction qf_fallback = NULL, dqf_fallback = NULL, dqfT_fallback = NULL; 1142b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->qf, &qf_fallback)); 1152b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqf, &dqf_fallback)); 1162b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqfT, &dqfT_fallback)); 1172b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed_fallback, qf_fallback, dqf_fallback, dqfT_fallback, &op_fallback)); 118805fe78eSJeremy L Thompson for (CeedInt i = 0; i < op->qf->num_input_fields; i++) { 1192b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(op_fallback, op->input_fields[i]->field_name, op->input_fields[i]->elem_restr, op->input_fields[i]->basis, 1202b730f8bSJeremy L Thompson op->input_fields[i]->vec)); 121805fe78eSJeremy L Thompson } 122805fe78eSJeremy L Thompson for (CeedInt i = 0; i < op->qf->num_output_fields; i++) { 1232b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(op_fallback, op->output_fields[i]->field_name, op->output_fields[i]->elem_restr, op->output_fields[i]->basis, 1242b730f8bSJeremy L Thompson op->output_fields[i]->vec)); 125805fe78eSJeremy L Thompson } 1262b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op->qf_assembled, &op_fallback->qf_assembled)); 127805fe78eSJeremy L Thompson if (op_fallback->num_qpts == 0) { 1282b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetNumQuadraturePoints(op_fallback, op->num_qpts)); 129805fe78eSJeremy L Thompson } 1309e77b9c8SJeremy L Thompson // Cleanup 1312b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&qf_fallback)); 1322b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&dqf_fallback)); 1332b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&dqfT_fallback)); 134805fe78eSJeremy L Thompson } 1352b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetName(op_fallback, op->name)); 1362b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fallback)); 137805fe78eSJeremy L Thompson op->op_fallback = op_fallback; 138eaf62fffSJeremy L Thompson 139eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 140eaf62fffSJeremy L Thompson } 141eaf62fffSJeremy L Thompson 142eaf62fffSJeremy L Thompson /** 143ea61e9acSJeremy L Thompson @brief Retrieve fallback CeedOperator with a reference Ceed for advanced CeedOperator functionality 144d04bbc78SJeremy L Thompson 145d04bbc78SJeremy L Thompson @param[in] op CeedOperator to retrieve fallback for 146d04bbc78SJeremy L Thompson @param[out] op_fallback Fallback CeedOperator 147d04bbc78SJeremy L Thompson 148d04bbc78SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 149d04bbc78SJeremy L Thompson 150d04bbc78SJeremy L Thompson @ref Developer 151d04bbc78SJeremy L Thompson **/ 152d04bbc78SJeremy L Thompson int CeedOperatorGetFallback(CeedOperator op, CeedOperator *op_fallback) { 153d04bbc78SJeremy L Thompson // Create if needed 154d04bbc78SJeremy L Thompson if (!op->op_fallback) { 1552b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreateFallback(op)); 156d04bbc78SJeremy L Thompson } 157d04bbc78SJeremy L Thompson if (op->op_fallback) { 158d04bbc78SJeremy L Thompson bool is_debug; 159d04bbc78SJeremy L Thompson 1602b730f8bSJeremy L Thompson CeedCall(CeedIsDebug(op->ceed, &is_debug)); 161d04bbc78SJeremy L Thompson if (is_debug) { 162b275c451SJeremy L Thompson Ceed ceed, ceed_fallback; 163d04bbc78SJeremy L Thompson const char *resource, *resource_fallback; 164d04bbc78SJeremy L Thompson 165b275c451SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 166b275c451SJeremy L Thompson CeedCall(CeedGetOperatorFallbackCeed(ceed, &ceed_fallback)); 167b275c451SJeremy L Thompson CeedCall(CeedGetResource(ceed, &resource)); 1682b730f8bSJeremy L Thompson CeedCall(CeedGetResource(ceed_fallback, &resource_fallback)); 169d04bbc78SJeremy L Thompson 170b275c451SJeremy L Thompson CeedDebug256(ceed, 1, "---------- CeedOperator Fallback ----------\n"); 171b275c451SJeremy L Thompson CeedDebug(ceed, "Falling back from %s operator at address %ld to %s operator at address %ld\n", resource, op, resource_fallback, 1722b730f8bSJeremy L Thompson op->op_fallback); 173d04bbc78SJeremy L Thompson } 174d04bbc78SJeremy L Thompson } 175d04bbc78SJeremy L Thompson *op_fallback = op->op_fallback; 176d04bbc78SJeremy L Thompson 177d04bbc78SJeremy L Thompson return CEED_ERROR_SUCCESS; 178d04bbc78SJeremy L Thompson } 179d04bbc78SJeremy L Thompson 180d04bbc78SJeremy L Thompson /** 181eaf62fffSJeremy L Thompson @brief Select correct basis matrix pointer based on CeedEvalMode 182eaf62fffSJeremy L Thompson 183eaf62fffSJeremy L Thompson @param[in] eval_mode Current basis evaluation mode 184eaf62fffSJeremy L Thompson @param[in] identity Pointer to identity matrix 185eaf62fffSJeremy L Thompson @param[in] interp Pointer to interpolation matrix 186eaf62fffSJeremy L Thompson @param[in] grad Pointer to gradient matrix 187eaf62fffSJeremy L Thompson @param[out] basis_ptr Basis pointer to set 188eaf62fffSJeremy L Thompson 189eaf62fffSJeremy L Thompson @ref Developer 190eaf62fffSJeremy L Thompson **/ 1912b730f8bSJeremy L Thompson static inline void CeedOperatorGetBasisPointer(CeedEvalMode eval_mode, const CeedScalar *identity, const CeedScalar *interp, const CeedScalar *grad, 1922b730f8bSJeremy L Thompson const CeedScalar **basis_ptr) { 193eaf62fffSJeremy L Thompson switch (eval_mode) { 194eaf62fffSJeremy L Thompson case CEED_EVAL_NONE: 195eaf62fffSJeremy L Thompson *basis_ptr = identity; 196eaf62fffSJeremy L Thompson break; 197eaf62fffSJeremy L Thompson case CEED_EVAL_INTERP: 198eaf62fffSJeremy L Thompson *basis_ptr = interp; 199eaf62fffSJeremy L Thompson break; 200eaf62fffSJeremy L Thompson case CEED_EVAL_GRAD: 201eaf62fffSJeremy L Thompson *basis_ptr = grad; 202eaf62fffSJeremy L Thompson break; 203eaf62fffSJeremy L Thompson case CEED_EVAL_WEIGHT: 204eaf62fffSJeremy L Thompson case CEED_EVAL_DIV: 205eaf62fffSJeremy L Thompson case CEED_EVAL_CURL: 206eaf62fffSJeremy L Thompson break; // Caught by QF Assembly 207eaf62fffSJeremy L Thompson } 208ed9e99e6SJeremy L Thompson assert(*basis_ptr != NULL); 209eaf62fffSJeremy L Thompson } 210eaf62fffSJeremy L Thompson 211eaf62fffSJeremy L Thompson /** 212eaf62fffSJeremy L Thompson @brief Create point block restriction for active operator field 213eaf62fffSJeremy L Thompson 214eaf62fffSJeremy L Thompson @param[in] rstr Original CeedElemRestriction for active field 215ea61e9acSJeremy L Thompson @param[out] pointblock_rstr Address of the variable where the newly created CeedElemRestriction will be stored 216eaf62fffSJeremy L Thompson 217eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 218eaf62fffSJeremy L Thompson 219eaf62fffSJeremy L Thompson @ref Developer 220eaf62fffSJeremy L Thompson **/ 2212b730f8bSJeremy L Thompson static int CeedOperatorCreateActivePointBlockRestriction(CeedElemRestriction rstr, CeedElemRestriction *pointblock_rstr) { 222eaf62fffSJeremy L Thompson Ceed ceed; 2232b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetCeed(rstr, &ceed)); 224eaf62fffSJeremy L Thompson const CeedInt *offsets; 2252b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetOffsets(rstr, CEED_MEM_HOST, &offsets)); 226eaf62fffSJeremy L Thompson 227eaf62fffSJeremy L Thompson // Expand offsets 2287b63f5c6SJed Brown CeedInt num_elem, num_comp, elem_size, comp_stride, *pointblock_offsets; 2297b63f5c6SJed Brown CeedSize l_size; 2302b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem)); 2312b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp)); 2322b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size)); 2332b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetCompStride(rstr, &comp_stride)); 2342b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size)); 235eaf62fffSJeremy L Thompson CeedInt shift = num_comp; 2362b730f8bSJeremy L Thompson if (comp_stride != 1) shift *= num_comp; 2372b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_elem * elem_size, &pointblock_offsets)); 238eaf62fffSJeremy L Thompson for (CeedInt i = 0; i < num_elem * elem_size; i++) { 239eaf62fffSJeremy L Thompson pointblock_offsets[i] = offsets[i] * shift; 240eaf62fffSJeremy L Thompson } 241eaf62fffSJeremy L Thompson 242eaf62fffSJeremy L Thompson // Create new restriction 2432b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionCreate(ceed, num_elem, elem_size, num_comp * num_comp, 1, l_size * num_comp, CEED_MEM_HOST, CEED_OWN_POINTER, 2442b730f8bSJeremy L Thompson pointblock_offsets, pointblock_rstr)); 245eaf62fffSJeremy L Thompson 246eaf62fffSJeremy L Thompson // Cleanup 2472b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionRestoreOffsets(rstr, &offsets)); 248eaf62fffSJeremy L Thompson 249eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 250eaf62fffSJeremy L Thompson } 251eaf62fffSJeremy L Thompson 252eaf62fffSJeremy L Thompson /** 253eaf62fffSJeremy L Thompson @brief Core logic for assembling operator diagonal or point block diagonal 254eaf62fffSJeremy L Thompson 255eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble point block diagonal 256ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE 257eaf62fffSJeremy L Thompson @param[in] is_pointblock Boolean flag to assemble diagonal or point block diagonal 258eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled diagonal 259eaf62fffSJeremy L Thompson 260eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 261eaf62fffSJeremy L Thompson 262eaf62fffSJeremy L Thompson @ref Developer 263eaf62fffSJeremy L Thompson **/ 2642b730f8bSJeremy L Thompson static inline int CeedSingleOperatorAssembleAddDiagonal_Core(CeedOperator op, CeedRequest *request, const bool is_pointblock, CeedVector assembled) { 265eaf62fffSJeremy L Thompson Ceed ceed; 2662b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 267eaf62fffSJeremy L Thompson 268eaf62fffSJeremy L Thompson // Assemble QFunction 269eaf62fffSJeremy L Thompson CeedQFunction qf; 2702b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 271eaf62fffSJeremy L Thompson CeedInt num_input_fields, num_output_fields; 2722b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetNumArgs(qf, &num_input_fields, &num_output_fields)); 273eaf62fffSJeremy L Thompson CeedVector assembled_qf; 274eaf62fffSJeremy L Thompson CeedElemRestriction rstr; 2752b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &rstr, request)); 276eaf62fffSJeremy L Thompson CeedInt layout[3]; 2772b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(rstr, &layout)); 2782b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr)); 279eaf62fffSJeremy L Thompson 280ed9e99e6SJeremy L Thompson // Get assembly data 281ed9e99e6SJeremy L Thompson CeedOperatorAssemblyData data; 2822b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data)); 283ed9e99e6SJeremy L Thompson const CeedEvalMode *eval_mode_in, *eval_mode_out; 284ed9e99e6SJeremy L Thompson CeedInt num_eval_mode_in, num_eval_mode_out; 2852b730f8bSJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_eval_mode_in, &eval_mode_in, &num_eval_mode_out, &eval_mode_out)); 286ed9e99e6SJeremy L Thompson CeedBasis basis_in, basis_out; 2872b730f8bSJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetBases(data, &basis_in, NULL, &basis_out, NULL)); 288ed9e99e6SJeremy L Thompson CeedInt num_comp; 2892b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_in, &num_comp)); 290eaf62fffSJeremy L Thompson 291eaf62fffSJeremy L Thompson // Assemble point block diagonal restriction, if needed 292ed9e99e6SJeremy L Thompson CeedElemRestriction diag_rstr; 2932b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(op, &diag_rstr)); 294eaf62fffSJeremy L Thompson if (is_pointblock) { 295ed9e99e6SJeremy L Thompson CeedElemRestriction point_block_rstr; 2962b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreateActivePointBlockRestriction(diag_rstr, &point_block_rstr)); 297ed9e99e6SJeremy L Thompson diag_rstr = point_block_rstr; 298eaf62fffSJeremy L Thompson } 299eaf62fffSJeremy L Thompson 300eaf62fffSJeremy L Thompson // Create diagonal vector 301eaf62fffSJeremy L Thompson CeedVector elem_diag; 3022b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionCreateVector(diag_rstr, NULL, &elem_diag)); 303eaf62fffSJeremy L Thompson 304eaf62fffSJeremy L Thompson // Assemble element operator diagonals 3059c774eddSJeremy L Thompson CeedScalar *elem_diag_array; 3069c774eddSJeremy L Thompson const CeedScalar *assembled_qf_array; 3072b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(elem_diag, 0.0)); 3082b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArray(elem_diag, CEED_MEM_HOST, &elem_diag_array)); 3092b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array)); 310eaf62fffSJeremy L Thompson CeedInt num_elem, num_nodes, num_qpts; 3112b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(diag_rstr, &num_elem)); 3122b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes(basis_in, &num_nodes)); 3132b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_in, &num_qpts)); 314ed9e99e6SJeremy L Thompson 315eaf62fffSJeremy L Thompson // Basis matrices 316eaf62fffSJeremy L Thompson const CeedScalar *interp_in, *interp_out, *grad_in, *grad_out; 317eaf62fffSJeremy L Thompson CeedScalar *identity = NULL; 318ed9e99e6SJeremy L Thompson bool has_eval_none = false; 319ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_eval_mode_in; i++) { 320ed9e99e6SJeremy L Thompson has_eval_none = has_eval_none || (eval_mode_in[i] == CEED_EVAL_NONE); 321ed9e99e6SJeremy L Thompson } 322ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_eval_mode_out; i++) { 323ed9e99e6SJeremy L Thompson has_eval_none = has_eval_none || (eval_mode_out[i] == CEED_EVAL_NONE); 324ed9e99e6SJeremy L Thompson } 325ed9e99e6SJeremy L Thompson if (has_eval_none) { 3262b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_qpts * num_nodes, &identity)); 3272b730f8bSJeremy L Thompson for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) identity[i * num_nodes + i] = 1.0; 328eaf62fffSJeremy L Thompson } 3292b730f8bSJeremy L Thompson CeedCall(CeedBasisGetInterp(basis_in, &interp_in)); 3302b730f8bSJeremy L Thompson CeedCall(CeedBasisGetInterp(basis_out, &interp_out)); 3312b730f8bSJeremy L Thompson CeedCall(CeedBasisGetGrad(basis_in, &grad_in)); 3322b730f8bSJeremy L Thompson CeedCall(CeedBasisGetGrad(basis_out, &grad_out)); 333eaf62fffSJeremy L Thompson // Compute the diagonal of B^T D B 334eaf62fffSJeremy L Thompson // Each element 335eaf62fffSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 336eaf62fffSJeremy L Thompson CeedInt d_out = -1; 337eaf62fffSJeremy L Thompson // Each basis eval mode pair 338eaf62fffSJeremy L Thompson for (CeedInt e_out = 0; e_out < num_eval_mode_out; e_out++) { 339eaf62fffSJeremy L Thompson const CeedScalar *bt = NULL; 3402b730f8bSJeremy L Thompson if (eval_mode_out[e_out] == CEED_EVAL_GRAD) d_out += 1; 3412b730f8bSJeremy L Thompson CeedOperatorGetBasisPointer(eval_mode_out[e_out], identity, interp_out, &grad_out[d_out * num_qpts * num_nodes], &bt); 342eaf62fffSJeremy L Thompson CeedInt d_in = -1; 343eaf62fffSJeremy L Thompson for (CeedInt e_in = 0; e_in < num_eval_mode_in; e_in++) { 344eaf62fffSJeremy L Thompson const CeedScalar *b = NULL; 3452b730f8bSJeremy L Thompson if (eval_mode_in[e_in] == CEED_EVAL_GRAD) d_in += 1; 3462b730f8bSJeremy L Thompson CeedOperatorGetBasisPointer(eval_mode_in[e_in], identity, interp_in, &grad_in[d_in * num_qpts * num_nodes], &b); 347eaf62fffSJeremy L Thompson // Each component 3482b730f8bSJeremy L Thompson for (CeedInt c_out = 0; c_out < num_comp; c_out++) { 349eaf62fffSJeremy L Thompson // Each qpoint/node pair 3502b730f8bSJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 351eaf62fffSJeremy L Thompson if (is_pointblock) { 352eaf62fffSJeremy L Thompson // Point Block Diagonal 353eaf62fffSJeremy L Thompson for (CeedInt c_in = 0; c_in < num_comp; c_in++) { 354eaf62fffSJeremy L Thompson const CeedScalar qf_value = 3552b730f8bSJeremy L Thompson assembled_qf_array[q * layout[0] + (((e_in * num_comp + c_in) * num_eval_mode_out + e_out) * num_comp + c_out) * layout[1] + 3562b730f8bSJeremy L Thompson e * layout[2]]; 3572b730f8bSJeremy L Thompson for (CeedInt n = 0; n < num_nodes; n++) { 358eaf62fffSJeremy L Thompson elem_diag_array[((e * num_comp + c_out) * num_comp + c_in) * num_nodes + n] += 359eaf62fffSJeremy L Thompson bt[q * num_nodes + n] * qf_value * b[q * num_nodes + n]; 360eaf62fffSJeremy L Thompson } 3612b730f8bSJeremy L Thompson } 362eaf62fffSJeremy L Thompson } else { 363eaf62fffSJeremy L Thompson // Diagonal Only 364eaf62fffSJeremy L Thompson const CeedScalar qf_value = 3652b730f8bSJeremy L Thompson assembled_qf_array[q * layout[0] + (((e_in * num_comp + c_out) * num_eval_mode_out + e_out) * num_comp + c_out) * layout[1] + 3662b730f8bSJeremy L Thompson e * layout[2]]; 3672b730f8bSJeremy L Thompson for (CeedInt n = 0; n < num_nodes; n++) { 3682b730f8bSJeremy L Thompson elem_diag_array[(e * num_comp + c_out) * num_nodes + n] += bt[q * num_nodes + n] * qf_value * b[q * num_nodes + n]; 369eaf62fffSJeremy L Thompson } 370eaf62fffSJeremy L Thompson } 371eaf62fffSJeremy L Thompson } 372eaf62fffSJeremy L Thompson } 3732b730f8bSJeremy L Thompson } 3742b730f8bSJeremy L Thompson } 3752b730f8bSJeremy L Thompson } 3762b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(elem_diag, &elem_diag_array)); 3772b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array)); 378eaf62fffSJeremy L Thompson 379eaf62fffSJeremy L Thompson // Assemble local operator diagonal 3802b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionApply(diag_rstr, CEED_TRANSPOSE, elem_diag, assembled, request)); 381eaf62fffSJeremy L Thompson 382eaf62fffSJeremy L Thompson // Cleanup 383eaf62fffSJeremy L Thompson if (is_pointblock) { 3842b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&diag_rstr)); 385eaf62fffSJeremy L Thompson } 3862b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled_qf)); 3872b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&elem_diag)); 3882b730f8bSJeremy L Thompson CeedCall(CeedFree(&identity)); 389eaf62fffSJeremy L Thompson 390eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 391eaf62fffSJeremy L Thompson } 392eaf62fffSJeremy L Thompson 393eaf62fffSJeremy L Thompson /** 394eaf62fffSJeremy L Thompson @brief Core logic for assembling composite operator diagonal 395eaf62fffSJeremy L Thompson 396eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble point block diagonal 397ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE 398eaf62fffSJeremy L Thompson @param[in] is_pointblock Boolean flag to assemble diagonal or point block diagonal 399eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled diagonal 400eaf62fffSJeremy L Thompson 401eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 402eaf62fffSJeremy L Thompson 403eaf62fffSJeremy L Thompson @ref Developer 404eaf62fffSJeremy L Thompson **/ 4052b730f8bSJeremy L Thompson static inline int CeedCompositeOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedRequest *request, const bool is_pointblock, 406eaf62fffSJeremy L Thompson CeedVector assembled) { 407eaf62fffSJeremy L Thompson CeedInt num_sub; 408eaf62fffSJeremy L Thompson CeedOperator *suboperators; 409c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_sub)); 410c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &suboperators)); 411eaf62fffSJeremy L Thompson for (CeedInt i = 0; i < num_sub; i++) { 4126aa95790SJeremy L Thompson if (is_pointblock) { 4132b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(suboperators[i], assembled, request)); 4146aa95790SJeremy L Thompson } else { 4152b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddDiagonal(suboperators[i], assembled, request)); 4166aa95790SJeremy L Thompson } 417eaf62fffSJeremy L Thompson } 418eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 419eaf62fffSJeremy L Thompson } 420eaf62fffSJeremy L Thompson 421eaf62fffSJeremy L Thompson /** 422eaf62fffSJeremy L Thompson @brief Build nonzero pattern for non-composite operator 423eaf62fffSJeremy L Thompson 424eaf62fffSJeremy L Thompson Users should generally use CeedOperatorLinearAssembleSymbolic() 425eaf62fffSJeremy L Thompson 426eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble nonzero pattern 427eaf62fffSJeremy L Thompson @param[in] offset Offset for number of entries 428eaf62fffSJeremy L Thompson @param[out] rows Row number for each entry 429eaf62fffSJeremy L Thompson @param[out] cols Column number for each entry 430eaf62fffSJeremy L Thompson 431eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 432eaf62fffSJeremy L Thompson 433eaf62fffSJeremy L Thompson @ref Developer 434eaf62fffSJeremy L Thompson **/ 4352b730f8bSJeremy L Thompson static int CeedSingleOperatorAssembleSymbolic(CeedOperator op, CeedInt offset, CeedInt *rows, CeedInt *cols) { 436f3d47e36SJeremy L Thompson Ceed ceed; 437f3d47e36SJeremy L Thompson bool is_composite; 438f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 439f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 440f3d47e36SJeremy L Thompson 441b275c451SJeremy L Thompson if (is_composite) { 442eaf62fffSJeremy L Thompson // LCOV_EXCL_START 4432b730f8bSJeremy L Thompson return CeedError(ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 444eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 4452b730f8bSJeremy L Thompson } 446eaf62fffSJeremy L Thompson 447c9366a6bSJeremy L Thompson CeedSize num_nodes; 4482b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &num_nodes, NULL)); 449eaf62fffSJeremy L Thompson CeedElemRestriction rstr_in; 4502b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(op, &rstr_in)); 451e79b91d9SJeremy L Thompson CeedInt num_elem, elem_size, num_comp; 4522b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr_in, &num_elem)); 4532b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr_in, &elem_size)); 4542b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(rstr_in, &num_comp)); 455eaf62fffSJeremy L Thompson CeedInt layout_er[3]; 4562b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(rstr_in, &layout_er)); 457eaf62fffSJeremy L Thompson 458eaf62fffSJeremy L Thompson CeedInt local_num_entries = elem_size * num_comp * elem_size * num_comp * num_elem; 459eaf62fffSJeremy L Thompson 460eaf62fffSJeremy L Thompson // Determine elem_dof relation 461eaf62fffSJeremy L Thompson CeedVector index_vec; 4622b730f8bSJeremy L Thompson CeedCall(CeedVectorCreate(ceed, num_nodes, &index_vec)); 463eaf62fffSJeremy L Thompson CeedScalar *array; 4642b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayWrite(index_vec, CEED_MEM_HOST, &array)); 465ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_nodes; i++) array[i] = i; 4662b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(index_vec, &array)); 467eaf62fffSJeremy L Thompson CeedVector elem_dof; 4682b730f8bSJeremy L Thompson CeedCall(CeedVectorCreate(ceed, num_elem * elem_size * num_comp, &elem_dof)); 4692b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(elem_dof, 0.0)); 4702b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionApply(rstr_in, CEED_NOTRANSPOSE, index_vec, elem_dof, CEED_REQUEST_IMMEDIATE)); 471eaf62fffSJeremy L Thompson const CeedScalar *elem_dof_a; 4722b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(elem_dof, CEED_MEM_HOST, &elem_dof_a)); 4732b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&index_vec)); 474eaf62fffSJeremy L Thompson 475eaf62fffSJeremy L Thompson // Determine i, j locations for element matrices 476eaf62fffSJeremy L Thompson CeedInt count = 0; 477ed9e99e6SJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 478ed9e99e6SJeremy L Thompson for (CeedInt comp_in = 0; comp_in < num_comp; comp_in++) { 479ed9e99e6SJeremy L Thompson for (CeedInt comp_out = 0; comp_out < num_comp; comp_out++) { 480ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < elem_size; i++) { 481ed9e99e6SJeremy L Thompson for (CeedInt j = 0; j < elem_size; j++) { 4822b730f8bSJeremy L Thompson const CeedInt elem_dof_index_row = i * layout_er[0] + (comp_out)*layout_er[1] + e * layout_er[2]; 4832b730f8bSJeremy L Thompson const CeedInt elem_dof_index_col = j * layout_er[0] + comp_in * layout_er[1] + e * layout_er[2]; 484eaf62fffSJeremy L Thompson 485eaf62fffSJeremy L Thompson const CeedInt row = elem_dof_a[elem_dof_index_row]; 486eaf62fffSJeremy L Thompson const CeedInt col = elem_dof_a[elem_dof_index_col]; 487eaf62fffSJeremy L Thompson 488eaf62fffSJeremy L Thompson rows[offset + count] = row; 489eaf62fffSJeremy L Thompson cols[offset + count] = col; 490eaf62fffSJeremy L Thompson count++; 491eaf62fffSJeremy L Thompson } 492eaf62fffSJeremy L Thompson } 493eaf62fffSJeremy L Thompson } 494eaf62fffSJeremy L Thompson } 495eaf62fffSJeremy L Thompson } 4962b730f8bSJeremy L Thompson if (count != local_num_entries) { 497eaf62fffSJeremy L Thompson // LCOV_EXCL_START 498eaf62fffSJeremy L Thompson return CeedError(ceed, CEED_ERROR_MAJOR, "Error computing assembled entries"); 499eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 5002b730f8bSJeremy L Thompson } 5012b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(elem_dof, &elem_dof_a)); 5022b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&elem_dof)); 503eaf62fffSJeremy L Thompson 504eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 505eaf62fffSJeremy L Thompson } 506eaf62fffSJeremy L Thompson 507eaf62fffSJeremy L Thompson /** 508eaf62fffSJeremy L Thompson @brief Assemble nonzero entries for non-composite operator 509eaf62fffSJeremy L Thompson 510eaf62fffSJeremy L Thompson Users should generally use CeedOperatorLinearAssemble() 511eaf62fffSJeremy L Thompson 512eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 513ea61e9acSJeremy L Thompson @param[in] offset Offset for number of entries 514eaf62fffSJeremy L Thompson @param[out] values Values to assemble into matrix 515eaf62fffSJeremy L Thompson 516eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 517eaf62fffSJeremy L Thompson 518eaf62fffSJeremy L Thompson @ref Developer 519eaf62fffSJeremy L Thompson **/ 5202b730f8bSJeremy L Thompson static int CeedSingleOperatorAssemble(CeedOperator op, CeedInt offset, CeedVector values) { 521f3d47e36SJeremy L Thompson Ceed ceed; 522f3d47e36SJeremy L Thompson bool is_composite; 523f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 524f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 525f3d47e36SJeremy L Thompson 526f3d47e36SJeremy L Thompson if (is_composite) { 527eaf62fffSJeremy L Thompson // LCOV_EXCL_START 5282b730f8bSJeremy L Thompson return CeedError(ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 529eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 5302b730f8bSJeremy L Thompson } 531f3d47e36SJeremy L Thompson 532f3d47e36SJeremy L Thompson // Early exit for empty operator 533f3d47e36SJeremy L Thompson { 534f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 535f3d47e36SJeremy L Thompson 536f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 537f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 538f3d47e36SJeremy L Thompson } 539eaf62fffSJeremy L Thompson 540cefa2673SJeremy L Thompson if (op->LinearAssembleSingle) { 541cefa2673SJeremy L Thompson // Backend version 5422b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleSingle(op, offset, values)); 543cefa2673SJeremy L Thompson return CEED_ERROR_SUCCESS; 544cefa2673SJeremy L Thompson } else { 545cefa2673SJeremy L Thompson // Operator fallback 546cefa2673SJeremy L Thompson CeedOperator op_fallback; 547cefa2673SJeremy L Thompson 5482b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 549cefa2673SJeremy L Thompson if (op_fallback) { 5502b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemble(op_fallback, offset, values)); 551cefa2673SJeremy L Thompson return CEED_ERROR_SUCCESS; 552cefa2673SJeremy L Thompson } 553cefa2673SJeremy L Thompson } 554cefa2673SJeremy L Thompson 555eaf62fffSJeremy L Thompson // Assemble QFunction 556eaf62fffSJeremy L Thompson CeedQFunction qf; 5572b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 558eaf62fffSJeremy L Thompson CeedVector assembled_qf; 559eaf62fffSJeremy L Thompson CeedElemRestriction rstr_q; 5602b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &rstr_q, CEED_REQUEST_IMMEDIATE)); 5611f9221feSJeremy L Thompson CeedSize qf_length; 5622b730f8bSJeremy L Thompson CeedCall(CeedVectorGetLength(assembled_qf, &qf_length)); 563eaf62fffSJeremy L Thompson 5647e7773b5SJeremy L Thompson CeedInt num_input_fields, num_output_fields; 565eaf62fffSJeremy L Thompson CeedOperatorField *input_fields; 566eaf62fffSJeremy L Thompson CeedOperatorField *output_fields; 5672b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, &num_input_fields, &input_fields, &num_output_fields, &output_fields)); 568eaf62fffSJeremy L Thompson 569ed9e99e6SJeremy L Thompson // Get assembly data 570ed9e99e6SJeremy L Thompson CeedOperatorAssemblyData data; 5712b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data)); 572ed9e99e6SJeremy L Thompson const CeedEvalMode *eval_mode_in, *eval_mode_out; 573ed9e99e6SJeremy L Thompson CeedInt num_eval_mode_in, num_eval_mode_out; 5742b730f8bSJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_eval_mode_in, &eval_mode_in, &num_eval_mode_out, &eval_mode_out)); 575ed9e99e6SJeremy L Thompson CeedBasis basis_in, basis_out; 5762b730f8bSJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetBases(data, &basis_in, NULL, &basis_out, NULL)); 577eaf62fffSJeremy L Thompson 5782b730f8bSJeremy L Thompson if (num_eval_mode_in == 0 || num_eval_mode_out == 0) { 579eaf62fffSJeremy L Thompson // LCOV_EXCL_START 5802b730f8bSJeremy L Thompson return CeedError(ceed, CEED_ERROR_UNSUPPORTED, "Cannot assemble operator with out inputs/outputs"); 581eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 5822b730f8bSJeremy L Thompson } 583eaf62fffSJeremy L Thompson 584ed9e99e6SJeremy L Thompson CeedElemRestriction active_rstr; 585eaf62fffSJeremy L Thompson CeedInt num_elem, elem_size, num_qpts, num_comp; 5862b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(op, &active_rstr)); 5872b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(active_rstr, &num_elem)); 5882b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(active_rstr, &elem_size)); 5892b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(active_rstr, &num_comp)); 5902b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_in, &num_qpts)); 591eaf62fffSJeremy L Thompson 592eaf62fffSJeremy L Thompson CeedInt local_num_entries = elem_size * num_comp * elem_size * num_comp * num_elem; 593eaf62fffSJeremy L Thompson 594eaf62fffSJeremy L Thompson // loop over elements and put in data structure 595eaf62fffSJeremy L Thompson const CeedScalar *interp_in, *grad_in; 5962b730f8bSJeremy L Thompson CeedCall(CeedBasisGetInterp(basis_in, &interp_in)); 5972b730f8bSJeremy L Thompson CeedCall(CeedBasisGetGrad(basis_in, &grad_in)); 598eaf62fffSJeremy L Thompson 599eaf62fffSJeremy L Thompson const CeedScalar *assembled_qf_array; 6002b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array)); 601eaf62fffSJeremy L Thompson 602eaf62fffSJeremy L Thompson CeedInt layout_qf[3]; 6032b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(rstr_q, &layout_qf)); 6042b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_q)); 605eaf62fffSJeremy L Thompson 606eaf62fffSJeremy L Thompson // we store B_mat_in, B_mat_out, BTD, elem_mat in row-major order 607ed9e99e6SJeremy L Thompson const CeedScalar *B_mat_in, *B_mat_out; 6082b730f8bSJeremy L Thompson CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, &B_mat_in, NULL, &B_mat_out)); 609ed9e99e6SJeremy L Thompson CeedScalar BTD_mat[elem_size * num_qpts * num_eval_mode_in]; 610eaf62fffSJeremy L Thompson CeedScalar elem_mat[elem_size * elem_size]; 61192ae7e47SJeremy L Thompson CeedInt count = 0; 612eaf62fffSJeremy L Thompson CeedScalar *vals; 6132b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayWrite(values, CEED_MEM_HOST, &vals)); 614ed9e99e6SJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 615ed9e99e6SJeremy L Thompson for (CeedInt comp_in = 0; comp_in < num_comp; comp_in++) { 616ed9e99e6SJeremy L Thompson for (CeedInt comp_out = 0; comp_out < num_comp; comp_out++) { 617ed9e99e6SJeremy L Thompson // Compute B^T*D 618ed9e99e6SJeremy L Thompson for (CeedInt n = 0; n < elem_size; n++) { 619ed9e99e6SJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 620ed9e99e6SJeremy L Thompson for (CeedInt e_in = 0; e_in < num_eval_mode_in; e_in++) { 6212b730f8bSJeremy L Thompson const CeedInt btd_index = n * (num_qpts * num_eval_mode_in) + (num_eval_mode_in * q + e_in); 622067fd99fSJeremy L Thompson CeedScalar sum = 0.0; 623067fd99fSJeremy L Thompson for (CeedInt e_out = 0; e_out < num_eval_mode_out; e_out++) { 624ed9e99e6SJeremy L Thompson const CeedInt b_out_index = (num_eval_mode_out * q + e_out) * elem_size + n; 6252b730f8bSJeremy L Thompson const CeedInt eval_mode_index = ((e_in * num_comp + comp_in) * num_eval_mode_out + e_out) * num_comp + comp_out; 6262b730f8bSJeremy L Thompson const CeedInt qf_index = q * layout_qf[0] + eval_mode_index * layout_qf[1] + e * layout_qf[2]; 627067fd99fSJeremy L Thompson sum += B_mat_out[b_out_index] * assembled_qf_array[qf_index]; 628eaf62fffSJeremy L Thompson } 629067fd99fSJeremy L Thompson BTD_mat[btd_index] = sum; 630ed9e99e6SJeremy L Thompson } 631ed9e99e6SJeremy L Thompson } 632eaf62fffSJeremy L Thompson } 633eaf62fffSJeremy L Thompson // form element matrix itself (for each block component) 6342b730f8bSJeremy L Thompson CeedCall(CeedMatrixMatrixMultiply(ceed, BTD_mat, B_mat_in, elem_mat, elem_size, elem_size, num_qpts * num_eval_mode_in)); 635eaf62fffSJeremy L Thompson 636eaf62fffSJeremy L Thompson // put element matrix in coordinate data structure 637ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < elem_size; i++) { 638ed9e99e6SJeremy L Thompson for (CeedInt j = 0; j < elem_size; j++) { 639eaf62fffSJeremy L Thompson vals[offset + count] = elem_mat[i * elem_size + j]; 640eaf62fffSJeremy L Thompson count++; 641eaf62fffSJeremy L Thompson } 642eaf62fffSJeremy L Thompson } 643eaf62fffSJeremy L Thompson } 644eaf62fffSJeremy L Thompson } 645eaf62fffSJeremy L Thompson } 6462b730f8bSJeremy L Thompson if (count != local_num_entries) { 647eaf62fffSJeremy L Thompson // LCOV_EXCL_START 648eaf62fffSJeremy L Thompson return CeedError(ceed, CEED_ERROR_MAJOR, "Error computing entries"); 649eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 6502b730f8bSJeremy L Thompson } 6512b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(values, &vals)); 652eaf62fffSJeremy L Thompson 6532b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array)); 6542b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled_qf)); 655eaf62fffSJeremy L Thompson 656eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 657eaf62fffSJeremy L Thompson } 658eaf62fffSJeremy L Thompson 659eaf62fffSJeremy L Thompson /** 660eaf62fffSJeremy L Thompson @brief Count number of entries for assembled CeedOperator 661eaf62fffSJeremy L Thompson 662eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 663eaf62fffSJeremy L Thompson @param[out] num_entries Number of entries in assembled representation 664eaf62fffSJeremy L Thompson 665eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 666eaf62fffSJeremy L Thompson 667eaf62fffSJeremy L Thompson @ref Utility 668eaf62fffSJeremy L Thompson **/ 6692b730f8bSJeremy L Thompson static int CeedSingleOperatorAssemblyCountEntries(CeedOperator op, CeedInt *num_entries) { 670b275c451SJeremy L Thompson bool is_composite; 671eaf62fffSJeremy L Thompson CeedElemRestriction rstr; 672eaf62fffSJeremy L Thompson CeedInt num_elem, elem_size, num_comp; 673eaf62fffSJeremy L Thompson 674b275c451SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 675b275c451SJeremy L Thompson if (is_composite) { 676eaf62fffSJeremy L Thompson // LCOV_EXCL_START 6772b730f8bSJeremy L Thompson return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported"); 678eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 6792b730f8bSJeremy L Thompson } 6802b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(op, &rstr)); 6812b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem)); 6822b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size)); 6832b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp)); 684eaf62fffSJeremy L Thompson *num_entries = elem_size * num_comp * elem_size * num_comp * num_elem; 685eaf62fffSJeremy L Thompson 686eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 687eaf62fffSJeremy L Thompson } 688eaf62fffSJeremy L Thompson 689eaf62fffSJeremy L Thompson /** 690ea61e9acSJeremy L Thompson @brief Common code for creating a multigrid coarse operator and level transfer operators for a CeedOperator 691eaf62fffSJeremy L Thompson 692eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 693*85bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 694eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 695eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 696*85bb9dcfSJeremy L Thompson @param[in] basis_c_to_f Basis for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators 697eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 698*85bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 699*85bb9dcfSJeremy L Thompson @param[out] op_restrict Fine to coarse operator, or NULL 700eaf62fffSJeremy L Thompson 701eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 702eaf62fffSJeremy L Thompson 703eaf62fffSJeremy L Thompson @ref Developer 704eaf62fffSJeremy L Thompson **/ 7052b730f8bSJeremy L Thompson static int CeedSingleOperatorMultigridLevel(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 7062b730f8bSJeremy L Thompson CeedBasis basis_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) { 707eaf62fffSJeremy L Thompson Ceed ceed; 708*85bb9dcfSJeremy L Thompson CeedVector mult_vec = NULL; 7092b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op_fine, &ceed)); 710eaf62fffSJeremy L Thompson 711eaf62fffSJeremy L Thompson // Check for composite operator 712eaf62fffSJeremy L Thompson bool is_composite; 7132b730f8bSJeremy L Thompson CeedCall(CeedOperatorIsComposite(op_fine, &is_composite)); 7142b730f8bSJeremy L Thompson if (is_composite) { 715eaf62fffSJeremy L Thompson // LCOV_EXCL_START 7162b730f8bSJeremy L Thompson return CeedError(ceed, CEED_ERROR_UNSUPPORTED, "Automatic multigrid setup for composite operators not supported"); 717eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 7182b730f8bSJeremy L Thompson } 719eaf62fffSJeremy L Thompson 720eaf62fffSJeremy L Thompson // Coarse Grid 7212b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed, op_fine->qf, op_fine->dqf, op_fine->dqfT, op_coarse)); 722eaf62fffSJeremy L Thompson CeedElemRestriction rstr_fine = NULL; 723eaf62fffSJeremy L Thompson // -- Clone input fields 72492ae7e47SJeremy L Thompson for (CeedInt i = 0; i < op_fine->qf->num_input_fields; i++) { 725eaf62fffSJeremy L Thompson if (op_fine->input_fields[i]->vec == CEED_VECTOR_ACTIVE) { 726eaf62fffSJeremy L Thompson rstr_fine = op_fine->input_fields[i]->elem_restr; 7272b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE)); 728eaf62fffSJeremy L Thompson } else { 7292b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, op_fine->input_fields[i]->elem_restr, 7302b730f8bSJeremy L Thompson op_fine->input_fields[i]->basis, op_fine->input_fields[i]->vec)); 731eaf62fffSJeremy L Thompson } 732eaf62fffSJeremy L Thompson } 733eaf62fffSJeremy L Thompson // -- Clone output fields 73492ae7e47SJeremy L Thompson for (CeedInt i = 0; i < op_fine->qf->num_output_fields; i++) { 735eaf62fffSJeremy L Thompson if (op_fine->output_fields[i]->vec == CEED_VECTOR_ACTIVE) { 7362b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE)); 737eaf62fffSJeremy L Thompson } else { 7382b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, op_fine->output_fields[i]->elem_restr, 7392b730f8bSJeremy L Thompson op_fine->output_fields[i]->basis, op_fine->output_fields[i]->vec)); 740eaf62fffSJeremy L Thompson } 741eaf62fffSJeremy L Thompson } 742af99e877SJeremy L Thompson // -- Clone QFunctionAssemblyData 7432b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op_fine->qf_assembled, &(*op_coarse)->qf_assembled)); 744eaf62fffSJeremy L Thompson 745eaf62fffSJeremy L Thompson // Multiplicity vector 746*85bb9dcfSJeremy L Thompson if (op_restrict || op_prolong) { 747*85bb9dcfSJeremy L Thompson CeedVector mult_e_vec; 748*85bb9dcfSJeremy L Thompson 749*85bb9dcfSJeremy L Thompson if (!p_mult_fine) { 750*85bb9dcfSJeremy L Thompson // LCOV_EXCL_START 751*85bb9dcfSJeremy L Thompson return CeedError(ceed, CEED_ERROR_INCOMPATIBLE, "Prolongation or restriction operator creation requires fine grid multiplicity vector"); 752*85bb9dcfSJeremy L Thompson // LCOV_EXCL_STOP 753*85bb9dcfSJeremy L Thompson } 7542b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionCreateVector(rstr_fine, &mult_vec, &mult_e_vec)); 7552b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(mult_e_vec, 0.0)); 7562b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionApply(rstr_fine, CEED_NOTRANSPOSE, p_mult_fine, mult_e_vec, CEED_REQUEST_IMMEDIATE)); 7572b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(mult_vec, 0.0)); 7582b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionApply(rstr_fine, CEED_TRANSPOSE, mult_e_vec, mult_vec, CEED_REQUEST_IMMEDIATE)); 7592b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&mult_e_vec)); 7602b730f8bSJeremy L Thompson CeedCall(CeedVectorReciprocal(mult_vec)); 761*85bb9dcfSJeremy L Thompson } 762eaf62fffSJeremy L Thompson 763addd79feSZach Atkins // Clone name 764addd79feSZach Atkins bool has_name = op_fine->name; 765addd79feSZach Atkins size_t name_len = op_fine->name ? strlen(op_fine->name) : 0; 766addd79feSZach Atkins CeedCall(CeedOperatorSetName(*op_coarse, op_fine->name)); 767addd79feSZach Atkins 76883d6adf3SZach Atkins // Check that coarse to fine basis is provided if prolong/restrict operators are requested 76983d6adf3SZach Atkins if ((op_restrict || op_prolong) && !basis_c_to_f) { 77083d6adf3SZach Atkins // LCOV_EXCL_START 77183d6adf3SZach Atkins return CeedError(ceed, CEED_ERROR_INCOMPATIBLE, "Prolongation or restriction operator creation requires coarse-to-fine basis"); 77283d6adf3SZach Atkins // LCOV_EXCL_STOP 77383d6adf3SZach Atkins } 77483d6adf3SZach Atkins 775*85bb9dcfSJeremy L Thompson // Restriction/Prolongation Operators 776eaf62fffSJeremy L Thompson CeedInt num_comp; 7772b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_coarse, &num_comp)); 778addd79feSZach Atkins 779addd79feSZach Atkins // Restriction 780addd79feSZach Atkins if (op_restrict) { 781eaf62fffSJeremy L Thompson CeedInt *num_comp_r_data; 782*85bb9dcfSJeremy L Thompson CeedQFunction qf_restrict; 783*85bb9dcfSJeremy L Thompson CeedQFunctionContext ctx_r; 784*85bb9dcfSJeremy L Thompson 785*85bb9dcfSJeremy L Thompson CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_restrict)); 7862b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &num_comp_r_data)); 787eaf62fffSJeremy L Thompson num_comp_r_data[0] = num_comp; 7882b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextCreate(ceed, &ctx_r)); 7892b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextSetData(ctx_r, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_r_data), num_comp_r_data)); 7902b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(qf_restrict, ctx_r)); 7912b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextDestroy(&ctx_r)); 7922b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_restrict, "input", num_comp, CEED_EVAL_NONE)); 7932b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_restrict, "scale", num_comp, CEED_EVAL_NONE)); 7942b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(qf_restrict, "output", num_comp, CEED_EVAL_INTERP)); 7952b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_restrict, num_comp)); 796eaf62fffSJeremy L Thompson 7972b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed, qf_restrict, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_restrict)); 7982b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_restrict, "input", rstr_fine, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE)); 7992b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_restrict, "scale", rstr_fine, CEED_BASIS_COLLOCATED, mult_vec)); 8002b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_restrict, "output", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE)); 801eaf62fffSJeremy L Thompson 802addd79feSZach Atkins // Set name 803addd79feSZach Atkins char *restriction_name; 804addd79feSZach Atkins CeedCall(CeedCalloc(17 + name_len, &restriction_name)); 805addd79feSZach Atkins sprintf(restriction_name, "restriction%s%s", has_name ? " for " : "", has_name ? op_fine->name : ""); 806addd79feSZach Atkins CeedCall(CeedOperatorSetName(*op_restrict, restriction_name)); 807addd79feSZach Atkins CeedCall(CeedFree(&restriction_name)); 808addd79feSZach Atkins 809addd79feSZach Atkins // Check 810addd79feSZach Atkins CeedCall(CeedOperatorCheckReady(*op_restrict)); 811addd79feSZach Atkins 812addd79feSZach Atkins // Cleanup 813addd79feSZach Atkins CeedCall(CeedQFunctionDestroy(&qf_restrict)); 814addd79feSZach Atkins } 815addd79feSZach Atkins 816eaf62fffSJeremy L Thompson // Prolongation 817addd79feSZach Atkins if (op_prolong) { 818eaf62fffSJeremy L Thompson CeedInt *num_comp_p_data; 819*85bb9dcfSJeremy L Thompson CeedQFunction qf_prolong; 820*85bb9dcfSJeremy L Thompson CeedQFunctionContext ctx_p; 821*85bb9dcfSJeremy L Thompson 822*85bb9dcfSJeremy L Thompson CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_prolong)); 8232b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &num_comp_p_data)); 824eaf62fffSJeremy L Thompson num_comp_p_data[0] = num_comp; 8252b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextCreate(ceed, &ctx_p)); 8262b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextSetData(ctx_p, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_p_data), num_comp_p_data)); 8272b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(qf_prolong, ctx_p)); 8282b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextDestroy(&ctx_p)); 8292b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_prolong, "input", num_comp, CEED_EVAL_INTERP)); 8302b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_prolong, "scale", num_comp, CEED_EVAL_NONE)); 8312b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(qf_prolong, "output", num_comp, CEED_EVAL_NONE)); 8322b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_prolong, num_comp)); 833eaf62fffSJeremy L Thompson 8342b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed, qf_prolong, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_prolong)); 8352b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_prolong, "input", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE)); 8362b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_prolong, "scale", rstr_fine, CEED_BASIS_COLLOCATED, mult_vec)); 8372b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*op_prolong, "output", rstr_fine, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE)); 838eaf62fffSJeremy L Thompson 839addd79feSZach Atkins // Set name 840ea6b5821SJeremy L Thompson char *prolongation_name; 8412b730f8bSJeremy L Thompson CeedCall(CeedCalloc(18 + name_len, &prolongation_name)); 8422b730f8bSJeremy L Thompson sprintf(prolongation_name, "prolongation%s%s", has_name ? " for " : "", has_name ? op_fine->name : ""); 8432b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetName(*op_prolong, prolongation_name)); 8442b730f8bSJeremy L Thompson CeedCall(CeedFree(&prolongation_name)); 845addd79feSZach Atkins 846addd79feSZach Atkins // Check 847addd79feSZach Atkins CeedCall(CeedOperatorCheckReady(*op_prolong)); 848addd79feSZach Atkins 849addd79feSZach Atkins // Cleanup 850addd79feSZach Atkins CeedCall(CeedQFunctionDestroy(&qf_prolong)); 851ea6b5821SJeremy L Thompson } 852ea6b5821SJeremy L Thompson 85358e4b056SJeremy L Thompson // Check 85458e4b056SJeremy L Thompson CeedCall(CeedOperatorCheckReady(*op_coarse)); 85558e4b056SJeremy L Thompson 856eaf62fffSJeremy L Thompson // Cleanup 8572b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&mult_vec)); 8582b730f8bSJeremy L Thompson CeedCall(CeedBasisDestroy(&basis_c_to_f)); 859805fe78eSJeremy L Thompson 860eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 861eaf62fffSJeremy L Thompson } 862eaf62fffSJeremy L Thompson 863eaf62fffSJeremy L Thompson /** 864eaf62fffSJeremy L Thompson @brief Build 1D mass matrix and Laplacian with perturbation 865eaf62fffSJeremy L Thompson 866eaf62fffSJeremy L Thompson @param[in] interp_1d Interpolation matrix in one dimension 867eaf62fffSJeremy L Thompson @param[in] grad_1d Gradient matrix in one dimension 868eaf62fffSJeremy L Thompson @param[in] q_weight_1d Quadrature weights in one dimension 869eaf62fffSJeremy L Thompson @param[in] P_1d Number of basis nodes in one dimension 870eaf62fffSJeremy L Thompson @param[in] Q_1d Number of quadrature points in one dimension 871eaf62fffSJeremy L Thompson @param[in] dim Dimension of basis 872eaf62fffSJeremy L Thompson @param[out] mass Assembled mass matrix in one dimension 873eaf62fffSJeremy L Thompson @param[out] laplace Assembled perturbed Laplacian in one dimension 874eaf62fffSJeremy L Thompson 875eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 876eaf62fffSJeremy L Thompson 877eaf62fffSJeremy L Thompson @ref Developer 878eaf62fffSJeremy L Thompson **/ 8792b730f8bSJeremy L Thompson CeedPragmaOptimizeOff static int CeedBuildMassLaplace(const CeedScalar *interp_1d, const CeedScalar *grad_1d, const CeedScalar *q_weight_1d, 8802b730f8bSJeremy L Thompson CeedInt P_1d, CeedInt Q_1d, CeedInt dim, CeedScalar *mass, CeedScalar *laplace) { 8812b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) { 882eaf62fffSJeremy L Thompson for (CeedInt j = 0; j < P_1d; j++) { 883eaf62fffSJeremy L Thompson CeedScalar sum = 0.0; 8842b730f8bSJeremy L Thompson for (CeedInt k = 0; k < Q_1d; k++) sum += interp_1d[k * P_1d + i] * q_weight_1d[k] * interp_1d[k * P_1d + j]; 885eaf62fffSJeremy L Thompson mass[i + j * P_1d] = sum; 886eaf62fffSJeremy L Thompson } 8872b730f8bSJeremy L Thompson } 888eaf62fffSJeremy L Thompson // -- Laplacian 8892b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) { 890eaf62fffSJeremy L Thompson for (CeedInt j = 0; j < P_1d; j++) { 891eaf62fffSJeremy L Thompson CeedScalar sum = 0.0; 8922b730f8bSJeremy L Thompson for (CeedInt k = 0; k < Q_1d; k++) sum += grad_1d[k * P_1d + i] * q_weight_1d[k] * grad_1d[k * P_1d + j]; 893eaf62fffSJeremy L Thompson laplace[i + j * P_1d] = sum; 894eaf62fffSJeremy L Thompson } 8952b730f8bSJeremy L Thompson } 896eaf62fffSJeremy L Thompson CeedScalar perturbation = dim > 2 ? 1e-6 : 1e-4; 8972b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) laplace[i + P_1d * i] += perturbation; 898eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 899eaf62fffSJeremy L Thompson } 900ea61e9acSJeremy L Thompson CeedPragmaOptimizeOn; 901eaf62fffSJeremy L Thompson 902eaf62fffSJeremy L Thompson /// @} 903eaf62fffSJeremy L Thompson 904eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 905480fae85SJeremy L Thompson /// CeedOperator Backend API 906480fae85SJeremy L Thompson /// ---------------------------------------------------------------------------- 907480fae85SJeremy L Thompson /// @addtogroup CeedOperatorBackend 908480fae85SJeremy L Thompson /// @{ 909480fae85SJeremy L Thompson 910480fae85SJeremy L Thompson /** 911480fae85SJeremy L Thompson @brief Create object holding CeedQFunction assembly data for CeedOperator 912480fae85SJeremy L Thompson 913480fae85SJeremy L Thompson @param[in] ceed A Ceed object where the CeedQFunctionAssemblyData will be created 914ea61e9acSJeremy L Thompson @param[out] data Address of the variable where the newly created CeedQFunctionAssemblyData will be stored 915480fae85SJeremy L Thompson 916480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 917480fae85SJeremy L Thompson 918480fae85SJeremy L Thompson @ref Backend 919480fae85SJeremy L Thompson **/ 920ea61e9acSJeremy L Thompson int CeedQFunctionAssemblyDataCreate(Ceed ceed, CeedQFunctionAssemblyData *data) { 9212b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, data)); 922480fae85SJeremy L Thompson (*data)->ref_count = 1; 923480fae85SJeremy L Thompson (*data)->ceed = ceed; 9242b730f8bSJeremy L Thompson CeedCall(CeedReference(ceed)); 925480fae85SJeremy L Thompson 926480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 927480fae85SJeremy L Thompson } 928480fae85SJeremy L Thompson 929480fae85SJeremy L Thompson /** 930480fae85SJeremy L Thompson @brief Increment the reference counter for a CeedQFunctionAssemblyData 931480fae85SJeremy L Thompson 932ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to increment the reference counter 933480fae85SJeremy L Thompson 934480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 935480fae85SJeremy L Thompson 936480fae85SJeremy L Thompson @ref Backend 937480fae85SJeremy L Thompson **/ 938480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataReference(CeedQFunctionAssemblyData data) { 939480fae85SJeremy L Thompson data->ref_count++; 940480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 941480fae85SJeremy L Thompson } 942480fae85SJeremy L Thompson 943480fae85SJeremy L Thompson /** 944beecbf24SJeremy L Thompson @brief Set re-use of CeedQFunctionAssemblyData 9458b919e6bSJeremy L Thompson 946ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to mark for reuse 947ea61e9acSJeremy L Thompson @param[in] reuse_data Boolean flag indicating data re-use 9488b919e6bSJeremy L Thompson 9498b919e6bSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 9508b919e6bSJeremy L Thompson 9518b919e6bSJeremy L Thompson @ref Backend 9528b919e6bSJeremy L Thompson **/ 9532b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetReuse(CeedQFunctionAssemblyData data, bool reuse_data) { 954beecbf24SJeremy L Thompson data->reuse_data = reuse_data; 955beecbf24SJeremy L Thompson data->needs_data_update = true; 956beecbf24SJeremy L Thompson return CEED_ERROR_SUCCESS; 957beecbf24SJeremy L Thompson } 958beecbf24SJeremy L Thompson 959beecbf24SJeremy L Thompson /** 960beecbf24SJeremy L Thompson @brief Mark QFunctionAssemblyData as stale 961beecbf24SJeremy L Thompson 962ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to mark as stale 963ea61e9acSJeremy L Thompson @param[in] needs_data_update Boolean flag indicating if update is needed or completed 964beecbf24SJeremy L Thompson 965beecbf24SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 966beecbf24SJeremy L Thompson 967beecbf24SJeremy L Thompson @ref Backend 968beecbf24SJeremy L Thompson **/ 9692b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetUpdateNeeded(CeedQFunctionAssemblyData data, bool needs_data_update) { 970beecbf24SJeremy L Thompson data->needs_data_update = needs_data_update; 9718b919e6bSJeremy L Thompson return CEED_ERROR_SUCCESS; 9728b919e6bSJeremy L Thompson } 9738b919e6bSJeremy L Thompson 9748b919e6bSJeremy L Thompson /** 9758b919e6bSJeremy L Thompson @brief Determine if QFunctionAssemblyData needs update 9768b919e6bSJeremy L Thompson 9778b919e6bSJeremy L Thompson @param[in] data CeedQFunctionAssemblyData to mark as stale 9788b919e6bSJeremy L Thompson @param[out] is_update_needed Boolean flag indicating if re-assembly is required 9798b919e6bSJeremy L Thompson 9808b919e6bSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 9818b919e6bSJeremy L Thompson 9828b919e6bSJeremy L Thompson @ref Backend 9838b919e6bSJeremy L Thompson **/ 9842b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsUpdateNeeded(CeedQFunctionAssemblyData data, bool *is_update_needed) { 985beecbf24SJeremy L Thompson *is_update_needed = !data->reuse_data || data->needs_data_update; 9868b919e6bSJeremy L Thompson return CEED_ERROR_SUCCESS; 9878b919e6bSJeremy L Thompson } 9888b919e6bSJeremy L Thompson 9898b919e6bSJeremy L Thompson /** 990ea61e9acSJeremy L Thompson @brief Copy the pointer to a CeedQFunctionAssemblyData. 991ea61e9acSJeremy L Thompson Both pointers should be destroyed with `CeedCeedQFunctionAssemblyDataDestroy()`. 992ea61e9acSJeremy L Thompson Note: If `*data_copy` is non-NULL, then it is assumed that `*data_copy` is a pointer to a CeedQFunctionAssemblyData. 993ea61e9acSJeremy L Thompson This CeedQFunctionAssemblyData will be destroyed if `*data_copy` is the only reference to this CeedQFunctionAssemblyData. 994480fae85SJeremy L Thompson 995ea61e9acSJeremy L Thompson @param[in] data CeedQFunctionAssemblyData to copy reference to 996ea61e9acSJeremy L Thompson @param[in,out] data_copy Variable to store copied reference 997480fae85SJeremy L Thompson 998480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 999480fae85SJeremy L Thompson 1000480fae85SJeremy L Thompson @ref Backend 1001480fae85SJeremy L Thompson **/ 10022b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataReferenceCopy(CeedQFunctionAssemblyData data, CeedQFunctionAssemblyData *data_copy) { 10032b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataReference(data)); 10042b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataDestroy(data_copy)); 1005480fae85SJeremy L Thompson *data_copy = data; 1006480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1007480fae85SJeremy L Thompson } 1008480fae85SJeremy L Thompson 1009480fae85SJeremy L Thompson /** 1010480fae85SJeremy L Thompson @brief Get setup status for internal objects for CeedQFunctionAssemblyData 1011480fae85SJeremy L Thompson 1012ea61e9acSJeremy L Thompson @param[in] data CeedQFunctionAssemblyData to retrieve status 1013480fae85SJeremy L Thompson @param[out] is_setup Boolean flag for setup status 1014480fae85SJeremy L Thompson 1015480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1016480fae85SJeremy L Thompson 1017480fae85SJeremy L Thompson @ref Backend 1018480fae85SJeremy L Thompson **/ 10192b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsSetup(CeedQFunctionAssemblyData data, bool *is_setup) { 1020480fae85SJeremy L Thompson *is_setup = data->is_setup; 1021480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1022480fae85SJeremy L Thompson } 1023480fae85SJeremy L Thompson 1024480fae85SJeremy L Thompson /** 1025480fae85SJeremy L Thompson @brief Set internal objects for CeedQFunctionAssemblyData 1026480fae85SJeremy L Thompson 1027ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to set objects 1028480fae85SJeremy L Thompson @param[in] vec CeedVector to store assembled CeedQFunction at quadrature points 1029480fae85SJeremy L Thompson @param[in] rstr CeedElemRestriction for CeedVector containing assembled CeedQFunction 1030480fae85SJeremy L Thompson 1031480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1032480fae85SJeremy L Thompson 1033480fae85SJeremy L Thompson @ref Backend 1034480fae85SJeremy L Thompson **/ 10352b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetObjects(CeedQFunctionAssemblyData data, CeedVector vec, CeedElemRestriction rstr) { 10362b730f8bSJeremy L Thompson CeedCall(CeedVectorReferenceCopy(vec, &data->vec)); 10372b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(rstr, &data->rstr)); 1038480fae85SJeremy L Thompson 1039480fae85SJeremy L Thompson data->is_setup = true; 1040480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1041480fae85SJeremy L Thompson } 1042480fae85SJeremy L Thompson 10432b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataGetObjects(CeedQFunctionAssemblyData data, CeedVector *vec, CeedElemRestriction *rstr) { 10442b730f8bSJeremy L Thompson if (!data->is_setup) { 1045480fae85SJeremy L Thompson // LCOV_EXCL_START 10462b730f8bSJeremy L Thompson return CeedError(data->ceed, CEED_ERROR_INCOMPLETE, "Internal objects not set; must call CeedQFunctionAssemblyDataSetObjects first."); 1047480fae85SJeremy L Thompson // LCOV_EXCL_STOP 10482b730f8bSJeremy L Thompson } 1049480fae85SJeremy L Thompson 10502b730f8bSJeremy L Thompson CeedCall(CeedVectorReferenceCopy(data->vec, vec)); 10512b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(data->rstr, rstr)); 1052480fae85SJeremy L Thompson 1053480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1054480fae85SJeremy L Thompson } 1055480fae85SJeremy L Thompson 1056480fae85SJeremy L Thompson /** 1057480fae85SJeremy L Thompson @brief Destroy CeedQFunctionAssemblyData 1058480fae85SJeremy L Thompson 1059ea61e9acSJeremy L Thompson @param[in,out] data CeedQFunctionAssemblyData to destroy 1060480fae85SJeremy L Thompson 1061480fae85SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1062480fae85SJeremy L Thompson 1063480fae85SJeremy L Thompson @ref Backend 1064480fae85SJeremy L Thompson **/ 1065480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataDestroy(CeedQFunctionAssemblyData *data) { 1066480fae85SJeremy L Thompson if (!*data || --(*data)->ref_count > 0) return CEED_ERROR_SUCCESS; 1067480fae85SJeremy L Thompson 10682b730f8bSJeremy L Thompson CeedCall(CeedDestroy(&(*data)->ceed)); 10692b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&(*data)->vec)); 10702b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&(*data)->rstr)); 1071480fae85SJeremy L Thompson 10722b730f8bSJeremy L Thompson CeedCall(CeedFree(data)); 1073480fae85SJeremy L Thompson return CEED_ERROR_SUCCESS; 1074480fae85SJeremy L Thompson } 1075480fae85SJeremy L Thompson 1076ed9e99e6SJeremy L Thompson /** 1077ed9e99e6SJeremy L Thompson @brief Get CeedOperatorAssemblyData 1078ed9e99e6SJeremy L Thompson 1079ed9e99e6SJeremy L Thompson @param[in] op CeedOperator to assemble 1080ed9e99e6SJeremy L Thompson @param[out] data CeedQFunctionAssemblyData 1081ed9e99e6SJeremy L Thompson 1082ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1083ed9e99e6SJeremy L Thompson 1084ed9e99e6SJeremy L Thompson @ref Backend 1085ed9e99e6SJeremy L Thompson **/ 10862b730f8bSJeremy L Thompson int CeedOperatorGetOperatorAssemblyData(CeedOperator op, CeedOperatorAssemblyData *data) { 1087ed9e99e6SJeremy L Thompson if (!op->op_assembled) { 1088ed9e99e6SJeremy L Thompson CeedOperatorAssemblyData data; 1089ed9e99e6SJeremy L Thompson 10902b730f8bSJeremy L Thompson CeedCall(CeedOperatorAssemblyDataCreate(op->ceed, op, &data)); 1091ed9e99e6SJeremy L Thompson op->op_assembled = data; 1092ed9e99e6SJeremy L Thompson } 1093ed9e99e6SJeremy L Thompson *data = op->op_assembled; 1094ed9e99e6SJeremy L Thompson 1095ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1096ed9e99e6SJeremy L Thompson } 1097ed9e99e6SJeremy L Thompson 1098ed9e99e6SJeremy L Thompson /** 1099ed9e99e6SJeremy L Thompson @brief Create object holding CeedOperator assembly data 1100ed9e99e6SJeremy L Thompson 1101ea61e9acSJeremy L Thompson @param[in] ceed Ceed object where the CeedOperatorAssemblyData will be created 1102ed9e99e6SJeremy L Thompson @param[in] op CeedOperator to be assembled 1103ea61e9acSJeremy L Thompson @param[out] data Address of the variable where the newly created CeedOperatorAssemblyData will be stored 1104ed9e99e6SJeremy L Thompson 1105ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1106ed9e99e6SJeremy L Thompson 1107ed9e99e6SJeremy L Thompson @ref Backend 1108ed9e99e6SJeremy L Thompson **/ 11092b730f8bSJeremy L Thompson int CeedOperatorAssemblyDataCreate(Ceed ceed, CeedOperator op, CeedOperatorAssemblyData *data) { 11102b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, data)); 1111ed9e99e6SJeremy L Thompson (*data)->ceed = ceed; 11122b730f8bSJeremy L Thompson CeedCall(CeedReference(ceed)); 1113ed9e99e6SJeremy L Thompson 1114ed9e99e6SJeremy L Thompson // Build OperatorAssembly data 1115ed9e99e6SJeremy L Thompson CeedQFunction qf; 1116ed9e99e6SJeremy L Thompson CeedQFunctionField *qf_fields; 1117ed9e99e6SJeremy L Thompson CeedOperatorField *op_fields; 1118ed9e99e6SJeremy L Thompson CeedInt num_input_fields; 11192b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 11202b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetFields(qf, &num_input_fields, &qf_fields, NULL, NULL)); 11212b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL)); 1122ed9e99e6SJeremy L Thompson 1123ed9e99e6SJeremy L Thompson // Determine active input basis 1124ed9e99e6SJeremy L Thompson CeedInt num_eval_mode_in = 0, dim = 1; 1125ed9e99e6SJeremy L Thompson CeedEvalMode *eval_mode_in = NULL; 1126ed9e99e6SJeremy L Thompson CeedBasis basis_in = NULL; 1127ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 1128ed9e99e6SJeremy L Thompson CeedVector vec; 11292b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec)); 1130ed9e99e6SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 11312b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_in)); 11322b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis_in, &dim)); 1133ed9e99e6SJeremy L Thompson CeedEvalMode eval_mode; 11342b730f8bSJeremy L Thompson CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 1135ed9e99e6SJeremy L Thompson switch (eval_mode) { 1136ed9e99e6SJeremy L Thompson case CEED_EVAL_NONE: 1137ed9e99e6SJeremy L Thompson case CEED_EVAL_INTERP: 11382b730f8bSJeremy L Thompson CeedCall(CeedRealloc(num_eval_mode_in + 1, &eval_mode_in)); 1139ed9e99e6SJeremy L Thompson eval_mode_in[num_eval_mode_in] = eval_mode; 1140ed9e99e6SJeremy L Thompson num_eval_mode_in += 1; 1141ed9e99e6SJeremy L Thompson break; 1142ed9e99e6SJeremy L Thompson case CEED_EVAL_GRAD: 11432b730f8bSJeremy L Thompson CeedCall(CeedRealloc(num_eval_mode_in + dim, &eval_mode_in)); 1144ed9e99e6SJeremy L Thompson for (CeedInt d = 0; d < dim; d++) { 1145ed9e99e6SJeremy L Thompson eval_mode_in[num_eval_mode_in + d] = eval_mode; 1146ed9e99e6SJeremy L Thompson } 1147ed9e99e6SJeremy L Thompson num_eval_mode_in += dim; 1148ed9e99e6SJeremy L Thompson break; 1149ed9e99e6SJeremy L Thompson case CEED_EVAL_WEIGHT: 1150ed9e99e6SJeremy L Thompson case CEED_EVAL_DIV: 1151ed9e99e6SJeremy L Thompson case CEED_EVAL_CURL: 1152ed9e99e6SJeremy L Thompson break; // Caught by QF Assembly 1153ed9e99e6SJeremy L Thompson } 1154ed9e99e6SJeremy L Thompson } 1155ed9e99e6SJeremy L Thompson } 1156ed9e99e6SJeremy L Thompson (*data)->num_eval_mode_in = num_eval_mode_in; 1157ed9e99e6SJeremy L Thompson (*data)->eval_mode_in = eval_mode_in; 11582b730f8bSJeremy L Thompson CeedCall(CeedBasisReferenceCopy(basis_in, &(*data)->basis_in)); 1159ed9e99e6SJeremy L Thompson 1160ed9e99e6SJeremy L Thompson // Determine active output basis 1161ed9e99e6SJeremy L Thompson CeedInt num_output_fields; 11622b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetFields(qf, NULL, NULL, &num_output_fields, &qf_fields)); 11632b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields)); 1164ed9e99e6SJeremy L Thompson CeedInt num_eval_mode_out = 0; 1165ed9e99e6SJeremy L Thompson CeedEvalMode *eval_mode_out = NULL; 1166ed9e99e6SJeremy L Thompson CeedBasis basis_out = NULL; 1167ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < num_output_fields; i++) { 1168ed9e99e6SJeremy L Thompson CeedVector vec; 11692b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec)); 1170ed9e99e6SJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 11712b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_out)); 1172ed9e99e6SJeremy L Thompson CeedEvalMode eval_mode; 11732b730f8bSJeremy L Thompson CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 1174ed9e99e6SJeremy L Thompson switch (eval_mode) { 1175ed9e99e6SJeremy L Thompson case CEED_EVAL_NONE: 1176ed9e99e6SJeremy L Thompson case CEED_EVAL_INTERP: 11772b730f8bSJeremy L Thompson CeedCall(CeedRealloc(num_eval_mode_out + 1, &eval_mode_out)); 1178ed9e99e6SJeremy L Thompson eval_mode_out[num_eval_mode_out] = eval_mode; 1179ed9e99e6SJeremy L Thompson num_eval_mode_out += 1; 1180ed9e99e6SJeremy L Thompson break; 1181ed9e99e6SJeremy L Thompson case CEED_EVAL_GRAD: 11822b730f8bSJeremy L Thompson CeedCall(CeedRealloc(num_eval_mode_out + dim, &eval_mode_out)); 1183ed9e99e6SJeremy L Thompson for (CeedInt d = 0; d < dim; d++) { 1184ed9e99e6SJeremy L Thompson eval_mode_out[num_eval_mode_out + d] = eval_mode; 1185ed9e99e6SJeremy L Thompson } 1186ed9e99e6SJeremy L Thompson num_eval_mode_out += dim; 1187ed9e99e6SJeremy L Thompson break; 1188ed9e99e6SJeremy L Thompson case CEED_EVAL_WEIGHT: 1189ed9e99e6SJeremy L Thompson case CEED_EVAL_DIV: 1190ed9e99e6SJeremy L Thompson case CEED_EVAL_CURL: 1191ed9e99e6SJeremy L Thompson break; // Caught by QF Assembly 1192ed9e99e6SJeremy L Thompson } 1193ed9e99e6SJeremy L Thompson } 1194ed9e99e6SJeremy L Thompson } 1195ed9e99e6SJeremy L Thompson (*data)->num_eval_mode_out = num_eval_mode_out; 1196ed9e99e6SJeremy L Thompson (*data)->eval_mode_out = eval_mode_out; 11972b730f8bSJeremy L Thompson CeedCall(CeedBasisReferenceCopy(basis_out, &(*data)->basis_out)); 1198ed9e99e6SJeremy L Thompson 1199ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1200ed9e99e6SJeremy L Thompson } 1201ed9e99e6SJeremy L Thompson 1202ed9e99e6SJeremy L Thompson /** 1203ed9e99e6SJeremy L Thompson @brief Get CeedOperator CeedEvalModes for assembly 1204ed9e99e6SJeremy L Thompson 1205ed9e99e6SJeremy L Thompson @param[in] data CeedOperatorAssemblyData 1206ed9e99e6SJeremy L Thompson @param[out] num_eval_mode_in Pointer to hold number of input CeedEvalModes, or NULL 1207ed9e99e6SJeremy L Thompson @param[out] eval_mode_in Pointer to hold input CeedEvalModes, or NULL 1208ed9e99e6SJeremy L Thompson @param[out] num_eval_mode_out Pointer to hold number of output CeedEvalModes, or NULL 1209ed9e99e6SJeremy L Thompson @param[out] eval_mode_out Pointer to hold output CeedEvalModes, or NULL 1210ed9e99e6SJeremy L Thompson 1211ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1212ed9e99e6SJeremy L Thompson 1213ed9e99e6SJeremy L Thompson @ref Backend 1214ed9e99e6SJeremy L Thompson **/ 12152b730f8bSJeremy L Thompson int CeedOperatorAssemblyDataGetEvalModes(CeedOperatorAssemblyData data, CeedInt *num_eval_mode_in, const CeedEvalMode **eval_mode_in, 1216ed9e99e6SJeremy L Thompson CeedInt *num_eval_mode_out, const CeedEvalMode **eval_mode_out) { 1217ed9e99e6SJeremy L Thompson if (num_eval_mode_in) *num_eval_mode_in = data->num_eval_mode_in; 1218ed9e99e6SJeremy L Thompson if (eval_mode_in) *eval_mode_in = data->eval_mode_in; 1219ed9e99e6SJeremy L Thompson if (num_eval_mode_out) *num_eval_mode_out = data->num_eval_mode_out; 1220ed9e99e6SJeremy L Thompson if (eval_mode_out) *eval_mode_out = data->eval_mode_out; 1221ed9e99e6SJeremy L Thompson 1222ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1223ed9e99e6SJeremy L Thompson } 1224ed9e99e6SJeremy L Thompson 1225ed9e99e6SJeremy L Thompson /** 1226ed9e99e6SJeremy L Thompson @brief Get CeedOperator CeedBasis data for assembly 1227ed9e99e6SJeremy L Thompson 1228ed9e99e6SJeremy L Thompson @param[in] data CeedOperatorAssemblyData 1229ed9e99e6SJeremy L Thompson @param[out] basis_in Pointer to hold active input CeedBasis, or NULL 1230ed9e99e6SJeremy L Thompson @param[out] B_in Pointer to hold assembled active input B, or NULL 1231ed9e99e6SJeremy L Thompson @param[out] basis_out Pointer to hold active output CeedBasis, or NULL 1232ed9e99e6SJeremy L Thompson @param[out] B_out Pointer to hold assembled active output B, or NULL 1233ed9e99e6SJeremy L Thompson 1234ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1235ed9e99e6SJeremy L Thompson 1236ed9e99e6SJeremy L Thompson @ref Backend 1237ed9e99e6SJeremy L Thompson **/ 12382b730f8bSJeremy L Thompson int CeedOperatorAssemblyDataGetBases(CeedOperatorAssemblyData data, CeedBasis *basis_in, const CeedScalar **B_in, CeedBasis *basis_out, 1239ed9e99e6SJeremy L Thompson const CeedScalar **B_out) { 1240ed9e99e6SJeremy L Thompson // Assemble B_in, B_out if needed 1241ed9e99e6SJeremy L Thompson if (B_in && !data->B_in) { 1242ed9e99e6SJeremy L Thompson CeedInt num_qpts, elem_size; 1243ed9e99e6SJeremy L Thompson CeedScalar *B_in, *identity = NULL; 1244ed9e99e6SJeremy L Thompson const CeedScalar *interp_in, *grad_in; 1245ed9e99e6SJeremy L Thompson bool has_eval_none = false; 1246ed9e99e6SJeremy L Thompson 12472b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(data->basis_in, &num_qpts)); 12482b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes(data->basis_in, &elem_size)); 12492b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_qpts * elem_size * data->num_eval_mode_in, &B_in)); 1250ed9e99e6SJeremy L Thompson 1251ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < data->num_eval_mode_in; i++) { 1252ed9e99e6SJeremy L Thompson has_eval_none = has_eval_none || (data->eval_mode_in[i] == CEED_EVAL_NONE); 1253ed9e99e6SJeremy L Thompson } 1254ed9e99e6SJeremy L Thompson if (has_eval_none) { 12552b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_qpts * elem_size, &identity)); 1256ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < (elem_size < num_qpts ? elem_size : num_qpts); i++) { 1257ed9e99e6SJeremy L Thompson identity[i * elem_size + i] = 1.0; 1258ed9e99e6SJeremy L Thompson } 1259ed9e99e6SJeremy L Thompson } 12602b730f8bSJeremy L Thompson CeedCall(CeedBasisGetInterp(data->basis_in, &interp_in)); 12612b730f8bSJeremy L Thompson CeedCall(CeedBasisGetGrad(data->basis_in, &grad_in)); 1262ed9e99e6SJeremy L Thompson 1263ed9e99e6SJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 1264ed9e99e6SJeremy L Thompson for (CeedInt n = 0; n < elem_size; n++) { 1265ed9e99e6SJeremy L Thompson CeedInt d_in = -1; 1266ed9e99e6SJeremy L Thompson for (CeedInt e_in = 0; e_in < data->num_eval_mode_in; e_in++) { 1267ed9e99e6SJeremy L Thompson const CeedInt qq = data->num_eval_mode_in * q; 1268ed9e99e6SJeremy L Thompson const CeedScalar *b = NULL; 1269ed9e99e6SJeremy L Thompson 1270ed9e99e6SJeremy L Thompson if (data->eval_mode_in[e_in] == CEED_EVAL_GRAD) d_in++; 12712b730f8bSJeremy L Thompson CeedOperatorGetBasisPointer(data->eval_mode_in[e_in], identity, interp_in, &grad_in[d_in * num_qpts * elem_size], &b); 1272ed9e99e6SJeremy L Thompson B_in[(qq + e_in) * elem_size + n] = b[q * elem_size + n]; 1273ed9e99e6SJeremy L Thompson } 1274ed9e99e6SJeremy L Thompson } 1275ed9e99e6SJeremy L Thompson } 1276ed9e99e6SJeremy L Thompson data->B_in = B_in; 1277ed9e99e6SJeremy L Thompson } 1278ed9e99e6SJeremy L Thompson 1279ed9e99e6SJeremy L Thompson if (B_out && !data->B_out) { 1280ed9e99e6SJeremy L Thompson CeedInt num_qpts, elem_size; 1281ed9e99e6SJeremy L Thompson CeedScalar *B_out, *identity = NULL; 1282ed9e99e6SJeremy L Thompson const CeedScalar *interp_out, *grad_out; 1283ed9e99e6SJeremy L Thompson bool has_eval_none = false; 1284ed9e99e6SJeremy L Thompson 12852b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(data->basis_out, &num_qpts)); 12862b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes(data->basis_out, &elem_size)); 12872b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_qpts * elem_size * data->num_eval_mode_out, &B_out)); 1288ed9e99e6SJeremy L Thompson 1289ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < data->num_eval_mode_out; i++) { 1290ed9e99e6SJeremy L Thompson has_eval_none = has_eval_none || (data->eval_mode_out[i] == CEED_EVAL_NONE); 1291ed9e99e6SJeremy L Thompson } 1292ed9e99e6SJeremy L Thompson if (has_eval_none) { 12932b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_qpts * elem_size, &identity)); 1294ed9e99e6SJeremy L Thompson for (CeedInt i = 0; i < (elem_size < num_qpts ? elem_size : num_qpts); i++) { 1295ed9e99e6SJeremy L Thompson identity[i * elem_size + i] = 1.0; 1296ed9e99e6SJeremy L Thompson } 1297ed9e99e6SJeremy L Thompson } 12982b730f8bSJeremy L Thompson CeedCall(CeedBasisGetInterp(data->basis_out, &interp_out)); 12992b730f8bSJeremy L Thompson CeedCall(CeedBasisGetGrad(data->basis_out, &grad_out)); 1300ed9e99e6SJeremy L Thompson 1301ed9e99e6SJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 1302ed9e99e6SJeremy L Thompson for (CeedInt n = 0; n < elem_size; n++) { 1303ed9e99e6SJeremy L Thompson CeedInt d_out = -1; 1304ed9e99e6SJeremy L Thompson for (CeedInt e_out = 0; e_out < data->num_eval_mode_out; e_out++) { 1305ed9e99e6SJeremy L Thompson const CeedInt qq = data->num_eval_mode_out * q; 1306ed9e99e6SJeremy L Thompson const CeedScalar *b = NULL; 1307ed9e99e6SJeremy L Thompson 1308ed9e99e6SJeremy L Thompson if (data->eval_mode_out[e_out] == CEED_EVAL_GRAD) d_out++; 13092b730f8bSJeremy L Thompson CeedOperatorGetBasisPointer(data->eval_mode_out[e_out], identity, interp_out, &grad_out[d_out * num_qpts * elem_size], &b); 1310ed9e99e6SJeremy L Thompson B_out[(qq + e_out) * elem_size + n] = b[q * elem_size + n]; 1311ed9e99e6SJeremy L Thompson } 1312ed9e99e6SJeremy L Thompson } 1313ed9e99e6SJeremy L Thompson } 1314ed9e99e6SJeremy L Thompson data->B_out = B_out; 1315ed9e99e6SJeremy L Thompson } 1316ed9e99e6SJeremy L Thompson 1317ed9e99e6SJeremy L Thompson if (basis_in) *basis_in = data->basis_in; 1318ed9e99e6SJeremy L Thompson if (B_in) *B_in = data->B_in; 1319ed9e99e6SJeremy L Thompson if (basis_out) *basis_out = data->basis_out; 1320ed9e99e6SJeremy L Thompson if (B_out) *B_out = data->B_out; 1321ed9e99e6SJeremy L Thompson 1322ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1323ed9e99e6SJeremy L Thompson } 1324ed9e99e6SJeremy L Thompson 1325ed9e99e6SJeremy L Thompson /** 1326ed9e99e6SJeremy L Thompson @brief Destroy CeedOperatorAssemblyData 1327ed9e99e6SJeremy L Thompson 1328ea61e9acSJeremy L Thompson @param[in,out] data CeedOperatorAssemblyData to destroy 1329ed9e99e6SJeremy L Thompson 1330ed9e99e6SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1331ed9e99e6SJeremy L Thompson 1332ed9e99e6SJeremy L Thompson @ref Backend 1333ed9e99e6SJeremy L Thompson **/ 1334ed9e99e6SJeremy L Thompson int CeedOperatorAssemblyDataDestroy(CeedOperatorAssemblyData *data) { 1335ed9e99e6SJeremy L Thompson if (!*data) return CEED_ERROR_SUCCESS; 1336ed9e99e6SJeremy L Thompson 13372b730f8bSJeremy L Thompson CeedCall(CeedDestroy(&(*data)->ceed)); 13382b730f8bSJeremy L Thompson CeedCall(CeedBasisDestroy(&(*data)->basis_in)); 13392b730f8bSJeremy L Thompson CeedCall(CeedBasisDestroy(&(*data)->basis_out)); 13402b730f8bSJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_in)); 13412b730f8bSJeremy L Thompson CeedCall(CeedFree(&(*data)->eval_mode_out)); 13422b730f8bSJeremy L Thompson CeedCall(CeedFree(&(*data)->B_in)); 13432b730f8bSJeremy L Thompson CeedCall(CeedFree(&(*data)->B_out)); 1344ed9e99e6SJeremy L Thompson 13452b730f8bSJeremy L Thompson CeedCall(CeedFree(data)); 1346ed9e99e6SJeremy L Thompson return CEED_ERROR_SUCCESS; 1347ed9e99e6SJeremy L Thompson } 1348ed9e99e6SJeremy L Thompson 1349480fae85SJeremy L Thompson /// @} 1350480fae85SJeremy L Thompson 1351480fae85SJeremy L Thompson /// ---------------------------------------------------------------------------- 1352eaf62fffSJeremy L Thompson /// CeedOperator Public API 1353eaf62fffSJeremy L Thompson /// ---------------------------------------------------------------------------- 1354eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorUser 1355eaf62fffSJeremy L Thompson /// @{ 1356eaf62fffSJeremy L Thompson 1357eaf62fffSJeremy L Thompson /** 1358eaf62fffSJeremy L Thompson @brief Assemble a linear CeedQFunction associated with a CeedOperator 1359eaf62fffSJeremy L Thompson 1360ea61e9acSJeremy L Thompson This returns a CeedVector containing a matrix at each quadrature point providing the action of the CeedQFunction associated with the CeedOperator. 1361ea61e9acSJeremy L Thompson The vector 'assembled' is of shape [num_elements, num_input_fields, num_output_fields, num_quad_points] and contains column-major matrices 1362ea61e9acSJeremy L Thompson representing the action of the CeedQFunction for a corresponding quadrature point on an element. Inputs and outputs are in the order provided by the 1363ea61e9acSJeremy L Thompson user when adding CeedOperator fields. For example, a CeedQFunction with inputs 'u' and 'gradu' and outputs 'gradv' and 'v', provided in that order, 1364ea61e9acSJeremy L Thompson would result in an assembled QFunction that consists of (1 + dim) x (dim + 1) matrices at each quadrature point acting on the input [u, du_0, du_1] 1365ea61e9acSJeremy L Thompson and producing the output [dv_0, dv_1, v]. 1366eaf62fffSJeremy L Thompson 1367ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1368f04ea552SJeremy L Thompson 1369ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1370ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points 1371ea61e9acSJeremy L Thompson @param[out] rstr CeedElemRestriction for CeedVector containing assembled CeedQFunction 1372ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1373eaf62fffSJeremy L Thompson 1374eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1375eaf62fffSJeremy L Thompson 1376eaf62fffSJeremy L Thompson @ref User 1377eaf62fffSJeremy L Thompson **/ 13782b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunction(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 13792b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1380eaf62fffSJeremy L Thompson 1381eaf62fffSJeremy L Thompson if (op->LinearAssembleQFunction) { 1382d04bbc78SJeremy L Thompson // Backend version 13832b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleQFunction(op, assembled, rstr, request)); 1384eaf62fffSJeremy L Thompson } else { 1385d04bbc78SJeremy L Thompson // Operator fallback 1386d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1387d04bbc78SJeremy L Thompson 13882b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1389d04bbc78SJeremy L Thompson if (op_fallback) { 13902b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunction(op_fallback, assembled, rstr, request)); 1391d04bbc78SJeremy L Thompson } else { 1392d04bbc78SJeremy L Thompson // LCOV_EXCL_START 13932b730f8bSJeremy L Thompson return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunction"); 1394d04bbc78SJeremy L Thompson // LCOV_EXCL_STOP 1395d04bbc78SJeremy L Thompson } 139670a7ffb3SJeremy L Thompson } 1397eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1398eaf62fffSJeremy L Thompson } 139970a7ffb3SJeremy L Thompson 140070a7ffb3SJeremy L Thompson /** 1401ea61e9acSJeremy L Thompson @brief Assemble CeedQFunction and store result internally. 1402ea61e9acSJeremy L Thompson Return copied references of stored data to the caller. 1403ea61e9acSJeremy L Thompson Caller is responsible for ownership and destruction of the copied references. 1404ea61e9acSJeremy L Thompson See also @ref CeedOperatorLinearAssembleQFunction 140570a7ffb3SJeremy L Thompson 1406ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1407ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points 1408ea61e9acSJeremy L Thompson @param[out] rstr CeedElemRestriction for CeedVector containing assembledCeedQFunction 1409ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 141070a7ffb3SJeremy L Thompson 141170a7ffb3SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 141270a7ffb3SJeremy L Thompson 141370a7ffb3SJeremy L Thompson @ref User 141470a7ffb3SJeremy L Thompson **/ 14152b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunctionBuildOrUpdate(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) { 14162b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 141770a7ffb3SJeremy L Thompson 141870a7ffb3SJeremy L Thompson if (op->LinearAssembleQFunctionUpdate) { 1419d04bbc78SJeremy L Thompson // Backend version 1420480fae85SJeremy L Thompson bool qf_assembled_is_setup; 14212efa2d85SJeremy L Thompson CeedVector assembled_vec = NULL; 14222efa2d85SJeremy L Thompson CeedElemRestriction assembled_rstr = NULL; 1423480fae85SJeremy L Thompson 14242b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataIsSetup(op->qf_assembled, &qf_assembled_is_setup)); 1425480fae85SJeremy L Thompson if (qf_assembled_is_setup) { 1426d04bbc78SJeremy L Thompson bool update_needed; 1427d04bbc78SJeremy L Thompson 14282b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataGetObjects(op->qf_assembled, &assembled_vec, &assembled_rstr)); 14292b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataIsUpdateNeeded(op->qf_assembled, &update_needed)); 14308b919e6bSJeremy L Thompson if (update_needed) { 14312b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleQFunctionUpdate(op, assembled_vec, assembled_rstr, request)); 14328b919e6bSJeremy L Thompson } 143370a7ffb3SJeremy L Thompson } else { 14342b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleQFunction(op, &assembled_vec, &assembled_rstr, request)); 14352b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataSetObjects(op->qf_assembled, assembled_vec, assembled_rstr)); 143670a7ffb3SJeremy L Thompson } 14372b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAssemblyDataSetUpdateNeeded(op->qf_assembled, false)); 14382efa2d85SJeremy L Thompson 1439d04bbc78SJeremy L Thompson // Copy reference from internally held copy 144070a7ffb3SJeremy L Thompson *assembled = NULL; 144170a7ffb3SJeremy L Thompson *rstr = NULL; 14422b730f8bSJeremy L Thompson CeedCall(CeedVectorReferenceCopy(assembled_vec, assembled)); 14432b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled_vec)); 14442b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionReferenceCopy(assembled_rstr, rstr)); 14452b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&assembled_rstr)); 144670a7ffb3SJeremy L Thompson } else { 1447d04bbc78SJeremy L Thompson // Operator fallback 1448d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1449d04bbc78SJeremy L Thompson 14502b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1451d04bbc78SJeremy L Thompson if (op_fallback) { 14522b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op_fallback, assembled, rstr, request)); 1453d04bbc78SJeremy L Thompson } else { 1454d04bbc78SJeremy L Thompson // LCOV_EXCL_START 14552b730f8bSJeremy L Thompson return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunctionUpdate"); 1456d04bbc78SJeremy L Thompson // LCOV_EXCL_STOP 145770a7ffb3SJeremy L Thompson } 145870a7ffb3SJeremy L Thompson } 145970a7ffb3SJeremy L Thompson 146070a7ffb3SJeremy L Thompson return CEED_ERROR_SUCCESS; 1461eaf62fffSJeremy L Thompson } 1462eaf62fffSJeremy L Thompson 1463eaf62fffSJeremy L Thompson /** 1464eaf62fffSJeremy L Thompson @brief Assemble the diagonal of a square linear CeedOperator 1465eaf62fffSJeremy L Thompson 1466eaf62fffSJeremy L Thompson This overwrites a CeedVector with the diagonal of a linear CeedOperator. 1467eaf62fffSJeremy L Thompson 1468ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1469eaf62fffSJeremy L Thompson 1470ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1471f04ea552SJeremy L Thompson 1472ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1473eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator diagonal 1474ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1475eaf62fffSJeremy L Thompson 1476eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1477eaf62fffSJeremy L Thompson 1478eaf62fffSJeremy L Thompson @ref User 1479eaf62fffSJeremy L Thompson **/ 14802b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1481f3d47e36SJeremy L Thompson bool is_composite; 14822b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1483f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1484eaf62fffSJeremy L Thompson 1485c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 14862b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 14872b730f8bSJeremy L Thompson if (input_size != output_size) { 1488c9366a6bSJeremy L Thompson // LCOV_EXCL_START 1489c9366a6bSJeremy L Thompson return CeedError(op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1490c9366a6bSJeremy L Thompson // LCOV_EXCL_STOP 14912b730f8bSJeremy L Thompson } 1492c9366a6bSJeremy L Thompson 1493f3d47e36SJeremy L Thompson // Early exit for empty operator 1494f3d47e36SJeremy L Thompson if (!is_composite) { 1495f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1496f3d47e36SJeremy L Thompson 1497f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1498f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1499f3d47e36SJeremy L Thompson } 1500f3d47e36SJeremy L Thompson 1501eaf62fffSJeremy L Thompson if (op->LinearAssembleDiagonal) { 1502d04bbc78SJeremy L Thompson // Backend version 15032b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleDiagonal(op, assembled, request)); 1504eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1505eaf62fffSJeremy L Thompson } else if (op->LinearAssembleAddDiagonal) { 1506d04bbc78SJeremy L Thompson // Backend version with zeroing first 15072b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 15082b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request)); 1509eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1510eaf62fffSJeremy L Thompson } else { 1511d04bbc78SJeremy L Thompson // Operator fallback 1512d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1513d04bbc78SJeremy L Thompson 15142b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1515d04bbc78SJeremy L Thompson if (op_fallback) { 15162b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleDiagonal(op_fallback, assembled, request)); 1517eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1518eaf62fffSJeremy L Thompson } 1519eaf62fffSJeremy L Thompson } 1520eaf62fffSJeremy L Thompson // Default interface implementation 15212b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 15222b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddDiagonal(op, assembled, request)); 1523d04bbc78SJeremy L Thompson 1524eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1525eaf62fffSJeremy L Thompson } 1526eaf62fffSJeremy L Thompson 1527eaf62fffSJeremy L Thompson /** 1528eaf62fffSJeremy L Thompson @brief Assemble the diagonal of a square linear CeedOperator 1529eaf62fffSJeremy L Thompson 1530eaf62fffSJeremy L Thompson This sums into a CeedVector the diagonal of a linear CeedOperator. 1531eaf62fffSJeremy L Thompson 1532ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1533eaf62fffSJeremy L Thompson 1534ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1535f04ea552SJeremy L Thompson 1536ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1537eaf62fffSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator diagonal 1538ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1539eaf62fffSJeremy L Thompson 1540eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1541eaf62fffSJeremy L Thompson 1542eaf62fffSJeremy L Thompson @ref User 1543eaf62fffSJeremy L Thompson **/ 15442b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1545f3d47e36SJeremy L Thompson bool is_composite; 15462b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1547f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1548eaf62fffSJeremy L Thompson 1549c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 15502b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 15512b730f8bSJeremy L Thompson if (input_size != output_size) { 1552c9366a6bSJeremy L Thompson // LCOV_EXCL_START 1553c9366a6bSJeremy L Thompson return CeedError(op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1554c9366a6bSJeremy L Thompson // LCOV_EXCL_STOP 15552b730f8bSJeremy L Thompson } 1556c9366a6bSJeremy L Thompson 1557f3d47e36SJeremy L Thompson // Early exit for empty operator 1558f3d47e36SJeremy L Thompson if (!is_composite) { 1559f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1560f3d47e36SJeremy L Thompson 1561f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1562f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1563f3d47e36SJeremy L Thompson } 1564f3d47e36SJeremy L Thompson 1565eaf62fffSJeremy L Thompson if (op->LinearAssembleAddDiagonal) { 1566d04bbc78SJeremy L Thompson // Backend version 15672b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request)); 1568eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1569eaf62fffSJeremy L Thompson } else { 1570d04bbc78SJeremy L Thompson // Operator fallback 1571d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1572d04bbc78SJeremy L Thompson 15732b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1574d04bbc78SJeremy L Thompson if (op_fallback) { 15752b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddDiagonal(op_fallback, assembled, request)); 1576eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1577eaf62fffSJeremy L Thompson } 1578eaf62fffSJeremy L Thompson } 1579eaf62fffSJeremy L Thompson // Default interface implementation 1580eaf62fffSJeremy L Thompson if (is_composite) { 15812b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, false, assembled)); 1582eaf62fffSJeremy L Thompson } else { 15832b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, false, assembled)); 1584eaf62fffSJeremy L Thompson } 1585d04bbc78SJeremy L Thompson 1586d04bbc78SJeremy L Thompson return CEED_ERROR_SUCCESS; 1587eaf62fffSJeremy L Thompson } 1588eaf62fffSJeremy L Thompson 1589eaf62fffSJeremy L Thompson /** 1590eaf62fffSJeremy L Thompson @brief Assemble the point block diagonal of a square linear CeedOperator 1591eaf62fffSJeremy L Thompson 1592ea61e9acSJeremy L Thompson This overwrites a CeedVector with the point block diagonal of a linear CeedOperator. 1593eaf62fffSJeremy L Thompson 1594ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1595eaf62fffSJeremy L Thompson 1596ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1597f04ea552SJeremy L Thompson 1598ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1599ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp 1600ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out, 1601ea61e9acSJeremy L Thompson component in]. 1602ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1603eaf62fffSJeremy L Thompson 1604eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1605eaf62fffSJeremy L Thompson 1606eaf62fffSJeremy L Thompson @ref User 1607eaf62fffSJeremy L Thompson **/ 16082b730f8bSJeremy L Thompson int CeedOperatorLinearAssemblePointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1609f3d47e36SJeremy L Thompson bool is_composite; 16102b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1611f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1612eaf62fffSJeremy L Thompson 1613c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 16142b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 16152b730f8bSJeremy L Thompson if (input_size != output_size) { 1616c9366a6bSJeremy L Thompson // LCOV_EXCL_START 1617c9366a6bSJeremy L Thompson return CeedError(op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1618c9366a6bSJeremy L Thompson // LCOV_EXCL_STOP 16192b730f8bSJeremy L Thompson } 1620c9366a6bSJeremy L Thompson 1621f3d47e36SJeremy L Thompson // Early exit for empty operator 1622f3d47e36SJeremy L Thompson if (!is_composite) { 1623f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1624f3d47e36SJeremy L Thompson 1625f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1626f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1627f3d47e36SJeremy L Thompson } 1628f3d47e36SJeremy L Thompson 1629eaf62fffSJeremy L Thompson if (op->LinearAssemblePointBlockDiagonal) { 1630d04bbc78SJeremy L Thompson // Backend version 16312b730f8bSJeremy L Thompson CeedCall(op->LinearAssemblePointBlockDiagonal(op, assembled, request)); 1632eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1633eaf62fffSJeremy L Thompson } else if (op->LinearAssembleAddPointBlockDiagonal) { 1634d04bbc78SJeremy L Thompson // Backend version with zeroing first 16352b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 16362b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request)); 1637eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1638eaf62fffSJeremy L Thompson } else { 1639d04bbc78SJeremy L Thompson // Operator fallback 1640d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1641d04bbc78SJeremy L Thompson 16422b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1643d04bbc78SJeremy L Thompson if (op_fallback) { 16442b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssemblePointBlockDiagonal(op_fallback, assembled, request)); 1645eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1646eaf62fffSJeremy L Thompson } 1647eaf62fffSJeremy L Thompson } 1648eaf62fffSJeremy L Thompson // Default interface implementation 16492b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(assembled, 0.0)); 16502b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request)); 1651d04bbc78SJeremy L Thompson 1652eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1653eaf62fffSJeremy L Thompson } 1654eaf62fffSJeremy L Thompson 1655eaf62fffSJeremy L Thompson /** 1656eaf62fffSJeremy L Thompson @brief Assemble the point block diagonal of a square linear CeedOperator 1657eaf62fffSJeremy L Thompson 1658ea61e9acSJeremy L Thompson This sums into a CeedVector with the point block diagonal of a linear CeedOperator. 1659eaf62fffSJeremy L Thompson 1660ea61e9acSJeremy L Thompson Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported. 1661eaf62fffSJeremy L Thompson 1662ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1663f04ea552SJeremy L Thompson 1664ea61e9acSJeremy L Thompson @param[in] op CeedOperator to assemble CeedQFunction 1665ea61e9acSJeremy L Thompson @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp 1666ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out, 1667ea61e9acSJeremy L Thompson component in]. 1668ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 1669eaf62fffSJeremy L Thompson 1670eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1671eaf62fffSJeremy L Thompson 1672eaf62fffSJeremy L Thompson @ref User 1673eaf62fffSJeremy L Thompson **/ 16742b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddPointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) { 1675f3d47e36SJeremy L Thompson bool is_composite; 16762b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1677f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1678eaf62fffSJeremy L Thompson 1679c9366a6bSJeremy L Thompson CeedSize input_size = 0, output_size = 0; 16802b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size)); 16812b730f8bSJeremy L Thompson if (input_size != output_size) { 1682c9366a6bSJeremy L Thompson // LCOV_EXCL_START 1683c9366a6bSJeremy L Thompson return CeedError(op->ceed, CEED_ERROR_DIMENSION, "Operator must be square"); 1684c9366a6bSJeremy L Thompson // LCOV_EXCL_STOP 16852b730f8bSJeremy L Thompson } 1686c9366a6bSJeremy L Thompson 1687f3d47e36SJeremy L Thompson // Early exit for empty operator 1688f3d47e36SJeremy L Thompson if (!is_composite) { 1689f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1690f3d47e36SJeremy L Thompson 1691f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1692f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1693f3d47e36SJeremy L Thompson } 1694f3d47e36SJeremy L Thompson 1695eaf62fffSJeremy L Thompson if (op->LinearAssembleAddPointBlockDiagonal) { 1696d04bbc78SJeremy L Thompson // Backend version 16972b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleAddPointBlockDiagonal(op, assembled, request)); 1698eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1699eaf62fffSJeremy L Thompson } else { 1700d04bbc78SJeremy L Thompson // Operator fallback 1701d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1702d04bbc78SJeremy L Thompson 17032b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1704d04bbc78SJeremy L Thompson if (op_fallback) { 17052b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op_fallback, assembled, request)); 1706eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1707eaf62fffSJeremy L Thompson } 1708eaf62fffSJeremy L Thompson } 1709ea61e9acSJeremy L Thompson // Default interface implementation 1710eaf62fffSJeremy L Thompson if (is_composite) { 17112b730f8bSJeremy L Thompson CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, true, assembled)); 1712eaf62fffSJeremy L Thompson } else { 17132b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, true, assembled)); 1714eaf62fffSJeremy L Thompson } 1715d04bbc78SJeremy L Thompson 1716d04bbc78SJeremy L Thompson return CEED_ERROR_SUCCESS; 1717eaf62fffSJeremy L Thompson } 1718eaf62fffSJeremy L Thompson 1719eaf62fffSJeremy L Thompson /** 1720eaf62fffSJeremy L Thompson @brief Fully assemble the nonzero pattern of a linear operator. 1721eaf62fffSJeremy L Thompson 1722ea61e9acSJeremy L Thompson Expected to be used in conjunction with CeedOperatorLinearAssemble(). 1723eaf62fffSJeremy L Thompson 1724ea61e9acSJeremy L Thompson The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the 1725ea61e9acSJeremy L Thompson matrix in entry (i, j). Note that the (i, j) pairs are not unique and may repeat. This function returns the number of entries and their (i, j) 1726ea61e9acSJeremy L Thompson locations, while CeedOperatorLinearAssemble() provides the values in the same ordering. 1727eaf62fffSJeremy L Thompson 1728eaf62fffSJeremy L Thompson This will generally be slow unless your operator is low-order. 1729eaf62fffSJeremy L Thompson 1730ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1731f04ea552SJeremy L Thompson 1732eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 1733eaf62fffSJeremy L Thompson @param[out] num_entries Number of entries in coordinate nonzero pattern 1734eaf62fffSJeremy L Thompson @param[out] rows Row number for each entry 1735eaf62fffSJeremy L Thompson @param[out] cols Column number for each entry 1736eaf62fffSJeremy L Thompson 1737eaf62fffSJeremy L Thompson @ref User 1738eaf62fffSJeremy L Thompson **/ 17392b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleSymbolic(CeedOperator op, CeedSize *num_entries, CeedInt **rows, CeedInt **cols) { 1740eaf62fffSJeremy L Thompson CeedInt num_suboperators, single_entries; 1741eaf62fffSJeremy L Thompson CeedOperator *sub_operators; 1742eaf62fffSJeremy L Thompson bool is_composite; 17432b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1744f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1745eaf62fffSJeremy L Thompson 1746eaf62fffSJeremy L Thompson if (op->LinearAssembleSymbolic) { 1747d04bbc78SJeremy L Thompson // Backend version 17482b730f8bSJeremy L Thompson CeedCall(op->LinearAssembleSymbolic(op, num_entries, rows, cols)); 1749eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1750eaf62fffSJeremy L Thompson } else { 1751d04bbc78SJeremy L Thompson // Operator fallback 1752d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1753d04bbc78SJeremy L Thompson 17542b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1755d04bbc78SJeremy L Thompson if (op_fallback) { 17562b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleSymbolic(op_fallback, num_entries, rows, cols)); 1757eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1758eaf62fffSJeremy L Thompson } 1759eaf62fffSJeremy L Thompson } 1760eaf62fffSJeremy L Thompson 1761eaf62fffSJeremy L Thompson // Default interface implementation 1762eaf62fffSJeremy L Thompson 1763eaf62fffSJeremy L Thompson // count entries and allocate rows, cols arrays 1764eaf62fffSJeremy L Thompson *num_entries = 0; 1765eaf62fffSJeremy L Thompson if (is_composite) { 1766c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1767c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 176892ae7e47SJeremy L Thompson for (CeedInt k = 0; k < num_suboperators; ++k) { 17692b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries)); 1770eaf62fffSJeremy L Thompson *num_entries += single_entries; 1771eaf62fffSJeremy L Thompson } 1772eaf62fffSJeremy L Thompson } else { 17732b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(op, &single_entries)); 1774eaf62fffSJeremy L Thompson *num_entries += single_entries; 1775eaf62fffSJeremy L Thompson } 17762b730f8bSJeremy L Thompson CeedCall(CeedCalloc(*num_entries, rows)); 17772b730f8bSJeremy L Thompson CeedCall(CeedCalloc(*num_entries, cols)); 1778eaf62fffSJeremy L Thompson 1779eaf62fffSJeremy L Thompson // assemble nonzero locations 1780eaf62fffSJeremy L Thompson CeedInt offset = 0; 1781eaf62fffSJeremy L Thompson if (is_composite) { 1782c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1783c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 178492ae7e47SJeremy L Thompson for (CeedInt k = 0; k < num_suboperators; ++k) { 17852b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleSymbolic(sub_operators[k], offset, *rows, *cols)); 17862b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries)); 1787eaf62fffSJeremy L Thompson offset += single_entries; 1788eaf62fffSJeremy L Thompson } 1789eaf62fffSJeremy L Thompson } else { 17902b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssembleSymbolic(op, offset, *rows, *cols)); 1791eaf62fffSJeremy L Thompson } 1792eaf62fffSJeremy L Thompson 1793eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1794eaf62fffSJeremy L Thompson } 1795eaf62fffSJeremy L Thompson 1796eaf62fffSJeremy L Thompson /** 1797eaf62fffSJeremy L Thompson @brief Fully assemble the nonzero entries of a linear operator. 1798eaf62fffSJeremy L Thompson 1799ea61e9acSJeremy L Thompson Expected to be used in conjunction with CeedOperatorLinearAssembleSymbolic(). 1800eaf62fffSJeremy L Thompson 1801ea61e9acSJeremy L Thompson The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the 1802ea61e9acSJeremy L Thompson matrix in entry (i, j). Note that the (i, j) pairs are not unique and may repeat. This function returns the values of the nonzero entries to be added, 1803ea61e9acSJeremy L Thompson their (i, j) locations are provided by CeedOperatorLinearAssembleSymbolic() 1804eaf62fffSJeremy L Thompson 1805eaf62fffSJeremy L Thompson This will generally be slow unless your operator is low-order. 1806eaf62fffSJeremy L Thompson 1807ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 1808f04ea552SJeremy L Thompson 1809eaf62fffSJeremy L Thompson @param[in] op CeedOperator to assemble 1810eaf62fffSJeremy L Thompson @param[out] values Values to assemble into matrix 1811eaf62fffSJeremy L Thompson 1812eaf62fffSJeremy L Thompson @ref User 1813eaf62fffSJeremy L Thompson **/ 1814eaf62fffSJeremy L Thompson int CeedOperatorLinearAssemble(CeedOperator op, CeedVector values) { 1815eaf62fffSJeremy L Thompson CeedInt num_suboperators, single_entries = 0; 1816eaf62fffSJeremy L Thompson CeedOperator *sub_operators; 1817f3d47e36SJeremy L Thompson bool is_composite; 18182b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 1819f3d47e36SJeremy L Thompson CeedCall(CeedOperatorIsComposite(op, &is_composite)); 1820f3d47e36SJeremy L Thompson 1821f3d47e36SJeremy L Thompson // Early exit for empty operator 1822f3d47e36SJeremy L Thompson if (!is_composite) { 1823f3d47e36SJeremy L Thompson CeedInt num_elem = 0; 1824f3d47e36SJeremy L Thompson 1825f3d47e36SJeremy L Thompson CeedCall(CeedOperatorGetNumElements(op, &num_elem)); 1826f3d47e36SJeremy L Thompson if (num_elem == 0) return CEED_ERROR_SUCCESS; 1827f3d47e36SJeremy L Thompson } 1828eaf62fffSJeremy L Thompson 1829eaf62fffSJeremy L Thompson if (op->LinearAssemble) { 1830d04bbc78SJeremy L Thompson // Backend version 18312b730f8bSJeremy L Thompson CeedCall(op->LinearAssemble(op, values)); 1832eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1833eaf62fffSJeremy L Thompson } else { 1834d04bbc78SJeremy L Thompson // Operator fallback 1835d04bbc78SJeremy L Thompson CeedOperator op_fallback; 1836d04bbc78SJeremy L Thompson 18372b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 1838d04bbc78SJeremy L Thompson if (op_fallback) { 18392b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssemble(op_fallback, values)); 1840eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1841eaf62fffSJeremy L Thompson } 1842eaf62fffSJeremy L Thompson } 1843eaf62fffSJeremy L Thompson 1844eaf62fffSJeremy L Thompson // Default interface implementation 1845eaf62fffSJeremy L Thompson CeedInt offset = 0; 1846eaf62fffSJeremy L Thompson if (is_composite) { 1847c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1848c6ebc35dSJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 1849cefa2673SJeremy L Thompson for (CeedInt k = 0; k < num_suboperators; k++) { 18502b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemble(sub_operators[k], offset, values)); 18512b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries)); 1852eaf62fffSJeremy L Thompson offset += single_entries; 1853eaf62fffSJeremy L Thompson } 1854eaf62fffSJeremy L Thompson } else { 18552b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorAssemble(op, offset, values)); 1856eaf62fffSJeremy L Thompson } 1857eaf62fffSJeremy L Thompson 1858eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1859eaf62fffSJeremy L Thompson } 1860eaf62fffSJeremy L Thompson 1861eaf62fffSJeremy L Thompson /** 186275f0d5a4SJeremy L Thompson @brief Get the multiplicity of nodes across suboperators in a composite CeedOperator 186375f0d5a4SJeremy L Thompson 186475f0d5a4SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 186575f0d5a4SJeremy L Thompson 186675f0d5a4SJeremy L Thompson @param[in] op Composite CeedOperator 186775f0d5a4SJeremy L Thompson @param[in] num_skip_indices Number of suboperators to skip 186875f0d5a4SJeremy L Thompson @param[in] skip_indices Array of indices of suboperators to skip 186975f0d5a4SJeremy L Thompson @param[out] mult Vector to store multiplicity (of size l_size) 187075f0d5a4SJeremy L Thompson 187175f0d5a4SJeremy L Thompson @return An error code: 0 - success, otherwise - failure 187275f0d5a4SJeremy L Thompson 187375f0d5a4SJeremy L Thompson @ref User 187475f0d5a4SJeremy L Thompson **/ 187575f0d5a4SJeremy L Thompson int CeedCompositeOperatorGetMultiplicity(CeedOperator op, CeedInt num_skip_indices, CeedInt *skip_indices, CeedVector mult) { 187675f0d5a4SJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 187775f0d5a4SJeremy L Thompson 187875f0d5a4SJeremy L Thompson Ceed ceed; 1879b275c451SJeremy L Thompson CeedInt num_suboperators; 188075f0d5a4SJeremy L Thompson CeedSize l_vec_len; 188175f0d5a4SJeremy L Thompson CeedScalar *mult_array; 188275f0d5a4SJeremy L Thompson CeedVector ones_l_vec; 188375f0d5a4SJeremy L Thompson CeedElemRestriction elem_restr; 1884b275c451SJeremy L Thompson CeedOperator *sub_operators; 188575f0d5a4SJeremy L Thompson 188675f0d5a4SJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 188775f0d5a4SJeremy L Thompson 188875f0d5a4SJeremy L Thompson // Zero mult vector 188975f0d5a4SJeremy L Thompson CeedCall(CeedVectorSetValue(mult, 0.0)); 189075f0d5a4SJeremy L Thompson 189175f0d5a4SJeremy L Thompson // Get suboperators 1892b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators)); 1893b275c451SJeremy L Thompson CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators)); 1894b275c451SJeremy L Thompson if (num_suboperators == 0) return CEED_ERROR_SUCCESS; 189575f0d5a4SJeremy L Thompson 189675f0d5a4SJeremy L Thompson // Work vector 189775f0d5a4SJeremy L Thompson CeedCall(CeedVectorGetLength(mult, &l_vec_len)); 189875f0d5a4SJeremy L Thompson CeedCall(CeedVectorCreate(ceed, l_vec_len, &ones_l_vec)); 189975f0d5a4SJeremy L Thompson CeedCall(CeedVectorSetValue(ones_l_vec, 1.0)); 190075f0d5a4SJeremy L Thompson CeedCall(CeedVectorGetArray(mult, CEED_MEM_HOST, &mult_array)); 190175f0d5a4SJeremy L Thompson 190275f0d5a4SJeremy L Thompson // Compute multiplicity across suboperators 1903b275c451SJeremy L Thompson for (CeedInt i = 0; i < num_suboperators; i++) { 190475f0d5a4SJeremy L Thompson const CeedScalar *sub_mult_array; 190575f0d5a4SJeremy L Thompson CeedVector sub_mult_l_vec, ones_e_vec; 190675f0d5a4SJeremy L Thompson 190775f0d5a4SJeremy L Thompson // -- Check for suboperator to skip 190875f0d5a4SJeremy L Thompson for (CeedInt j = 0; j < num_skip_indices; j++) { 190975f0d5a4SJeremy L Thompson if (skip_indices[j] == i) continue; 191075f0d5a4SJeremy L Thompson } 191175f0d5a4SJeremy L Thompson 191275f0d5a4SJeremy L Thompson // -- Sub operator multiplicity 1913b275c451SJeremy L Thompson CeedCall(CeedOperatorGetActiveElemRestriction(sub_operators[i], &elem_restr)); 191475f0d5a4SJeremy L Thompson CeedCall(CeedElemRestrictionCreateVector(elem_restr, &sub_mult_l_vec, &ones_e_vec)); 191575f0d5a4SJeremy L Thompson CeedCall(CeedVectorSetValue(sub_mult_l_vec, 0.0)); 191675f0d5a4SJeremy L Thompson CeedCall(CeedElemRestrictionApply(elem_restr, CEED_NOTRANSPOSE, ones_l_vec, ones_e_vec, CEED_REQUEST_IMMEDIATE)); 191775f0d5a4SJeremy L Thompson CeedCall(CeedElemRestrictionApply(elem_restr, CEED_TRANSPOSE, ones_e_vec, sub_mult_l_vec, CEED_REQUEST_IMMEDIATE)); 191875f0d5a4SJeremy L Thompson CeedCall(CeedVectorGetArrayRead(sub_mult_l_vec, CEED_MEM_HOST, &sub_mult_array)); 191975f0d5a4SJeremy L Thompson // ---- Flag every node present in the current suboperator 192075f0d5a4SJeremy L Thompson for (CeedInt j = 0; j < l_vec_len; j++) { 192175f0d5a4SJeremy L Thompson if (sub_mult_array[j] > 0.0) mult_array[j] += 1.0; 192275f0d5a4SJeremy L Thompson } 192375f0d5a4SJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(sub_mult_l_vec, &sub_mult_array)); 192475f0d5a4SJeremy L Thompson CeedCall(CeedVectorDestroy(&sub_mult_l_vec)); 192575f0d5a4SJeremy L Thompson CeedCall(CeedVectorDestroy(&ones_e_vec)); 192675f0d5a4SJeremy L Thompson } 192775f0d5a4SJeremy L Thompson CeedCall(CeedVectorRestoreArray(mult, &mult_array)); 1928811d0ccfSJeremy L Thompson CeedCall(CeedVectorDestroy(&ones_l_vec)); 192975f0d5a4SJeremy L Thompson 193075f0d5a4SJeremy L Thompson return CEED_ERROR_SUCCESS; 193175f0d5a4SJeremy L Thompson } 193275f0d5a4SJeremy L Thompson 193375f0d5a4SJeremy L Thompson /** 1934ea61e9acSJeremy L Thompson @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator, creating the prolongation basis from the fine and coarse 1935ea61e9acSJeremy L Thompson grid interpolation 1936eaf62fffSJeremy L Thompson 193758e4b056SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable. 1938f04ea552SJeremy L Thompson 1939eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 1940*85bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 1941eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 1942eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 1943eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 1944*85bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 1945*85bb9dcfSJeremy L Thompson @param[out] op_restrict Fine to coarse operator, or NULL 1946eaf62fffSJeremy L Thompson 1947eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1948eaf62fffSJeremy L Thompson 1949eaf62fffSJeremy L Thompson @ref User 1950eaf62fffSJeremy L Thompson **/ 19512b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreate(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 19522b730f8bSJeremy L Thompson CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) { 19532b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fine)); 1954eaf62fffSJeremy L Thompson 195583d6adf3SZach Atkins // Build prolongation matrix, if required 195683d6adf3SZach Atkins CeedBasis basis_c_to_f = NULL; 195783d6adf3SZach Atkins if (op_prolong || op_restrict) { 195883d6adf3SZach Atkins CeedBasis basis_fine; 19592b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine)); 19602b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateProjection(basis_coarse, basis_fine, &basis_c_to_f)); 196183d6adf3SZach Atkins } 1962eaf62fffSJeremy L Thompson 1963f113e5dcSJeremy L Thompson // Core code 19642b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict)); 1965f113e5dcSJeremy L Thompson 1966eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 1967eaf62fffSJeremy L Thompson } 1968eaf62fffSJeremy L Thompson 1969eaf62fffSJeremy L Thompson /** 1970ea61e9acSJeremy L Thompson @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a tensor basis for the active basis 1971eaf62fffSJeremy L Thompson 197258e4b056SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable. 1973f04ea552SJeremy L Thompson 1974eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 1975*85bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 1976eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 1977eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 1978*85bb9dcfSJeremy L Thompson @param[in] interp_c_to_f Matrix for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators 1979eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 1980*85bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 1981*85bb9dcfSJeremy L Thompson @param[out] op_restrict Fine to coarse operator, or NULL 1982eaf62fffSJeremy L Thompson 1983eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 1984eaf62fffSJeremy L Thompson 1985eaf62fffSJeremy L Thompson @ref User 1986eaf62fffSJeremy L Thompson **/ 19872b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateTensorH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 19882b730f8bSJeremy L Thompson const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, 19892b730f8bSJeremy L Thompson CeedOperator *op_restrict) { 19902b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fine)); 1991eaf62fffSJeremy L Thompson Ceed ceed; 19922b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op_fine, &ceed)); 1993eaf62fffSJeremy L Thompson 1994eaf62fffSJeremy L Thompson // Check for compatible quadrature spaces 1995eaf62fffSJeremy L Thompson CeedBasis basis_fine; 19962b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine)); 1997eaf62fffSJeremy L Thompson CeedInt Q_f, Q_c; 19982b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f)); 19992b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c)); 20002b730f8bSJeremy L Thompson if (Q_f != Q_c) { 2001eaf62fffSJeremy L Thompson // LCOV_EXCL_START 20022b730f8bSJeremy L Thompson return CeedError(ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces"); 2003eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 20042b730f8bSJeremy L Thompson } 2005eaf62fffSJeremy L Thompson 200683d6adf3SZach Atkins // Create coarse to fine basis, if required 200783d6adf3SZach Atkins CeedBasis basis_c_to_f = NULL; 200883d6adf3SZach Atkins if (op_prolong || op_restrict) { 200983d6adf3SZach Atkins // Check if interpolation matrix is provided 201083d6adf3SZach Atkins if (!interp_c_to_f) { 201183d6adf3SZach Atkins // LCOV_EXCL_START 201283d6adf3SZach Atkins return CeedError(ceed, CEED_ERROR_INCOMPATIBLE, "Prolongation or restriction operator creation requires coarse-to-fine interpolation matrix"); 201383d6adf3SZach Atkins // LCOV_EXCL_STOP 201483d6adf3SZach Atkins } 2015eaf62fffSJeremy L Thompson CeedInt dim, num_comp, num_nodes_c, P_1d_f, P_1d_c; 20162b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis_fine, &dim)); 20172b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp)); 20182b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes1D(basis_fine, &P_1d_f)); 20192b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c)); 20202b730f8bSJeremy L Thompson P_1d_c = dim == 1 ? num_nodes_c : dim == 2 ? sqrt(num_nodes_c) : cbrt(num_nodes_c); 2021eaf62fffSJeremy L Thompson CeedScalar *q_ref, *q_weight, *grad; 20222b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d_f, &q_ref)); 20232b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d_f, &q_weight)); 20242b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d_f * P_1d_c * dim, &grad)); 20252b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateTensorH1(ceed, dim, num_comp, P_1d_c, P_1d_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f)); 20262b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_ref)); 20272b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_weight)); 20282b730f8bSJeremy L Thompson CeedCall(CeedFree(&grad)); 202983d6adf3SZach Atkins } 2030eaf62fffSJeremy L Thompson 2031eaf62fffSJeremy L Thompson // Core code 20322b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict)); 2033eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2034eaf62fffSJeremy L Thompson } 2035eaf62fffSJeremy L Thompson 2036eaf62fffSJeremy L Thompson /** 2037ea61e9acSJeremy L Thompson @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a non-tensor basis for the active vector 2038eaf62fffSJeremy L Thompson 203958e4b056SJeremy L Thompson Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable. 2040f04ea552SJeremy L Thompson 2041eaf62fffSJeremy L Thompson @param[in] op_fine Fine grid operator 2042*85bb9dcfSJeremy L Thompson @param[in] p_mult_fine L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators 2043eaf62fffSJeremy L Thompson @param[in] rstr_coarse Coarse grid restriction 2044eaf62fffSJeremy L Thompson @param[in] basis_coarse Coarse grid active vector basis 2045*85bb9dcfSJeremy L Thompson @param[in] interp_c_to_f Matrix for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators 2046eaf62fffSJeremy L Thompson @param[out] op_coarse Coarse grid operator 2047*85bb9dcfSJeremy L Thompson @param[out] op_prolong Coarse to fine operator, or NULL 2048*85bb9dcfSJeremy L Thompson @param[out] op_restrict Fine to coarse operator, or NULL 2049eaf62fffSJeremy L Thompson 2050eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2051eaf62fffSJeremy L Thompson 2052eaf62fffSJeremy L Thompson @ref User 2053eaf62fffSJeremy L Thompson **/ 20542b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse, 20552b730f8bSJeremy L Thompson const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, 2056eaf62fffSJeremy L Thompson CeedOperator *op_restrict) { 20572b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op_fine)); 2058eaf62fffSJeremy L Thompson Ceed ceed; 20592b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op_fine, &ceed)); 2060eaf62fffSJeremy L Thompson 2061eaf62fffSJeremy L Thompson // Check for compatible quadrature spaces 2062eaf62fffSJeremy L Thompson CeedBasis basis_fine; 20632b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine)); 2064eaf62fffSJeremy L Thompson CeedInt Q_f, Q_c; 20652b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f)); 20662b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c)); 20672b730f8bSJeremy L Thompson if (Q_f != Q_c) { 2068eaf62fffSJeremy L Thompson // LCOV_EXCL_START 20692b730f8bSJeremy L Thompson return CeedError(ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces"); 2070eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 20712b730f8bSJeremy L Thompson } 2072eaf62fffSJeremy L Thompson 2073eaf62fffSJeremy L Thompson // Coarse to fine basis 207483d6adf3SZach Atkins CeedBasis basis_c_to_f = NULL; 207583d6adf3SZach Atkins if (op_prolong || op_restrict) { 207683d6adf3SZach Atkins // Check if interpolation matrix is provided 207783d6adf3SZach Atkins if (!interp_c_to_f) { 207883d6adf3SZach Atkins // LCOV_EXCL_START 207983d6adf3SZach Atkins return CeedError(ceed, CEED_ERROR_INCOMPATIBLE, "Prolongation or restriction operator creation requires coarse-to-fine interpolation matrix"); 208083d6adf3SZach Atkins // LCOV_EXCL_STOP 208183d6adf3SZach Atkins } 2082eaf62fffSJeremy L Thompson CeedElemTopology topo; 20832b730f8bSJeremy L Thompson CeedCall(CeedBasisGetTopology(basis_fine, &topo)); 2084eaf62fffSJeremy L Thompson CeedInt dim, num_comp, num_nodes_c, num_nodes_f; 20852b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis_fine, &dim)); 20862b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp)); 20872b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes(basis_fine, &num_nodes_f)); 20882b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c)); 2089eaf62fffSJeremy L Thompson CeedScalar *q_ref, *q_weight, *grad; 20902b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_nodes_f * dim, &q_ref)); 20912b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_nodes_f, &q_weight)); 20922b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_nodes_f * num_nodes_c * dim, &grad)); 20932b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateH1(ceed, topo, num_comp, num_nodes_c, num_nodes_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f)); 20942b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_ref)); 20952b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_weight)); 20962b730f8bSJeremy L Thompson CeedCall(CeedFree(&grad)); 209783d6adf3SZach Atkins } 2098eaf62fffSJeremy L Thompson 2099eaf62fffSJeremy L Thompson // Core code 21002b730f8bSJeremy L Thompson CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict)); 2101eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2102eaf62fffSJeremy L Thompson } 2103eaf62fffSJeremy L Thompson 2104eaf62fffSJeremy L Thompson /** 2105ea61e9acSJeremy L Thompson @brief Build a FDM based approximate inverse for each element for a CeedOperator 2106eaf62fffSJeremy L Thompson 2107ea61e9acSJeremy L Thompson This returns a CeedOperator and CeedVector to apply a Fast Diagonalization Method based approximate inverse. 2108ea61e9acSJeremy L Thompson This function obtains the simultaneous diagonalization for the 1D mass and Laplacian operators, M = V^T V, K = V^T S V. 2109ea61e9acSJeremy L Thompson The assembled QFunction is used to modify the eigenvalues from simultaneous diagonalization and obtain an approximate inverse of the form V^T 2110ea61e9acSJeremy L Thompson S^hat V. The CeedOperator must be linear and non-composite. The associated CeedQFunction must therefore also be linear. 2111eaf62fffSJeremy L Thompson 2112ea61e9acSJeremy L Thompson Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable. 2113f04ea552SJeremy L Thompson 2114ea61e9acSJeremy L Thompson @param[in] op CeedOperator to create element inverses 2115ea61e9acSJeremy L Thompson @param[out] fdm_inv CeedOperator to apply the action of a FDM based inverse for each element 2116ea61e9acSJeremy L Thompson @param[in] request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE 2117eaf62fffSJeremy L Thompson 2118eaf62fffSJeremy L Thompson @return An error code: 0 - success, otherwise - failure 2119eaf62fffSJeremy L Thompson 2120480fae85SJeremy L Thompson @ref User 2121eaf62fffSJeremy L Thompson **/ 21222b730f8bSJeremy L Thompson int CeedOperatorCreateFDMElementInverse(CeedOperator op, CeedOperator *fdm_inv, CeedRequest *request) { 21232b730f8bSJeremy L Thompson CeedCall(CeedOperatorCheckReady(op)); 2124eaf62fffSJeremy L Thompson 2125eaf62fffSJeremy L Thompson if (op->CreateFDMElementInverse) { 2126d04bbc78SJeremy L Thompson // Backend version 21272b730f8bSJeremy L Thompson CeedCall(op->CreateFDMElementInverse(op, fdm_inv, request)); 2128eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2129eaf62fffSJeremy L Thompson } else { 2130d04bbc78SJeremy L Thompson // Operator fallback 2131d04bbc78SJeremy L Thompson CeedOperator op_fallback; 2132d04bbc78SJeremy L Thompson 21332b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFallback(op, &op_fallback)); 2134d04bbc78SJeremy L Thompson if (op_fallback) { 21352b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreateFDMElementInverse(op_fallback, fdm_inv, request)); 2136eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2137eaf62fffSJeremy L Thompson } 2138eaf62fffSJeremy L Thompson } 2139eaf62fffSJeremy L Thompson 2140d04bbc78SJeremy L Thompson // Default interface implementation 2141eaf62fffSJeremy L Thompson Ceed ceed, ceed_parent; 21422b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetCeed(op, &ceed)); 21432b730f8bSJeremy L Thompson CeedCall(CeedGetOperatorFallbackParentCeed(ceed, &ceed_parent)); 2144eaf62fffSJeremy L Thompson ceed_parent = ceed_parent ? ceed_parent : ceed; 2145eaf62fffSJeremy L Thompson CeedQFunction qf; 21462b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetQFunction(op, &qf)); 2147eaf62fffSJeremy L Thompson 2148eaf62fffSJeremy L Thompson // Determine active input basis 2149eaf62fffSJeremy L Thompson bool interp = false, grad = false; 2150eaf62fffSJeremy L Thompson CeedBasis basis = NULL; 2151eaf62fffSJeremy L Thompson CeedElemRestriction rstr = NULL; 2152eaf62fffSJeremy L Thompson CeedOperatorField *op_fields; 2153eaf62fffSJeremy L Thompson CeedQFunctionField *qf_fields; 2154eaf62fffSJeremy L Thompson CeedInt num_input_fields; 21552b730f8bSJeremy L Thompson CeedCall(CeedOperatorGetFields(op, &num_input_fields, &op_fields, NULL, NULL)); 21562b730f8bSJeremy L Thompson CeedCall(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL)); 2157eaf62fffSJeremy L Thompson for (CeedInt i = 0; i < num_input_fields; i++) { 2158eaf62fffSJeremy L Thompson CeedVector vec; 21592b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec)); 2160eaf62fffSJeremy L Thompson if (vec == CEED_VECTOR_ACTIVE) { 2161eaf62fffSJeremy L Thompson CeedEvalMode eval_mode; 21622b730f8bSJeremy L Thompson CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode)); 2163eaf62fffSJeremy L Thompson interp = interp || eval_mode == CEED_EVAL_INTERP; 2164eaf62fffSJeremy L Thompson grad = grad || eval_mode == CEED_EVAL_GRAD; 21652b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis)); 21662b730f8bSJeremy L Thompson CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr)); 2167eaf62fffSJeremy L Thompson } 2168eaf62fffSJeremy L Thompson } 21692b730f8bSJeremy L Thompson if (!basis) { 2170eaf62fffSJeremy L Thompson // LCOV_EXCL_START 2171eaf62fffSJeremy L Thompson return CeedError(ceed, CEED_ERROR_BACKEND, "No active field set"); 2172eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 21732b730f8bSJeremy L Thompson } 2174e79b91d9SJeremy L Thompson CeedSize l_size = 1; 2175e79b91d9SJeremy L Thompson CeedInt P_1d, Q_1d, elem_size, num_qpts, dim, num_comp = 1, num_elem = 1; 21762b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes1D(basis, &P_1d)); 21772b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumNodes(basis, &elem_size)); 21782b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints1D(basis, &Q_1d)); 21792b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumQuadraturePoints(basis, &num_qpts)); 21802b730f8bSJeremy L Thompson CeedCall(CeedBasisGetDimension(basis, &dim)); 21812b730f8bSJeremy L Thompson CeedCall(CeedBasisGetNumComponents(basis, &num_comp)); 21822b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem)); 21832b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size)); 2184eaf62fffSJeremy L Thompson 2185eaf62fffSJeremy L Thompson // Build and diagonalize 1D Mass and Laplacian 2186eaf62fffSJeremy L Thompson bool tensor_basis; 21872b730f8bSJeremy L Thompson CeedCall(CeedBasisIsTensor(basis, &tensor_basis)); 21882b730f8bSJeremy L Thompson if (!tensor_basis) { 2189eaf62fffSJeremy L Thompson // LCOV_EXCL_START 21902b730f8bSJeremy L Thompson return CeedError(ceed, CEED_ERROR_BACKEND, "FDMElementInverse only supported for tensor bases"); 2191eaf62fffSJeremy L Thompson // LCOV_EXCL_STOP 21922b730f8bSJeremy L Thompson } 2193eaf62fffSJeremy L Thompson CeedScalar *mass, *laplace, *x, *fdm_interp, *lambda; 21942b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &mass)); 21952b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &laplace)); 21962b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &x)); 21972b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &fdm_interp)); 21982b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d, &lambda)); 2199eaf62fffSJeremy L Thompson // -- Build matrices 2200eaf62fffSJeremy L Thompson const CeedScalar *interp_1d, *grad_1d, *q_weight_1d; 22012b730f8bSJeremy L Thompson CeedCall(CeedBasisGetInterp1D(basis, &interp_1d)); 22022b730f8bSJeremy L Thompson CeedCall(CeedBasisGetGrad1D(basis, &grad_1d)); 22032b730f8bSJeremy L Thompson CeedCall(CeedBasisGetQWeights(basis, &q_weight_1d)); 22042b730f8bSJeremy L Thompson CeedCall(CeedBuildMassLaplace(interp_1d, grad_1d, q_weight_1d, P_1d, Q_1d, dim, mass, laplace)); 2205eaf62fffSJeremy L Thompson 2206eaf62fffSJeremy L Thompson // -- Diagonalize 22072b730f8bSJeremy L Thompson CeedCall(CeedSimultaneousDiagonalization(ceed, laplace, mass, x, lambda, P_1d)); 22082b730f8bSJeremy L Thompson CeedCall(CeedFree(&mass)); 22092b730f8bSJeremy L Thompson CeedCall(CeedFree(&laplace)); 22102b730f8bSJeremy L Thompson for (CeedInt i = 0; i < P_1d; i++) { 22112b730f8bSJeremy L Thompson for (CeedInt j = 0; j < P_1d; j++) fdm_interp[i + j * P_1d] = x[j + i * P_1d]; 22122b730f8bSJeremy L Thompson } 22132b730f8bSJeremy L Thompson CeedCall(CeedFree(&x)); 2214eaf62fffSJeremy L Thompson 2215eaf62fffSJeremy L Thompson // Assemble QFunction 2216eaf62fffSJeremy L Thompson CeedVector assembled; 2217eaf62fffSJeremy L Thompson CeedElemRestriction rstr_qf; 22182b730f8bSJeremy L Thompson CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled, &rstr_qf, request)); 2219eaf62fffSJeremy L Thompson CeedInt layout[3]; 22202b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionGetELayout(rstr_qf, &layout)); 22212b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_qf)); 2222eaf62fffSJeremy L Thompson CeedScalar max_norm = 0; 22232b730f8bSJeremy L Thompson CeedCall(CeedVectorNorm(assembled, CEED_NORM_MAX, &max_norm)); 2224eaf62fffSJeremy L Thompson 2225eaf62fffSJeremy L Thompson // Calculate element averages 2226eaf62fffSJeremy L Thompson CeedInt num_modes = (interp ? 1 : 0) + (grad ? dim : 0); 2227eaf62fffSJeremy L Thompson CeedScalar *elem_avg; 2228eaf62fffSJeremy L Thompson const CeedScalar *assembled_array, *q_weight_array; 2229eaf62fffSJeremy L Thompson CeedVector q_weight; 22302b730f8bSJeremy L Thompson CeedCall(CeedVectorCreate(ceed_parent, num_qpts, &q_weight)); 22312b730f8bSJeremy L Thompson CeedCall(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, q_weight)); 22322b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(assembled, CEED_MEM_HOST, &assembled_array)); 22332b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayRead(q_weight, CEED_MEM_HOST, &q_weight_array)); 22342b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_elem, &elem_avg)); 2235eaf62fffSJeremy L Thompson const CeedScalar qf_value_bound = max_norm * 100 * CEED_EPSILON; 2236eaf62fffSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 2237eaf62fffSJeremy L Thompson CeedInt count = 0; 22382b730f8bSJeremy L Thompson for (CeedInt q = 0; q < num_qpts; q++) { 22392b730f8bSJeremy L Thompson for (CeedInt i = 0; i < num_comp * num_comp * num_modes * num_modes; i++) { 22402b730f8bSJeremy L Thompson if (fabs(assembled_array[q * layout[0] + i * layout[1] + e * layout[2]]) > qf_value_bound) { 22412b730f8bSJeremy L Thompson elem_avg[e] += assembled_array[q * layout[0] + i * layout[1] + e * layout[2]] / q_weight_array[q]; 2242eaf62fffSJeremy L Thompson count++; 2243eaf62fffSJeremy L Thompson } 22442b730f8bSJeremy L Thompson } 22452b730f8bSJeremy L Thompson } 2246eaf62fffSJeremy L Thompson if (count) { 2247eaf62fffSJeremy L Thompson elem_avg[e] /= count; 2248eaf62fffSJeremy L Thompson } else { 2249eaf62fffSJeremy L Thompson elem_avg[e] = 1.0; 2250eaf62fffSJeremy L Thompson } 2251eaf62fffSJeremy L Thompson } 22522b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(assembled, &assembled_array)); 22532b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&assembled)); 22542b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArrayRead(q_weight, &q_weight_array)); 22552b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&q_weight)); 2256eaf62fffSJeremy L Thompson 2257eaf62fffSJeremy L Thompson // Build FDM diagonal 2258eaf62fffSJeremy L Thompson CeedVector q_data; 2259eaf62fffSJeremy L Thompson CeedScalar *q_data_array, *fdm_diagonal; 22602b730f8bSJeremy L Thompson CeedCall(CeedCalloc(num_comp * elem_size, &fdm_diagonal)); 2261eaf62fffSJeremy L Thompson const CeedScalar fdm_diagonal_bound = elem_size * CEED_EPSILON; 22622b730f8bSJeremy L Thompson for (CeedInt c = 0; c < num_comp; c++) { 2263eaf62fffSJeremy L Thompson for (CeedInt n = 0; n < elem_size; n++) { 22642b730f8bSJeremy L Thompson if (interp) fdm_diagonal[c * elem_size + n] = 1.0; 22652b730f8bSJeremy L Thompson if (grad) { 2266eaf62fffSJeremy L Thompson for (CeedInt d = 0; d < dim; d++) { 2267eaf62fffSJeremy L Thompson CeedInt i = (n / CeedIntPow(P_1d, d)) % P_1d; 2268eaf62fffSJeremy L Thompson fdm_diagonal[c * elem_size + n] += lambda[i]; 2269eaf62fffSJeremy L Thompson } 2270eaf62fffSJeremy L Thompson } 22712b730f8bSJeremy L Thompson if (fabs(fdm_diagonal[c * elem_size + n]) < fdm_diagonal_bound) fdm_diagonal[c * elem_size + n] = fdm_diagonal_bound; 22722b730f8bSJeremy L Thompson } 22732b730f8bSJeremy L Thompson } 22742b730f8bSJeremy L Thompson CeedCall(CeedVectorCreate(ceed_parent, num_elem * num_comp * elem_size, &q_data)); 22752b730f8bSJeremy L Thompson CeedCall(CeedVectorSetValue(q_data, 0.0)); 22762b730f8bSJeremy L Thompson CeedCall(CeedVectorGetArrayWrite(q_data, CEED_MEM_HOST, &q_data_array)); 22772b730f8bSJeremy L Thompson for (CeedInt e = 0; e < num_elem; e++) { 22782b730f8bSJeremy L Thompson for (CeedInt c = 0; c < num_comp; c++) { 22792b730f8bSJeremy L Thompson for (CeedInt n = 0; n < elem_size; n++) q_data_array[(e * num_comp + c) * elem_size + n] = 1. / (elem_avg[e] * fdm_diagonal[c * elem_size + n]); 22802b730f8bSJeremy L Thompson } 22812b730f8bSJeremy L Thompson } 22822b730f8bSJeremy L Thompson CeedCall(CeedFree(&elem_avg)); 22832b730f8bSJeremy L Thompson CeedCall(CeedFree(&fdm_diagonal)); 22842b730f8bSJeremy L Thompson CeedCall(CeedVectorRestoreArray(q_data, &q_data_array)); 2285eaf62fffSJeremy L Thompson 2286eaf62fffSJeremy L Thompson // Setup FDM operator 2287eaf62fffSJeremy L Thompson // -- Basis 2288eaf62fffSJeremy L Thompson CeedBasis fdm_basis; 2289eaf62fffSJeremy L Thompson CeedScalar *grad_dummy, *q_ref_dummy, *q_weight_dummy; 22902b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d * P_1d, &grad_dummy)); 22912b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d, &q_ref_dummy)); 22922b730f8bSJeremy L Thompson CeedCall(CeedCalloc(P_1d, &q_weight_dummy)); 22932b730f8bSJeremy L Thompson CeedCall(CeedBasisCreateTensorH1(ceed_parent, dim, num_comp, P_1d, P_1d, fdm_interp, grad_dummy, q_ref_dummy, q_weight_dummy, &fdm_basis)); 22942b730f8bSJeremy L Thompson CeedCall(CeedFree(&fdm_interp)); 22952b730f8bSJeremy L Thompson CeedCall(CeedFree(&grad_dummy)); 22962b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_ref_dummy)); 22972b730f8bSJeremy L Thompson CeedCall(CeedFree(&q_weight_dummy)); 22982b730f8bSJeremy L Thompson CeedCall(CeedFree(&lambda)); 2299eaf62fffSJeremy L Thompson 2300eaf62fffSJeremy L Thompson // -- Restriction 2301eaf62fffSJeremy L Thompson CeedElemRestriction rstr_qd_i; 2302eaf62fffSJeremy L Thompson CeedInt strides[3] = {1, elem_size, elem_size * num_comp}; 23032b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionCreateStrided(ceed_parent, num_elem, elem_size, num_comp, num_elem * num_comp * elem_size, strides, &rstr_qd_i)); 2304eaf62fffSJeremy L Thompson // -- QFunction 2305eaf62fffSJeremy L Thompson CeedQFunction qf_fdm; 23062b730f8bSJeremy L Thompson CeedCall(CeedQFunctionCreateInteriorByName(ceed_parent, "Scale", &qf_fdm)); 23072b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_fdm, "input", num_comp, CEED_EVAL_INTERP)); 23082b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddInput(qf_fdm, "scale", num_comp, CEED_EVAL_NONE)); 23092b730f8bSJeremy L Thompson CeedCall(CeedQFunctionAddOutput(qf_fdm, "output", num_comp, CEED_EVAL_INTERP)); 23102b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_fdm, num_comp)); 2311eaf62fffSJeremy L Thompson // -- QFunction context 2312eaf62fffSJeremy L Thompson CeedInt *num_comp_data; 23132b730f8bSJeremy L Thompson CeedCall(CeedCalloc(1, &num_comp_data)); 2314eaf62fffSJeremy L Thompson num_comp_data[0] = num_comp; 2315eaf62fffSJeremy L Thompson CeedQFunctionContext ctx_fdm; 23162b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextCreate(ceed, &ctx_fdm)); 23172b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextSetData(ctx_fdm, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_data), num_comp_data)); 23182b730f8bSJeremy L Thompson CeedCall(CeedQFunctionSetContext(qf_fdm, ctx_fdm)); 23192b730f8bSJeremy L Thompson CeedCall(CeedQFunctionContextDestroy(&ctx_fdm)); 2320eaf62fffSJeremy L Thompson // -- Operator 23212b730f8bSJeremy L Thompson CeedCall(CeedOperatorCreate(ceed_parent, qf_fdm, NULL, NULL, fdm_inv)); 23222b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*fdm_inv, "input", rstr, fdm_basis, CEED_VECTOR_ACTIVE)); 23232b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*fdm_inv, "scale", rstr_qd_i, CEED_BASIS_COLLOCATED, q_data)); 23242b730f8bSJeremy L Thompson CeedCall(CeedOperatorSetField(*fdm_inv, "output", rstr, fdm_basis, CEED_VECTOR_ACTIVE)); 2325eaf62fffSJeremy L Thompson 2326eaf62fffSJeremy L Thompson // Cleanup 23272b730f8bSJeremy L Thompson CeedCall(CeedVectorDestroy(&q_data)); 23282b730f8bSJeremy L Thompson CeedCall(CeedBasisDestroy(&fdm_basis)); 23292b730f8bSJeremy L Thompson CeedCall(CeedElemRestrictionDestroy(&rstr_qd_i)); 23302b730f8bSJeremy L Thompson CeedCall(CeedQFunctionDestroy(&qf_fdm)); 2331eaf62fffSJeremy L Thompson 2332eaf62fffSJeremy L Thompson return CEED_ERROR_SUCCESS; 2333eaf62fffSJeremy L Thompson } 2334eaf62fffSJeremy L Thompson 2335eaf62fffSJeremy L Thompson /// @} 2336