xref: /libCEED/rust/libceed-sys/c-src/interface/ceed-preconditioning.c (revision e984cf9ab7e61f88276fc03d915be3267ae350fc)
13d8e8822SJeremy L Thompson // Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors.
23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details.
3eaf62fffSJeremy L Thompson //
43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause
5eaf62fffSJeremy L Thompson //
63d8e8822SJeremy L Thompson // This file is part of CEED:  http://github.com/ceed
7eaf62fffSJeremy L Thompson 
82b730f8bSJeremy L Thompson #include <ceed-impl.h>
949aac155SJeremy L Thompson #include <ceed.h>
102b730f8bSJeremy L Thompson #include <ceed/backend.h>
11c85e8640SSebastian Grimberg #include <assert.h>
122b730f8bSJeremy L Thompson #include <math.h>
13eaf62fffSJeremy L Thompson #include <stdbool.h>
14eaf62fffSJeremy L Thompson #include <stdio.h>
15eaf62fffSJeremy L Thompson #include <string.h>
16eaf62fffSJeremy L Thompson 
17eaf62fffSJeremy L Thompson /// @file
18eaf62fffSJeremy L Thompson /// Implementation of CeedOperator preconditioning interfaces
19eaf62fffSJeremy L Thompson 
20eaf62fffSJeremy L Thompson /// ----------------------------------------------------------------------------
21eaf62fffSJeremy L Thompson /// CeedOperator Library Internal Preconditioning Functions
22eaf62fffSJeremy L Thompson /// ----------------------------------------------------------------------------
23eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorDeveloper
24eaf62fffSJeremy L Thompson /// @{
25eaf62fffSJeremy L Thompson 
26eaf62fffSJeremy L Thompson /**
27ea61e9acSJeremy L Thompson   @brief Duplicate a CeedQFunction with a reference Ceed to fallback for advanced CeedOperator functionality
289e77b9c8SJeremy L Thompson 
2901ea9c81SJed Brown   @param[in]  fallback_ceed Ceed on which to create fallback CeedQFunction
309e77b9c8SJeremy L Thompson   @param[in]  qf            CeedQFunction to create fallback for
3101ea9c81SJed Brown   @param[out] qf_fallback   fallback CeedQFunction
329e77b9c8SJeremy L Thompson 
339e77b9c8SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
349e77b9c8SJeremy L Thompson 
359e77b9c8SJeremy L Thompson   @ref Developer
369e77b9c8SJeremy L Thompson **/
372b730f8bSJeremy L Thompson static int CeedQFunctionCreateFallback(Ceed fallback_ceed, CeedQFunction qf, CeedQFunction *qf_fallback) {
381c66c397SJeremy L Thompson   char *source_path_with_name = NULL;
391c66c397SJeremy L Thompson 
409e77b9c8SJeremy L Thompson   // Check if NULL qf passed in
419e77b9c8SJeremy L Thompson   if (!qf) return CEED_ERROR_SUCCESS;
429e77b9c8SJeremy L Thompson 
43d04bbc78SJeremy L Thompson   CeedDebug256(qf->ceed, 1, "---------- CeedOperator Fallback ----------\n");
4413f886e9SJeremy L Thompson   CeedDebug(qf->ceed, "Creating fallback CeedQFunction\n");
45d04bbc78SJeremy L Thompson 
469e77b9c8SJeremy L Thompson   if (qf->source_path) {
472b730f8bSJeremy L Thompson     size_t path_len = strlen(qf->source_path), name_len = strlen(qf->kernel_name);
482b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(path_len + name_len + 2, &source_path_with_name));
499e77b9c8SJeremy L Thompson     memcpy(source_path_with_name, qf->source_path, path_len);
509e77b9c8SJeremy L Thompson     memcpy(&source_path_with_name[path_len], ":", 1);
519e77b9c8SJeremy L Thompson     memcpy(&source_path_with_name[path_len + 1], qf->kernel_name, name_len);
529e77b9c8SJeremy L Thompson   } else {
532b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(1, &source_path_with_name));
549e77b9c8SJeremy L Thompson   }
559e77b9c8SJeremy L Thompson 
562b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionCreateInterior(fallback_ceed, qf->vec_length, qf->function, source_path_with_name, qf_fallback));
579e77b9c8SJeremy L Thompson   {
589e77b9c8SJeremy L Thompson     CeedQFunctionContext ctx;
599e77b9c8SJeremy L Thompson 
602b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionGetContext(qf, &ctx));
612b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionSetContext(*qf_fallback, ctx));
629e77b9c8SJeremy L Thompson   }
639e77b9c8SJeremy L Thompson   for (CeedInt i = 0; i < qf->num_input_fields; i++) {
642b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddInput(*qf_fallback, qf->input_fields[i]->field_name, qf->input_fields[i]->size, qf->input_fields[i]->eval_mode));
659e77b9c8SJeremy L Thompson   }
669e77b9c8SJeremy L Thompson   for (CeedInt i = 0; i < qf->num_output_fields; i++) {
672b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddOutput(*qf_fallback, qf->output_fields[i]->field_name, qf->output_fields[i]->size, qf->output_fields[i]->eval_mode));
689e77b9c8SJeremy L Thompson   }
692b730f8bSJeremy L Thompson   CeedCall(CeedFree(&source_path_with_name));
709e77b9c8SJeremy L Thompson   return CEED_ERROR_SUCCESS;
719e77b9c8SJeremy L Thompson }
729e77b9c8SJeremy L Thompson 
739e77b9c8SJeremy L Thompson /**
74ea61e9acSJeremy L Thompson   @brief Duplicate a CeedOperator with a reference Ceed to fallback for advanced CeedOperator functionality
75eaf62fffSJeremy L Thompson 
76ea61e9acSJeremy L Thompson   @param[in,out] op CeedOperator to create fallback for
77eaf62fffSJeremy L Thompson 
78eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
79eaf62fffSJeremy L Thompson 
80eaf62fffSJeremy L Thompson   @ref Developer
81eaf62fffSJeremy L Thompson **/
82d04bbc78SJeremy L Thompson static int CeedOperatorCreateFallback(CeedOperator op) {
839e77b9c8SJeremy L Thompson   Ceed         ceed_fallback;
841c66c397SJeremy L Thompson   bool         is_composite;
851c66c397SJeremy L Thompson   CeedOperator op_fallback;
86eaf62fffSJeremy L Thompson 
87805fe78eSJeremy L Thompson   // Check not already created
88805fe78eSJeremy L Thompson   if (op->op_fallback) return CEED_ERROR_SUCCESS;
89805fe78eSJeremy L Thompson 
90eaf62fffSJeremy L Thompson   // Fallback Ceed
912b730f8bSJeremy L Thompson   CeedCall(CeedGetOperatorFallbackCeed(op->ceed, &ceed_fallback));
92d04bbc78SJeremy L Thompson   if (!ceed_fallback) return CEED_ERROR_SUCCESS;
93d04bbc78SJeremy L Thompson 
94d04bbc78SJeremy L Thompson   CeedDebug256(op->ceed, 1, "---------- CeedOperator Fallback ----------\n");
9513f886e9SJeremy L Thompson   CeedDebug(op->ceed, "Creating fallback CeedOperator\n");
96eaf62fffSJeremy L Thompson 
97eaf62fffSJeremy L Thompson   // Clone Op
98b275c451SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
99b275c451SJeremy L Thompson   if (is_composite) {
100b275c451SJeremy L Thompson     CeedInt       num_suboperators;
101b275c451SJeremy L Thompson     CeedOperator *sub_operators;
102b275c451SJeremy L Thompson 
1032b730f8bSJeremy L Thompson     CeedCall(CeedCompositeOperatorCreate(ceed_fallback, &op_fallback));
104b275c451SJeremy L Thompson     CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
105b275c451SJeremy L Thompson     CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
106b275c451SJeremy L Thompson     for (CeedInt i = 0; i < num_suboperators; i++) {
107d04bbc78SJeremy L Thompson       CeedOperator op_sub_fallback;
108d04bbc78SJeremy L Thompson 
109b275c451SJeremy L Thompson       CeedCall(CeedOperatorGetFallback(sub_operators[i], &op_sub_fallback));
1102b730f8bSJeremy L Thompson       CeedCall(CeedCompositeOperatorAddSub(op_fallback, op_sub_fallback));
111805fe78eSJeremy L Thompson     }
112805fe78eSJeremy L Thompson   } else {
1139e77b9c8SJeremy L Thompson     CeedQFunction qf_fallback = NULL, dqf_fallback = NULL, dqfT_fallback = NULL;
1141c66c397SJeremy L Thompson 
1152b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->qf, &qf_fallback));
1162b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqf, &dqf_fallback));
1172b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqfT, &dqfT_fallback));
1182b730f8bSJeremy L Thompson     CeedCall(CeedOperatorCreate(ceed_fallback, qf_fallback, dqf_fallback, dqfT_fallback, &op_fallback));
119805fe78eSJeremy L Thompson     for (CeedInt i = 0; i < op->qf->num_input_fields; i++) {
120437c7c90SJeremy L Thompson       CeedCall(CeedOperatorSetField(op_fallback, op->input_fields[i]->field_name, op->input_fields[i]->elem_rstr, op->input_fields[i]->basis,
1212b730f8bSJeremy L Thompson                                     op->input_fields[i]->vec));
122805fe78eSJeremy L Thompson     }
123805fe78eSJeremy L Thompson     for (CeedInt i = 0; i < op->qf->num_output_fields; i++) {
124437c7c90SJeremy L Thompson       CeedCall(CeedOperatorSetField(op_fallback, op->output_fields[i]->field_name, op->output_fields[i]->elem_rstr, op->output_fields[i]->basis,
1252b730f8bSJeremy L Thompson                                     op->output_fields[i]->vec));
126805fe78eSJeremy L Thompson     }
1272b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op->qf_assembled, &op_fallback->qf_assembled));
128febe2972SJeremy L Thompson     if (op_fallback->num_qpts == 0) CeedCall(CeedOperatorSetNumQuadraturePoints(op_fallback, op->num_qpts));
1299e77b9c8SJeremy L Thompson     // Cleanup
1302b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionDestroy(&qf_fallback));
1312b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionDestroy(&dqf_fallback));
1322b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionDestroy(&dqfT_fallback));
133805fe78eSJeremy L Thompson   }
1342b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetName(op_fallback, op->name));
1352b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op_fallback));
136b05f7e9fSJeremy L Thompson   // Note: No ref-counting here so we don't get caught in a reference loop.
137b05f7e9fSJeremy L Thompson   //       The op holds the only reference to op_fallback and is responsible for deleting itself and op_fallback.
138805fe78eSJeremy L Thompson   op->op_fallback                 = op_fallback;
139b05f7e9fSJeremy L Thompson   op_fallback->op_fallback_parent = op;
140eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
141eaf62fffSJeremy L Thompson }
142eaf62fffSJeremy L Thompson 
143eaf62fffSJeremy L Thompson /**
144ea61e9acSJeremy L Thompson   @brief Retrieve fallback CeedOperator with a reference Ceed for advanced CeedOperator functionality
145d04bbc78SJeremy L Thompson 
146d04bbc78SJeremy L Thompson   @param[in]  op          CeedOperator to retrieve fallback for
147d04bbc78SJeremy L Thompson   @param[out] op_fallback Fallback CeedOperator
148d04bbc78SJeremy L Thompson 
149d04bbc78SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
150d04bbc78SJeremy L Thompson 
151d04bbc78SJeremy L Thompson   @ref Developer
152d04bbc78SJeremy L Thompson **/
153d04bbc78SJeremy L Thompson int CeedOperatorGetFallback(CeedOperator op, CeedOperator *op_fallback) {
154d04bbc78SJeremy L Thompson   // Create if needed
1551c66c397SJeremy L Thompson   if (!op->op_fallback) CeedCall(CeedOperatorCreateFallback(op));
156d04bbc78SJeremy L Thompson   if (op->op_fallback) {
157d04bbc78SJeremy L Thompson     bool is_debug;
158d04bbc78SJeremy L Thompson 
1592b730f8bSJeremy L Thompson     CeedCall(CeedIsDebug(op->ceed, &is_debug));
160d04bbc78SJeremy L Thompson     if (is_debug) {
161b275c451SJeremy L Thompson       Ceed        ceed, ceed_fallback;
162d04bbc78SJeremy L Thompson       const char *resource, *resource_fallback;
163d04bbc78SJeremy L Thompson 
164b275c451SJeremy L Thompson       CeedCall(CeedOperatorGetCeed(op, &ceed));
165b275c451SJeremy L Thompson       CeedCall(CeedGetOperatorFallbackCeed(ceed, &ceed_fallback));
166b275c451SJeremy L Thompson       CeedCall(CeedGetResource(ceed, &resource));
1672b730f8bSJeremy L Thompson       CeedCall(CeedGetResource(ceed_fallback, &resource_fallback));
168d04bbc78SJeremy L Thompson 
16923d4529eSJeremy L Thompson       CeedDebug256(ceed, CEED_DEBUG_COLOR_SUCCESS, "---------- CeedOperator Fallback ----------\n");
170b275c451SJeremy L Thompson       CeedDebug(ceed, "Falling back from %s operator at address %ld to %s operator at address %ld\n", resource, op, resource_fallback,
1712b730f8bSJeremy L Thompson                 op->op_fallback);
172d04bbc78SJeremy L Thompson     }
173d04bbc78SJeremy L Thompson   }
174d04bbc78SJeremy L Thompson   *op_fallback = op->op_fallback;
175d04bbc78SJeremy L Thompson   return CEED_ERROR_SUCCESS;
176d04bbc78SJeremy L Thompson }
177d04bbc78SJeremy L Thompson 
178d04bbc78SJeremy L Thompson /**
179bb229da9SJeremy L Thompson   @brief Get the parent Ceed context associated with a fallback Ceed context for a CeedOperator
180bb229da9SJeremy L Thompson 
181bb229da9SJeremy L Thompson   @param[in]  op     CeedOperator context
182bb229da9SJeremy L Thompson   @param[out] parent Variable to store parent CeedOperator context
183bb229da9SJeremy L Thompson 
184bb229da9SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
185bb229da9SJeremy L Thompson 
186bb229da9SJeremy L Thompson   @ref Developer
187bb229da9SJeremy L Thompson **/
188bb229da9SJeremy L Thompson int CeedOperatorGetFallbackParent(CeedOperator op, CeedOperator *parent) {
189bb229da9SJeremy L Thompson   *parent = op->op_fallback_parent ? op->op_fallback_parent : NULL;
190bb229da9SJeremy L Thompson   return CEED_ERROR_SUCCESS;
191bb229da9SJeremy L Thompson }
192bb229da9SJeremy L Thompson 
193bb229da9SJeremy L Thompson /**
194bb229da9SJeremy L Thompson   @brief Get the parent Ceed context associated with a fallback Ceed context for a CeedOperator
195bb229da9SJeremy L Thompson 
196bb229da9SJeremy L Thompson   @param[in]  op     CeedOperator context
197bb229da9SJeremy L Thompson   @param[out] parent Variable to store parent Ceed context
198bb229da9SJeremy L Thompson 
199bb229da9SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
200bb229da9SJeremy L Thompson 
201bb229da9SJeremy L Thompson   @ref Developer
202bb229da9SJeremy L Thompson **/
203bb229da9SJeremy L Thompson int CeedOperatorGetFallbackParentCeed(CeedOperator op, Ceed *parent) {
204*e984cf9aSJeremy L Thompson   *parent = op->op_fallback_parent ? op->op_fallback_parent->ceed : op->ceed;
205bb229da9SJeremy L Thompson   return CEED_ERROR_SUCCESS;
206bb229da9SJeremy L Thompson }
207bb229da9SJeremy L Thompson 
208bb229da9SJeremy L Thompson /**
209eaf62fffSJeremy L Thompson   @brief Select correct basis matrix pointer based on CeedEvalMode
210eaf62fffSJeremy L Thompson 
211352a5e7cSSebastian Grimberg   @param[in]  basis     CeedBasis from which to get the basis matrix
212eaf62fffSJeremy L Thompson   @param[in]  eval_mode Current basis evaluation mode
213eaf62fffSJeremy L Thompson   @param[in]  identity  Pointer to identity matrix
214eaf62fffSJeremy L Thompson   @param[out] basis_ptr Basis pointer to set
215eaf62fffSJeremy L Thompson 
216eaf62fffSJeremy L Thompson   @ref Developer
217eaf62fffSJeremy L Thompson **/
218352a5e7cSSebastian Grimberg static inline int CeedOperatorGetBasisPointer(CeedBasis basis, CeedEvalMode eval_mode, const CeedScalar *identity, const CeedScalar **basis_ptr) {
219eaf62fffSJeremy L Thompson   switch (eval_mode) {
220eaf62fffSJeremy L Thompson     case CEED_EVAL_NONE:
221eaf62fffSJeremy L Thompson       *basis_ptr = identity;
222eaf62fffSJeremy L Thompson       break;
223eaf62fffSJeremy L Thompson     case CEED_EVAL_INTERP:
224352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetInterp(basis, basis_ptr));
225eaf62fffSJeremy L Thompson       break;
226eaf62fffSJeremy L Thompson     case CEED_EVAL_GRAD:
227352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetGrad(basis, basis_ptr));
228352a5e7cSSebastian Grimberg       break;
229352a5e7cSSebastian Grimberg     case CEED_EVAL_DIV:
230352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetDiv(basis, basis_ptr));
231352a5e7cSSebastian Grimberg       break;
232352a5e7cSSebastian Grimberg     case CEED_EVAL_CURL:
233352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetCurl(basis, basis_ptr));
234eaf62fffSJeremy L Thompson       break;
235eaf62fffSJeremy L Thompson     case CEED_EVAL_WEIGHT:
236eaf62fffSJeremy L Thompson       break;  // Caught by QF Assembly
237eaf62fffSJeremy L Thompson   }
238ed9e99e6SJeremy L Thompson   assert(*basis_ptr != NULL);
239352a5e7cSSebastian Grimberg   return CEED_ERROR_SUCCESS;
240eaf62fffSJeremy L Thompson }
241eaf62fffSJeremy L Thompson 
242eaf62fffSJeremy L Thompson /**
243eaf62fffSJeremy L Thompson   @brief Create point block restriction for active operator field
244eaf62fffSJeremy L Thompson 
245eaf62fffSJeremy L Thompson   @param[in]  rstr            Original CeedElemRestriction for active field
246ea61e9acSJeremy L Thompson   @param[out] pointblock_rstr Address of the variable where the newly created CeedElemRestriction will be stored
247eaf62fffSJeremy L Thompson 
248eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
249eaf62fffSJeremy L Thompson 
250eaf62fffSJeremy L Thompson   @ref Developer
251eaf62fffSJeremy L Thompson **/
2522b730f8bSJeremy L Thompson static int CeedOperatorCreateActivePointBlockRestriction(CeedElemRestriction rstr, CeedElemRestriction *pointblock_rstr) {
253eaf62fffSJeremy L Thompson   Ceed           ceed;
2541c66c397SJeremy L Thompson   CeedInt        num_elem, num_comp, shift, elem_size, comp_stride, *pointblock_offsets;
2551c66c397SJeremy L Thompson   CeedSize       l_size;
256eaf62fffSJeremy L Thompson   const CeedInt *offsets;
2571c66c397SJeremy L Thompson 
2581c66c397SJeremy L Thompson   CeedCall(CeedElemRestrictionGetCeed(rstr, &ceed));
2592b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetOffsets(rstr, CEED_MEM_HOST, &offsets));
260eaf62fffSJeremy L Thompson 
261eaf62fffSJeremy L Thompson   // Expand offsets
2622b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem));
2632b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp));
2642b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size));
2652b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetCompStride(rstr, &comp_stride));
2662b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size));
2671c66c397SJeremy L Thompson   shift = num_comp;
2682b730f8bSJeremy L Thompson   if (comp_stride != 1) shift *= num_comp;
2692b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(num_elem * elem_size, &pointblock_offsets));
270eaf62fffSJeremy L Thompson   for (CeedInt i = 0; i < num_elem * elem_size; i++) {
271eaf62fffSJeremy L Thompson     pointblock_offsets[i] = offsets[i] * shift;
272eaf62fffSJeremy L Thompson   }
273eaf62fffSJeremy L Thompson 
274eaf62fffSJeremy L Thompson   // Create new restriction
2752b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionCreate(ceed, num_elem, elem_size, num_comp * num_comp, 1, l_size * num_comp, CEED_MEM_HOST, CEED_OWN_POINTER,
2762b730f8bSJeremy L Thompson                                      pointblock_offsets, pointblock_rstr));
277eaf62fffSJeremy L Thompson 
278eaf62fffSJeremy L Thompson   // Cleanup
2792b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionRestoreOffsets(rstr, &offsets));
280eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
281eaf62fffSJeremy L Thompson }
282eaf62fffSJeremy L Thompson 
283eaf62fffSJeremy L Thompson /**
284eaf62fffSJeremy L Thompson   @brief Core logic for assembling operator diagonal or point block diagonal
285eaf62fffSJeremy L Thompson 
286eaf62fffSJeremy L Thompson   @param[in]  op            CeedOperator to assemble point block diagonal
287ea61e9acSJeremy L Thompson   @param[in]  request       Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE
288eaf62fffSJeremy L Thompson   @param[in]  is_pointblock Boolean flag to assemble diagonal or point block diagonal
289eaf62fffSJeremy L Thompson   @param[out] assembled     CeedVector to store assembled diagonal
290eaf62fffSJeremy L Thompson 
291eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
292eaf62fffSJeremy L Thompson 
293eaf62fffSJeremy L Thompson   @ref Developer
294eaf62fffSJeremy L Thompson **/
2952b730f8bSJeremy L Thompson static inline int CeedSingleOperatorAssembleAddDiagonal_Core(CeedOperator op, CeedRequest *request, const bool is_pointblock, CeedVector assembled) {
296eaf62fffSJeremy L Thompson   Ceed                ceed;
2971c66c397SJeremy L Thompson   CeedInt             num_input_fields, num_output_fields;
2981c66c397SJeremy L Thompson   CeedInt             layout[3];
299437c7c90SJeremy L Thompson   const CeedScalar   *assembled_qf_array;
300c5f45aeaSJeremy L Thompson   CeedVector          assembled_qf        = NULL;
301c5f45aeaSJeremy L Thompson   CeedElemRestriction assembled_elem_rstr = NULL;
3021c66c397SJeremy L Thompson   CeedQFunction       qf;
303437c7c90SJeremy L Thompson 
3041c66c397SJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
3051c66c397SJeremy L Thompson 
3061c66c397SJeremy L Thompson   // Assemble QFunction
307437c7c90SJeremy L Thompson   CeedCall(CeedOperatorGetQFunction(op, &qf));
308437c7c90SJeremy L Thompson   CeedCall(CeedQFunctionGetNumArgs(qf, &num_input_fields, &num_output_fields));
309437c7c90SJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &assembled_elem_rstr, request));
310437c7c90SJeremy L Thompson   CeedCall(CeedElemRestrictionGetELayout(assembled_elem_rstr, &layout));
311437c7c90SJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&assembled_elem_rstr));
312437c7c90SJeremy L Thompson   CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array));
313eaf62fffSJeremy L Thompson 
314ed9e99e6SJeremy L Thompson   // Get assembly data
315437c7c90SJeremy L Thompson   const CeedEvalMode     **eval_modes_in, **eval_modes_out;
316437c7c90SJeremy L Thompson   CeedInt                 *num_eval_modes_in, *num_eval_modes_out, num_active_bases;
317437c7c90SJeremy L Thompson   CeedSize               **eval_mode_offsets_in, **eval_mode_offsets_out, num_output_components;
318437c7c90SJeremy L Thompson   CeedElemRestriction     *active_elem_rstrs;
3191c66c397SJeremy L Thompson   CeedBasis               *active_bases;
3201c66c397SJeremy L Thompson   CeedOperatorAssemblyData data;
3211c66c397SJeremy L Thompson 
322437c7c90SJeremy L Thompson   CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data));
323437c7c90SJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_active_bases, &num_eval_modes_in, &eval_modes_in, &eval_mode_offsets_in,
324437c7c90SJeremy L Thompson                                                 &num_eval_modes_out, &eval_modes_out, &eval_mode_offsets_out, &num_output_components));
325437c7c90SJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, &active_bases, NULL, NULL));
326437c7c90SJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetElemRestrictions(data, NULL, &active_elem_rstrs));
327437c7c90SJeremy L Thompson 
328437c7c90SJeremy L Thompson   // Loop over all active bases
329437c7c90SJeremy L Thompson   for (CeedInt b = 0; b < num_active_bases; b++) {
3301c66c397SJeremy L Thompson     bool                has_eval_none = false;
3311c66c397SJeremy L Thompson     CeedInt             num_elem, num_nodes, num_qpts, num_components;
3321c66c397SJeremy L Thompson     CeedScalar         *elem_diag_array, *identity = NULL;
3331c66c397SJeremy L Thompson     CeedVector          elem_diag;
3347c1dbaffSSebastian Grimberg     CeedElemRestriction diag_elem_rstr;
3351c66c397SJeremy L Thompson 
3361c66c397SJeremy L Thompson     // Assemble point block diagonal restriction, if needed
337eaf62fffSJeremy L Thompson     if (is_pointblock) {
3387c1dbaffSSebastian Grimberg       CeedCall(CeedOperatorCreateActivePointBlockRestriction(active_elem_rstrs[b], &diag_elem_rstr));
3397c1dbaffSSebastian Grimberg     } else {
3407c1dbaffSSebastian Grimberg       CeedCall(CeedElemRestrictionCreateUnsignedCopy(active_elem_rstrs[b], &diag_elem_rstr));
341eaf62fffSJeremy L Thompson     }
342eaf62fffSJeremy L Thompson 
343eaf62fffSJeremy L Thompson     // Create diagonal vector
344437c7c90SJeremy L Thompson     CeedCall(CeedElemRestrictionCreateVector(diag_elem_rstr, NULL, &elem_diag));
345eaf62fffSJeremy L Thompson 
346eaf62fffSJeremy L Thompson     // Assemble element operator diagonals
3472b730f8bSJeremy L Thompson     CeedCall(CeedVectorSetValue(elem_diag, 0.0));
3482b730f8bSJeremy L Thompson     CeedCall(CeedVectorGetArray(elem_diag, CEED_MEM_HOST, &elem_diag_array));
349437c7c90SJeremy L Thompson     CeedCall(CeedElemRestrictionGetNumElements(diag_elem_rstr, &num_elem));
350437c7c90SJeremy L Thompson     CeedCall(CeedBasisGetNumNodes(active_bases[b], &num_nodes));
351437c7c90SJeremy L Thompson     CeedCall(CeedBasisGetNumComponents(active_bases[b], &num_components));
352437c7c90SJeremy L Thompson     CeedCall(CeedBasisGetNumQuadraturePoints(active_bases[b], &num_qpts));
353ed9e99e6SJeremy L Thompson 
354352a5e7cSSebastian Grimberg     // Construct identity matrix for basis if required
355437c7c90SJeremy L Thompson     for (CeedInt i = 0; i < num_eval_modes_in[b]; i++) {
356437c7c90SJeremy L Thompson       has_eval_none = has_eval_none || (eval_modes_in[b][i] == CEED_EVAL_NONE);
357ed9e99e6SJeremy L Thompson     }
358437c7c90SJeremy L Thompson     for (CeedInt i = 0; i < num_eval_modes_out[b]; i++) {
359437c7c90SJeremy L Thompson       has_eval_none = has_eval_none || (eval_modes_out[b][i] == CEED_EVAL_NONE);
360ed9e99e6SJeremy L Thompson     }
361ed9e99e6SJeremy L Thompson     if (has_eval_none) {
3622b730f8bSJeremy L Thompson       CeedCall(CeedCalloc(num_qpts * num_nodes, &identity));
3632b730f8bSJeremy L Thompson       for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) identity[i * num_nodes + i] = 1.0;
364eaf62fffSJeremy L Thompson     }
365352a5e7cSSebastian Grimberg 
366eaf62fffSJeremy L Thompson     // Compute the diagonal of B^T D B
367eaf62fffSJeremy L Thompson     // Each element
368b94338b9SJed Brown     for (CeedSize e = 0; e < num_elem; e++) {
369eaf62fffSJeremy L Thompson       // Each basis eval mode pair
370352a5e7cSSebastian Grimberg       CeedInt      d_out              = 0, q_comp_out;
371352a5e7cSSebastian Grimberg       CeedEvalMode eval_mode_out_prev = CEED_EVAL_NONE;
3721c66c397SJeremy L Thompson 
373437c7c90SJeremy L Thompson       for (CeedInt e_out = 0; e_out < num_eval_modes_out[b]; e_out++) {
3741c66c397SJeremy L Thompson         CeedInt           d_in              = 0, q_comp_in;
375437c7c90SJeremy L Thompson         const CeedScalar *B_t               = NULL;
3761c66c397SJeremy L Thompson         CeedEvalMode      eval_mode_in_prev = CEED_EVAL_NONE;
3771c66c397SJeremy L Thompson 
378352a5e7cSSebastian Grimberg         CeedOperatorGetBasisPointer(active_bases[b], eval_modes_out[b][e_out], identity, &B_t);
379352a5e7cSSebastian Grimberg         CeedCall(CeedBasisGetNumQuadratureComponents(active_bases[b], eval_modes_out[b][e_out], &q_comp_out));
380352a5e7cSSebastian Grimberg         if (q_comp_out > 1) {
381352a5e7cSSebastian Grimberg           if (e_out == 0 || eval_modes_out[b][e_out] != eval_mode_out_prev) d_out = 0;
382352a5e7cSSebastian Grimberg           else B_t = &B_t[(++d_out) * num_qpts * num_nodes];
383352a5e7cSSebastian Grimberg         }
384352a5e7cSSebastian Grimberg         eval_mode_out_prev = eval_modes_out[b][e_out];
385352a5e7cSSebastian Grimberg 
386437c7c90SJeremy L Thompson         for (CeedInt e_in = 0; e_in < num_eval_modes_in[b]; e_in++) {
387437c7c90SJeremy L Thompson           const CeedScalar *B = NULL;
3881c66c397SJeremy L Thompson 
389352a5e7cSSebastian Grimberg           CeedOperatorGetBasisPointer(active_bases[b], eval_modes_in[b][e_in], identity, &B);
390352a5e7cSSebastian Grimberg           CeedCall(CeedBasisGetNumQuadratureComponents(active_bases[b], eval_modes_in[b][e_in], &q_comp_in));
391352a5e7cSSebastian Grimberg           if (q_comp_in > 1) {
392352a5e7cSSebastian Grimberg             if (e_in == 0 || eval_modes_in[b][e_in] != eval_mode_in_prev) d_in = 0;
393352a5e7cSSebastian Grimberg             else B = &B[(++d_in) * num_qpts * num_nodes];
394352a5e7cSSebastian Grimberg           }
395352a5e7cSSebastian Grimberg           eval_mode_in_prev = eval_modes_in[b][e_in];
396352a5e7cSSebastian Grimberg 
397eaf62fffSJeremy L Thompson           // Each component
398437c7c90SJeremy L Thompson           for (CeedInt c_out = 0; c_out < num_components; c_out++) {
399437c7c90SJeremy L Thompson             // Each qpt/node pair
4002b730f8bSJeremy L Thompson             for (CeedInt q = 0; q < num_qpts; q++) {
401eaf62fffSJeremy L Thompson               if (is_pointblock) {
402eaf62fffSJeremy L Thompson                 // Point Block Diagonal
403437c7c90SJeremy L Thompson                 for (CeedInt c_in = 0; c_in < num_components; c_in++) {
404b94338b9SJed Brown                   const CeedSize c_offset = (eval_mode_offsets_in[b][e_in] + c_in) * num_output_components + eval_mode_offsets_out[b][e_out] + c_out;
405437c7c90SJeremy L Thompson                   const CeedScalar qf_value = assembled_qf_array[q * layout[0] + c_offset * layout[1] + e * layout[2]];
4061c66c397SJeremy L Thompson 
4072b730f8bSJeremy L Thompson                   for (CeedInt n = 0; n < num_nodes; n++) {
408437c7c90SJeremy L Thompson                     elem_diag_array[((e * num_components + c_out) * num_components + c_in) * num_nodes + n] +=
409437c7c90SJeremy L Thompson                         B_t[q * num_nodes + n] * qf_value * B[q * num_nodes + n];
410eaf62fffSJeremy L Thompson                   }
4112b730f8bSJeremy L Thompson                 }
412eaf62fffSJeremy L Thompson               } else {
413eaf62fffSJeremy L Thompson                 // Diagonal Only
414437c7c90SJeremy L Thompson                 const CeedInt    c_offset = (eval_mode_offsets_in[b][e_in] + c_out) * num_output_components + eval_mode_offsets_out[b][e_out] + c_out;
415437c7c90SJeremy L Thompson                 const CeedScalar qf_value = assembled_qf_array[q * layout[0] + c_offset * layout[1] + e * layout[2]];
4161c66c397SJeremy L Thompson 
4172b730f8bSJeremy L Thompson                 for (CeedInt n = 0; n < num_nodes; n++) {
418437c7c90SJeremy L Thompson                   elem_diag_array[(e * num_components + c_out) * num_nodes + n] += B_t[q * num_nodes + n] * qf_value * B[q * num_nodes + n];
419eaf62fffSJeremy L Thompson                 }
420eaf62fffSJeremy L Thompson               }
421eaf62fffSJeremy L Thompson             }
422eaf62fffSJeremy L Thompson           }
4232b730f8bSJeremy L Thompson         }
4242b730f8bSJeremy L Thompson       }
4252b730f8bSJeremy L Thompson     }
4262b730f8bSJeremy L Thompson     CeedCall(CeedVectorRestoreArray(elem_diag, &elem_diag_array));
427eaf62fffSJeremy L Thompson 
428eaf62fffSJeremy L Thompson     // Assemble local operator diagonal
4297c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionApply(diag_elem_rstr, CEED_TRANSPOSE, elem_diag, assembled, request));
430eaf62fffSJeremy L Thompson 
431eaf62fffSJeremy L Thompson     // Cleanup
4327c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionDestroy(&diag_elem_rstr));
4332b730f8bSJeremy L Thompson     CeedCall(CeedVectorDestroy(&elem_diag));
4342b730f8bSJeremy L Thompson     CeedCall(CeedFree(&identity));
435437c7c90SJeremy L Thompson   }
436437c7c90SJeremy L Thompson   CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array));
437437c7c90SJeremy L Thompson   CeedCall(CeedVectorDestroy(&assembled_qf));
438eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
439eaf62fffSJeremy L Thompson }
440eaf62fffSJeremy L Thompson 
441eaf62fffSJeremy L Thompson /**
442eaf62fffSJeremy L Thompson   @brief Core logic for assembling composite operator diagonal
443eaf62fffSJeremy L Thompson 
444eaf62fffSJeremy L Thompson   @param[in]  op            CeedOperator to assemble point block diagonal
445ea61e9acSJeremy L Thompson   @param[in]  request       Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE
446eaf62fffSJeremy L Thompson   @param[in]  is_pointblock Boolean flag to assemble diagonal or point block diagonal
447eaf62fffSJeremy L Thompson   @param[out] assembled     CeedVector to store assembled diagonal
448eaf62fffSJeremy L Thompson 
449eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
450eaf62fffSJeremy L Thompson 
451eaf62fffSJeremy L Thompson   @ref Developer
452eaf62fffSJeremy L Thompson **/
4532b730f8bSJeremy L Thompson static inline int CeedCompositeOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedRequest *request, const bool is_pointblock,
454eaf62fffSJeremy L Thompson                                                                  CeedVector assembled) {
455eaf62fffSJeremy L Thompson   CeedInt       num_sub;
456eaf62fffSJeremy L Thompson   CeedOperator *suboperators;
4571c66c397SJeremy L Thompson 
458c6ebc35dSJeremy L Thompson   CeedCall(CeedCompositeOperatorGetNumSub(op, &num_sub));
459c6ebc35dSJeremy L Thompson   CeedCall(CeedCompositeOperatorGetSubList(op, &suboperators));
460eaf62fffSJeremy L Thompson   for (CeedInt i = 0; i < num_sub; i++) {
4616aa95790SJeremy L Thompson     if (is_pointblock) {
4622b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(suboperators[i], assembled, request));
4636aa95790SJeremy L Thompson     } else {
4642b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleAddDiagonal(suboperators[i], assembled, request));
4656aa95790SJeremy L Thompson     }
466eaf62fffSJeremy L Thompson   }
467eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
468eaf62fffSJeremy L Thompson }
469eaf62fffSJeremy L Thompson 
470eaf62fffSJeremy L Thompson /**
471eaf62fffSJeremy L Thompson   @brief Build nonzero pattern for non-composite operator
472eaf62fffSJeremy L Thompson 
473eaf62fffSJeremy L Thompson   Users should generally use CeedOperatorLinearAssembleSymbolic()
474eaf62fffSJeremy L Thompson 
475eaf62fffSJeremy L Thompson   @param[in]  op     CeedOperator to assemble nonzero pattern
476eaf62fffSJeremy L Thompson   @param[in]  offset Offset for number of entries
477eaf62fffSJeremy L Thompson   @param[out] rows   Row number for each entry
478eaf62fffSJeremy L Thompson   @param[out] cols   Column number for each entry
479eaf62fffSJeremy L Thompson 
480eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
481eaf62fffSJeremy L Thompson 
482eaf62fffSJeremy L Thompson   @ref Developer
483eaf62fffSJeremy L Thompson **/
4842b730f8bSJeremy L Thompson static int CeedSingleOperatorAssembleSymbolic(CeedOperator op, CeedInt offset, CeedInt *rows, CeedInt *cols) {
485f3d47e36SJeremy L Thompson   Ceed                ceed;
486f3d47e36SJeremy L Thompson   bool                is_composite;
4871c66c397SJeremy L Thompson   CeedInt             num_elem, elem_size, num_comp, layout_er[3], local_num_entries;
4881c66c397SJeremy L Thompson   CeedSize            num_nodes, count = 0;
4891c66c397SJeremy L Thompson   CeedScalar         *array;
4901c66c397SJeremy L Thompson   const CeedScalar   *elem_dof_a;
4911c66c397SJeremy L Thompson   CeedVector          index_vec, elem_dof;
4921c66c397SJeremy L Thompson   CeedElemRestriction active_rstr, index_elem_rstr;
4931c66c397SJeremy L Thompson 
494f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
495f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
4966574a04fSJeremy L Thompson   CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported");
497eaf62fffSJeremy L Thompson 
4982b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &num_nodes, NULL));
4997c1dbaffSSebastian Grimberg   CeedCall(CeedOperatorGetActiveElemRestriction(op, &active_rstr));
5007c1dbaffSSebastian Grimberg   CeedCall(CeedElemRestrictionCreateUnorientedCopy(active_rstr, &index_elem_rstr));
5017c1dbaffSSebastian Grimberg   CeedCall(CeedElemRestrictionGetNumElements(index_elem_rstr, &num_elem));
5027c1dbaffSSebastian Grimberg   CeedCall(CeedElemRestrictionGetElementSize(index_elem_rstr, &elem_size));
5037c1dbaffSSebastian Grimberg   CeedCall(CeedElemRestrictionGetNumComponents(index_elem_rstr, &num_comp));
5047c1dbaffSSebastian Grimberg   CeedCall(CeedElemRestrictionGetELayout(index_elem_rstr, &layout_er));
5051c66c397SJeremy L Thompson   local_num_entries = elem_size * num_comp * elem_size * num_comp * num_elem;
506eaf62fffSJeremy L Thompson 
507eaf62fffSJeremy L Thompson   // Determine elem_dof relation
5082b730f8bSJeremy L Thompson   CeedCall(CeedVectorCreate(ceed, num_nodes, &index_vec));
5092b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayWrite(index_vec, CEED_MEM_HOST, &array));
510ed9e99e6SJeremy L Thompson   for (CeedInt i = 0; i < num_nodes; i++) array[i] = i;
5112b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArray(index_vec, &array));
5122b730f8bSJeremy L Thompson   CeedCall(CeedVectorCreate(ceed, num_elem * elem_size * num_comp, &elem_dof));
5132b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(elem_dof, 0.0));
5147c1dbaffSSebastian Grimberg   CeedCall(CeedElemRestrictionApply(index_elem_rstr, CEED_NOTRANSPOSE, index_vec, elem_dof, CEED_REQUEST_IMMEDIATE));
5152b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayRead(elem_dof, CEED_MEM_HOST, &elem_dof_a));
5162b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&index_vec));
517eaf62fffSJeremy L Thompson 
518eaf62fffSJeremy L Thompson   // Determine i, j locations for element matrices
519ed9e99e6SJeremy L Thompson   for (CeedInt e = 0; e < num_elem; e++) {
520ed9e99e6SJeremy L Thompson     for (CeedInt comp_in = 0; comp_in < num_comp; comp_in++) {
521ed9e99e6SJeremy L Thompson       for (CeedInt comp_out = 0; comp_out < num_comp; comp_out++) {
522ed9e99e6SJeremy L Thompson         for (CeedInt i = 0; i < elem_size; i++) {
523ed9e99e6SJeremy L Thompson           for (CeedInt j = 0; j < elem_size; j++) {
5242b730f8bSJeremy L Thompson             const CeedInt elem_dof_index_row = i * layout_er[0] + (comp_out)*layout_er[1] + e * layout_er[2];
5252b730f8bSJeremy L Thompson             const CeedInt elem_dof_index_col = j * layout_er[0] + comp_in * layout_er[1] + e * layout_er[2];
526eaf62fffSJeremy L Thompson             const CeedInt row                = elem_dof_a[elem_dof_index_row];
527eaf62fffSJeremy L Thompson             const CeedInt col                = elem_dof_a[elem_dof_index_col];
528eaf62fffSJeremy L Thompson 
529eaf62fffSJeremy L Thompson             rows[offset + count] = row;
530eaf62fffSJeremy L Thompson             cols[offset + count] = col;
531eaf62fffSJeremy L Thompson             count++;
532eaf62fffSJeremy L Thompson           }
533eaf62fffSJeremy L Thompson         }
534eaf62fffSJeremy L Thompson       }
535eaf62fffSJeremy L Thompson     }
536eaf62fffSJeremy L Thompson   }
5376574a04fSJeremy L Thompson   CeedCheck(count == local_num_entries, ceed, CEED_ERROR_MAJOR, "Error computing assembled entries");
5382b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArrayRead(elem_dof, &elem_dof_a));
5392b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&elem_dof));
5407c1dbaffSSebastian Grimberg   CeedCall(CeedElemRestrictionDestroy(&index_elem_rstr));
541eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
542eaf62fffSJeremy L Thompson }
543eaf62fffSJeremy L Thompson 
544eaf62fffSJeremy L Thompson /**
545eaf62fffSJeremy L Thompson   @brief Assemble nonzero entries for non-composite operator
546eaf62fffSJeremy L Thompson 
547eaf62fffSJeremy L Thompson   Users should generally use CeedOperatorLinearAssemble()
548eaf62fffSJeremy L Thompson 
549eaf62fffSJeremy L Thompson   @param[in]  op     CeedOperator to assemble
550ea61e9acSJeremy L Thompson   @param[in]  offset Offset for number of entries
551eaf62fffSJeremy L Thompson   @param[out] values Values to assemble into matrix
552eaf62fffSJeremy L Thompson 
553eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
554eaf62fffSJeremy L Thompson 
555eaf62fffSJeremy L Thompson   @ref Developer
556eaf62fffSJeremy L Thompson **/
5572b730f8bSJeremy L Thompson static int CeedSingleOperatorAssemble(CeedOperator op, CeedInt offset, CeedVector values) {
558f3d47e36SJeremy L Thompson   Ceed ceed;
559f3d47e36SJeremy L Thompson   bool is_composite;
5601c66c397SJeremy L Thompson 
561f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
562f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
563f3d47e36SJeremy L Thompson 
5646574a04fSJeremy L Thompson   CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported");
565f3d47e36SJeremy L Thompson 
566f3d47e36SJeremy L Thompson   // Early exit for empty operator
567f3d47e36SJeremy L Thompson   {
568f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
569f3d47e36SJeremy L Thompson 
570f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
571f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
572f3d47e36SJeremy L Thompson   }
573eaf62fffSJeremy L Thompson 
574cefa2673SJeremy L Thompson   if (op->LinearAssembleSingle) {
575cefa2673SJeremy L Thompson     // Backend version
5762b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleSingle(op, offset, values));
577cefa2673SJeremy L Thompson     return CEED_ERROR_SUCCESS;
578cefa2673SJeremy L Thompson   } else {
579cefa2673SJeremy L Thompson     // Operator fallback
580cefa2673SJeremy L Thompson     CeedOperator op_fallback;
581cefa2673SJeremy L Thompson 
5822b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
583cefa2673SJeremy L Thompson     if (op_fallback) {
5842b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemble(op_fallback, offset, values));
585cefa2673SJeremy L Thompson       return CEED_ERROR_SUCCESS;
586cefa2673SJeremy L Thompson     }
587cefa2673SJeremy L Thompson   }
588cefa2673SJeremy L Thompson 
589eaf62fffSJeremy L Thompson   // Assemble QFunction
5901c66c397SJeremy L Thompson   const bool     *orients      = NULL;
5911c66c397SJeremy L Thompson   const CeedInt8 *curl_orients = NULL;
5921c66c397SJeremy L Thompson   CeedInt *num_eval_modes_in, *num_eval_modes_out, num_active_bases, num_input_fields, num_output_fields, num_elem, elem_size, num_qpts, num_comp,
5931c66c397SJeremy L Thompson       local_num_entries, layout_qf[3];
5941c66c397SJeremy L Thompson   const CeedScalar        *assembled_qf_array;
595c5f45aeaSJeremy L Thompson   CeedVector               assembled_qf = NULL;
5961c66c397SJeremy L Thompson   CeedRestrictionType      rstr_type;
5971c66c397SJeremy L Thompson   CeedElemRestriction      rstr_q = NULL, active_rstr;
5981c66c397SJeremy L Thompson   const CeedEvalMode     **eval_modes_in, **eval_modes_out;
5991c66c397SJeremy L Thompson   CeedBasis               *bases, basis_in;
6001c66c397SJeremy L Thompson   CeedQFunction            qf;
6011c66c397SJeremy L Thompson   CeedOperatorAssemblyData data;
6021c66c397SJeremy L Thompson   CeedOperatorField       *input_fields, *output_fields;
603eaf62fffSJeremy L Thompson 
6041c66c397SJeremy L Thompson   CeedCall(CeedOperatorGetQFunction(op, &qf));
6051c66c397SJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &rstr_q, CEED_REQUEST_IMMEDIATE));
6062b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetFields(op, &num_input_fields, &input_fields, &num_output_fields, &output_fields));
607eaf62fffSJeremy L Thompson 
608ed9e99e6SJeremy L Thompson   // Get assembly data
6092b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data));
610437c7c90SJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_active_bases, &num_eval_modes_in, &eval_modes_in, NULL, &num_eval_modes_out,
611437c7c90SJeremy L Thompson                                                 &eval_modes_out, NULL, NULL));
612437c7c90SJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, &bases, NULL, NULL));
6131c66c397SJeremy L Thompson   basis_in = bases[0];
614eaf62fffSJeremy L Thompson 
6156574a04fSJeremy L Thompson   CeedCheck(num_active_bases == 1, ceed, CEED_ERROR_UNSUPPORTED, "Cannot assemble operator with multiple active bases");
6166574a04fSJeremy L Thompson   CeedCheck(num_eval_modes_in[0] > 0 && num_eval_modes_out[0] > 0, ceed, CEED_ERROR_UNSUPPORTED, "Cannot assemble operator with out inputs/outputs");
617eaf62fffSJeremy L Thompson 
6182b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveElemRestriction(op, &active_rstr));
6192b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(active_rstr, &num_elem));
6202b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetElementSize(active_rstr, &elem_size));
6212b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumComponents(active_rstr, &num_comp));
6222b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_in, &num_qpts));
6231c66c397SJeremy L Thompson   local_num_entries = elem_size * num_comp * elem_size * num_comp * num_elem;
624eaf62fffSJeremy L Thompson 
6257c1dbaffSSebastian Grimberg   CeedCall(CeedElemRestrictionGetType(active_rstr, &rstr_type));
6267c1dbaffSSebastian Grimberg   if (rstr_type == CEED_RESTRICTION_ORIENTED) {
6277c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionGetOrientations(active_rstr, CEED_MEM_HOST, &orients));
6287c1dbaffSSebastian Grimberg   } else if (rstr_type == CEED_RESTRICTION_CURL_ORIENTED) {
6297c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionGetCurlOrientations(active_rstr, CEED_MEM_HOST, &curl_orients));
6307c1dbaffSSebastian Grimberg   }
6317c1dbaffSSebastian Grimberg 
6327c1dbaffSSebastian Grimberg   // Loop over elements and put in data structure
6332b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array));
6342b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetELayout(rstr_q, &layout_qf));
6352b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&rstr_q));
636eaf62fffSJeremy L Thompson 
6377c1dbaffSSebastian Grimberg   // We store B_mat_in, B_mat_out, BTD, elem_mat in row-major order
6381c66c397SJeremy L Thompson   CeedSize           count = 0;
6391c66c397SJeremy L Thompson   CeedScalar        *vals, BTD_mat[elem_size * num_qpts * num_eval_modes_in[0]], elem_mat[elem_size * elem_size];
640437c7c90SJeremy L Thompson   const CeedScalar **B_mats_in, **B_mats_out;
641437c7c90SJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, NULL, &B_mats_in, &B_mats_out));
642437c7c90SJeremy L Thompson   const CeedScalar *B_mat_in = B_mats_in[0], *B_mat_out = B_mats_out[0];
6431c66c397SJeremy L Thompson 
64428ec399dSJeremy L Thompson   CeedCall(CeedVectorGetArray(values, CEED_MEM_HOST, &vals));
645b94338b9SJed Brown   for (CeedSize e = 0; e < num_elem; e++) {
646ed9e99e6SJeremy L Thompson     for (CeedInt comp_in = 0; comp_in < num_comp; comp_in++) {
647ed9e99e6SJeremy L Thompson       for (CeedInt comp_out = 0; comp_out < num_comp; comp_out++) {
648ed9e99e6SJeremy L Thompson         // Compute B^T*D
649b94338b9SJed Brown         for (CeedSize n = 0; n < elem_size; n++) {
650b94338b9SJed Brown           for (CeedSize q = 0; q < num_qpts; q++) {
651437c7c90SJeremy L Thompson             for (CeedInt e_in = 0; e_in < num_eval_modes_in[0]; e_in++) {
652b94338b9SJed Brown               const CeedSize btd_index = n * (num_qpts * num_eval_modes_in[0]) + (num_eval_modes_in[0] * q + e_in);
653067fd99fSJeremy L Thompson               CeedScalar     sum       = 0.0;
6541c66c397SJeremy L Thompson 
655437c7c90SJeremy L Thompson               for (CeedInt e_out = 0; e_out < num_eval_modes_out[0]; e_out++) {
656b94338b9SJed Brown                 const CeedSize b_out_index     = (num_eval_modes_out[0] * q + e_out) * elem_size + n;
657b94338b9SJed Brown                 const CeedSize eval_mode_index = ((e_in * num_comp + comp_in) * num_eval_modes_out[0] + e_out) * num_comp + comp_out;
658b94338b9SJed Brown                 const CeedSize qf_index        = q * layout_qf[0] + eval_mode_index * layout_qf[1] + e * layout_qf[2];
6591c66c397SJeremy L Thompson 
660067fd99fSJeremy L Thompson                 sum += B_mat_out[b_out_index] * assembled_qf_array[qf_index];
661eaf62fffSJeremy L Thompson               }
662067fd99fSJeremy L Thompson               BTD_mat[btd_index] = sum;
663ed9e99e6SJeremy L Thompson             }
664ed9e99e6SJeremy L Thompson           }
665eaf62fffSJeremy L Thompson         }
6667c1dbaffSSebastian Grimberg 
6677c1dbaffSSebastian Grimberg         // Form element matrix itself (for each block component)
668437c7c90SJeremy L Thompson         CeedCall(CeedMatrixMatrixMultiply(ceed, BTD_mat, B_mat_in, elem_mat, elem_size, elem_size, num_qpts * num_eval_modes_in[0]));
669eaf62fffSJeremy L Thompson 
6707c1dbaffSSebastian Grimberg         // Transform the element matrix if required
6717c1dbaffSSebastian Grimberg         if (orients) {
6727c1dbaffSSebastian Grimberg           const bool *elem_orients = &orients[e * elem_size];
6731c66c397SJeremy L Thompson 
6747c1dbaffSSebastian Grimberg           for (CeedInt i = 0; i < elem_size; i++) {
6757c1dbaffSSebastian Grimberg             for (CeedInt j = 0; j < elem_size; j++) {
6767c1dbaffSSebastian Grimberg               elem_mat[i * elem_size + j] *= elem_orients[i] ? -1.0 : 1.0;
6777c1dbaffSSebastian Grimberg               elem_mat[i * elem_size + j] *= elem_orients[j] ? -1.0 : 1.0;
6787c1dbaffSSebastian Grimberg             }
6797c1dbaffSSebastian Grimberg           }
6807c1dbaffSSebastian Grimberg         } else if (curl_orients) {
6817c1dbaffSSebastian Grimberg           const CeedInt8 *elem_curl_orients = &curl_orients[e * 3 * elem_size];
6827c1dbaffSSebastian Grimberg           CeedScalar      o_elem_mat[elem_size * elem_size];
6831c66c397SJeremy L Thompson 
6847c1dbaffSSebastian Grimberg           // T^T*(B^T*D*B)
6857c1dbaffSSebastian Grimberg           for (CeedInt i = 0; i < elem_size; i++) {
6867c1dbaffSSebastian Grimberg             for (CeedInt j = 0; j < elem_size; j++) {
6877c1dbaffSSebastian Grimberg               o_elem_mat[i * elem_size + j] = elem_mat[i * elem_size + j] * elem_curl_orients[3 * i + 1] +
6887c1dbaffSSebastian Grimberg                                               (i > 0 ? elem_mat[(i - 1) * elem_size + j] * elem_curl_orients[3 * i - 1] : 0.0) +
6897c1dbaffSSebastian Grimberg                                               (i < elem_size - 1 ? elem_mat[(i + 1) * elem_size + j] * elem_curl_orients[3 * i + 3] : 0.0);
6907c1dbaffSSebastian Grimberg             }
6917c1dbaffSSebastian Grimberg           }
6927c1dbaffSSebastian Grimberg           // T^T*(B^T*D*B)*T
6937c1dbaffSSebastian Grimberg           for (CeedInt i = 0; i < elem_size; i++) {
6947c1dbaffSSebastian Grimberg             for (CeedInt j = 0; j < elem_size; j++) {
6957c1dbaffSSebastian Grimberg               elem_mat[i * elem_size + j] = o_elem_mat[i * elem_size + j] * elem_curl_orients[3 * j + 1] +
6967c1dbaffSSebastian Grimberg                                             (j > 0 ? o_elem_mat[i * elem_size + j - 1] * elem_curl_orients[3 * j - 1] : 0.0) +
6977c1dbaffSSebastian Grimberg                                             (j < elem_size - 1 ? o_elem_mat[i * elem_size + j + 1] * elem_curl_orients[3 * j + 3] : 0.0);
6987c1dbaffSSebastian Grimberg             }
6997c1dbaffSSebastian Grimberg           }
7007c1dbaffSSebastian Grimberg         }
7017c1dbaffSSebastian Grimberg 
7027c1dbaffSSebastian Grimberg         // Put element matrix in coordinate data structure
703ed9e99e6SJeremy L Thompson         for (CeedInt i = 0; i < elem_size; i++) {
704ed9e99e6SJeremy L Thompson           for (CeedInt j = 0; j < elem_size; j++) {
705eaf62fffSJeremy L Thompson             vals[offset + count] = elem_mat[i * elem_size + j];
706eaf62fffSJeremy L Thompson             count++;
707eaf62fffSJeremy L Thompson           }
708eaf62fffSJeremy L Thompson         }
709eaf62fffSJeremy L Thompson       }
710eaf62fffSJeremy L Thompson     }
711eaf62fffSJeremy L Thompson   }
7126574a04fSJeremy L Thompson   CeedCheck(count == local_num_entries, ceed, CEED_ERROR_MAJOR, "Error computing entries");
7132b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArray(values, &vals));
714eaf62fffSJeremy L Thompson 
7152b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array));
7162b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&assembled_qf));
717eaf62fffSJeremy L Thompson 
7187c1dbaffSSebastian Grimberg   if (rstr_type == CEED_RESTRICTION_ORIENTED) {
7197c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionRestoreOrientations(active_rstr, &orients));
7207c1dbaffSSebastian Grimberg   } else if (rstr_type == CEED_RESTRICTION_CURL_ORIENTED) {
7217c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionRestoreCurlOrientations(active_rstr, &curl_orients));
7227c1dbaffSSebastian Grimberg   }
723eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
724eaf62fffSJeremy L Thompson }
725eaf62fffSJeremy L Thompson 
726eaf62fffSJeremy L Thompson /**
727eaf62fffSJeremy L Thompson   @brief Count number of entries for assembled CeedOperator
728eaf62fffSJeremy L Thompson 
729eaf62fffSJeremy L Thompson   @param[in]  op          CeedOperator to assemble
730eaf62fffSJeremy L Thompson   @param[out] num_entries Number of entries in assembled representation
731eaf62fffSJeremy L Thompson 
732eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
733eaf62fffSJeremy L Thompson 
734eaf62fffSJeremy L Thompson   @ref Utility
735eaf62fffSJeremy L Thompson **/
736b94338b9SJed Brown static int CeedSingleOperatorAssemblyCountEntries(CeedOperator op, CeedSize *num_entries) {
737b275c451SJeremy L Thompson   bool                is_composite;
738eaf62fffSJeremy L Thompson   CeedInt             num_elem, elem_size, num_comp;
7391c66c397SJeremy L Thompson   CeedElemRestriction rstr;
740eaf62fffSJeremy L Thompson 
741b275c451SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
7426574a04fSJeremy L Thompson   CeedCheck(!is_composite, op->ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported");
7432b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveElemRestriction(op, &rstr));
7442b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem));
7452b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size));
7462b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp));
747b94338b9SJed Brown   *num_entries = (CeedSize)elem_size * num_comp * elem_size * num_comp * num_elem;
748eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
749eaf62fffSJeremy L Thompson }
750eaf62fffSJeremy L Thompson 
751eaf62fffSJeremy L Thompson /**
752ea61e9acSJeremy L Thompson   @brief Common code for creating a multigrid coarse operator and level transfer operators for a CeedOperator
753eaf62fffSJeremy L Thompson 
754eaf62fffSJeremy L Thompson   @param[in]  op_fine      Fine grid operator
75585bb9dcfSJeremy L Thompson   @param[in]  p_mult_fine  L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators
756eaf62fffSJeremy L Thompson   @param[in]  rstr_coarse  Coarse grid restriction
757eaf62fffSJeremy L Thompson   @param[in]  basis_coarse Coarse grid active vector basis
75885bb9dcfSJeremy L Thompson   @param[in]  basis_c_to_f Basis for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators
759eaf62fffSJeremy L Thompson   @param[out] op_coarse    Coarse grid operator
76085bb9dcfSJeremy L Thompson   @param[out] op_prolong   Coarse to fine operator, or NULL
76185bb9dcfSJeremy L Thompson   @param[out] op_restrict  Fine to coarse operator, or NULL
762eaf62fffSJeremy L Thompson 
763eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
764eaf62fffSJeremy L Thompson 
765eaf62fffSJeremy L Thompson   @ref Developer
766eaf62fffSJeremy L Thompson **/
7672b730f8bSJeremy L Thompson static int CeedSingleOperatorMultigridLevel(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse,
7682b730f8bSJeremy L Thompson                                             CeedBasis basis_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) {
7691c66c397SJeremy L Thompson   bool                is_composite;
770eaf62fffSJeremy L Thompson   Ceed                ceed;
7711c66c397SJeremy L Thompson   CeedInt             num_comp;
77285bb9dcfSJeremy L Thompson   CeedVector          mult_vec         = NULL;
7731c66c397SJeremy L Thompson   CeedElemRestriction rstr_p_mult_fine = NULL, rstr_fine = NULL;
7741c66c397SJeremy L Thompson 
7752b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op_fine, &ceed));
776eaf62fffSJeremy L Thompson 
777eaf62fffSJeremy L Thompson   // Check for composite operator
7782b730f8bSJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op_fine, &is_composite));
7796574a04fSJeremy L Thompson   CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Automatic multigrid setup for composite operators not supported");
780eaf62fffSJeremy L Thompson 
781eaf62fffSJeremy L Thompson   // Coarse Grid
7822b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCreate(ceed, op_fine->qf, op_fine->dqf, op_fine->dqfT, op_coarse));
783eaf62fffSJeremy L Thompson   // -- Clone input fields
78492ae7e47SJeremy L Thompson   for (CeedInt i = 0; i < op_fine->qf->num_input_fields; i++) {
785eaf62fffSJeremy L Thompson     if (op_fine->input_fields[i]->vec == CEED_VECTOR_ACTIVE) {
786437c7c90SJeremy L Thompson       rstr_fine = op_fine->input_fields[i]->elem_rstr;
7872b730f8bSJeremy L Thompson       CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE));
788eaf62fffSJeremy L Thompson     } else {
789437c7c90SJeremy L Thompson       CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, op_fine->input_fields[i]->elem_rstr,
7902b730f8bSJeremy L Thompson                                     op_fine->input_fields[i]->basis, op_fine->input_fields[i]->vec));
791eaf62fffSJeremy L Thompson     }
792eaf62fffSJeremy L Thompson   }
793eaf62fffSJeremy L Thompson   // -- Clone output fields
79492ae7e47SJeremy L Thompson   for (CeedInt i = 0; i < op_fine->qf->num_output_fields; i++) {
795eaf62fffSJeremy L Thompson     if (op_fine->output_fields[i]->vec == CEED_VECTOR_ACTIVE) {
7962b730f8bSJeremy L Thompson       CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE));
797eaf62fffSJeremy L Thompson     } else {
798437c7c90SJeremy L Thompson       CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, op_fine->output_fields[i]->elem_rstr,
7992b730f8bSJeremy L Thompson                                     op_fine->output_fields[i]->basis, op_fine->output_fields[i]->vec));
800eaf62fffSJeremy L Thompson     }
801eaf62fffSJeremy L Thompson   }
802af99e877SJeremy L Thompson   // -- Clone QFunctionAssemblyData
8032b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op_fine->qf_assembled, &(*op_coarse)->qf_assembled));
804eaf62fffSJeremy L Thompson 
805eaf62fffSJeremy L Thompson   // Multiplicity vector
80685bb9dcfSJeremy L Thompson   if (op_restrict || op_prolong) {
80785bb9dcfSJeremy L Thompson     CeedVector          mult_e_vec;
8081c66c397SJeremy L Thompson     CeedRestrictionType rstr_type;
80985bb9dcfSJeremy L Thompson 
8107c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionGetType(rstr_fine, &rstr_type));
8117c1dbaffSSebastian Grimberg     CeedCheck(rstr_type != CEED_RESTRICTION_CURL_ORIENTED, ceed, CEED_ERROR_UNSUPPORTED,
8127c1dbaffSSebastian Grimberg               "Element restrictions created with CeedElemRestrictionCreateCurlOriented are not supported");
8136574a04fSJeremy L Thompson     CeedCheck(p_mult_fine, ceed, CEED_ERROR_INCOMPATIBLE, "Prolongation or restriction operator creation requires fine grid multiplicity vector");
8147c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionCreateUnsignedCopy(rstr_fine, &rstr_p_mult_fine));
8152b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionCreateVector(rstr_fine, &mult_vec, &mult_e_vec));
8162b730f8bSJeremy L Thompson     CeedCall(CeedVectorSetValue(mult_e_vec, 0.0));
817c17ec2beSJeremy L Thompson     CeedCall(CeedElemRestrictionApply(rstr_p_mult_fine, CEED_NOTRANSPOSE, p_mult_fine, mult_e_vec, CEED_REQUEST_IMMEDIATE));
8182b730f8bSJeremy L Thompson     CeedCall(CeedVectorSetValue(mult_vec, 0.0));
819c17ec2beSJeremy L Thompson     CeedCall(CeedElemRestrictionApply(rstr_p_mult_fine, CEED_TRANSPOSE, mult_e_vec, mult_vec, CEED_REQUEST_IMMEDIATE));
8202b730f8bSJeremy L Thompson     CeedCall(CeedVectorDestroy(&mult_e_vec));
8212b730f8bSJeremy L Thompson     CeedCall(CeedVectorReciprocal(mult_vec));
82285bb9dcfSJeremy L Thompson   }
823eaf62fffSJeremy L Thompson 
824addd79feSZach Atkins   // Clone name
825addd79feSZach Atkins   bool   has_name = op_fine->name;
826addd79feSZach Atkins   size_t name_len = op_fine->name ? strlen(op_fine->name) : 0;
827addd79feSZach Atkins   CeedCall(CeedOperatorSetName(*op_coarse, op_fine->name));
828addd79feSZach Atkins 
82983d6adf3SZach Atkins   // Check that coarse to fine basis is provided if prolong/restrict operators are requested
8306574a04fSJeremy L Thompson   CeedCheck(basis_c_to_f || (!op_restrict && !op_prolong), ceed, CEED_ERROR_INCOMPATIBLE,
8316574a04fSJeremy L Thompson             "Prolongation or restriction operator creation requires coarse-to-fine basis");
83283d6adf3SZach Atkins 
83385bb9dcfSJeremy L Thompson   // Restriction/Prolongation Operators
8342b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumComponents(basis_coarse, &num_comp));
835addd79feSZach Atkins 
836addd79feSZach Atkins   // Restriction
837addd79feSZach Atkins   if (op_restrict) {
838eaf62fffSJeremy L Thompson     CeedInt             *num_comp_r_data;
83985bb9dcfSJeremy L Thompson     CeedQFunctionContext ctx_r;
8401c66c397SJeremy L Thompson     CeedQFunction        qf_restrict;
84185bb9dcfSJeremy L Thompson 
84285bb9dcfSJeremy L Thompson     CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_restrict));
8432b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(1, &num_comp_r_data));
844eaf62fffSJeremy L Thompson     num_comp_r_data[0] = num_comp;
8452b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextCreate(ceed, &ctx_r));
8462b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextSetData(ctx_r, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_r_data), num_comp_r_data));
8472b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionSetContext(qf_restrict, ctx_r));
8482b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextDestroy(&ctx_r));
8492b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddInput(qf_restrict, "input", num_comp, CEED_EVAL_NONE));
8502b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddInput(qf_restrict, "scale", num_comp, CEED_EVAL_NONE));
8512b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddOutput(qf_restrict, "output", num_comp, CEED_EVAL_INTERP));
8522b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_restrict, num_comp));
853eaf62fffSJeremy L Thompson 
8542b730f8bSJeremy L Thompson     CeedCall(CeedOperatorCreate(ceed, qf_restrict, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_restrict));
8552b730f8bSJeremy L Thompson     CeedCall(CeedOperatorSetField(*op_restrict, "input", rstr_fine, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE));
856c17ec2beSJeremy L Thompson     CeedCall(CeedOperatorSetField(*op_restrict, "scale", rstr_p_mult_fine, CEED_BASIS_COLLOCATED, mult_vec));
8572b730f8bSJeremy L Thompson     CeedCall(CeedOperatorSetField(*op_restrict, "output", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE));
858eaf62fffSJeremy L Thompson 
859addd79feSZach Atkins     // Set name
860addd79feSZach Atkins     char *restriction_name;
8611c66c397SJeremy L Thompson 
862addd79feSZach Atkins     CeedCall(CeedCalloc(17 + name_len, &restriction_name));
863addd79feSZach Atkins     sprintf(restriction_name, "restriction%s%s", has_name ? " for " : "", has_name ? op_fine->name : "");
864addd79feSZach Atkins     CeedCall(CeedOperatorSetName(*op_restrict, restriction_name));
865addd79feSZach Atkins     CeedCall(CeedFree(&restriction_name));
866addd79feSZach Atkins 
867addd79feSZach Atkins     // Check
868addd79feSZach Atkins     CeedCall(CeedOperatorCheckReady(*op_restrict));
869addd79feSZach Atkins 
870addd79feSZach Atkins     // Cleanup
871addd79feSZach Atkins     CeedCall(CeedQFunctionDestroy(&qf_restrict));
872addd79feSZach Atkins   }
873addd79feSZach Atkins 
874eaf62fffSJeremy L Thompson   // Prolongation
875addd79feSZach Atkins   if (op_prolong) {
876eaf62fffSJeremy L Thompson     CeedInt             *num_comp_p_data;
87785bb9dcfSJeremy L Thompson     CeedQFunctionContext ctx_p;
8781c66c397SJeremy L Thompson     CeedQFunction        qf_prolong;
87985bb9dcfSJeremy L Thompson 
88085bb9dcfSJeremy L Thompson     CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_prolong));
8812b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(1, &num_comp_p_data));
882eaf62fffSJeremy L Thompson     num_comp_p_data[0] = num_comp;
8832b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextCreate(ceed, &ctx_p));
8842b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextSetData(ctx_p, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_p_data), num_comp_p_data));
8852b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionSetContext(qf_prolong, ctx_p));
8862b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextDestroy(&ctx_p));
8872b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddInput(qf_prolong, "input", num_comp, CEED_EVAL_INTERP));
8882b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddInput(qf_prolong, "scale", num_comp, CEED_EVAL_NONE));
8892b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddOutput(qf_prolong, "output", num_comp, CEED_EVAL_NONE));
8902b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_prolong, num_comp));
891eaf62fffSJeremy L Thompson 
8922b730f8bSJeremy L Thompson     CeedCall(CeedOperatorCreate(ceed, qf_prolong, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_prolong));
8932b730f8bSJeremy L Thompson     CeedCall(CeedOperatorSetField(*op_prolong, "input", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE));
894c17ec2beSJeremy L Thompson     CeedCall(CeedOperatorSetField(*op_prolong, "scale", rstr_p_mult_fine, CEED_BASIS_COLLOCATED, mult_vec));
8952b730f8bSJeremy L Thompson     CeedCall(CeedOperatorSetField(*op_prolong, "output", rstr_fine, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE));
896eaf62fffSJeremy L Thompson 
897addd79feSZach Atkins     // Set name
898ea6b5821SJeremy L Thompson     char *prolongation_name;
8991c66c397SJeremy L Thompson 
9002b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(18 + name_len, &prolongation_name));
9012b730f8bSJeremy L Thompson     sprintf(prolongation_name, "prolongation%s%s", has_name ? " for " : "", has_name ? op_fine->name : "");
9022b730f8bSJeremy L Thompson     CeedCall(CeedOperatorSetName(*op_prolong, prolongation_name));
9032b730f8bSJeremy L Thompson     CeedCall(CeedFree(&prolongation_name));
904addd79feSZach Atkins 
905addd79feSZach Atkins     // Check
906addd79feSZach Atkins     CeedCall(CeedOperatorCheckReady(*op_prolong));
907addd79feSZach Atkins 
908addd79feSZach Atkins     // Cleanup
909addd79feSZach Atkins     CeedCall(CeedQFunctionDestroy(&qf_prolong));
910ea6b5821SJeremy L Thompson   }
911ea6b5821SJeremy L Thompson 
91258e4b056SJeremy L Thompson   // Check
91358e4b056SJeremy L Thompson   CeedCall(CeedOperatorCheckReady(*op_coarse));
91458e4b056SJeremy L Thompson 
915eaf62fffSJeremy L Thompson   // Cleanup
9162b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&mult_vec));
917c17ec2beSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&rstr_p_mult_fine));
9182b730f8bSJeremy L Thompson   CeedCall(CeedBasisDestroy(&basis_c_to_f));
919eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
920eaf62fffSJeremy L Thompson }
921eaf62fffSJeremy L Thompson 
922eaf62fffSJeremy L Thompson /**
923eaf62fffSJeremy L Thompson   @brief Build 1D mass matrix and Laplacian with perturbation
924eaf62fffSJeremy L Thompson 
925eaf62fffSJeremy L Thompson   @param[in]  interp_1d   Interpolation matrix in one dimension
926eaf62fffSJeremy L Thompson   @param[in]  grad_1d     Gradient matrix in one dimension
927eaf62fffSJeremy L Thompson   @param[in]  q_weight_1d Quadrature weights in one dimension
928eaf62fffSJeremy L Thompson   @param[in]  P_1d        Number of basis nodes in one dimension
929eaf62fffSJeremy L Thompson   @param[in]  Q_1d        Number of quadrature points in one dimension
930eaf62fffSJeremy L Thompson   @param[in]  dim         Dimension of basis
931eaf62fffSJeremy L Thompson   @param[out] mass        Assembled mass matrix in one dimension
932eaf62fffSJeremy L Thompson   @param[out] laplace     Assembled perturbed Laplacian in one dimension
933eaf62fffSJeremy L Thompson 
934eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
935eaf62fffSJeremy L Thompson 
936eaf62fffSJeremy L Thompson   @ref Developer
937eaf62fffSJeremy L Thompson **/
9382c2ea1dbSJeremy L Thompson CeedPragmaOptimizeOff
9392c2ea1dbSJeremy L Thompson static int CeedBuildMassLaplace(const CeedScalar *interp_1d, const CeedScalar *grad_1d, const CeedScalar *q_weight_1d, CeedInt P_1d, CeedInt Q_1d,
9402c2ea1dbSJeremy L Thompson                                 CeedInt dim, CeedScalar *mass, CeedScalar *laplace) {
9412b730f8bSJeremy L Thompson   for (CeedInt i = 0; i < P_1d; i++) {
942eaf62fffSJeremy L Thompson     for (CeedInt j = 0; j < P_1d; j++) {
943eaf62fffSJeremy L Thompson       CeedScalar sum = 0.0;
9442b730f8bSJeremy L Thompson       for (CeedInt k = 0; k < Q_1d; k++) sum += interp_1d[k * P_1d + i] * q_weight_1d[k] * interp_1d[k * P_1d + j];
945eaf62fffSJeremy L Thompson       mass[i + j * P_1d] = sum;
946eaf62fffSJeremy L Thompson     }
9472b730f8bSJeremy L Thompson   }
948eaf62fffSJeremy L Thompson   // -- Laplacian
9492b730f8bSJeremy L Thompson   for (CeedInt i = 0; i < P_1d; i++) {
950eaf62fffSJeremy L Thompson     for (CeedInt j = 0; j < P_1d; j++) {
951eaf62fffSJeremy L Thompson       CeedScalar sum = 0.0;
9521c66c397SJeremy L Thompson 
9532b730f8bSJeremy L Thompson       for (CeedInt k = 0; k < Q_1d; k++) sum += grad_1d[k * P_1d + i] * q_weight_1d[k] * grad_1d[k * P_1d + j];
954eaf62fffSJeremy L Thompson       laplace[i + j * P_1d] = sum;
955eaf62fffSJeremy L Thompson     }
9562b730f8bSJeremy L Thompson   }
957eaf62fffSJeremy L Thompson   CeedScalar perturbation = dim > 2 ? 1e-6 : 1e-4;
9582b730f8bSJeremy L Thompson   for (CeedInt i = 0; i < P_1d; i++) laplace[i + P_1d * i] += perturbation;
959eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
960eaf62fffSJeremy L Thompson }
9612c2ea1dbSJeremy L Thompson CeedPragmaOptimizeOn
962eaf62fffSJeremy L Thompson 
963eaf62fffSJeremy L Thompson /// @}
964eaf62fffSJeremy L Thompson 
965eaf62fffSJeremy L Thompson /// ----------------------------------------------------------------------------
966480fae85SJeremy L Thompson /// CeedOperator Backend API
967480fae85SJeremy L Thompson /// ----------------------------------------------------------------------------
968480fae85SJeremy L Thompson /// @addtogroup CeedOperatorBackend
969480fae85SJeremy L Thompson /// @{
970480fae85SJeremy L Thompson 
971480fae85SJeremy L Thompson /**
972480fae85SJeremy L Thompson   @brief Create object holding CeedQFunction assembly data for CeedOperator
973480fae85SJeremy L Thompson 
974480fae85SJeremy L Thompson   @param[in]  ceed A Ceed object where the CeedQFunctionAssemblyData will be created
975ea61e9acSJeremy L Thompson   @param[out] data Address of the variable where the newly created CeedQFunctionAssemblyData will be stored
976480fae85SJeremy L Thompson 
977480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
978480fae85SJeremy L Thompson 
979480fae85SJeremy L Thompson   @ref Backend
980480fae85SJeremy L Thompson **/
981ea61e9acSJeremy L Thompson int CeedQFunctionAssemblyDataCreate(Ceed ceed, CeedQFunctionAssemblyData *data) {
9822b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(1, data));
983480fae85SJeremy L Thompson   (*data)->ref_count = 1;
984480fae85SJeremy L Thompson   (*data)->ceed      = ceed;
9852b730f8bSJeremy L Thompson   CeedCall(CeedReference(ceed));
986480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
987480fae85SJeremy L Thompson }
988480fae85SJeremy L Thompson 
989480fae85SJeremy L Thompson /**
990480fae85SJeremy L Thompson   @brief Increment the reference counter for a CeedQFunctionAssemblyData
991480fae85SJeremy L Thompson 
992ea61e9acSJeremy L Thompson   @param[in,out] data CeedQFunctionAssemblyData to increment the reference counter
993480fae85SJeremy L Thompson 
994480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
995480fae85SJeremy L Thompson 
996480fae85SJeremy L Thompson   @ref Backend
997480fae85SJeremy L Thompson **/
998480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataReference(CeedQFunctionAssemblyData data) {
999480fae85SJeremy L Thompson   data->ref_count++;
1000480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1001480fae85SJeremy L Thompson }
1002480fae85SJeremy L Thompson 
1003480fae85SJeremy L Thompson /**
1004beecbf24SJeremy L Thompson   @brief Set re-use of CeedQFunctionAssemblyData
10058b919e6bSJeremy L Thompson 
1006ea61e9acSJeremy L Thompson   @param[in,out] data       CeedQFunctionAssemblyData to mark for reuse
1007ea61e9acSJeremy L Thompson   @param[in]     reuse_data Boolean flag indicating data re-use
10088b919e6bSJeremy L Thompson 
10098b919e6bSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
10108b919e6bSJeremy L Thompson 
10118b919e6bSJeremy L Thompson   @ref Backend
10128b919e6bSJeremy L Thompson **/
10132b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetReuse(CeedQFunctionAssemblyData data, bool reuse_data) {
1014beecbf24SJeremy L Thompson   data->reuse_data        = reuse_data;
1015beecbf24SJeremy L Thompson   data->needs_data_update = true;
1016beecbf24SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1017beecbf24SJeremy L Thompson }
1018beecbf24SJeremy L Thompson 
1019beecbf24SJeremy L Thompson /**
1020beecbf24SJeremy L Thompson   @brief Mark QFunctionAssemblyData as stale
1021beecbf24SJeremy L Thompson 
1022ea61e9acSJeremy L Thompson   @param[in,out] data              CeedQFunctionAssemblyData to mark as stale
1023ea61e9acSJeremy L Thompson   @param[in]     needs_data_update Boolean flag indicating if update is needed or completed
1024beecbf24SJeremy L Thompson 
1025beecbf24SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1026beecbf24SJeremy L Thompson 
1027beecbf24SJeremy L Thompson   @ref Backend
1028beecbf24SJeremy L Thompson **/
10292b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetUpdateNeeded(CeedQFunctionAssemblyData data, bool needs_data_update) {
1030beecbf24SJeremy L Thompson   data->needs_data_update = needs_data_update;
10318b919e6bSJeremy L Thompson   return CEED_ERROR_SUCCESS;
10328b919e6bSJeremy L Thompson }
10338b919e6bSJeremy L Thompson 
10348b919e6bSJeremy L Thompson /**
10358b919e6bSJeremy L Thompson   @brief Determine if QFunctionAssemblyData needs update
10368b919e6bSJeremy L Thompson 
10378b919e6bSJeremy L Thompson   @param[in]  data             CeedQFunctionAssemblyData to mark as stale
10388b919e6bSJeremy L Thompson   @param[out] is_update_needed Boolean flag indicating if re-assembly is required
10398b919e6bSJeremy L Thompson 
10408b919e6bSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
10418b919e6bSJeremy L Thompson 
10428b919e6bSJeremy L Thompson   @ref Backend
10438b919e6bSJeremy L Thompson **/
10442b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsUpdateNeeded(CeedQFunctionAssemblyData data, bool *is_update_needed) {
1045beecbf24SJeremy L Thompson   *is_update_needed = !data->reuse_data || data->needs_data_update;
10468b919e6bSJeremy L Thompson   return CEED_ERROR_SUCCESS;
10478b919e6bSJeremy L Thompson }
10488b919e6bSJeremy L Thompson 
10498b919e6bSJeremy L Thompson /**
1050ea61e9acSJeremy L Thompson   @brief Copy the pointer to a CeedQFunctionAssemblyData.
10514385fb7fSSebastian Grimberg 
1052ea61e9acSJeremy L Thompson   Both pointers should be destroyed with `CeedCeedQFunctionAssemblyDataDestroy()`.
1053512bb800SJeremy L Thompson 
1054512bb800SJeremy L Thompson   Note: If the value of `data_copy` passed to this function is non-NULL, then it is assumed that `*data_copy` is a pointer to a
1055512bb800SJeremy L Thompson         CeedQFunctionAssemblyData. This CeedQFunctionAssemblyData will be destroyed if `data_copy` is the only reference to this
1056512bb800SJeremy L Thompson         CeedQFunctionAssemblyData.
1057480fae85SJeremy L Thompson 
1058ea61e9acSJeremy L Thompson   @param[in]     data      CeedQFunctionAssemblyData to copy reference to
1059ea61e9acSJeremy L Thompson   @param[in,out] data_copy Variable to store copied reference
1060480fae85SJeremy L Thompson 
1061480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1062480fae85SJeremy L Thompson 
1063480fae85SJeremy L Thompson   @ref Backend
1064480fae85SJeremy L Thompson **/
10652b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataReferenceCopy(CeedQFunctionAssemblyData data, CeedQFunctionAssemblyData *data_copy) {
10662b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAssemblyDataReference(data));
10672b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAssemblyDataDestroy(data_copy));
1068480fae85SJeremy L Thompson   *data_copy = data;
1069480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1070480fae85SJeremy L Thompson }
1071480fae85SJeremy L Thompson 
1072480fae85SJeremy L Thompson /**
1073480fae85SJeremy L Thompson   @brief Get setup status for internal objects for CeedQFunctionAssemblyData
1074480fae85SJeremy L Thompson 
1075ea61e9acSJeremy L Thompson   @param[in]  data     CeedQFunctionAssemblyData to retrieve status
1076480fae85SJeremy L Thompson   @param[out] is_setup Boolean flag for setup status
1077480fae85SJeremy L Thompson 
1078480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1079480fae85SJeremy L Thompson 
1080480fae85SJeremy L Thompson   @ref Backend
1081480fae85SJeremy L Thompson **/
10822b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsSetup(CeedQFunctionAssemblyData data, bool *is_setup) {
1083480fae85SJeremy L Thompson   *is_setup = data->is_setup;
1084480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1085480fae85SJeremy L Thompson }
1086480fae85SJeremy L Thompson 
1087480fae85SJeremy L Thompson /**
1088480fae85SJeremy L Thompson   @brief Set internal objects for CeedQFunctionAssemblyData
1089480fae85SJeremy L Thompson 
1090ea61e9acSJeremy L Thompson   @param[in,out] data CeedQFunctionAssemblyData to set objects
1091480fae85SJeremy L Thompson   @param[in]     vec  CeedVector to store assembled CeedQFunction at quadrature points
1092480fae85SJeremy L Thompson   @param[in]     rstr CeedElemRestriction for CeedVector containing assembled CeedQFunction
1093480fae85SJeremy L Thompson 
1094480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1095480fae85SJeremy L Thompson 
1096480fae85SJeremy L Thompson   @ref Backend
1097480fae85SJeremy L Thompson **/
10982b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetObjects(CeedQFunctionAssemblyData data, CeedVector vec, CeedElemRestriction rstr) {
10992b730f8bSJeremy L Thompson   CeedCall(CeedVectorReferenceCopy(vec, &data->vec));
11002b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionReferenceCopy(rstr, &data->rstr));
1101480fae85SJeremy L Thompson 
1102480fae85SJeremy L Thompson   data->is_setup = true;
1103480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1104480fae85SJeremy L Thompson }
1105480fae85SJeremy L Thompson 
11062b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataGetObjects(CeedQFunctionAssemblyData data, CeedVector *vec, CeedElemRestriction *rstr) {
11076574a04fSJeremy L Thompson   CeedCheck(data->is_setup, data->ceed, CEED_ERROR_INCOMPLETE, "Internal objects not set; must call CeedQFunctionAssemblyDataSetObjects first.");
1108480fae85SJeremy L Thompson 
11092b730f8bSJeremy L Thompson   CeedCall(CeedVectorReferenceCopy(data->vec, vec));
11102b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionReferenceCopy(data->rstr, rstr));
1111480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1112480fae85SJeremy L Thompson }
1113480fae85SJeremy L Thompson 
1114480fae85SJeremy L Thompson /**
1115480fae85SJeremy L Thompson   @brief Destroy CeedQFunctionAssemblyData
1116480fae85SJeremy L Thompson 
1117ea61e9acSJeremy L Thompson   @param[in,out] data  CeedQFunctionAssemblyData to destroy
1118480fae85SJeremy L Thompson 
1119480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1120480fae85SJeremy L Thompson 
1121480fae85SJeremy L Thompson   @ref Backend
1122480fae85SJeremy L Thompson **/
1123480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataDestroy(CeedQFunctionAssemblyData *data) {
1124ad6481ceSJeremy L Thompson   if (!*data || --(*data)->ref_count > 0) {
1125ad6481ceSJeremy L Thompson     *data = NULL;
1126ad6481ceSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1127ad6481ceSJeremy L Thompson   }
11282b730f8bSJeremy L Thompson   CeedCall(CeedDestroy(&(*data)->ceed));
11292b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&(*data)->vec));
11302b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&(*data)->rstr));
1131480fae85SJeremy L Thompson 
11322b730f8bSJeremy L Thompson   CeedCall(CeedFree(data));
1133480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1134480fae85SJeremy L Thompson }
1135480fae85SJeremy L Thompson 
1136ed9e99e6SJeremy L Thompson /**
1137ed9e99e6SJeremy L Thompson   @brief Get CeedOperatorAssemblyData
1138ed9e99e6SJeremy L Thompson 
1139ed9e99e6SJeremy L Thompson   @param[in]  op   CeedOperator to assemble
1140ed9e99e6SJeremy L Thompson   @param[out] data CeedQFunctionAssemblyData
1141ed9e99e6SJeremy L Thompson 
1142ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1143ed9e99e6SJeremy L Thompson 
1144ed9e99e6SJeremy L Thompson   @ref Backend
1145ed9e99e6SJeremy L Thompson **/
11462b730f8bSJeremy L Thompson int CeedOperatorGetOperatorAssemblyData(CeedOperator op, CeedOperatorAssemblyData *data) {
1147ed9e99e6SJeremy L Thompson   if (!op->op_assembled) {
1148ed9e99e6SJeremy L Thompson     CeedOperatorAssemblyData data;
1149ed9e99e6SJeremy L Thompson 
11502b730f8bSJeremy L Thompson     CeedCall(CeedOperatorAssemblyDataCreate(op->ceed, op, &data));
1151ed9e99e6SJeremy L Thompson     op->op_assembled = data;
1152ed9e99e6SJeremy L Thompson   }
1153ed9e99e6SJeremy L Thompson   *data = op->op_assembled;
1154ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1155ed9e99e6SJeremy L Thompson }
1156ed9e99e6SJeremy L Thompson 
1157ed9e99e6SJeremy L Thompson /**
1158ba746a46SJeremy L Thompson   @brief Create object holding CeedOperator assembly data.
1159ba746a46SJeremy L Thompson 
1160ba746a46SJeremy L Thompson   The CeedOperatorAssemblyData holds an array with references to every active CeedBasis used in the CeedOperator.
1161ba746a46SJeremy L Thompson   An array with references to the corresponding active CeedElemRestrictions is also stored.
1162ba746a46SJeremy L Thompson   For each active CeedBasis, the CeedOperatorAssemblyData holds an array of all input and output CeedEvalModes for this CeedBasis.
1163ba746a46SJeremy L Thompson   The CeedOperatorAssemblyData holds an array of offsets for indexing into the assembled CeedQFunction arrays to the row representing each
1164ba746a46SJeremy L Thompson CeedEvalMode.
1165ba746a46SJeremy L Thompson   The number of input columns across all active bases for the assembled CeedQFunction is also stored.
1166ba746a46SJeremy L Thompson   Lastly, the CeedOperatorAssembly data holds assembled matrices representing the full action of the CeedBasis for all CeedEvalModes.
1167ed9e99e6SJeremy L Thompson 
1168ea61e9acSJeremy L Thompson   @param[in]  ceed Ceed object where the CeedOperatorAssemblyData will be created
1169ed9e99e6SJeremy L Thompson   @param[in]  op   CeedOperator to be assembled
1170ea61e9acSJeremy L Thompson   @param[out] data Address of the variable where the newly created CeedOperatorAssemblyData will be stored
1171ed9e99e6SJeremy L Thompson 
1172ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1173ed9e99e6SJeremy L Thompson 
1174ed9e99e6SJeremy L Thompson   @ref Backend
1175ed9e99e6SJeremy L Thompson **/
11762b730f8bSJeremy L Thompson int CeedOperatorAssemblyDataCreate(Ceed ceed, CeedOperator op, CeedOperatorAssemblyData *data) {
11771c66c397SJeremy L Thompson   CeedInt             num_active_bases = 0, num_input_fields, *num_eval_modes_in = NULL, *num_eval_modes_out = NULL, offset = 0, num_output_fields;
11781c66c397SJeremy L Thompson   CeedSize          **eval_mode_offsets_in = NULL, **eval_mode_offsets_out = NULL;
11791c66c397SJeremy L Thompson   CeedEvalMode      **eval_modes_in = NULL, **eval_modes_out = NULL;
11801c66c397SJeremy L Thompson   CeedQFunctionField *qf_fields;
11811c66c397SJeremy L Thompson   CeedQFunction       qf;
11821c66c397SJeremy L Thompson   CeedOperatorField  *op_fields;
1183437c7c90SJeremy L Thompson 
1184437c7c90SJeremy L Thompson   // Allocate
11852b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(1, data));
1186ed9e99e6SJeremy L Thompson   (*data)->ceed = ceed;
11872b730f8bSJeremy L Thompson   CeedCall(CeedReference(ceed));
1188ed9e99e6SJeremy L Thompson 
1189ed9e99e6SJeremy L Thompson   // Build OperatorAssembly data
11902b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetQFunction(op, &qf));
11912b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionGetFields(qf, &num_input_fields, &qf_fields, NULL, NULL));
11922b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL));
1193ed9e99e6SJeremy L Thompson 
1194ed9e99e6SJeremy L Thompson   // Determine active input basis
1195ed9e99e6SJeremy L Thompson   for (CeedInt i = 0; i < num_input_fields; i++) {
1196ed9e99e6SJeremy L Thompson     CeedVector vec;
11971c66c397SJeremy L Thompson 
11982b730f8bSJeremy L Thompson     CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec));
1199ed9e99e6SJeremy L Thompson     if (vec == CEED_VECTOR_ACTIVE) {
12007c1dbaffSSebastian Grimberg       CeedInt      index = -1, num_comp, q_comp;
12011c66c397SJeremy L Thompson       CeedEvalMode eval_mode;
12021c66c397SJeremy L Thompson       CeedBasis    basis_in = NULL;
12031c66c397SJeremy L Thompson 
12042b730f8bSJeremy L Thompson       CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_in));
12052b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode));
1206352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetNumComponents(basis_in, &num_comp));
1207352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetNumQuadratureComponents(basis_in, eval_mode, &q_comp));
1208437c7c90SJeremy L Thompson       for (CeedInt i = 0; i < num_active_bases; i++) {
1209437c7c90SJeremy L Thompson         if ((*data)->active_bases[i] == basis_in) index = i;
1210437c7c90SJeremy L Thompson       }
1211437c7c90SJeremy L Thompson       if (index == -1) {
1212437c7c90SJeremy L Thompson         CeedElemRestriction elem_rstr_in;
12131c66c397SJeremy L Thompson 
1214437c7c90SJeremy L Thompson         index = num_active_bases;
1215437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_bases));
1216437c7c90SJeremy L Thompson         (*data)->active_bases[num_active_bases] = NULL;
1217437c7c90SJeremy L Thompson         CeedCall(CeedBasisReferenceCopy(basis_in, &(*data)->active_bases[num_active_bases]));
1218437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_elem_rstrs));
1219437c7c90SJeremy L Thompson         (*data)->active_elem_rstrs[num_active_bases] = NULL;
1220437c7c90SJeremy L Thompson         CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr_in));
1221437c7c90SJeremy L Thompson         CeedCall(CeedElemRestrictionReferenceCopy(elem_rstr_in, &(*data)->active_elem_rstrs[num_active_bases]));
1222437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_in));
1223437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_out));
1224437c7c90SJeremy L Thompson         num_eval_modes_in[index]  = 0;
1225437c7c90SJeremy L Thompson         num_eval_modes_out[index] = 0;
1226437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_in));
1227437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_out));
1228437c7c90SJeremy L Thompson         eval_modes_in[index]  = NULL;
1229437c7c90SJeremy L Thompson         eval_modes_out[index] = NULL;
1230437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_in));
1231437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_out));
1232437c7c90SJeremy L Thompson         eval_mode_offsets_in[index]  = NULL;
1233437c7c90SJeremy L Thompson         eval_mode_offsets_out[index] = NULL;
1234437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_in));
1235437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_out));
1236437c7c90SJeremy L Thompson         (*data)->assembled_bases_in[index]  = NULL;
1237437c7c90SJeremy L Thompson         (*data)->assembled_bases_out[index] = NULL;
1238437c7c90SJeremy L Thompson         num_active_bases++;
1239437c7c90SJeremy L Thompson       }
1240352a5e7cSSebastian Grimberg       if (eval_mode != CEED_EVAL_WEIGHT) {
1241352a5e7cSSebastian Grimberg         // q_comp = 1 if CEED_EVAL_NONE, CEED_EVAL_WEIGHT caught by QF Assembly
1242352a5e7cSSebastian Grimberg         CeedCall(CeedRealloc(num_eval_modes_in[index] + q_comp, &eval_modes_in[index]));
1243352a5e7cSSebastian Grimberg         CeedCall(CeedRealloc(num_eval_modes_in[index] + q_comp, &eval_mode_offsets_in[index]));
1244352a5e7cSSebastian Grimberg         for (CeedInt d = 0; d < q_comp; d++) {
1245437c7c90SJeremy L Thompson           eval_modes_in[index][num_eval_modes_in[index] + d]        = eval_mode;
1246437c7c90SJeremy L Thompson           eval_mode_offsets_in[index][num_eval_modes_in[index] + d] = offset;
1247352a5e7cSSebastian Grimberg           offset += num_comp;
1248ed9e99e6SJeremy L Thompson         }
1249352a5e7cSSebastian Grimberg         num_eval_modes_in[index] += q_comp;
1250ed9e99e6SJeremy L Thompson       }
1251ed9e99e6SJeremy L Thompson     }
1252ed9e99e6SJeremy L Thompson   }
1253437c7c90SJeremy L Thompson   (*data)->num_eval_modes_in    = num_eval_modes_in;
1254437c7c90SJeremy L Thompson   (*data)->eval_modes_in        = eval_modes_in;
1255437c7c90SJeremy L Thompson   (*data)->eval_mode_offsets_in = eval_mode_offsets_in;
1256ed9e99e6SJeremy L Thompson 
1257ed9e99e6SJeremy L Thompson   // Determine active output basis
12582b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionGetFields(qf, NULL, NULL, &num_output_fields, &qf_fields));
12592b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields));
1260437c7c90SJeremy L Thompson   offset = 0;
1261ed9e99e6SJeremy L Thompson   for (CeedInt i = 0; i < num_output_fields; i++) {
1262ed9e99e6SJeremy L Thompson     CeedVector vec;
12631c66c397SJeremy L Thompson 
12642b730f8bSJeremy L Thompson     CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec));
1265ed9e99e6SJeremy L Thompson     if (vec == CEED_VECTOR_ACTIVE) {
12667c1dbaffSSebastian Grimberg       CeedInt      index = -1, num_comp, q_comp;
12671c66c397SJeremy L Thompson       CeedEvalMode eval_mode;
12681c66c397SJeremy L Thompson       CeedBasis    basis_out = NULL;
12691c66c397SJeremy L Thompson 
1270437c7c90SJeremy L Thompson       CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_out));
12712b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode));
1272352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetNumComponents(basis_out, &num_comp));
1273352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetNumQuadratureComponents(basis_out, eval_mode, &q_comp));
1274437c7c90SJeremy L Thompson       for (CeedInt i = 0; i < num_active_bases; i++) {
1275437c7c90SJeremy L Thompson         if ((*data)->active_bases[i] == basis_out) index = i;
1276437c7c90SJeremy L Thompson       }
1277437c7c90SJeremy L Thompson       if (index == -1) {
1278437c7c90SJeremy L Thompson         CeedElemRestriction elem_rstr_out;
12791c66c397SJeremy L Thompson 
1280437c7c90SJeremy L Thompson         index = num_active_bases;
1281437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_bases));
1282437c7c90SJeremy L Thompson         (*data)->active_bases[num_active_bases] = NULL;
1283437c7c90SJeremy L Thompson         CeedCall(CeedBasisReferenceCopy(basis_out, &(*data)->active_bases[num_active_bases]));
1284437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_elem_rstrs));
1285437c7c90SJeremy L Thompson         (*data)->active_elem_rstrs[num_active_bases] = NULL;
1286437c7c90SJeremy L Thompson         CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr_out));
1287437c7c90SJeremy L Thompson         CeedCall(CeedElemRestrictionReferenceCopy(elem_rstr_out, &(*data)->active_elem_rstrs[num_active_bases]));
1288437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_in));
1289437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_out));
1290437c7c90SJeremy L Thompson         num_eval_modes_in[index]  = 0;
1291437c7c90SJeremy L Thompson         num_eval_modes_out[index] = 0;
1292437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_in));
1293437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_out));
1294437c7c90SJeremy L Thompson         eval_modes_in[index]  = NULL;
1295437c7c90SJeremy L Thompson         eval_modes_out[index] = NULL;
1296437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_in));
1297437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_out));
1298437c7c90SJeremy L Thompson         eval_mode_offsets_in[index]  = NULL;
1299437c7c90SJeremy L Thompson         eval_mode_offsets_out[index] = NULL;
1300437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_in));
1301437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_out));
1302437c7c90SJeremy L Thompson         (*data)->assembled_bases_in[index]  = NULL;
1303437c7c90SJeremy L Thompson         (*data)->assembled_bases_out[index] = NULL;
1304437c7c90SJeremy L Thompson         num_active_bases++;
1305437c7c90SJeremy L Thompson       }
1306352a5e7cSSebastian Grimberg       if (eval_mode != CEED_EVAL_WEIGHT) {
1307352a5e7cSSebastian Grimberg         // q_comp = 1 if CEED_EVAL_NONE, CEED_EVAL_WEIGHT caught by QF Assembly
1308352a5e7cSSebastian Grimberg         CeedCall(CeedRealloc(num_eval_modes_out[index] + q_comp, &eval_modes_out[index]));
1309352a5e7cSSebastian Grimberg         CeedCall(CeedRealloc(num_eval_modes_out[index] + q_comp, &eval_mode_offsets_out[index]));
1310352a5e7cSSebastian Grimberg         for (CeedInt d = 0; d < q_comp; d++) {
1311437c7c90SJeremy L Thompson           eval_modes_out[index][num_eval_modes_out[index] + d]        = eval_mode;
1312437c7c90SJeremy L Thompson           eval_mode_offsets_out[index][num_eval_modes_out[index] + d] = offset;
1313352a5e7cSSebastian Grimberg           offset += num_comp;
1314ed9e99e6SJeremy L Thompson         }
1315352a5e7cSSebastian Grimberg         num_eval_modes_out[index] += q_comp;
1316ed9e99e6SJeremy L Thompson       }
1317ed9e99e6SJeremy L Thompson     }
1318ed9e99e6SJeremy L Thompson   }
1319437c7c90SJeremy L Thompson   (*data)->num_output_components = offset;
1320437c7c90SJeremy L Thompson   (*data)->num_eval_modes_out    = num_eval_modes_out;
1321437c7c90SJeremy L Thompson   (*data)->eval_modes_out        = eval_modes_out;
1322437c7c90SJeremy L Thompson   (*data)->eval_mode_offsets_out = eval_mode_offsets_out;
1323437c7c90SJeremy L Thompson   (*data)->num_active_bases      = num_active_bases;
1324ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1325ed9e99e6SJeremy L Thompson }
1326ed9e99e6SJeremy L Thompson 
1327ed9e99e6SJeremy L Thompson /**
1328ba746a46SJeremy L Thompson   @brief Get CeedOperator CeedEvalModes for assembly.
1329ba746a46SJeremy L Thompson 
1330ba746a46SJeremy L Thompson   Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object.
1331ed9e99e6SJeremy L Thompson 
1332ed9e99e6SJeremy L Thompson   @param[in]  data                  CeedOperatorAssemblyData
1333ba746a46SJeremy L Thompson   @param[out] num_active_bases      Total number of active bases
1334c5d0f995SJed Brown   @param[out] num_eval_modes_in     Pointer to hold array of numbers of input CeedEvalModes, or NULL.
1335ba746a46SJeremy L Thompson                                       `eval_modes_in[0]` holds an array of eval modes for the first active basis.
1336c5d0f995SJed Brown   @param[out] eval_modes_in         Pointer to hold arrays of input CeedEvalModes, or NULL.
1337ba746a46SJeremy L Thompson   @param[out] eval_mode_offsets_in  Pointer to hold arrays of input offsets at each quadrature point.
1338c5d0f995SJed Brown   @param[out] num_eval_modes_out    Pointer to hold array of numbers of output CeedEvalModes, or NULL
1339c5d0f995SJed Brown   @param[out] eval_modes_out        Pointer to hold arrays of output CeedEvalModes, or NULL.
1340437c7c90SJeremy L Thompson   @param[out] eval_mode_offsets_out Pointer to hold arrays of output offsets at each quadrature point
1341ba746a46SJeremy L Thompson   @param[out] num_output_components The number of columns in the assembled CeedQFunction matrix for each quadrature point,
1342ba746a46SJeremy L Thompson                                       including contributions of all active bases
1343ed9e99e6SJeremy L Thompson 
1344ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1345ed9e99e6SJeremy L Thompson 
1346c5d0f995SJed Brown 
1347ed9e99e6SJeremy L Thompson   @ref Backend
1348ed9e99e6SJeremy L Thompson **/
1349437c7c90SJeremy L Thompson int CeedOperatorAssemblyDataGetEvalModes(CeedOperatorAssemblyData data, CeedInt *num_active_bases, CeedInt **num_eval_modes_in,
1350437c7c90SJeremy L Thompson                                          const CeedEvalMode ***eval_modes_in, CeedSize ***eval_mode_offsets_in, CeedInt **num_eval_modes_out,
1351437c7c90SJeremy L Thompson                                          const CeedEvalMode ***eval_modes_out, CeedSize ***eval_mode_offsets_out, CeedSize *num_output_components) {
1352437c7c90SJeremy L Thompson   if (num_active_bases) *num_active_bases = data->num_active_bases;
1353437c7c90SJeremy L Thompson   if (num_eval_modes_in) *num_eval_modes_in = data->num_eval_modes_in;
1354437c7c90SJeremy L Thompson   if (eval_modes_in) *eval_modes_in = (const CeedEvalMode **)data->eval_modes_in;
1355437c7c90SJeremy L Thompson   if (eval_mode_offsets_in) *eval_mode_offsets_in = data->eval_mode_offsets_in;
1356437c7c90SJeremy L Thompson   if (num_eval_modes_out) *num_eval_modes_out = data->num_eval_modes_out;
1357437c7c90SJeremy L Thompson   if (eval_modes_out) *eval_modes_out = (const CeedEvalMode **)data->eval_modes_out;
1358437c7c90SJeremy L Thompson   if (eval_mode_offsets_out) *eval_mode_offsets_out = data->eval_mode_offsets_out;
1359437c7c90SJeremy L Thompson   if (num_output_components) *num_output_components = data->num_output_components;
1360ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1361ed9e99e6SJeremy L Thompson }
1362ed9e99e6SJeremy L Thompson 
1363ed9e99e6SJeremy L Thompson /**
1364ba746a46SJeremy L Thompson   @brief Get CeedOperator CeedBasis data for assembly.
1365ba746a46SJeremy L Thompson 
1366ba746a46SJeremy L Thompson   Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object.
1367ed9e99e6SJeremy L Thompson 
1368ed9e99e6SJeremy L Thompson   @param[in]  data                CeedOperatorAssemblyData
1369437c7c90SJeremy L Thompson   @param[out] num_active_bases    Number of active bases, or NULL
1370437c7c90SJeremy L Thompson   @param[out] active_bases        Pointer to hold active CeedBasis, or NULL
1371437c7c90SJeremy L Thompson   @param[out] assembled_bases_in  Pointer to hold assembled active input B, or NULL
1372437c7c90SJeremy L Thompson   @param[out] assembled_bases_out Pointer to hold assembled active output B, or NULL
1373ed9e99e6SJeremy L Thompson 
1374ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1375ed9e99e6SJeremy L Thompson 
1376ed9e99e6SJeremy L Thompson   @ref Backend
1377ed9e99e6SJeremy L Thompson **/
1378437c7c90SJeremy L Thompson int CeedOperatorAssemblyDataGetBases(CeedOperatorAssemblyData data, CeedInt *num_active_bases, CeedBasis **active_bases,
1379437c7c90SJeremy L Thompson                                      const CeedScalar ***assembled_bases_in, const CeedScalar ***assembled_bases_out) {
1380ed9e99e6SJeremy L Thompson   // Assemble B_in, B_out if needed
1381437c7c90SJeremy L Thompson   if (assembled_bases_in && !data->assembled_bases_in[0]) {
1382437c7c90SJeremy L Thompson     CeedInt num_qpts;
1383437c7c90SJeremy L Thompson 
1384437c7c90SJeremy L Thompson     CeedCall(CeedBasisGetNumQuadraturePoints(data->active_bases[0], &num_qpts));
1385437c7c90SJeremy L Thompson     for (CeedInt b = 0; b < data->num_active_bases; b++) {
13861c66c397SJeremy L Thompson       bool        has_eval_none = false;
1387352a5e7cSSebastian Grimberg       CeedInt     num_nodes;
1388437c7c90SJeremy L Thompson       CeedScalar *B_in = NULL, *identity = NULL;
1389ed9e99e6SJeremy L Thompson 
1390352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetNumNodes(data->active_bases[b], &num_nodes));
1391352a5e7cSSebastian Grimberg       CeedCall(CeedCalloc(num_qpts * num_nodes * data->num_eval_modes_in[b], &B_in));
1392ed9e99e6SJeremy L Thompson 
1393437c7c90SJeremy L Thompson       for (CeedInt i = 0; i < data->num_eval_modes_in[b]; i++) {
1394437c7c90SJeremy L Thompson         has_eval_none = has_eval_none || (data->eval_modes_in[b][i] == CEED_EVAL_NONE);
1395ed9e99e6SJeremy L Thompson       }
1396ed9e99e6SJeremy L Thompson       if (has_eval_none) {
1397352a5e7cSSebastian Grimberg         CeedCall(CeedCalloc(num_qpts * num_nodes, &identity));
1398352a5e7cSSebastian Grimberg         for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) {
1399352a5e7cSSebastian Grimberg           identity[i * num_nodes + i] = 1.0;
1400ed9e99e6SJeremy L Thompson         }
1401ed9e99e6SJeremy L Thompson       }
1402ed9e99e6SJeremy L Thompson 
1403ed9e99e6SJeremy L Thompson       for (CeedInt q = 0; q < num_qpts; q++) {
1404352a5e7cSSebastian Grimberg         for (CeedInt n = 0; n < num_nodes; n++) {
1405352a5e7cSSebastian Grimberg           CeedInt      d_in              = 0, q_comp_in;
1406352a5e7cSSebastian Grimberg           CeedEvalMode eval_mode_in_prev = CEED_EVAL_NONE;
14071c66c397SJeremy L Thompson 
1408437c7c90SJeremy L Thompson           for (CeedInt e_in = 0; e_in < data->num_eval_modes_in[b]; e_in++) {
1409437c7c90SJeremy L Thompson             const CeedInt     qq = data->num_eval_modes_in[b] * q;
1410437c7c90SJeremy L Thompson             const CeedScalar *B  = NULL;
14111c66c397SJeremy L Thompson 
1412352a5e7cSSebastian Grimberg             CeedOperatorGetBasisPointer(data->active_bases[b], data->eval_modes_in[b][e_in], identity, &B);
1413352a5e7cSSebastian Grimberg             CeedCall(CeedBasisGetNumQuadratureComponents(data->active_bases[b], data->eval_modes_in[b][e_in], &q_comp_in));
1414352a5e7cSSebastian Grimberg             if (q_comp_in > 1) {
1415352a5e7cSSebastian Grimberg               if (e_in == 0 || data->eval_modes_in[b][e_in] != eval_mode_in_prev) d_in = 0;
1416352a5e7cSSebastian Grimberg               else B = &B[(++d_in) * num_qpts * num_nodes];
1417352a5e7cSSebastian Grimberg             }
1418352a5e7cSSebastian Grimberg             eval_mode_in_prev                 = data->eval_modes_in[b][e_in];
1419352a5e7cSSebastian Grimberg             B_in[(qq + e_in) * num_nodes + n] = B[q * num_nodes + n];
1420ed9e99e6SJeremy L Thompson           }
1421ed9e99e6SJeremy L Thompson         }
1422ed9e99e6SJeremy L Thompson       }
14237c1dbaffSSebastian Grimberg       if (identity) CeedCall(CeedFree(&identity));
1424437c7c90SJeremy L Thompson       data->assembled_bases_in[b] = B_in;
1425437c7c90SJeremy L Thompson     }
1426ed9e99e6SJeremy L Thompson   }
1427ed9e99e6SJeremy L Thompson 
1428437c7c90SJeremy L Thompson   if (assembled_bases_out && !data->assembled_bases_out[0]) {
1429437c7c90SJeremy L Thompson     CeedInt num_qpts;
1430437c7c90SJeremy L Thompson 
1431437c7c90SJeremy L Thompson     CeedCall(CeedBasisGetNumQuadraturePoints(data->active_bases[0], &num_qpts));
1432437c7c90SJeremy L Thompson     for (CeedInt b = 0; b < data->num_active_bases; b++) {
1433ed9e99e6SJeremy L Thompson       bool        has_eval_none = false;
14341c66c397SJeremy L Thompson       CeedInt     num_nodes;
1435437c7c90SJeremy L Thompson       CeedScalar *B_out = NULL, *identity = NULL;
1436ed9e99e6SJeremy L Thompson 
1437352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetNumNodes(data->active_bases[b], &num_nodes));
1438352a5e7cSSebastian Grimberg       CeedCall(CeedCalloc(num_qpts * num_nodes * data->num_eval_modes_out[b], &B_out));
1439ed9e99e6SJeremy L Thompson 
1440437c7c90SJeremy L Thompson       for (CeedInt i = 0; i < data->num_eval_modes_out[b]; i++) {
1441437c7c90SJeremy L Thompson         has_eval_none = has_eval_none || (data->eval_modes_out[b][i] == CEED_EVAL_NONE);
1442ed9e99e6SJeremy L Thompson       }
1443ed9e99e6SJeremy L Thompson       if (has_eval_none) {
1444352a5e7cSSebastian Grimberg         CeedCall(CeedCalloc(num_qpts * num_nodes, &identity));
1445352a5e7cSSebastian Grimberg         for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) {
1446352a5e7cSSebastian Grimberg           identity[i * num_nodes + i] = 1.0;
1447ed9e99e6SJeremy L Thompson         }
1448ed9e99e6SJeremy L Thompson       }
1449ed9e99e6SJeremy L Thompson 
1450ed9e99e6SJeremy L Thompson       for (CeedInt q = 0; q < num_qpts; q++) {
1451352a5e7cSSebastian Grimberg         for (CeedInt n = 0; n < num_nodes; n++) {
1452352a5e7cSSebastian Grimberg           CeedInt      d_out              = 0, q_comp_out;
1453352a5e7cSSebastian Grimberg           CeedEvalMode eval_mode_out_prev = CEED_EVAL_NONE;
14541c66c397SJeremy L Thompson 
1455437c7c90SJeremy L Thompson           for (CeedInt e_out = 0; e_out < data->num_eval_modes_out[b]; e_out++) {
1456437c7c90SJeremy L Thompson             const CeedInt     qq = data->num_eval_modes_out[b] * q;
1457437c7c90SJeremy L Thompson             const CeedScalar *B  = NULL;
14581c66c397SJeremy L Thompson 
1459352a5e7cSSebastian Grimberg             CeedOperatorGetBasisPointer(data->active_bases[b], data->eval_modes_out[b][e_out], identity, &B);
1460352a5e7cSSebastian Grimberg             CeedCall(CeedBasisGetNumQuadratureComponents(data->active_bases[b], data->eval_modes_out[b][e_out], &q_comp_out));
1461352a5e7cSSebastian Grimberg             if (q_comp_out > 1) {
1462352a5e7cSSebastian Grimberg               if (e_out == 0 || data->eval_modes_out[b][e_out] != eval_mode_out_prev) d_out = 0;
1463352a5e7cSSebastian Grimberg               else B = &B[(++d_out) * num_qpts * num_nodes];
1464352a5e7cSSebastian Grimberg             }
1465352a5e7cSSebastian Grimberg             eval_mode_out_prev                  = data->eval_modes_out[b][e_out];
1466352a5e7cSSebastian Grimberg             B_out[(qq + e_out) * num_nodes + n] = B[q * num_nodes + n];
1467ed9e99e6SJeremy L Thompson           }
1468ed9e99e6SJeremy L Thompson         }
1469ed9e99e6SJeremy L Thompson       }
14707c1dbaffSSebastian Grimberg       if (identity) CeedCall(CeedFree(&identity));
1471437c7c90SJeremy L Thompson       data->assembled_bases_out[b] = B_out;
1472437c7c90SJeremy L Thompson     }
1473ed9e99e6SJeremy L Thompson   }
1474ed9e99e6SJeremy L Thompson 
1475437c7c90SJeremy L Thompson   // Pass out assembled data
1476437c7c90SJeremy L Thompson   if (active_bases) *active_bases = data->active_bases;
1477437c7c90SJeremy L Thompson   if (assembled_bases_in) *assembled_bases_in = (const CeedScalar **)data->assembled_bases_in;
1478437c7c90SJeremy L Thompson   if (assembled_bases_out) *assembled_bases_out = (const CeedScalar **)data->assembled_bases_out;
1479437c7c90SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1480437c7c90SJeremy L Thompson }
1481437c7c90SJeremy L Thompson 
1482437c7c90SJeremy L Thompson /**
1483ba746a46SJeremy L Thompson   @brief Get CeedOperator CeedBasis data for assembly.
1484ba746a46SJeremy L Thompson 
1485ba746a46SJeremy L Thompson   Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object.
1486437c7c90SJeremy L Thompson 
1487437c7c90SJeremy L Thompson   @param[in]  data                  CeedOperatorAssemblyData
1488437c7c90SJeremy L Thompson   @param[out] num_active_elem_rstrs Number of active element restrictions, or NULL
1489437c7c90SJeremy L Thompson   @param[out] active_elem_rstrs     Pointer to hold active CeedElemRestrictions, or NULL
1490437c7c90SJeremy L Thompson 
1491437c7c90SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1492437c7c90SJeremy L Thompson 
1493437c7c90SJeremy L Thompson   @ref Backend
1494437c7c90SJeremy L Thompson **/
1495437c7c90SJeremy L Thompson int CeedOperatorAssemblyDataGetElemRestrictions(CeedOperatorAssemblyData data, CeedInt *num_active_elem_rstrs,
1496437c7c90SJeremy L Thompson                                                 CeedElemRestriction **active_elem_rstrs) {
1497437c7c90SJeremy L Thompson   if (num_active_elem_rstrs) *num_active_elem_rstrs = data->num_active_bases;
1498437c7c90SJeremy L Thompson   if (active_elem_rstrs) *active_elem_rstrs = data->active_elem_rstrs;
1499ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1500ed9e99e6SJeremy L Thompson }
1501ed9e99e6SJeremy L Thompson 
1502ed9e99e6SJeremy L Thompson /**
1503ed9e99e6SJeremy L Thompson   @brief Destroy CeedOperatorAssemblyData
1504ed9e99e6SJeremy L Thompson 
1505ea61e9acSJeremy L Thompson   @param[in,out] data CeedOperatorAssemblyData to destroy
1506ed9e99e6SJeremy L Thompson 
1507ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1508ed9e99e6SJeremy L Thompson 
1509ed9e99e6SJeremy L Thompson   @ref Backend
1510ed9e99e6SJeremy L Thompson **/
1511ed9e99e6SJeremy L Thompson int CeedOperatorAssemblyDataDestroy(CeedOperatorAssemblyData *data) {
1512ad6481ceSJeremy L Thompson   if (!*data) {
1513ad6481ceSJeremy L Thompson     *data = NULL;
1514ad6481ceSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1515ad6481ceSJeremy L Thompson   }
15162b730f8bSJeremy L Thompson   CeedCall(CeedDestroy(&(*data)->ceed));
1517437c7c90SJeremy L Thompson   for (CeedInt b = 0; b < (*data)->num_active_bases; b++) {
1518437c7c90SJeremy L Thompson     CeedCall(CeedBasisDestroy(&(*data)->active_bases[b]));
1519437c7c90SJeremy L Thompson     CeedCall(CeedElemRestrictionDestroy(&(*data)->active_elem_rstrs[b]));
1520437c7c90SJeremy L Thompson     CeedCall(CeedFree(&(*data)->eval_modes_in[b]));
1521437c7c90SJeremy L Thompson     CeedCall(CeedFree(&(*data)->eval_modes_out[b]));
1522437c7c90SJeremy L Thompson     CeedCall(CeedFree(&(*data)->eval_mode_offsets_in[b]));
1523437c7c90SJeremy L Thompson     CeedCall(CeedFree(&(*data)->eval_mode_offsets_out[b]));
1524437c7c90SJeremy L Thompson     CeedCall(CeedFree(&(*data)->assembled_bases_in[b]));
1525437c7c90SJeremy L Thompson     CeedCall(CeedFree(&(*data)->assembled_bases_out[b]));
1526437c7c90SJeremy L Thompson   }
1527437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->active_bases));
1528437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->active_elem_rstrs));
1529437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->num_eval_modes_in));
1530437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->num_eval_modes_out));
1531437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->eval_modes_in));
1532437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->eval_modes_out));
1533437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->eval_mode_offsets_in));
1534437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->eval_mode_offsets_out));
1535437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->assembled_bases_in));
1536437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->assembled_bases_out));
1537ed9e99e6SJeremy L Thompson 
15382b730f8bSJeremy L Thompson   CeedCall(CeedFree(data));
1539ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1540ed9e99e6SJeremy L Thompson }
1541ed9e99e6SJeremy L Thompson 
1542480fae85SJeremy L Thompson /// @}
1543480fae85SJeremy L Thompson 
1544480fae85SJeremy L Thompson /// ----------------------------------------------------------------------------
1545eaf62fffSJeremy L Thompson /// CeedOperator Public API
1546eaf62fffSJeremy L Thompson /// ----------------------------------------------------------------------------
1547eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorUser
1548eaf62fffSJeremy L Thompson /// @{
1549eaf62fffSJeremy L Thompson 
1550eaf62fffSJeremy L Thompson /**
1551eaf62fffSJeremy L Thompson   @brief Assemble a linear CeedQFunction associated with a CeedOperator
1552eaf62fffSJeremy L Thompson 
1553ea61e9acSJeremy L Thompson   This returns a CeedVector containing a matrix at each quadrature point providing the action of the CeedQFunction associated with the CeedOperator.
1554859c15bbSJames Wright   The vector `assembled` is of shape `[num_elements, num_input_fields, num_output_fields, num_quad_points]` and contains column-major matrices
1555859c15bbSJames Wright representing the action of the CeedQFunction for a corresponding quadrature point on an element.
1556859c15bbSJames Wright 
15579fd66db6SSebastian Grimberg   Inputs and outputs are in the order provided by the user when adding CeedOperator fields.
15589fd66db6SSebastian Grimberg   For example, a CeedQFunction with inputs 'u' and 'gradu' and outputs 'gradv' and 'v', provided in that order, would result in an assembled QFunction
15599fd66db6SSebastian Grimberg that consists of (1 + dim) x (dim + 1) matrices at each quadrature point acting on the input [u, du_0, du_1] and producing the output [dv_0, dv_1, v].
1560eaf62fffSJeremy L Thompson 
1561ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1562f04ea552SJeremy L Thompson 
1563ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1564ea61e9acSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points
1565ea61e9acSJeremy L Thompson   @param[out] rstr      CeedElemRestriction for CeedVector containing assembled CeedQFunction
1566ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1567eaf62fffSJeremy L Thompson 
1568eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1569eaf62fffSJeremy L Thompson 
1570eaf62fffSJeremy L Thompson   @ref User
1571eaf62fffSJeremy L Thompson **/
15722b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunction(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) {
15732b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1574eaf62fffSJeremy L Thompson 
1575eaf62fffSJeremy L Thompson   if (op->LinearAssembleQFunction) {
1576d04bbc78SJeremy L Thompson     // Backend version
15772b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleQFunction(op, assembled, rstr, request));
1578eaf62fffSJeremy L Thompson   } else {
1579d04bbc78SJeremy L Thompson     // Operator fallback
1580d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1581d04bbc78SJeremy L Thompson 
15822b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
15836574a04fSJeremy L Thompson     if (op_fallback) CeedCall(CeedOperatorLinearAssembleQFunction(op_fallback, assembled, rstr, request));
15846574a04fSJeremy L Thompson     else return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunction");
158570a7ffb3SJeremy L Thompson   }
1586eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1587eaf62fffSJeremy L Thompson }
158870a7ffb3SJeremy L Thompson 
158970a7ffb3SJeremy L Thompson /**
1590ea61e9acSJeremy L Thompson   @brief Assemble CeedQFunction and store result internally.
15914385fb7fSSebastian Grimberg 
1592ea61e9acSJeremy L Thompson   Return copied references of stored data to the caller.
1593ea61e9acSJeremy L Thompson   Caller is responsible for ownership and destruction of the copied references.
1594ea61e9acSJeremy L Thompson   See also @ref CeedOperatorLinearAssembleQFunction
159570a7ffb3SJeremy L Thompson 
1596c5f45aeaSJeremy L Thompson   Note: If the value of `assembled` or `rstr` passed to this function are non-NULL, then it is assumed that they hold valid pointers.
1597c5f45aeaSJeremy L Thompson         These objects will be destroyed if `*assembled` or `*rstr` is the only reference to the object.
1598c5f45aeaSJeremy L Thompson 
1599ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1600ea61e9acSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points
1601ea61e9acSJeremy L Thompson   @param[out] rstr      CeedElemRestriction for CeedVector containing assembledCeedQFunction
1602ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
160370a7ffb3SJeremy L Thompson 
160470a7ffb3SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
160570a7ffb3SJeremy L Thompson 
160670a7ffb3SJeremy L Thompson   @ref User
160770a7ffb3SJeremy L Thompson **/
16082b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunctionBuildOrUpdate(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) {
1609b05f7e9fSJeremy L Thompson   int (*LinearAssembleQFunctionUpdate)(CeedOperator, CeedVector, CeedElemRestriction, CeedRequest *) = NULL;
1610b05f7e9fSJeremy L Thompson   CeedOperator op_assemble                                                                           = NULL;
1611bb229da9SJeremy L Thompson   CeedOperator op_fallback_parent                                                                    = NULL;
1612b05f7e9fSJeremy L Thompson 
16132b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
161470a7ffb3SJeremy L Thompson 
1615b05f7e9fSJeremy L Thompson   // Determine if fallback parent or operator has implementation
1616bb229da9SJeremy L Thompson   CeedCall(CeedOperatorGetFallbackParent(op, &op_fallback_parent));
1617bb229da9SJeremy L Thompson   if (op_fallback_parent && op_fallback_parent->LinearAssembleQFunctionUpdate) {
1618b05f7e9fSJeremy L Thompson     // -- Backend version for op fallback parent is faster, if it exists
1619bb229da9SJeremy L Thompson     LinearAssembleQFunctionUpdate = op_fallback_parent->LinearAssembleQFunctionUpdate;
1620bb229da9SJeremy L Thompson     op_assemble                   = op_fallback_parent;
1621b05f7e9fSJeremy L Thompson   } else if (op->LinearAssembleQFunctionUpdate) {
1622b05f7e9fSJeremy L Thompson     // -- Backend version for op
1623b05f7e9fSJeremy L Thompson     LinearAssembleQFunctionUpdate = op->LinearAssembleQFunctionUpdate;
1624b05f7e9fSJeremy L Thompson     op_assemble                   = op;
1625b05f7e9fSJeremy L Thompson   }
1626b05f7e9fSJeremy L Thompson 
1627b05f7e9fSJeremy L Thompson   // Assemble QFunction
1628b05f7e9fSJeremy L Thompson   if (LinearAssembleQFunctionUpdate) {
1629b05f7e9fSJeremy L Thompson     // Backend or fallback parent version
1630480fae85SJeremy L Thompson     bool                qf_assembled_is_setup;
16312efa2d85SJeremy L Thompson     CeedVector          assembled_vec  = NULL;
16322efa2d85SJeremy L Thompson     CeedElemRestriction assembled_rstr = NULL;
1633480fae85SJeremy L Thompson 
16342b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAssemblyDataIsSetup(op->qf_assembled, &qf_assembled_is_setup));
1635480fae85SJeremy L Thompson     if (qf_assembled_is_setup) {
1636d04bbc78SJeremy L Thompson       bool update_needed;
1637d04bbc78SJeremy L Thompson 
16382b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionAssemblyDataGetObjects(op->qf_assembled, &assembled_vec, &assembled_rstr));
16392b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionAssemblyDataIsUpdateNeeded(op->qf_assembled, &update_needed));
1640b05f7e9fSJeremy L Thompson       if (update_needed) CeedCall(LinearAssembleQFunctionUpdate(op_assemble, assembled_vec, assembled_rstr, request));
164170a7ffb3SJeremy L Thompson     } else {
1642b05f7e9fSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleQFunction(op_assemble, &assembled_vec, &assembled_rstr, request));
16432b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionAssemblyDataSetObjects(op->qf_assembled, assembled_vec, assembled_rstr));
164470a7ffb3SJeremy L Thompson     }
16452b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAssemblyDataSetUpdateNeeded(op->qf_assembled, false));
16462efa2d85SJeremy L Thompson 
1647d04bbc78SJeremy L Thompson     // Copy reference from internally held copy
16482b730f8bSJeremy L Thompson     CeedCall(CeedVectorReferenceCopy(assembled_vec, assembled));
16492b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionReferenceCopy(assembled_rstr, rstr));
1650c5f45aeaSJeremy L Thompson     CeedCall(CeedVectorDestroy(&assembled_vec));
16512b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionDestroy(&assembled_rstr));
165270a7ffb3SJeremy L Thompson   } else {
1653d04bbc78SJeremy L Thompson     // Operator fallback
1654d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1655d04bbc78SJeremy L Thompson 
16562b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
16576574a04fSJeremy L Thompson     if (op_fallback) CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op_fallback, assembled, rstr, request));
16586574a04fSJeremy L Thompson     else return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunctionUpdate");
165970a7ffb3SJeremy L Thompson   }
166070a7ffb3SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1661eaf62fffSJeremy L Thompson }
1662eaf62fffSJeremy L Thompson 
1663eaf62fffSJeremy L Thompson /**
1664eaf62fffSJeremy L Thompson   @brief Assemble the diagonal of a square linear CeedOperator
1665eaf62fffSJeremy L Thompson 
1666eaf62fffSJeremy L Thompson   This overwrites a CeedVector with the diagonal of a linear CeedOperator.
1667eaf62fffSJeremy L Thompson 
1668ea61e9acSJeremy L Thompson   Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported.
1669eaf62fffSJeremy L Thompson 
1670ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1671f04ea552SJeremy L Thompson 
1672ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1673eaf62fffSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedOperator diagonal
1674ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1675eaf62fffSJeremy L Thompson 
1676eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1677eaf62fffSJeremy L Thompson 
1678eaf62fffSJeremy L Thompson   @ref User
1679eaf62fffSJeremy L Thompson **/
16802b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) {
1681f3d47e36SJeremy L Thompson   bool     is_composite;
16821c66c397SJeremy L Thompson   CeedSize input_size = 0, output_size = 0;
16831c66c397SJeremy L Thompson 
16842b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1685f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1686eaf62fffSJeremy L Thompson 
16872b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size));
16886574a04fSJeremy L Thompson   CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square");
1689c9366a6bSJeremy L Thompson 
1690f3d47e36SJeremy L Thompson   // Early exit for empty operator
1691f3d47e36SJeremy L Thompson   if (!is_composite) {
1692f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
1693f3d47e36SJeremy L Thompson 
1694f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
1695f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
1696f3d47e36SJeremy L Thompson   }
1697f3d47e36SJeremy L Thompson 
1698eaf62fffSJeremy L Thompson   if (op->LinearAssembleDiagonal) {
1699d04bbc78SJeremy L Thompson     // Backend version
17002b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleDiagonal(op, assembled, request));
1701eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1702eaf62fffSJeremy L Thompson   } else if (op->LinearAssembleAddDiagonal) {
1703d04bbc78SJeremy L Thompson     // Backend version with zeroing first
17042b730f8bSJeremy L Thompson     CeedCall(CeedVectorSetValue(assembled, 0.0));
17052b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request));
1706eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1707eaf62fffSJeremy L Thompson   } else {
1708d04bbc78SJeremy L Thompson     // Operator fallback
1709d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1710d04bbc78SJeremy L Thompson 
17112b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1712d04bbc78SJeremy L Thompson     if (op_fallback) {
17132b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleDiagonal(op_fallback, assembled, request));
1714eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1715eaf62fffSJeremy L Thompson     }
1716eaf62fffSJeremy L Thompson   }
1717eaf62fffSJeremy L Thompson   // Default interface implementation
17182b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(assembled, 0.0));
17192b730f8bSJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleAddDiagonal(op, assembled, request));
1720eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1721eaf62fffSJeremy L Thompson }
1722eaf62fffSJeremy L Thompson 
1723eaf62fffSJeremy L Thompson /**
1724eaf62fffSJeremy L Thompson   @brief Assemble the diagonal of a square linear CeedOperator
1725eaf62fffSJeremy L Thompson 
1726eaf62fffSJeremy L Thompson   This sums into a CeedVector the diagonal of a linear CeedOperator.
1727eaf62fffSJeremy L Thompson 
1728ea61e9acSJeremy L Thompson   Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported.
1729eaf62fffSJeremy L Thompson 
1730ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1731f04ea552SJeremy L Thompson 
1732ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1733eaf62fffSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedOperator diagonal
1734ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1735eaf62fffSJeremy L Thompson 
1736eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1737eaf62fffSJeremy L Thompson 
1738eaf62fffSJeremy L Thompson   @ref User
1739eaf62fffSJeremy L Thompson **/
17402b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) {
1741f3d47e36SJeremy L Thompson   bool     is_composite;
17421c66c397SJeremy L Thompson   CeedSize input_size = 0, output_size = 0;
17431c66c397SJeremy L Thompson 
17442b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1745f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1746eaf62fffSJeremy L Thompson 
17472b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size));
17486574a04fSJeremy L Thompson   CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square");
1749c9366a6bSJeremy L Thompson 
1750f3d47e36SJeremy L Thompson   // Early exit for empty operator
1751f3d47e36SJeremy L Thompson   if (!is_composite) {
1752f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
1753f3d47e36SJeremy L Thompson 
1754f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
1755f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
1756f3d47e36SJeremy L Thompson   }
1757f3d47e36SJeremy L Thompson 
1758eaf62fffSJeremy L Thompson   if (op->LinearAssembleAddDiagonal) {
1759d04bbc78SJeremy L Thompson     // Backend version
17602b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request));
1761eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1762eaf62fffSJeremy L Thompson   } else {
1763d04bbc78SJeremy L Thompson     // Operator fallback
1764d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1765d04bbc78SJeremy L Thompson 
17662b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1767d04bbc78SJeremy L Thompson     if (op_fallback) {
17682b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleAddDiagonal(op_fallback, assembled, request));
1769eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1770eaf62fffSJeremy L Thompson     }
1771eaf62fffSJeremy L Thompson   }
1772eaf62fffSJeremy L Thompson   // Default interface implementation
1773eaf62fffSJeremy L Thompson   if (is_composite) {
17742b730f8bSJeremy L Thompson     CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, false, assembled));
1775eaf62fffSJeremy L Thompson   } else {
17762b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, false, assembled));
1777eaf62fffSJeremy L Thompson   }
1778d04bbc78SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1779eaf62fffSJeremy L Thompson }
1780eaf62fffSJeremy L Thompson 
1781eaf62fffSJeremy L Thompson /**
1782eaf62fffSJeremy L Thompson   @brief Assemble the point block diagonal of a square linear CeedOperator
1783eaf62fffSJeremy L Thompson 
1784ea61e9acSJeremy L Thompson   This overwrites a CeedVector with the point block diagonal of a linear CeedOperator.
1785eaf62fffSJeremy L Thompson 
1786ea61e9acSJeremy L Thompson   Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported.
1787eaf62fffSJeremy L Thompson 
1788ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1789f04ea552SJeremy L Thompson 
1790ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1791ea61e9acSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp
1792ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out,
1793ea61e9acSJeremy L Thompson component in].
1794ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1795eaf62fffSJeremy L Thompson 
1796eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1797eaf62fffSJeremy L Thompson 
1798eaf62fffSJeremy L Thompson   @ref User
1799eaf62fffSJeremy L Thompson **/
18002b730f8bSJeremy L Thompson int CeedOperatorLinearAssemblePointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) {
1801f3d47e36SJeremy L Thompson   bool     is_composite;
18021c66c397SJeremy L Thompson   CeedSize input_size = 0, output_size = 0;
18031c66c397SJeremy L Thompson 
18042b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1805f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1806eaf62fffSJeremy L Thompson 
18072b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size));
18086574a04fSJeremy L Thompson   CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square");
1809c9366a6bSJeremy L Thompson 
1810f3d47e36SJeremy L Thompson   // Early exit for empty operator
1811f3d47e36SJeremy L Thompson   if (!is_composite) {
1812f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
1813f3d47e36SJeremy L Thompson 
1814f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
1815f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
1816f3d47e36SJeremy L Thompson   }
1817f3d47e36SJeremy L Thompson 
1818eaf62fffSJeremy L Thompson   if (op->LinearAssemblePointBlockDiagonal) {
1819d04bbc78SJeremy L Thompson     // Backend version
18202b730f8bSJeremy L Thompson     CeedCall(op->LinearAssemblePointBlockDiagonal(op, assembled, request));
1821eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1822eaf62fffSJeremy L Thompson   } else if (op->LinearAssembleAddPointBlockDiagonal) {
1823d04bbc78SJeremy L Thompson     // Backend version with zeroing first
18242b730f8bSJeremy L Thompson     CeedCall(CeedVectorSetValue(assembled, 0.0));
18252b730f8bSJeremy L Thompson     CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request));
1826eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1827eaf62fffSJeremy L Thompson   } else {
1828d04bbc78SJeremy L Thompson     // Operator fallback
1829d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1830d04bbc78SJeremy L Thompson 
18312b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1832d04bbc78SJeremy L Thompson     if (op_fallback) {
18332b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssemblePointBlockDiagonal(op_fallback, assembled, request));
1834eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1835eaf62fffSJeremy L Thompson     }
1836eaf62fffSJeremy L Thompson   }
1837eaf62fffSJeremy L Thompson   // Default interface implementation
18382b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(assembled, 0.0));
18392b730f8bSJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request));
1840eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1841eaf62fffSJeremy L Thompson }
1842eaf62fffSJeremy L Thompson 
1843eaf62fffSJeremy L Thompson /**
1844eaf62fffSJeremy L Thompson   @brief Assemble the point block diagonal of a square linear CeedOperator
1845eaf62fffSJeremy L Thompson 
1846ea61e9acSJeremy L Thompson   This sums into a CeedVector with the point block diagonal of a linear CeedOperator.
1847eaf62fffSJeremy L Thompson 
1848ea61e9acSJeremy L Thompson   Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported.
1849eaf62fffSJeremy L Thompson 
1850ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1851f04ea552SJeremy L Thompson 
1852ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1853ea61e9acSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp
1854ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out,
1855ea61e9acSJeremy L Thompson component in].
1856ea61e9acSJeremy L Thompson   @param[in]  request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1857eaf62fffSJeremy L Thompson 
1858eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1859eaf62fffSJeremy L Thompson 
1860eaf62fffSJeremy L Thompson   @ref User
1861eaf62fffSJeremy L Thompson **/
18622b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddPointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) {
1863f3d47e36SJeremy L Thompson   bool     is_composite;
18641c66c397SJeremy L Thompson   CeedSize input_size = 0, output_size = 0;
18651c66c397SJeremy L Thompson 
18662b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1867f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1868eaf62fffSJeremy L Thompson 
18692b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size));
18706574a04fSJeremy L Thompson   CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square");
1871c9366a6bSJeremy L Thompson 
1872f3d47e36SJeremy L Thompson   // Early exit for empty operator
1873f3d47e36SJeremy L Thompson   if (!is_composite) {
1874f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
1875f3d47e36SJeremy L Thompson 
1876f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
1877f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
1878f3d47e36SJeremy L Thompson   }
1879f3d47e36SJeremy L Thompson 
1880eaf62fffSJeremy L Thompson   if (op->LinearAssembleAddPointBlockDiagonal) {
1881d04bbc78SJeremy L Thompson     // Backend version
18822b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleAddPointBlockDiagonal(op, assembled, request));
1883eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1884eaf62fffSJeremy L Thompson   } else {
1885d04bbc78SJeremy L Thompson     // Operator fallback
1886d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1887d04bbc78SJeremy L Thompson 
18882b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1889d04bbc78SJeremy L Thompson     if (op_fallback) {
18902b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op_fallback, assembled, request));
1891eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1892eaf62fffSJeremy L Thompson     }
1893eaf62fffSJeremy L Thompson   }
1894ea61e9acSJeremy L Thompson   // Default interface implementation
1895eaf62fffSJeremy L Thompson   if (is_composite) {
18962b730f8bSJeremy L Thompson     CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, true, assembled));
1897eaf62fffSJeremy L Thompson   } else {
18982b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, true, assembled));
1899eaf62fffSJeremy L Thompson   }
1900d04bbc78SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1901eaf62fffSJeremy L Thompson }
1902eaf62fffSJeremy L Thompson 
1903eaf62fffSJeremy L Thompson /**
1904eaf62fffSJeremy L Thompson    @brief Fully assemble the nonzero pattern of a linear operator.
1905eaf62fffSJeremy L Thompson 
1906ea61e9acSJeremy L Thompson    Expected to be used in conjunction with CeedOperatorLinearAssemble().
1907eaf62fffSJeremy L Thompson 
1908ea61e9acSJeremy L Thompson    The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the
19099fd66db6SSebastian Grimberg matrix in entry (i, j).
19109fd66db6SSebastian Grimberg   Note that the (i, j) pairs are not unique and may repeat.
19119fd66db6SSebastian Grimberg   This function returns the number of entries and their (i, j) locations, while CeedOperatorLinearAssemble() provides the values in the same ordering.
1912eaf62fffSJeremy L Thompson 
1913eaf62fffSJeremy L Thompson    This will generally be slow unless your operator is low-order.
1914eaf62fffSJeremy L Thompson 
1915ea61e9acSJeremy L Thompson    Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1916f04ea552SJeremy L Thompson 
1917eaf62fffSJeremy L Thompson    @param[in]  op          CeedOperator to assemble
1918eaf62fffSJeremy L Thompson    @param[out] num_entries Number of entries in coordinate nonzero pattern
1919eaf62fffSJeremy L Thompson    @param[out] rows        Row number for each entry
1920eaf62fffSJeremy L Thompson    @param[out] cols        Column number for each entry
1921eaf62fffSJeremy L Thompson 
1922eaf62fffSJeremy L Thompson    @ref User
1923eaf62fffSJeremy L Thompson **/
19242b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleSymbolic(CeedOperator op, CeedSize *num_entries, CeedInt **rows, CeedInt **cols) {
19251c66c397SJeremy L Thompson   bool          is_composite;
19261c66c397SJeremy L Thompson   CeedInt       num_suboperators, offset = 0;
1927b94338b9SJed Brown   CeedSize      single_entries;
1928eaf62fffSJeremy L Thompson   CeedOperator *sub_operators;
19291c66c397SJeremy L Thompson 
19302b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1931f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1932eaf62fffSJeremy L Thompson 
1933eaf62fffSJeremy L Thompson   if (op->LinearAssembleSymbolic) {
1934d04bbc78SJeremy L Thompson     // Backend version
19352b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleSymbolic(op, num_entries, rows, cols));
1936eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1937eaf62fffSJeremy L Thompson   } else {
1938d04bbc78SJeremy L Thompson     // Operator fallback
1939d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1940d04bbc78SJeremy L Thompson 
19412b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1942d04bbc78SJeremy L Thompson     if (op_fallback) {
19432b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleSymbolic(op_fallback, num_entries, rows, cols));
1944eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1945eaf62fffSJeremy L Thompson     }
1946eaf62fffSJeremy L Thompson   }
1947eaf62fffSJeremy L Thompson 
1948eaf62fffSJeremy L Thompson   // Default interface implementation
1949eaf62fffSJeremy L Thompson 
1950eaf62fffSJeremy L Thompson   // count entries and allocate rows, cols arrays
1951eaf62fffSJeremy L Thompson   *num_entries = 0;
1952eaf62fffSJeremy L Thompson   if (is_composite) {
1953c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
1954c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
195592ae7e47SJeremy L Thompson     for (CeedInt k = 0; k < num_suboperators; ++k) {
19562b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries));
1957eaf62fffSJeremy L Thompson       *num_entries += single_entries;
1958eaf62fffSJeremy L Thompson     }
1959eaf62fffSJeremy L Thompson   } else {
19602b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssemblyCountEntries(op, &single_entries));
1961eaf62fffSJeremy L Thompson     *num_entries += single_entries;
1962eaf62fffSJeremy L Thompson   }
19632b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(*num_entries, rows));
19642b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(*num_entries, cols));
1965eaf62fffSJeremy L Thompson 
1966eaf62fffSJeremy L Thompson   // assemble nonzero locations
1967eaf62fffSJeremy L Thompson   if (is_composite) {
1968c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
1969c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
197092ae7e47SJeremy L Thompson     for (CeedInt k = 0; k < num_suboperators; ++k) {
19712b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssembleSymbolic(sub_operators[k], offset, *rows, *cols));
19722b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries));
1973eaf62fffSJeremy L Thompson       offset += single_entries;
1974eaf62fffSJeremy L Thompson     }
1975eaf62fffSJeremy L Thompson   } else {
19762b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssembleSymbolic(op, offset, *rows, *cols));
1977eaf62fffSJeremy L Thompson   }
1978eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1979eaf62fffSJeremy L Thompson }
1980eaf62fffSJeremy L Thompson 
1981eaf62fffSJeremy L Thompson /**
1982eaf62fffSJeremy L Thompson    @brief Fully assemble the nonzero entries of a linear operator.
1983eaf62fffSJeremy L Thompson 
1984ea61e9acSJeremy L Thompson    Expected to be used in conjunction with CeedOperatorLinearAssembleSymbolic().
1985eaf62fffSJeremy L Thompson 
1986ea61e9acSJeremy L Thompson    The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the
19879fd66db6SSebastian Grimberg matrix in entry (i, j).
19889fd66db6SSebastian Grimberg   Note that the (i, j) pairs are not unique and may repeat.
19899fd66db6SSebastian Grimberg   This function returns the values of the nonzero entries to be added, their (i, j) locations are provided by CeedOperatorLinearAssembleSymbolic()
1990eaf62fffSJeremy L Thompson 
1991eaf62fffSJeremy L Thompson    This will generally be slow unless your operator is low-order.
1992eaf62fffSJeremy L Thompson 
1993ea61e9acSJeremy L Thompson    Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1994f04ea552SJeremy L Thompson 
1995eaf62fffSJeremy L Thompson    @param[in]  op     CeedOperator to assemble
1996eaf62fffSJeremy L Thompson    @param[out] values Values to assemble into matrix
1997eaf62fffSJeremy L Thompson 
1998eaf62fffSJeremy L Thompson    @ref User
1999eaf62fffSJeremy L Thompson **/
2000eaf62fffSJeremy L Thompson int CeedOperatorLinearAssemble(CeedOperator op, CeedVector values) {
20011c66c397SJeremy L Thompson   bool          is_composite;
20021c66c397SJeremy L Thompson   CeedInt       num_suboperators, offset = 0;
2003b94338b9SJed Brown   CeedSize      single_entries = 0;
2004eaf62fffSJeremy L Thompson   CeedOperator *sub_operators;
20051c66c397SJeremy L Thompson 
20062b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
2007f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
2008f3d47e36SJeremy L Thompson 
2009f3d47e36SJeremy L Thompson   // Early exit for empty operator
2010f3d47e36SJeremy L Thompson   if (!is_composite) {
2011f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
2012f3d47e36SJeremy L Thompson 
2013f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
2014f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
2015f3d47e36SJeremy L Thompson   }
2016eaf62fffSJeremy L Thompson 
2017eaf62fffSJeremy L Thompson   if (op->LinearAssemble) {
2018d04bbc78SJeremy L Thompson     // Backend version
20192b730f8bSJeremy L Thompson     CeedCall(op->LinearAssemble(op, values));
2020eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
2021eaf62fffSJeremy L Thompson   } else {
2022d04bbc78SJeremy L Thompson     // Operator fallback
2023d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
2024d04bbc78SJeremy L Thompson 
20252b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
2026d04bbc78SJeremy L Thompson     if (op_fallback) {
20272b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssemble(op_fallback, values));
2028eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
2029eaf62fffSJeremy L Thompson     }
2030eaf62fffSJeremy L Thompson   }
2031eaf62fffSJeremy L Thompson 
2032eaf62fffSJeremy L Thompson   // Default interface implementation
203328ec399dSJeremy L Thompson   CeedCall(CeedVectorSetValue(values, 0.0));
2034eaf62fffSJeremy L Thompson   if (is_composite) {
2035c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
2036c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
2037cefa2673SJeremy L Thompson     for (CeedInt k = 0; k < num_suboperators; k++) {
20382b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemble(sub_operators[k], offset, values));
20392b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries));
2040eaf62fffSJeremy L Thompson       offset += single_entries;
2041eaf62fffSJeremy L Thompson     }
2042eaf62fffSJeremy L Thompson   } else {
20432b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssemble(op, offset, values));
2044eaf62fffSJeremy L Thompson   }
2045eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
2046eaf62fffSJeremy L Thompson }
2047eaf62fffSJeremy L Thompson 
2048eaf62fffSJeremy L Thompson /**
204975f0d5a4SJeremy L Thompson   @brief Get the multiplicity of nodes across suboperators in a composite CeedOperator
205075f0d5a4SJeremy L Thompson 
205175f0d5a4SJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
205275f0d5a4SJeremy L Thompson 
205375f0d5a4SJeremy L Thompson   @param[in]  op               Composite CeedOperator
205475f0d5a4SJeremy L Thompson   @param[in]  num_skip_indices Number of suboperators to skip
205575f0d5a4SJeremy L Thompson   @param[in]  skip_indices     Array of indices of suboperators to skip
205675f0d5a4SJeremy L Thompson   @param[out] mult             Vector to store multiplicity (of size l_size)
205775f0d5a4SJeremy L Thompson 
205875f0d5a4SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
205975f0d5a4SJeremy L Thompson 
206075f0d5a4SJeremy L Thompson   @ref User
206175f0d5a4SJeremy L Thompson **/
206275f0d5a4SJeremy L Thompson int CeedCompositeOperatorGetMultiplicity(CeedOperator op, CeedInt num_skip_indices, CeedInt *skip_indices, CeedVector mult) {
206375f0d5a4SJeremy L Thompson   Ceed                ceed;
2064b275c451SJeremy L Thompson   CeedInt             num_suboperators;
206575f0d5a4SJeremy L Thompson   CeedSize            l_vec_len;
206675f0d5a4SJeremy L Thompson   CeedScalar         *mult_array;
206775f0d5a4SJeremy L Thompson   CeedVector          ones_l_vec;
20687c1dbaffSSebastian Grimberg   CeedElemRestriction elem_rstr, mult_elem_rstr;
2069b275c451SJeremy L Thompson   CeedOperator       *sub_operators;
207075f0d5a4SJeremy L Thompson 
20711c66c397SJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
20721c66c397SJeremy L Thompson 
207375f0d5a4SJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
207475f0d5a4SJeremy L Thompson 
207575f0d5a4SJeremy L Thompson   // Zero mult vector
207675f0d5a4SJeremy L Thompson   CeedCall(CeedVectorSetValue(mult, 0.0));
207775f0d5a4SJeremy L Thompson 
207875f0d5a4SJeremy L Thompson   // Get suboperators
2079b275c451SJeremy L Thompson   CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
2080b275c451SJeremy L Thompson   CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
2081b275c451SJeremy L Thompson   if (num_suboperators == 0) return CEED_ERROR_SUCCESS;
208275f0d5a4SJeremy L Thompson 
208375f0d5a4SJeremy L Thompson   // Work vector
208475f0d5a4SJeremy L Thompson   CeedCall(CeedVectorGetLength(mult, &l_vec_len));
208575f0d5a4SJeremy L Thompson   CeedCall(CeedVectorCreate(ceed, l_vec_len, &ones_l_vec));
208675f0d5a4SJeremy L Thompson   CeedCall(CeedVectorSetValue(ones_l_vec, 1.0));
208775f0d5a4SJeremy L Thompson   CeedCall(CeedVectorGetArray(mult, CEED_MEM_HOST, &mult_array));
208875f0d5a4SJeremy L Thompson 
208975f0d5a4SJeremy L Thompson   // Compute multiplicity across suboperators
2090b275c451SJeremy L Thompson   for (CeedInt i = 0; i < num_suboperators; i++) {
209175f0d5a4SJeremy L Thompson     const CeedScalar *sub_mult_array;
209275f0d5a4SJeremy L Thompson     CeedVector        sub_mult_l_vec, ones_e_vec;
209375f0d5a4SJeremy L Thompson 
209475f0d5a4SJeremy L Thompson     // -- Check for suboperator to skip
209575f0d5a4SJeremy L Thompson     for (CeedInt j = 0; j < num_skip_indices; j++) {
209675f0d5a4SJeremy L Thompson       if (skip_indices[j] == i) continue;
209775f0d5a4SJeremy L Thompson     }
209875f0d5a4SJeremy L Thompson 
209975f0d5a4SJeremy L Thompson     // -- Sub operator multiplicity
2100437c7c90SJeremy L Thompson     CeedCall(CeedOperatorGetActiveElemRestriction(sub_operators[i], &elem_rstr));
21017c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionCreateUnorientedCopy(elem_rstr, &mult_elem_rstr));
21027c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionCreateVector(mult_elem_rstr, &sub_mult_l_vec, &ones_e_vec));
210375f0d5a4SJeremy L Thompson     CeedCall(CeedVectorSetValue(sub_mult_l_vec, 0.0));
21047c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionApply(mult_elem_rstr, CEED_NOTRANSPOSE, ones_l_vec, ones_e_vec, CEED_REQUEST_IMMEDIATE));
21057c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionApply(mult_elem_rstr, CEED_TRANSPOSE, ones_e_vec, sub_mult_l_vec, CEED_REQUEST_IMMEDIATE));
210675f0d5a4SJeremy L Thompson     CeedCall(CeedVectorGetArrayRead(sub_mult_l_vec, CEED_MEM_HOST, &sub_mult_array));
210775f0d5a4SJeremy L Thompson     // ---- Flag every node present in the current suboperator
210875f0d5a4SJeremy L Thompson     for (CeedInt j = 0; j < l_vec_len; j++) {
210975f0d5a4SJeremy L Thompson       if (sub_mult_array[j] > 0.0) mult_array[j] += 1.0;
211075f0d5a4SJeremy L Thompson     }
211175f0d5a4SJeremy L Thompson     CeedCall(CeedVectorRestoreArrayRead(sub_mult_l_vec, &sub_mult_array));
211275f0d5a4SJeremy L Thompson     CeedCall(CeedVectorDestroy(&sub_mult_l_vec));
211375f0d5a4SJeremy L Thompson     CeedCall(CeedVectorDestroy(&ones_e_vec));
21147c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionDestroy(&mult_elem_rstr));
211575f0d5a4SJeremy L Thompson   }
211675f0d5a4SJeremy L Thompson   CeedCall(CeedVectorRestoreArray(mult, &mult_array));
2117811d0ccfSJeremy L Thompson   CeedCall(CeedVectorDestroy(&ones_l_vec));
211875f0d5a4SJeremy L Thompson   return CEED_ERROR_SUCCESS;
211975f0d5a4SJeremy L Thompson }
212075f0d5a4SJeremy L Thompson 
212175f0d5a4SJeremy L Thompson /**
2122ea61e9acSJeremy L Thompson   @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator, creating the prolongation basis from the fine and coarse
2123ea61e9acSJeremy L Thompson grid interpolation
2124eaf62fffSJeremy L Thompson 
212558e4b056SJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable.
2126f04ea552SJeremy L Thompson 
2127eaf62fffSJeremy L Thompson   @param[in]  op_fine      Fine grid operator
212885bb9dcfSJeremy L Thompson   @param[in]  p_mult_fine  L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators
2129eaf62fffSJeremy L Thompson   @param[in]  rstr_coarse  Coarse grid restriction
2130eaf62fffSJeremy L Thompson   @param[in]  basis_coarse Coarse grid active vector basis
2131eaf62fffSJeremy L Thompson   @param[out] op_coarse    Coarse grid operator
213285bb9dcfSJeremy L Thompson   @param[out] op_prolong   Coarse to fine operator, or NULL
213385bb9dcfSJeremy L Thompson   @param[out] op_restrict  Fine to coarse operator, or NULL
2134eaf62fffSJeremy L Thompson 
2135eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
2136eaf62fffSJeremy L Thompson 
2137eaf62fffSJeremy L Thompson   @ref User
2138eaf62fffSJeremy L Thompson **/
21392b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreate(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse,
21402b730f8bSJeremy L Thompson                                      CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) {
21411c66c397SJeremy L Thompson   CeedBasis basis_c_to_f = NULL;
21421c66c397SJeremy L Thompson 
21432b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op_fine));
2144eaf62fffSJeremy L Thompson 
214583d6adf3SZach Atkins   // Build prolongation matrix, if required
214683d6adf3SZach Atkins   if (op_prolong || op_restrict) {
214783d6adf3SZach Atkins     CeedBasis basis_fine;
21481c66c397SJeremy L Thompson 
21492b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine));
21502b730f8bSJeremy L Thompson     CeedCall(CeedBasisCreateProjection(basis_coarse, basis_fine, &basis_c_to_f));
215183d6adf3SZach Atkins   }
2152eaf62fffSJeremy L Thompson 
2153f113e5dcSJeremy L Thompson   // Core code
21542b730f8bSJeremy L Thompson   CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict));
2155eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
2156eaf62fffSJeremy L Thompson }
2157eaf62fffSJeremy L Thompson 
2158eaf62fffSJeremy L Thompson /**
2159ea61e9acSJeremy L Thompson   @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a tensor basis for the active basis
2160eaf62fffSJeremy L Thompson 
216158e4b056SJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable.
2162f04ea552SJeremy L Thompson 
2163eaf62fffSJeremy L Thompson   @param[in]  op_fine       Fine grid operator
216485bb9dcfSJeremy L Thompson   @param[in]  p_mult_fine   L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators
2165eaf62fffSJeremy L Thompson   @param[in]  rstr_coarse   Coarse grid restriction
2166eaf62fffSJeremy L Thompson   @param[in]  basis_coarse  Coarse grid active vector basis
216785bb9dcfSJeremy L Thompson   @param[in]  interp_c_to_f Matrix for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators
2168eaf62fffSJeremy L Thompson   @param[out] op_coarse     Coarse grid operator
216985bb9dcfSJeremy L Thompson   @param[out] op_prolong    Coarse to fine operator, or NULL
217085bb9dcfSJeremy L Thompson   @param[out] op_restrict   Fine to coarse operator, or NULL
2171eaf62fffSJeremy L Thompson 
2172eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
2173eaf62fffSJeremy L Thompson 
2174eaf62fffSJeremy L Thompson   @ref User
2175eaf62fffSJeremy L Thompson **/
21762b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateTensorH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse,
21772b730f8bSJeremy L Thompson                                              const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong,
21782b730f8bSJeremy L Thompson                                              CeedOperator *op_restrict) {
2179eaf62fffSJeremy L Thompson   Ceed      ceed;
21801c66c397SJeremy L Thompson   CeedInt   Q_f, Q_c;
21811c66c397SJeremy L Thompson   CeedBasis basis_fine, basis_c_to_f = NULL;
21821c66c397SJeremy L Thompson 
21831c66c397SJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op_fine));
21842b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op_fine, &ceed));
2185eaf62fffSJeremy L Thompson 
2186eaf62fffSJeremy L Thompson   // Check for compatible quadrature spaces
21872b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine));
21882b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f));
21892b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c));
21906574a04fSJeremy L Thompson   CeedCheck(Q_f == Q_c, ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces");
2191eaf62fffSJeremy L Thompson 
219283d6adf3SZach Atkins   // Create coarse to fine basis, if required
219383d6adf3SZach Atkins   if (op_prolong || op_restrict) {
21941c66c397SJeremy L Thompson     CeedInt     dim, num_comp, num_nodes_c, P_1d_f, P_1d_c;
21951c66c397SJeremy L Thompson     CeedScalar *q_ref, *q_weight, *grad;
21961c66c397SJeremy L Thompson 
219783d6adf3SZach Atkins     // Check if interpolation matrix is provided
21986574a04fSJeremy L Thompson     CeedCheck(interp_c_to_f, ceed, CEED_ERROR_INCOMPATIBLE,
21996574a04fSJeremy L Thompson               "Prolongation or restriction operator creation requires coarse-to-fine interpolation matrix");
22002b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetDimension(basis_fine, &dim));
22012b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp));
22022b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumNodes1D(basis_fine, &P_1d_f));
22032b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c));
22042b730f8bSJeremy L Thompson     P_1d_c = dim == 1 ? num_nodes_c : dim == 2 ? sqrt(num_nodes_c) : cbrt(num_nodes_c);
22052b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(P_1d_f, &q_ref));
22062b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(P_1d_f, &q_weight));
22072b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(P_1d_f * P_1d_c * dim, &grad));
22082b730f8bSJeremy L Thompson     CeedCall(CeedBasisCreateTensorH1(ceed, dim, num_comp, P_1d_c, P_1d_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f));
22092b730f8bSJeremy L Thompson     CeedCall(CeedFree(&q_ref));
22102b730f8bSJeremy L Thompson     CeedCall(CeedFree(&q_weight));
22112b730f8bSJeremy L Thompson     CeedCall(CeedFree(&grad));
221283d6adf3SZach Atkins   }
2213eaf62fffSJeremy L Thompson 
2214eaf62fffSJeremy L Thompson   // Core code
22152b730f8bSJeremy L Thompson   CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict));
2216eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
2217eaf62fffSJeremy L Thompson }
2218eaf62fffSJeremy L Thompson 
2219eaf62fffSJeremy L Thompson /**
2220ea61e9acSJeremy L Thompson   @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a non-tensor basis for the active vector
2221eaf62fffSJeremy L Thompson 
222258e4b056SJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable.
2223f04ea552SJeremy L Thompson 
2224eaf62fffSJeremy L Thompson   @param[in]  op_fine       Fine grid operator
222585bb9dcfSJeremy L Thompson   @param[in]  p_mult_fine   L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators
2226eaf62fffSJeremy L Thompson   @param[in]  rstr_coarse   Coarse grid restriction
2227eaf62fffSJeremy L Thompson   @param[in]  basis_coarse  Coarse grid active vector basis
222885bb9dcfSJeremy L Thompson   @param[in]  interp_c_to_f Matrix for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators
2229eaf62fffSJeremy L Thompson   @param[out] op_coarse     Coarse grid operator
223085bb9dcfSJeremy L Thompson   @param[out] op_prolong    Coarse to fine operator, or NULL
223185bb9dcfSJeremy L Thompson   @param[out] op_restrict   Fine to coarse operator, or NULL
2232eaf62fffSJeremy L Thompson 
2233eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
2234eaf62fffSJeremy L Thompson 
2235eaf62fffSJeremy L Thompson   @ref User
2236eaf62fffSJeremy L Thompson **/
22372b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse,
22382b730f8bSJeremy L Thompson                                        const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong,
2239eaf62fffSJeremy L Thompson                                        CeedOperator *op_restrict) {
2240eaf62fffSJeremy L Thompson   Ceed      ceed;
22411c66c397SJeremy L Thompson   CeedInt   Q_f, Q_c;
22421c66c397SJeremy L Thompson   CeedBasis basis_fine, basis_c_to_f = NULL;
22431c66c397SJeremy L Thompson 
22441c66c397SJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op_fine));
22452b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op_fine, &ceed));
2246eaf62fffSJeremy L Thompson 
2247eaf62fffSJeremy L Thompson   // Check for compatible quadrature spaces
22482b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine));
22492b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f));
22502b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c));
22516574a04fSJeremy L Thompson   CeedCheck(Q_f == Q_c, ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces");
2252eaf62fffSJeremy L Thompson 
2253eaf62fffSJeremy L Thompson   // Coarse to fine basis
225483d6adf3SZach Atkins   if (op_prolong || op_restrict) {
22551c66c397SJeremy L Thompson     CeedInt          dim, num_comp, num_nodes_c, num_nodes_f;
22561c66c397SJeremy L Thompson     CeedScalar      *q_ref, *q_weight, *grad;
22571c66c397SJeremy L Thompson     CeedElemTopology topo;
22581c66c397SJeremy L Thompson 
225983d6adf3SZach Atkins     // Check if interpolation matrix is provided
22606574a04fSJeremy L Thompson     CeedCheck(interp_c_to_f, ceed, CEED_ERROR_INCOMPATIBLE,
22616574a04fSJeremy L Thompson               "Prolongation or restriction operator creation requires coarse-to-fine interpolation matrix");
22622b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetTopology(basis_fine, &topo));
22632b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetDimension(basis_fine, &dim));
22642b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp));
22652b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumNodes(basis_fine, &num_nodes_f));
22662b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c));
22672b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(num_nodes_f * dim, &q_ref));
22682b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(num_nodes_f, &q_weight));
22692b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(num_nodes_f * num_nodes_c * dim, &grad));
22702b730f8bSJeremy L Thompson     CeedCall(CeedBasisCreateH1(ceed, topo, num_comp, num_nodes_c, num_nodes_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f));
22712b730f8bSJeremy L Thompson     CeedCall(CeedFree(&q_ref));
22722b730f8bSJeremy L Thompson     CeedCall(CeedFree(&q_weight));
22732b730f8bSJeremy L Thompson     CeedCall(CeedFree(&grad));
227483d6adf3SZach Atkins   }
2275eaf62fffSJeremy L Thompson 
2276eaf62fffSJeremy L Thompson   // Core code
22772b730f8bSJeremy L Thompson   CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict));
2278eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
2279eaf62fffSJeremy L Thompson }
2280eaf62fffSJeremy L Thompson 
2281eaf62fffSJeremy L Thompson /**
2282ea61e9acSJeremy L Thompson   @brief Build a FDM based approximate inverse for each element for a CeedOperator
2283eaf62fffSJeremy L Thompson 
2284ea61e9acSJeremy L Thompson   This returns a CeedOperator and CeedVector to apply a Fast Diagonalization Method based approximate inverse.
2285859c15bbSJames Wright   This function obtains the simultaneous diagonalization for the 1D mass and Laplacian operators, \f$M = V^T V, K = V^T S V\f$.
2286859c15bbSJames Wright   The assembled QFunction is used to modify the eigenvalues from simultaneous diagonalization and obtain an approximate inverse of the form \f$V^T
22879fd66db6SSebastian Grimberg \hat S V\f$.
22889fd66db6SSebastian Grimberg   The CeedOperator must be linear and non-composite.
22899fd66db6SSebastian Grimberg   The associated CeedQFunction must therefore also be linear.
2290eaf62fffSJeremy L Thompson 
2291ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
2292f04ea552SJeremy L Thompson 
2293ea61e9acSJeremy L Thompson   @param[in]  op      CeedOperator to create element inverses
2294ea61e9acSJeremy L Thompson   @param[out] fdm_inv CeedOperator to apply the action of a FDM based inverse for each element
2295ea61e9acSJeremy L Thompson   @param[in]  request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
2296eaf62fffSJeremy L Thompson 
2297eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
2298eaf62fffSJeremy L Thompson 
2299480fae85SJeremy L Thompson   @ref User
2300eaf62fffSJeremy L Thompson **/
23012b730f8bSJeremy L Thompson int CeedOperatorCreateFDMElementInverse(CeedOperator op, CeedOperator *fdm_inv, CeedRequest *request) {
23021c66c397SJeremy L Thompson   Ceed                 ceed, ceed_parent;
23031c66c397SJeremy L Thompson   bool                 interp = false, grad = false, is_tensor_basis = true;
23041c66c397SJeremy L Thompson   CeedInt              num_input_fields, P_1d, Q_1d, num_nodes, num_qpts, dim, num_comp = 1, num_elem = 1;
23051c66c397SJeremy L Thompson   CeedSize             l_size = 1;
23061c66c397SJeremy L Thompson   CeedScalar          *mass, *laplace, *x, *fdm_interp, *lambda, *elem_avg;
23071c66c397SJeremy L Thompson   const CeedScalar    *interp_1d, *grad_1d, *q_weight_1d;
23081c66c397SJeremy L Thompson   CeedVector           q_data;
23091c66c397SJeremy L Thompson   CeedElemRestriction  rstr  = NULL, rstr_qd_i;
23101c66c397SJeremy L Thompson   CeedBasis            basis = NULL, fdm_basis;
23111c66c397SJeremy L Thompson   CeedQFunctionContext ctx_fdm;
23121c66c397SJeremy L Thompson   CeedQFunctionField  *qf_fields;
23131c66c397SJeremy L Thompson   CeedQFunction        qf, qf_fdm;
23141c66c397SJeremy L Thompson   CeedOperatorField   *op_fields;
23151c66c397SJeremy L Thompson 
23162b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
2317eaf62fffSJeremy L Thompson 
2318eaf62fffSJeremy L Thompson   if (op->CreateFDMElementInverse) {
2319d04bbc78SJeremy L Thompson     // Backend version
23202b730f8bSJeremy L Thompson     CeedCall(op->CreateFDMElementInverse(op, fdm_inv, request));
2321eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
2322eaf62fffSJeremy L Thompson   } else {
2323d04bbc78SJeremy L Thompson     // Operator fallback
2324d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
2325d04bbc78SJeremy L Thompson 
23262b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
2327d04bbc78SJeremy L Thompson     if (op_fallback) {
23282b730f8bSJeremy L Thompson       CeedCall(CeedOperatorCreateFDMElementInverse(op_fallback, fdm_inv, request));
2329eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
2330eaf62fffSJeremy L Thompson     }
2331eaf62fffSJeremy L Thompson   }
2332eaf62fffSJeremy L Thompson 
2333d04bbc78SJeremy L Thompson   // Default interface implementation
23342b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
2335bb229da9SJeremy L Thompson   CeedCall(CeedOperatorGetFallbackParentCeed(op, &ceed_parent));
23362b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetQFunction(op, &qf));
2337eaf62fffSJeremy L Thompson 
2338eaf62fffSJeremy L Thompson   // Determine active input basis
23392b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetFields(op, &num_input_fields, &op_fields, NULL, NULL));
23402b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL));
2341eaf62fffSJeremy L Thompson   for (CeedInt i = 0; i < num_input_fields; i++) {
2342eaf62fffSJeremy L Thompson     CeedVector vec;
23431c66c397SJeremy L Thompson 
23442b730f8bSJeremy L Thompson     CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec));
2345eaf62fffSJeremy L Thompson     if (vec == CEED_VECTOR_ACTIVE) {
2346eaf62fffSJeremy L Thompson       CeedEvalMode eval_mode;
23471c66c397SJeremy L Thompson 
23482b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode));
2349eaf62fffSJeremy L Thompson       interp = interp || eval_mode == CEED_EVAL_INTERP;
2350eaf62fffSJeremy L Thompson       grad   = grad || eval_mode == CEED_EVAL_GRAD;
23512b730f8bSJeremy L Thompson       CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis));
23522b730f8bSJeremy L Thompson       CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr));
2353eaf62fffSJeremy L Thompson     }
2354eaf62fffSJeremy L Thompson   }
23556574a04fSJeremy L Thompson   CeedCheck(basis, ceed, CEED_ERROR_BACKEND, "No active field set");
23562b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumNodes1D(basis, &P_1d));
2357352a5e7cSSebastian Grimberg   CeedCall(CeedBasisGetNumNodes(basis, &num_nodes));
23582b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints1D(basis, &Q_1d));
23592b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis, &num_qpts));
23602b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetDimension(basis, &dim));
23612b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumComponents(basis, &num_comp));
23622b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem));
23632b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size));
2364eaf62fffSJeremy L Thompson 
2365eaf62fffSJeremy L Thompson   // Build and diagonalize 1D Mass and Laplacian
23666574a04fSJeremy L Thompson   CeedCall(CeedBasisIsTensor(basis, &is_tensor_basis));
23676574a04fSJeremy L Thompson   CeedCheck(is_tensor_basis, ceed, CEED_ERROR_BACKEND, "FDMElementInverse only supported for tensor bases");
23682b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &mass));
23692b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &laplace));
23702b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &x));
23712b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &fdm_interp));
23722b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d, &lambda));
2373eaf62fffSJeremy L Thompson   // -- Build matrices
23742b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetInterp1D(basis, &interp_1d));
23752b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetGrad1D(basis, &grad_1d));
23762b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetQWeights(basis, &q_weight_1d));
23772b730f8bSJeremy L Thompson   CeedCall(CeedBuildMassLaplace(interp_1d, grad_1d, q_weight_1d, P_1d, Q_1d, dim, mass, laplace));
2378eaf62fffSJeremy L Thompson 
2379eaf62fffSJeremy L Thompson   // -- Diagonalize
23802b730f8bSJeremy L Thompson   CeedCall(CeedSimultaneousDiagonalization(ceed, laplace, mass, x, lambda, P_1d));
23812b730f8bSJeremy L Thompson   CeedCall(CeedFree(&mass));
23822b730f8bSJeremy L Thompson   CeedCall(CeedFree(&laplace));
23832b730f8bSJeremy L Thompson   for (CeedInt i = 0; i < P_1d; i++) {
23842b730f8bSJeremy L Thompson     for (CeedInt j = 0; j < P_1d; j++) fdm_interp[i + j * P_1d] = x[j + i * P_1d];
23852b730f8bSJeremy L Thompson   }
23862b730f8bSJeremy L Thompson   CeedCall(CeedFree(&x));
2387eaf62fffSJeremy L Thompson 
23881c66c397SJeremy L Thompson   {
23891c66c397SJeremy L Thompson     CeedInt             layout[3], num_modes = (interp ? 1 : 0) + (grad ? dim : 0);
23901c66c397SJeremy L Thompson     CeedScalar          max_norm = 0;
23911c66c397SJeremy L Thompson     const CeedScalar   *assembled_array, *q_weight_array;
23921c66c397SJeremy L Thompson     CeedVector          assembled = NULL, q_weight;
2393c5f45aeaSJeremy L Thompson     CeedElemRestriction rstr_qf   = NULL;
23941c66c397SJeremy L Thompson 
23951c66c397SJeremy L Thompson     // Assemble QFunction
23962b730f8bSJeremy L Thompson     CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled, &rstr_qf, request));
23972b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionGetELayout(rstr_qf, &layout));
23982b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionDestroy(&rstr_qf));
23992b730f8bSJeremy L Thompson     CeedCall(CeedVectorNorm(assembled, CEED_NORM_MAX, &max_norm));
2400eaf62fffSJeremy L Thompson 
2401eaf62fffSJeremy L Thompson     // Calculate element averages
24022b730f8bSJeremy L Thompson     CeedCall(CeedVectorCreate(ceed_parent, num_qpts, &q_weight));
24032b730f8bSJeremy L Thompson     CeedCall(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, q_weight));
24042b730f8bSJeremy L Thompson     CeedCall(CeedVectorGetArrayRead(assembled, CEED_MEM_HOST, &assembled_array));
24052b730f8bSJeremy L Thompson     CeedCall(CeedVectorGetArrayRead(q_weight, CEED_MEM_HOST, &q_weight_array));
24062b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(num_elem, &elem_avg));
2407eaf62fffSJeremy L Thompson     const CeedScalar qf_value_bound = max_norm * 100 * CEED_EPSILON;
24081c66c397SJeremy L Thompson 
2409eaf62fffSJeremy L Thompson     for (CeedInt e = 0; e < num_elem; e++) {
2410eaf62fffSJeremy L Thompson       CeedInt count = 0;
24111c66c397SJeremy L Thompson 
24122b730f8bSJeremy L Thompson       for (CeedInt q = 0; q < num_qpts; q++) {
24132b730f8bSJeremy L Thompson         for (CeedInt i = 0; i < num_comp * num_comp * num_modes * num_modes; i++) {
24142b730f8bSJeremy L Thompson           if (fabs(assembled_array[q * layout[0] + i * layout[1] + e * layout[2]]) > qf_value_bound) {
24152b730f8bSJeremy L Thompson             elem_avg[e] += assembled_array[q * layout[0] + i * layout[1] + e * layout[2]] / q_weight_array[q];
2416eaf62fffSJeremy L Thompson             count++;
2417eaf62fffSJeremy L Thompson           }
24182b730f8bSJeremy L Thompson         }
24192b730f8bSJeremy L Thompson       }
2420eaf62fffSJeremy L Thompson       if (count) {
2421eaf62fffSJeremy L Thompson         elem_avg[e] /= count;
2422eaf62fffSJeremy L Thompson       } else {
2423eaf62fffSJeremy L Thompson         elem_avg[e] = 1.0;
2424eaf62fffSJeremy L Thompson       }
2425eaf62fffSJeremy L Thompson     }
24262b730f8bSJeremy L Thompson     CeedCall(CeedVectorRestoreArrayRead(assembled, &assembled_array));
24272b730f8bSJeremy L Thompson     CeedCall(CeedVectorDestroy(&assembled));
24282b730f8bSJeremy L Thompson     CeedCall(CeedVectorRestoreArrayRead(q_weight, &q_weight_array));
24292b730f8bSJeremy L Thompson     CeedCall(CeedVectorDestroy(&q_weight));
24301c66c397SJeremy L Thompson   }
2431eaf62fffSJeremy L Thompson 
2432eaf62fffSJeremy L Thompson   // Build FDM diagonal
24331c66c397SJeremy L Thompson   {
2434eaf62fffSJeremy L Thompson     CeedScalar *q_data_array, *fdm_diagonal;
24351c66c397SJeremy L Thompson 
2436352a5e7cSSebastian Grimberg     CeedCall(CeedCalloc(num_comp * num_nodes, &fdm_diagonal));
2437352a5e7cSSebastian Grimberg     const CeedScalar fdm_diagonal_bound = num_nodes * CEED_EPSILON;
24382b730f8bSJeremy L Thompson     for (CeedInt c = 0; c < num_comp; c++) {
2439352a5e7cSSebastian Grimberg       for (CeedInt n = 0; n < num_nodes; n++) {
2440352a5e7cSSebastian Grimberg         if (interp) fdm_diagonal[c * num_nodes + n] = 1.0;
24412b730f8bSJeremy L Thompson         if (grad) {
2442eaf62fffSJeremy L Thompson           for (CeedInt d = 0; d < dim; d++) {
2443eaf62fffSJeremy L Thompson             CeedInt i = (n / CeedIntPow(P_1d, d)) % P_1d;
2444352a5e7cSSebastian Grimberg             fdm_diagonal[c * num_nodes + n] += lambda[i];
2445eaf62fffSJeremy L Thompson           }
2446eaf62fffSJeremy L Thompson         }
2447352a5e7cSSebastian Grimberg         if (fabs(fdm_diagonal[c * num_nodes + n]) < fdm_diagonal_bound) fdm_diagonal[c * num_nodes + n] = fdm_diagonal_bound;
24482b730f8bSJeremy L Thompson       }
24492b730f8bSJeremy L Thompson     }
2450352a5e7cSSebastian Grimberg     CeedCall(CeedVectorCreate(ceed_parent, num_elem * num_comp * num_nodes, &q_data));
24512b730f8bSJeremy L Thompson     CeedCall(CeedVectorSetValue(q_data, 0.0));
24522b730f8bSJeremy L Thompson     CeedCall(CeedVectorGetArrayWrite(q_data, CEED_MEM_HOST, &q_data_array));
24532b730f8bSJeremy L Thompson     for (CeedInt e = 0; e < num_elem; e++) {
24542b730f8bSJeremy L Thompson       for (CeedInt c = 0; c < num_comp; c++) {
24551c66c397SJeremy L Thompson         for (CeedInt n = 0; n < num_nodes; n++)
24561c66c397SJeremy L Thompson           q_data_array[(e * num_comp + c) * num_nodes + n] = 1. / (elem_avg[e] * fdm_diagonal[c * num_nodes + n]);
24572b730f8bSJeremy L Thompson       }
24582b730f8bSJeremy L Thompson     }
24592b730f8bSJeremy L Thompson     CeedCall(CeedFree(&elem_avg));
24602b730f8bSJeremy L Thompson     CeedCall(CeedFree(&fdm_diagonal));
24612b730f8bSJeremy L Thompson     CeedCall(CeedVectorRestoreArray(q_data, &q_data_array));
24621c66c397SJeremy L Thompson   }
2463eaf62fffSJeremy L Thompson 
2464eaf62fffSJeremy L Thompson   // Setup FDM operator
2465eaf62fffSJeremy L Thompson   // -- Basis
24661c66c397SJeremy L Thompson   {
2467eaf62fffSJeremy L Thompson     CeedScalar *grad_dummy, *q_ref_dummy, *q_weight_dummy;
24681c66c397SJeremy L Thompson 
24692b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(P_1d * P_1d, &grad_dummy));
24702b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(P_1d, &q_ref_dummy));
24712b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(P_1d, &q_weight_dummy));
24722b730f8bSJeremy L Thompson     CeedCall(CeedBasisCreateTensorH1(ceed_parent, dim, num_comp, P_1d, P_1d, fdm_interp, grad_dummy, q_ref_dummy, q_weight_dummy, &fdm_basis));
24732b730f8bSJeremy L Thompson     CeedCall(CeedFree(&fdm_interp));
24742b730f8bSJeremy L Thompson     CeedCall(CeedFree(&grad_dummy));
24752b730f8bSJeremy L Thompson     CeedCall(CeedFree(&q_ref_dummy));
24762b730f8bSJeremy L Thompson     CeedCall(CeedFree(&q_weight_dummy));
24772b730f8bSJeremy L Thompson     CeedCall(CeedFree(&lambda));
24781c66c397SJeremy L Thompson   }
2479eaf62fffSJeremy L Thompson 
2480eaf62fffSJeremy L Thompson   // -- Restriction
24811c66c397SJeremy L Thompson   {
2482352a5e7cSSebastian Grimberg     CeedInt strides[3] = {1, num_nodes, num_nodes * num_comp};
2483352a5e7cSSebastian Grimberg     CeedCall(CeedElemRestrictionCreateStrided(ceed_parent, num_elem, num_nodes, num_comp, num_elem * num_comp * num_nodes, strides, &rstr_qd_i));
24841c66c397SJeremy L Thompson   }
24851c66c397SJeremy L Thompson 
2486eaf62fffSJeremy L Thompson   // -- QFunction
24872b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionCreateInteriorByName(ceed_parent, "Scale", &qf_fdm));
24882b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAddInput(qf_fdm, "input", num_comp, CEED_EVAL_INTERP));
24892b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAddInput(qf_fdm, "scale", num_comp, CEED_EVAL_NONE));
24902b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAddOutput(qf_fdm, "output", num_comp, CEED_EVAL_INTERP));
24912b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_fdm, num_comp));
24921c66c397SJeremy L Thompson 
2493eaf62fffSJeremy L Thompson   // -- QFunction context
24941c66c397SJeremy L Thompson   {
2495eaf62fffSJeremy L Thompson     CeedInt *num_comp_data;
24961c66c397SJeremy L Thompson 
24972b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(1, &num_comp_data));
2498eaf62fffSJeremy L Thompson     num_comp_data[0] = num_comp;
24992b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextCreate(ceed, &ctx_fdm));
25002b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextSetData(ctx_fdm, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_data), num_comp_data));
25011c66c397SJeremy L Thompson   }
25022b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionSetContext(qf_fdm, ctx_fdm));
25032b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionContextDestroy(&ctx_fdm));
25041c66c397SJeremy L Thompson 
2505eaf62fffSJeremy L Thompson   // -- Operator
25062b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCreate(ceed_parent, qf_fdm, NULL, NULL, fdm_inv));
25072b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetField(*fdm_inv, "input", rstr, fdm_basis, CEED_VECTOR_ACTIVE));
25082b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetField(*fdm_inv, "scale", rstr_qd_i, CEED_BASIS_COLLOCATED, q_data));
25092b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetField(*fdm_inv, "output", rstr, fdm_basis, CEED_VECTOR_ACTIVE));
2510eaf62fffSJeremy L Thompson 
2511eaf62fffSJeremy L Thompson   // Cleanup
25122b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&q_data));
25132b730f8bSJeremy L Thompson   CeedCall(CeedBasisDestroy(&fdm_basis));
25142b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&rstr_qd_i));
25152b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionDestroy(&qf_fdm));
2516eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
2517eaf62fffSJeremy L Thompson }
2518eaf62fffSJeremy L Thompson 
2519eaf62fffSJeremy L Thompson /// @}
2520