xref: /libCEED/rust/libceed-sys/c-src/interface/ceed-preconditioning.c (revision b05f7e9f18319d38f6812c09171b3c228477e742)
13d8e8822SJeremy L Thompson // Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors.
23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details.
3eaf62fffSJeremy L Thompson //
43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause
5eaf62fffSJeremy L Thompson //
63d8e8822SJeremy L Thompson // This file is part of CEED:  http://github.com/ceed
7eaf62fffSJeremy L Thompson 
82b730f8bSJeremy L Thompson #include <ceed-impl.h>
949aac155SJeremy L Thompson #include <ceed.h>
102b730f8bSJeremy L Thompson #include <ceed/backend.h>
11c85e8640SSebastian Grimberg #include <assert.h>
122b730f8bSJeremy L Thompson #include <math.h>
13eaf62fffSJeremy L Thompson #include <stdbool.h>
14eaf62fffSJeremy L Thompson #include <stdio.h>
15eaf62fffSJeremy L Thompson #include <string.h>
16eaf62fffSJeremy L Thompson 
17eaf62fffSJeremy L Thompson /// @file
18eaf62fffSJeremy L Thompson /// Implementation of CeedOperator preconditioning interfaces
19eaf62fffSJeremy L Thompson 
20eaf62fffSJeremy L Thompson /// ----------------------------------------------------------------------------
21eaf62fffSJeremy L Thompson /// CeedOperator Library Internal Preconditioning Functions
22eaf62fffSJeremy L Thompson /// ----------------------------------------------------------------------------
23eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorDeveloper
24eaf62fffSJeremy L Thompson /// @{
25eaf62fffSJeremy L Thompson 
26eaf62fffSJeremy L Thompson /**
27ea61e9acSJeremy L Thompson   @brief Duplicate a CeedQFunction with a reference Ceed to fallback for advanced CeedOperator functionality
289e77b9c8SJeremy L Thompson 
2901ea9c81SJed Brown   @param[in]  fallback_ceed Ceed on which to create fallback CeedQFunction
309e77b9c8SJeremy L Thompson   @param[in]  qf            CeedQFunction to create fallback for
3101ea9c81SJed Brown   @param[out] qf_fallback   fallback CeedQFunction
329e77b9c8SJeremy L Thompson 
339e77b9c8SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
349e77b9c8SJeremy L Thompson 
359e77b9c8SJeremy L Thompson   @ref Developer
369e77b9c8SJeremy L Thompson **/
372b730f8bSJeremy L Thompson static int CeedQFunctionCreateFallback(Ceed fallback_ceed, CeedQFunction qf, CeedQFunction *qf_fallback) {
389e77b9c8SJeremy L Thompson   // Check if NULL qf passed in
399e77b9c8SJeremy L Thompson   if (!qf) return CEED_ERROR_SUCCESS;
409e77b9c8SJeremy L Thompson 
41d04bbc78SJeremy L Thompson   CeedDebug256(qf->ceed, 1, "---------- CeedOperator Fallback ----------\n");
4213f886e9SJeremy L Thompson   CeedDebug(qf->ceed, "Creating fallback CeedQFunction\n");
43d04bbc78SJeremy L Thompson 
441862681bSJeremy Luke Thompson   char *source_path_with_name = NULL;
459e77b9c8SJeremy L Thompson   if (qf->source_path) {
462b730f8bSJeremy L Thompson     size_t path_len = strlen(qf->source_path), name_len = strlen(qf->kernel_name);
472b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(path_len + name_len + 2, &source_path_with_name));
489e77b9c8SJeremy L Thompson     memcpy(source_path_with_name, qf->source_path, path_len);
499e77b9c8SJeremy L Thompson     memcpy(&source_path_with_name[path_len], ":", 1);
509e77b9c8SJeremy L Thompson     memcpy(&source_path_with_name[path_len + 1], qf->kernel_name, name_len);
519e77b9c8SJeremy L Thompson   } else {
522b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(1, &source_path_with_name));
539e77b9c8SJeremy L Thompson   }
549e77b9c8SJeremy L Thompson 
552b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionCreateInterior(fallback_ceed, qf->vec_length, qf->function, source_path_with_name, qf_fallback));
569e77b9c8SJeremy L Thompson   {
579e77b9c8SJeremy L Thompson     CeedQFunctionContext ctx;
589e77b9c8SJeremy L Thompson 
592b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionGetContext(qf, &ctx));
602b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionSetContext(*qf_fallback, ctx));
619e77b9c8SJeremy L Thompson   }
629e77b9c8SJeremy L Thompson   for (CeedInt i = 0; i < qf->num_input_fields; i++) {
632b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddInput(*qf_fallback, qf->input_fields[i]->field_name, qf->input_fields[i]->size, qf->input_fields[i]->eval_mode));
649e77b9c8SJeremy L Thompson   }
659e77b9c8SJeremy L Thompson   for (CeedInt i = 0; i < qf->num_output_fields; i++) {
662b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddOutput(*qf_fallback, qf->output_fields[i]->field_name, qf->output_fields[i]->size, qf->output_fields[i]->eval_mode));
679e77b9c8SJeremy L Thompson   }
682b730f8bSJeremy L Thompson   CeedCall(CeedFree(&source_path_with_name));
699e77b9c8SJeremy L Thompson 
709e77b9c8SJeremy L Thompson   return CEED_ERROR_SUCCESS;
719e77b9c8SJeremy L Thompson }
729e77b9c8SJeremy L Thompson 
739e77b9c8SJeremy L Thompson /**
74ea61e9acSJeremy L Thompson   @brief Duplicate a CeedOperator with a reference Ceed to fallback for advanced CeedOperator functionality
75eaf62fffSJeremy L Thompson 
76ea61e9acSJeremy L Thompson   @param[in,out] op CeedOperator to create fallback for
77eaf62fffSJeremy L Thompson 
78eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
79eaf62fffSJeremy L Thompson 
80eaf62fffSJeremy L Thompson   @ref Developer
81eaf62fffSJeremy L Thompson **/
82d04bbc78SJeremy L Thompson static int CeedOperatorCreateFallback(CeedOperator op) {
83b275c451SJeremy L Thompson   bool is_composite;
849e77b9c8SJeremy L Thompson   Ceed ceed_fallback;
85eaf62fffSJeremy L Thompson 
86805fe78eSJeremy L Thompson   // Check not already created
87805fe78eSJeremy L Thompson   if (op->op_fallback) return CEED_ERROR_SUCCESS;
88805fe78eSJeremy L Thompson 
89eaf62fffSJeremy L Thompson   // Fallback Ceed
902b730f8bSJeremy L Thompson   CeedCall(CeedGetOperatorFallbackCeed(op->ceed, &ceed_fallback));
91d04bbc78SJeremy L Thompson   if (!ceed_fallback) return CEED_ERROR_SUCCESS;
92d04bbc78SJeremy L Thompson 
93d04bbc78SJeremy L Thompson   CeedDebug256(op->ceed, 1, "---------- CeedOperator Fallback ----------\n");
9413f886e9SJeremy L Thompson   CeedDebug(op->ceed, "Creating fallback CeedOperator\n");
95eaf62fffSJeremy L Thompson 
96eaf62fffSJeremy L Thompson   // Clone Op
97805fe78eSJeremy L Thompson   CeedOperator op_fallback;
98b275c451SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
99b275c451SJeremy L Thompson   if (is_composite) {
100b275c451SJeremy L Thompson     CeedInt       num_suboperators;
101b275c451SJeremy L Thompson     CeedOperator *sub_operators;
102b275c451SJeremy L Thompson 
1032b730f8bSJeremy L Thompson     CeedCall(CeedCompositeOperatorCreate(ceed_fallback, &op_fallback));
104b275c451SJeremy L Thompson     CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
105b275c451SJeremy L Thompson     CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
106b275c451SJeremy L Thompson     for (CeedInt i = 0; i < num_suboperators; i++) {
107d04bbc78SJeremy L Thompson       CeedOperator op_sub_fallback;
108d04bbc78SJeremy L Thompson 
109b275c451SJeremy L Thompson       CeedCall(CeedOperatorGetFallback(sub_operators[i], &op_sub_fallback));
1102b730f8bSJeremy L Thompson       CeedCall(CeedCompositeOperatorAddSub(op_fallback, op_sub_fallback));
111805fe78eSJeremy L Thompson     }
112805fe78eSJeremy L Thompson   } else {
1139e77b9c8SJeremy L Thompson     CeedQFunction qf_fallback = NULL, dqf_fallback = NULL, dqfT_fallback = NULL;
1142b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->qf, &qf_fallback));
1152b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqf, &dqf_fallback));
1162b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqfT, &dqfT_fallback));
1172b730f8bSJeremy L Thompson     CeedCall(CeedOperatorCreate(ceed_fallback, qf_fallback, dqf_fallback, dqfT_fallback, &op_fallback));
118805fe78eSJeremy L Thompson     for (CeedInt i = 0; i < op->qf->num_input_fields; i++) {
119437c7c90SJeremy L Thompson       CeedCall(CeedOperatorSetField(op_fallback, op->input_fields[i]->field_name, op->input_fields[i]->elem_rstr, op->input_fields[i]->basis,
1202b730f8bSJeremy L Thompson                                     op->input_fields[i]->vec));
121805fe78eSJeremy L Thompson     }
122805fe78eSJeremy L Thompson     for (CeedInt i = 0; i < op->qf->num_output_fields; i++) {
123437c7c90SJeremy L Thompson       CeedCall(CeedOperatorSetField(op_fallback, op->output_fields[i]->field_name, op->output_fields[i]->elem_rstr, op->output_fields[i]->basis,
1242b730f8bSJeremy L Thompson                                     op->output_fields[i]->vec));
125805fe78eSJeremy L Thompson     }
1262b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op->qf_assembled, &op_fallback->qf_assembled));
127febe2972SJeremy L Thompson     if (op_fallback->num_qpts == 0) CeedCall(CeedOperatorSetNumQuadraturePoints(op_fallback, op->num_qpts));
1289e77b9c8SJeremy L Thompson     // Cleanup
1292b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionDestroy(&qf_fallback));
1302b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionDestroy(&dqf_fallback));
1312b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionDestroy(&dqfT_fallback));
132805fe78eSJeremy L Thompson   }
1332b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetName(op_fallback, op->name));
1342b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op_fallback));
135*b05f7e9fSJeremy L Thompson   // Note: No ref-counting here so we don't get caught in a reference loop.
136*b05f7e9fSJeremy L Thompson   //       The op holds the only reference to op_fallback and is responsible for deleting itself and op_fallback.
137805fe78eSJeremy L Thompson   op->op_fallback                 = op_fallback;
138*b05f7e9fSJeremy L Thompson   op_fallback->op_fallback_parent = op;
139eaf62fffSJeremy L Thompson 
140eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
141eaf62fffSJeremy L Thompson }
142eaf62fffSJeremy L Thompson 
143eaf62fffSJeremy L Thompson /**
144ea61e9acSJeremy L Thompson   @brief Retrieve fallback CeedOperator with a reference Ceed for advanced CeedOperator functionality
145d04bbc78SJeremy L Thompson 
146d04bbc78SJeremy L Thompson   @param[in]  op          CeedOperator to retrieve fallback for
147d04bbc78SJeremy L Thompson   @param[out] op_fallback Fallback CeedOperator
148d04bbc78SJeremy L Thompson 
149d04bbc78SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
150d04bbc78SJeremy L Thompson 
151d04bbc78SJeremy L Thompson   @ref Developer
152d04bbc78SJeremy L Thompson **/
153d04bbc78SJeremy L Thompson int CeedOperatorGetFallback(CeedOperator op, CeedOperator *op_fallback) {
154d04bbc78SJeremy L Thompson   // Create if needed
155d04bbc78SJeremy L Thompson   if (!op->op_fallback) {
1562b730f8bSJeremy L Thompson     CeedCall(CeedOperatorCreateFallback(op));
157d04bbc78SJeremy L Thompson   }
158d04bbc78SJeremy L Thompson   if (op->op_fallback) {
159d04bbc78SJeremy L Thompson     bool is_debug;
160d04bbc78SJeremy L Thompson 
1612b730f8bSJeremy L Thompson     CeedCall(CeedIsDebug(op->ceed, &is_debug));
162d04bbc78SJeremy L Thompson     if (is_debug) {
163b275c451SJeremy L Thompson       Ceed        ceed, ceed_fallback;
164d04bbc78SJeremy L Thompson       const char *resource, *resource_fallback;
165d04bbc78SJeremy L Thompson 
166b275c451SJeremy L Thompson       CeedCall(CeedOperatorGetCeed(op, &ceed));
167b275c451SJeremy L Thompson       CeedCall(CeedGetOperatorFallbackCeed(ceed, &ceed_fallback));
168b275c451SJeremy L Thompson       CeedCall(CeedGetResource(ceed, &resource));
1692b730f8bSJeremy L Thompson       CeedCall(CeedGetResource(ceed_fallback, &resource_fallback));
170d04bbc78SJeremy L Thompson 
17123d4529eSJeremy L Thompson       CeedDebug256(ceed, CEED_DEBUG_COLOR_SUCCESS, "---------- CeedOperator Fallback ----------\n");
172b275c451SJeremy L Thompson       CeedDebug(ceed, "Falling back from %s operator at address %ld to %s operator at address %ld\n", resource, op, resource_fallback,
1732b730f8bSJeremy L Thompson                 op->op_fallback);
174d04bbc78SJeremy L Thompson     }
175d04bbc78SJeremy L Thompson   }
176d04bbc78SJeremy L Thompson   *op_fallback = op->op_fallback;
177d04bbc78SJeremy L Thompson 
178d04bbc78SJeremy L Thompson   return CEED_ERROR_SUCCESS;
179d04bbc78SJeremy L Thompson }
180d04bbc78SJeremy L Thompson 
181d04bbc78SJeremy L Thompson /**
182eaf62fffSJeremy L Thompson   @brief Select correct basis matrix pointer based on CeedEvalMode
183eaf62fffSJeremy L Thompson 
184352a5e7cSSebastian Grimberg   @param[in]  basis     CeedBasis from which to get the basis matrix
185eaf62fffSJeremy L Thompson   @param[in]  eval_mode Current basis evaluation mode
186eaf62fffSJeremy L Thompson   @param[in]  identity  Pointer to identity matrix
187eaf62fffSJeremy L Thompson   @param[out] basis_ptr Basis pointer to set
188eaf62fffSJeremy L Thompson 
189eaf62fffSJeremy L Thompson   @ref Developer
190eaf62fffSJeremy L Thompson **/
191352a5e7cSSebastian Grimberg static inline int CeedOperatorGetBasisPointer(CeedBasis basis, CeedEvalMode eval_mode, const CeedScalar *identity, const CeedScalar **basis_ptr) {
192eaf62fffSJeremy L Thompson   switch (eval_mode) {
193eaf62fffSJeremy L Thompson     case CEED_EVAL_NONE:
194eaf62fffSJeremy L Thompson       *basis_ptr = identity;
195eaf62fffSJeremy L Thompson       break;
196eaf62fffSJeremy L Thompson     case CEED_EVAL_INTERP:
197352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetInterp(basis, basis_ptr));
198eaf62fffSJeremy L Thompson       break;
199eaf62fffSJeremy L Thompson     case CEED_EVAL_GRAD:
200352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetGrad(basis, basis_ptr));
201352a5e7cSSebastian Grimberg       break;
202352a5e7cSSebastian Grimberg     case CEED_EVAL_DIV:
203352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetDiv(basis, basis_ptr));
204352a5e7cSSebastian Grimberg       break;
205352a5e7cSSebastian Grimberg     case CEED_EVAL_CURL:
206352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetCurl(basis, basis_ptr));
207eaf62fffSJeremy L Thompson       break;
208eaf62fffSJeremy L Thompson     case CEED_EVAL_WEIGHT:
209eaf62fffSJeremy L Thompson       break;  // Caught by QF Assembly
210eaf62fffSJeremy L Thompson   }
211ed9e99e6SJeremy L Thompson   assert(*basis_ptr != NULL);
212352a5e7cSSebastian Grimberg 
213352a5e7cSSebastian Grimberg   return CEED_ERROR_SUCCESS;
214eaf62fffSJeremy L Thompson }
215eaf62fffSJeremy L Thompson 
216eaf62fffSJeremy L Thompson /**
217eaf62fffSJeremy L Thompson   @brief Create point block restriction for active operator field
218eaf62fffSJeremy L Thompson 
219eaf62fffSJeremy L Thompson   @param[in]  rstr            Original CeedElemRestriction for active field
220ea61e9acSJeremy L Thompson   @param[out] pointblock_rstr Address of the variable where the newly created CeedElemRestriction will be stored
221eaf62fffSJeremy L Thompson 
222eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
223eaf62fffSJeremy L Thompson 
224eaf62fffSJeremy L Thompson   @ref Developer
225eaf62fffSJeremy L Thompson **/
2262b730f8bSJeremy L Thompson static int CeedOperatorCreateActivePointBlockRestriction(CeedElemRestriction rstr, CeedElemRestriction *pointblock_rstr) {
227eaf62fffSJeremy L Thompson   Ceed ceed;
2282b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetCeed(rstr, &ceed));
229eaf62fffSJeremy L Thompson   const CeedInt *offsets;
2302b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetOffsets(rstr, CEED_MEM_HOST, &offsets));
231eaf62fffSJeremy L Thompson 
232eaf62fffSJeremy L Thompson   // Expand offsets
2337b63f5c6SJed Brown   CeedInt  num_elem, num_comp, elem_size, comp_stride, *pointblock_offsets;
2347b63f5c6SJed Brown   CeedSize l_size;
2352b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem));
2362b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp));
2372b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size));
2382b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetCompStride(rstr, &comp_stride));
2392b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size));
240eaf62fffSJeremy L Thompson   CeedInt shift = num_comp;
2412b730f8bSJeremy L Thompson   if (comp_stride != 1) shift *= num_comp;
2422b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(num_elem * elem_size, &pointblock_offsets));
243eaf62fffSJeremy L Thompson   for (CeedInt i = 0; i < num_elem * elem_size; i++) {
244eaf62fffSJeremy L Thompson     pointblock_offsets[i] = offsets[i] * shift;
245eaf62fffSJeremy L Thompson   }
246eaf62fffSJeremy L Thompson 
247eaf62fffSJeremy L Thompson   // Create new restriction
2482b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionCreate(ceed, num_elem, elem_size, num_comp * num_comp, 1, l_size * num_comp, CEED_MEM_HOST, CEED_OWN_POINTER,
2492b730f8bSJeremy L Thompson                                      pointblock_offsets, pointblock_rstr));
250eaf62fffSJeremy L Thompson 
251eaf62fffSJeremy L Thompson   // Cleanup
2522b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionRestoreOffsets(rstr, &offsets));
253eaf62fffSJeremy L Thompson 
254eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
255eaf62fffSJeremy L Thompson }
256eaf62fffSJeremy L Thompson 
257eaf62fffSJeremy L Thompson /**
258eaf62fffSJeremy L Thompson   @brief Core logic for assembling operator diagonal or point block diagonal
259eaf62fffSJeremy L Thompson 
260eaf62fffSJeremy L Thompson   @param[in]  op            CeedOperator to assemble point block diagonal
261ea61e9acSJeremy L Thompson   @param[in]  request       Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE
262eaf62fffSJeremy L Thompson   @param[in]  is_pointblock Boolean flag to assemble diagonal or point block diagonal
263eaf62fffSJeremy L Thompson   @param[out] assembled     CeedVector to store assembled diagonal
264eaf62fffSJeremy L Thompson 
265eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
266eaf62fffSJeremy L Thompson 
267eaf62fffSJeremy L Thompson   @ref Developer
268eaf62fffSJeremy L Thompson **/
2692b730f8bSJeremy L Thompson static inline int CeedSingleOperatorAssembleAddDiagonal_Core(CeedOperator op, CeedRequest *request, const bool is_pointblock, CeedVector assembled) {
270eaf62fffSJeremy L Thompson   Ceed ceed;
2712b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
272eaf62fffSJeremy L Thompson 
273eaf62fffSJeremy L Thompson   // Assemble QFunction
274eaf62fffSJeremy L Thompson   CeedQFunction       qf;
275437c7c90SJeremy L Thompson   const CeedScalar   *assembled_qf_array;
276c5f45aeaSJeremy L Thompson   CeedVector          assembled_qf        = NULL;
277c5f45aeaSJeremy L Thompson   CeedElemRestriction assembled_elem_rstr = NULL;
278437c7c90SJeremy L Thompson   CeedInt             num_input_fields, num_output_fields;
279eaf62fffSJeremy L Thompson   CeedInt             layout[3];
280437c7c90SJeremy L Thompson 
281437c7c90SJeremy L Thompson   CeedCall(CeedOperatorGetQFunction(op, &qf));
282437c7c90SJeremy L Thompson   CeedCall(CeedQFunctionGetNumArgs(qf, &num_input_fields, &num_output_fields));
283437c7c90SJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &assembled_elem_rstr, request));
284437c7c90SJeremy L Thompson   CeedCall(CeedElemRestrictionGetELayout(assembled_elem_rstr, &layout));
285437c7c90SJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&assembled_elem_rstr));
286437c7c90SJeremy L Thompson   CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array));
287eaf62fffSJeremy L Thompson 
288ed9e99e6SJeremy L Thompson   // Get assembly data
289ed9e99e6SJeremy L Thompson   CeedOperatorAssemblyData data;
290437c7c90SJeremy L Thompson   const CeedEvalMode     **eval_modes_in, **eval_modes_out;
291437c7c90SJeremy L Thompson   CeedInt                 *num_eval_modes_in, *num_eval_modes_out, num_active_bases;
292437c7c90SJeremy L Thompson   CeedSize               **eval_mode_offsets_in, **eval_mode_offsets_out, num_output_components;
293437c7c90SJeremy L Thompson   CeedBasis               *active_bases;
294437c7c90SJeremy L Thompson   CeedElemRestriction     *active_elem_rstrs;
295437c7c90SJeremy L Thompson   CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data));
296437c7c90SJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_active_bases, &num_eval_modes_in, &eval_modes_in, &eval_mode_offsets_in,
297437c7c90SJeremy L Thompson                                                 &num_eval_modes_out, &eval_modes_out, &eval_mode_offsets_out, &num_output_components));
298437c7c90SJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, &active_bases, NULL, NULL));
299437c7c90SJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetElemRestrictions(data, NULL, &active_elem_rstrs));
300437c7c90SJeremy L Thompson 
301437c7c90SJeremy L Thompson   // Loop over all active bases
302437c7c90SJeremy L Thompson   for (CeedInt b = 0; b < num_active_bases; b++) {
303eaf62fffSJeremy L Thompson     // Assemble point block diagonal restriction, if needed
304437c7c90SJeremy L Thompson     CeedElemRestriction diag_elem_rstr = active_elem_rstrs[b];
305437c7c90SJeremy L Thompson 
306eaf62fffSJeremy L Thompson     if (is_pointblock) {
307437c7c90SJeremy L Thompson       CeedElemRestriction point_block_elem_rstr;
308437c7c90SJeremy L Thompson 
309437c7c90SJeremy L Thompson       CeedCall(CeedOperatorCreateActivePointBlockRestriction(diag_elem_rstr, &point_block_elem_rstr));
310437c7c90SJeremy L Thompson       diag_elem_rstr = point_block_elem_rstr;
311eaf62fffSJeremy L Thompson     }
312eaf62fffSJeremy L Thompson 
313eaf62fffSJeremy L Thompson     // Create diagonal vector
314eaf62fffSJeremy L Thompson     CeedVector elem_diag;
315437c7c90SJeremy L Thompson     CeedCall(CeedElemRestrictionCreateVector(diag_elem_rstr, NULL, &elem_diag));
316eaf62fffSJeremy L Thompson 
317eaf62fffSJeremy L Thompson     // Assemble element operator diagonals
3189c774eddSJeremy L Thompson     CeedScalar *elem_diag_array;
319437c7c90SJeremy L Thompson     CeedInt     num_elem, num_nodes, num_qpts, num_components;
320437c7c90SJeremy L Thompson 
3212b730f8bSJeremy L Thompson     CeedCall(CeedVectorSetValue(elem_diag, 0.0));
3222b730f8bSJeremy L Thompson     CeedCall(CeedVectorGetArray(elem_diag, CEED_MEM_HOST, &elem_diag_array));
323437c7c90SJeremy L Thompson     CeedCall(CeedElemRestrictionGetNumElements(diag_elem_rstr, &num_elem));
324437c7c90SJeremy L Thompson     CeedCall(CeedBasisGetNumNodes(active_bases[b], &num_nodes));
325437c7c90SJeremy L Thompson     CeedCall(CeedBasisGetNumComponents(active_bases[b], &num_components));
326437c7c90SJeremy L Thompson     CeedCall(CeedBasisGetNumQuadraturePoints(active_bases[b], &num_qpts));
327ed9e99e6SJeremy L Thompson 
328352a5e7cSSebastian Grimberg     // Construct identity matrix for basis if required
329ed9e99e6SJeremy L Thompson     bool        has_eval_none = false;
330352a5e7cSSebastian Grimberg     CeedScalar *identity      = NULL;
331437c7c90SJeremy L Thompson     for (CeedInt i = 0; i < num_eval_modes_in[b]; i++) {
332437c7c90SJeremy L Thompson       has_eval_none = has_eval_none || (eval_modes_in[b][i] == CEED_EVAL_NONE);
333ed9e99e6SJeremy L Thompson     }
334437c7c90SJeremy L Thompson     for (CeedInt i = 0; i < num_eval_modes_out[b]; i++) {
335437c7c90SJeremy L Thompson       has_eval_none = has_eval_none || (eval_modes_out[b][i] == CEED_EVAL_NONE);
336ed9e99e6SJeremy L Thompson     }
337ed9e99e6SJeremy L Thompson     if (has_eval_none) {
3382b730f8bSJeremy L Thompson       CeedCall(CeedCalloc(num_qpts * num_nodes, &identity));
3392b730f8bSJeremy L Thompson       for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) identity[i * num_nodes + i] = 1.0;
340eaf62fffSJeremy L Thompson     }
341352a5e7cSSebastian Grimberg 
342eaf62fffSJeremy L Thompson     // Compute the diagonal of B^T D B
343eaf62fffSJeremy L Thompson     // Each element
344b94338b9SJed Brown     for (CeedSize e = 0; e < num_elem; e++) {
345eaf62fffSJeremy L Thompson       // Each basis eval mode pair
346352a5e7cSSebastian Grimberg       CeedInt      d_out              = 0, q_comp_out;
347352a5e7cSSebastian Grimberg       CeedEvalMode eval_mode_out_prev = CEED_EVAL_NONE;
348437c7c90SJeremy L Thompson       for (CeedInt e_out = 0; e_out < num_eval_modes_out[b]; e_out++) {
349437c7c90SJeremy L Thompson         const CeedScalar *B_t = NULL;
350352a5e7cSSebastian Grimberg         CeedOperatorGetBasisPointer(active_bases[b], eval_modes_out[b][e_out], identity, &B_t);
351352a5e7cSSebastian Grimberg         CeedCall(CeedBasisGetNumQuadratureComponents(active_bases[b], eval_modes_out[b][e_out], &q_comp_out));
352352a5e7cSSebastian Grimberg         if (q_comp_out > 1) {
353352a5e7cSSebastian Grimberg           if (e_out == 0 || eval_modes_out[b][e_out] != eval_mode_out_prev) d_out = 0;
354352a5e7cSSebastian Grimberg           else B_t = &B_t[(++d_out) * num_qpts * num_nodes];
355352a5e7cSSebastian Grimberg         }
356352a5e7cSSebastian Grimberg         eval_mode_out_prev = eval_modes_out[b][e_out];
357352a5e7cSSebastian Grimberg 
358352a5e7cSSebastian Grimberg         CeedInt      d_in              = 0, q_comp_in;
359352a5e7cSSebastian Grimberg         CeedEvalMode eval_mode_in_prev = CEED_EVAL_NONE;
360437c7c90SJeremy L Thompson         for (CeedInt e_in = 0; e_in < num_eval_modes_in[b]; e_in++) {
361437c7c90SJeremy L Thompson           const CeedScalar *B = NULL;
362352a5e7cSSebastian Grimberg           CeedOperatorGetBasisPointer(active_bases[b], eval_modes_in[b][e_in], identity, &B);
363352a5e7cSSebastian Grimberg           CeedCall(CeedBasisGetNumQuadratureComponents(active_bases[b], eval_modes_in[b][e_in], &q_comp_in));
364352a5e7cSSebastian Grimberg           if (q_comp_in > 1) {
365352a5e7cSSebastian Grimberg             if (e_in == 0 || eval_modes_in[b][e_in] != eval_mode_in_prev) d_in = 0;
366352a5e7cSSebastian Grimberg             else B = &B[(++d_in) * num_qpts * num_nodes];
367352a5e7cSSebastian Grimberg           }
368352a5e7cSSebastian Grimberg           eval_mode_in_prev = eval_modes_in[b][e_in];
369352a5e7cSSebastian Grimberg 
370eaf62fffSJeremy L Thompson           // Each component
371437c7c90SJeremy L Thompson           for (CeedInt c_out = 0; c_out < num_components; c_out++) {
372437c7c90SJeremy L Thompson             // Each qpt/node pair
3732b730f8bSJeremy L Thompson             for (CeedInt q = 0; q < num_qpts; q++) {
374eaf62fffSJeremy L Thompson               if (is_pointblock) {
375eaf62fffSJeremy L Thompson                 // Point Block Diagonal
376437c7c90SJeremy L Thompson                 for (CeedInt c_in = 0; c_in < num_components; c_in++) {
377b94338b9SJed Brown                   const CeedSize c_offset = (eval_mode_offsets_in[b][e_in] + c_in) * num_output_components + eval_mode_offsets_out[b][e_out] + c_out;
378437c7c90SJeremy L Thompson                   const CeedScalar qf_value = assembled_qf_array[q * layout[0] + c_offset * layout[1] + e * layout[2]];
3792b730f8bSJeremy L Thompson                   for (CeedInt n = 0; n < num_nodes; n++) {
380437c7c90SJeremy L Thompson                     elem_diag_array[((e * num_components + c_out) * num_components + c_in) * num_nodes + n] +=
381437c7c90SJeremy L Thompson                         B_t[q * num_nodes + n] * qf_value * B[q * num_nodes + n];
382eaf62fffSJeremy L Thompson                   }
3832b730f8bSJeremy L Thompson                 }
384eaf62fffSJeremy L Thompson               } else {
385eaf62fffSJeremy L Thompson                 // Diagonal Only
386437c7c90SJeremy L Thompson                 const CeedInt    c_offset = (eval_mode_offsets_in[b][e_in] + c_out) * num_output_components + eval_mode_offsets_out[b][e_out] + c_out;
387437c7c90SJeremy L Thompson                 const CeedScalar qf_value = assembled_qf_array[q * layout[0] + c_offset * layout[1] + e * layout[2]];
3882b730f8bSJeremy L Thompson                 for (CeedInt n = 0; n < num_nodes; n++) {
389437c7c90SJeremy L Thompson                   elem_diag_array[(e * num_components + c_out) * num_nodes + n] += B_t[q * num_nodes + n] * qf_value * B[q * num_nodes + n];
390eaf62fffSJeremy L Thompson                 }
391eaf62fffSJeremy L Thompson               }
392eaf62fffSJeremy L Thompson             }
393eaf62fffSJeremy L Thompson           }
3942b730f8bSJeremy L Thompson         }
3952b730f8bSJeremy L Thompson       }
3962b730f8bSJeremy L Thompson     }
3972b730f8bSJeremy L Thompson     CeedCall(CeedVectorRestoreArray(elem_diag, &elem_diag_array));
398eaf62fffSJeremy L Thompson 
399eaf62fffSJeremy L Thompson     // Assemble local operator diagonal
400f30b1135SSebastian Grimberg     CeedCall(CeedElemRestrictionApplyUnsigned(diag_elem_rstr, CEED_TRANSPOSE, elem_diag, assembled, request));
401eaf62fffSJeremy L Thompson 
402eaf62fffSJeremy L Thompson     // Cleanup
403437c7c90SJeremy L Thompson     if (is_pointblock) CeedCall(CeedElemRestrictionDestroy(&diag_elem_rstr));
4042b730f8bSJeremy L Thompson     CeedCall(CeedVectorDestroy(&elem_diag));
4052b730f8bSJeremy L Thompson     CeedCall(CeedFree(&identity));
406437c7c90SJeremy L Thompson   }
407437c7c90SJeremy L Thompson   CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array));
408437c7c90SJeremy L Thompson   CeedCall(CeedVectorDestroy(&assembled_qf));
409eaf62fffSJeremy L Thompson 
410eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
411eaf62fffSJeremy L Thompson }
412eaf62fffSJeremy L Thompson 
413eaf62fffSJeremy L Thompson /**
414eaf62fffSJeremy L Thompson   @brief Core logic for assembling composite operator diagonal
415eaf62fffSJeremy L Thompson 
416eaf62fffSJeremy L Thompson   @param[in]  op            CeedOperator to assemble point block diagonal
417ea61e9acSJeremy L Thompson   @param[in]  request       Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE
418eaf62fffSJeremy L Thompson   @param[in]  is_pointblock Boolean flag to assemble diagonal or point block diagonal
419eaf62fffSJeremy L Thompson   @param[out] assembled     CeedVector to store assembled diagonal
420eaf62fffSJeremy L Thompson 
421eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
422eaf62fffSJeremy L Thompson 
423eaf62fffSJeremy L Thompson   @ref Developer
424eaf62fffSJeremy L Thompson **/
4252b730f8bSJeremy L Thompson static inline int CeedCompositeOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedRequest *request, const bool is_pointblock,
426eaf62fffSJeremy L Thompson                                                                  CeedVector assembled) {
427eaf62fffSJeremy L Thompson   CeedInt       num_sub;
428eaf62fffSJeremy L Thompson   CeedOperator *suboperators;
429c6ebc35dSJeremy L Thompson   CeedCall(CeedCompositeOperatorGetNumSub(op, &num_sub));
430c6ebc35dSJeremy L Thompson   CeedCall(CeedCompositeOperatorGetSubList(op, &suboperators));
431eaf62fffSJeremy L Thompson   for (CeedInt i = 0; i < num_sub; i++) {
4326aa95790SJeremy L Thompson     if (is_pointblock) {
4332b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(suboperators[i], assembled, request));
4346aa95790SJeremy L Thompson     } else {
4352b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleAddDiagonal(suboperators[i], assembled, request));
4366aa95790SJeremy L Thompson     }
437eaf62fffSJeremy L Thompson   }
438eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
439eaf62fffSJeremy L Thompson }
440eaf62fffSJeremy L Thompson 
441eaf62fffSJeremy L Thompson /**
442eaf62fffSJeremy L Thompson   @brief Build nonzero pattern for non-composite operator
443eaf62fffSJeremy L Thompson 
444eaf62fffSJeremy L Thompson   Users should generally use CeedOperatorLinearAssembleSymbolic()
445eaf62fffSJeremy L Thompson 
4463bdd4e5aSSebastian Grimberg   Note: For operators using oriented element restrictions, entries in rows or cols may be negative indicating the assembled value at this nonzero
4473bdd4e5aSSebastian Grimberg should be negated
448f30b1135SSebastian Grimberg 
449eaf62fffSJeremy L Thompson   @param[in]  op     CeedOperator to assemble nonzero pattern
450eaf62fffSJeremy L Thompson   @param[in]  offset Offset for number of entries
451eaf62fffSJeremy L Thompson   @param[out] rows   Row number for each entry
452eaf62fffSJeremy L Thompson   @param[out] cols   Column number for each entry
453eaf62fffSJeremy L Thompson 
454eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
455eaf62fffSJeremy L Thompson 
456eaf62fffSJeremy L Thompson   @ref Developer
457eaf62fffSJeremy L Thompson **/
4582b730f8bSJeremy L Thompson static int CeedSingleOperatorAssembleSymbolic(CeedOperator op, CeedInt offset, CeedInt *rows, CeedInt *cols) {
459f3d47e36SJeremy L Thompson   Ceed ceed;
460f3d47e36SJeremy L Thompson   bool is_composite;
461f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
462f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
463f3d47e36SJeremy L Thompson 
4646574a04fSJeremy L Thompson   CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported");
465eaf62fffSJeremy L Thompson 
466c9366a6bSJeremy L Thompson   CeedSize num_nodes;
4672b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &num_nodes, NULL));
468eaf62fffSJeremy L Thompson   CeedElemRestriction rstr_in;
4692b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveElemRestriction(op, &rstr_in));
470e79b91d9SJeremy L Thompson   CeedInt num_elem, elem_size, num_comp;
4712b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(rstr_in, &num_elem));
4722b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetElementSize(rstr_in, &elem_size));
4732b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumComponents(rstr_in, &num_comp));
474eaf62fffSJeremy L Thompson   CeedInt layout_er[3];
4752b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetELayout(rstr_in, &layout_er));
476eaf62fffSJeremy L Thompson 
477eaf62fffSJeremy L Thompson   CeedInt local_num_entries = elem_size * num_comp * elem_size * num_comp * num_elem;
478eaf62fffSJeremy L Thompson 
479eaf62fffSJeremy L Thompson   // Determine elem_dof relation
480eaf62fffSJeremy L Thompson   CeedVector index_vec;
4812b730f8bSJeremy L Thompson   CeedCall(CeedVectorCreate(ceed, num_nodes, &index_vec));
482eaf62fffSJeremy L Thompson   CeedScalar *array;
4832b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayWrite(index_vec, CEED_MEM_HOST, &array));
484ed9e99e6SJeremy L Thompson   for (CeedInt i = 0; i < num_nodes; i++) array[i] = i;
4852b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArray(index_vec, &array));
486eaf62fffSJeremy L Thompson   CeedVector elem_dof;
4872b730f8bSJeremy L Thompson   CeedCall(CeedVectorCreate(ceed, num_elem * elem_size * num_comp, &elem_dof));
4882b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(elem_dof, 0.0));
4892b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionApply(rstr_in, CEED_NOTRANSPOSE, index_vec, elem_dof, CEED_REQUEST_IMMEDIATE));
490eaf62fffSJeremy L Thompson   const CeedScalar *elem_dof_a;
4912b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayRead(elem_dof, CEED_MEM_HOST, &elem_dof_a));
4922b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&index_vec));
493eaf62fffSJeremy L Thompson 
494eaf62fffSJeremy L Thompson   // Determine i, j locations for element matrices
495b94338b9SJed Brown   CeedSize count = 0;
496ed9e99e6SJeremy L Thompson   for (CeedInt e = 0; e < num_elem; e++) {
497ed9e99e6SJeremy L Thompson     for (CeedInt comp_in = 0; comp_in < num_comp; comp_in++) {
498ed9e99e6SJeremy L Thompson       for (CeedInt comp_out = 0; comp_out < num_comp; comp_out++) {
499ed9e99e6SJeremy L Thompson         for (CeedInt i = 0; i < elem_size; i++) {
500ed9e99e6SJeremy L Thompson           for (CeedInt j = 0; j < elem_size; j++) {
5012b730f8bSJeremy L Thompson             const CeedInt elem_dof_index_row = i * layout_er[0] + (comp_out)*layout_er[1] + e * layout_er[2];
5022b730f8bSJeremy L Thompson             const CeedInt elem_dof_index_col = j * layout_er[0] + comp_in * layout_er[1] + e * layout_er[2];
503eaf62fffSJeremy L Thompson 
504eaf62fffSJeremy L Thompson             const CeedInt row = elem_dof_a[elem_dof_index_row];
505eaf62fffSJeremy L Thompson             const CeedInt col = elem_dof_a[elem_dof_index_col];
506eaf62fffSJeremy L Thompson 
507eaf62fffSJeremy L Thompson             rows[offset + count] = row;
508eaf62fffSJeremy L Thompson             cols[offset + count] = col;
509eaf62fffSJeremy L Thompson             count++;
510eaf62fffSJeremy L Thompson           }
511eaf62fffSJeremy L Thompson         }
512eaf62fffSJeremy L Thompson       }
513eaf62fffSJeremy L Thompson     }
514eaf62fffSJeremy L Thompson   }
5156574a04fSJeremy L Thompson   CeedCheck(count == local_num_entries, ceed, CEED_ERROR_MAJOR, "Error computing assembled entries");
5162b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArrayRead(elem_dof, &elem_dof_a));
5172b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&elem_dof));
518eaf62fffSJeremy L Thompson 
519eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
520eaf62fffSJeremy L Thompson }
521eaf62fffSJeremy L Thompson 
522eaf62fffSJeremy L Thompson /**
523eaf62fffSJeremy L Thompson   @brief Assemble nonzero entries for non-composite operator
524eaf62fffSJeremy L Thompson 
525eaf62fffSJeremy L Thompson   Users should generally use CeedOperatorLinearAssemble()
526eaf62fffSJeremy L Thompson 
527eaf62fffSJeremy L Thompson   @param[in]  op     CeedOperator to assemble
528ea61e9acSJeremy L Thompson   @param[in]  offset Offset for number of entries
529eaf62fffSJeremy L Thompson   @param[out] values Values to assemble into matrix
530eaf62fffSJeremy L Thompson 
531eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
532eaf62fffSJeremy L Thompson 
533eaf62fffSJeremy L Thompson   @ref Developer
534eaf62fffSJeremy L Thompson **/
5352b730f8bSJeremy L Thompson static int CeedSingleOperatorAssemble(CeedOperator op, CeedInt offset, CeedVector values) {
536f3d47e36SJeremy L Thompson   Ceed ceed;
537f3d47e36SJeremy L Thompson   bool is_composite;
538f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
539f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
540f3d47e36SJeremy L Thompson 
5416574a04fSJeremy L Thompson   CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported");
542f3d47e36SJeremy L Thompson 
543f3d47e36SJeremy L Thompson   // Early exit for empty operator
544f3d47e36SJeremy L Thompson   {
545f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
546f3d47e36SJeremy L Thompson 
547f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
548f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
549f3d47e36SJeremy L Thompson   }
550eaf62fffSJeremy L Thompson 
551cefa2673SJeremy L Thompson   if (op->LinearAssembleSingle) {
552cefa2673SJeremy L Thompson     // Backend version
5532b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleSingle(op, offset, values));
554cefa2673SJeremy L Thompson     return CEED_ERROR_SUCCESS;
555cefa2673SJeremy L Thompson   } else {
556cefa2673SJeremy L Thompson     // Operator fallback
557cefa2673SJeremy L Thompson     CeedOperator op_fallback;
558cefa2673SJeremy L Thompson 
5592b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
560cefa2673SJeremy L Thompson     if (op_fallback) {
5612b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemble(op_fallback, offset, values));
562cefa2673SJeremy L Thompson       return CEED_ERROR_SUCCESS;
563cefa2673SJeremy L Thompson     }
564cefa2673SJeremy L Thompson   }
565cefa2673SJeremy L Thompson 
566eaf62fffSJeremy L Thompson   // Assemble QFunction
567eaf62fffSJeremy L Thompson   CeedQFunction qf;
5682b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetQFunction(op, &qf));
569c5f45aeaSJeremy L Thompson   CeedVector          assembled_qf = NULL;
570c5f45aeaSJeremy L Thompson   CeedElemRestriction rstr_q       = NULL;
5712b730f8bSJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &rstr_q, CEED_REQUEST_IMMEDIATE));
5721f9221feSJeremy L Thompson   CeedSize qf_length;
5732b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetLength(assembled_qf, &qf_length));
574eaf62fffSJeremy L Thompson 
5757e7773b5SJeremy L Thompson   CeedInt            num_input_fields, num_output_fields;
576eaf62fffSJeremy L Thompson   CeedOperatorField *input_fields;
577eaf62fffSJeremy L Thompson   CeedOperatorField *output_fields;
5782b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetFields(op, &num_input_fields, &input_fields, &num_output_fields, &output_fields));
579eaf62fffSJeremy L Thompson 
580ed9e99e6SJeremy L Thompson   // Get assembly data
581ed9e99e6SJeremy L Thompson   CeedOperatorAssemblyData data;
5822b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data));
583437c7c90SJeremy L Thompson   const CeedEvalMode **eval_modes_in, **eval_modes_out;
584437c7c90SJeremy L Thompson   CeedInt             *num_eval_modes_in, *num_eval_modes_out, num_active_bases;
585437c7c90SJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_active_bases, &num_eval_modes_in, &eval_modes_in, NULL, &num_eval_modes_out,
586437c7c90SJeremy L Thompson                                                 &eval_modes_out, NULL, NULL));
587437c7c90SJeremy L Thompson   CeedBasis *bases;
588437c7c90SJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, &bases, NULL, NULL));
589437c7c90SJeremy L Thompson   CeedBasis basis_in = bases[0];
590eaf62fffSJeremy L Thompson 
5916574a04fSJeremy L Thompson   CeedCheck(num_active_bases == 1, ceed, CEED_ERROR_UNSUPPORTED, "Cannot assemble operator with multiple active bases");
5926574a04fSJeremy L Thompson   CeedCheck(num_eval_modes_in[0] > 0 && num_eval_modes_out[0] > 0, ceed, CEED_ERROR_UNSUPPORTED, "Cannot assemble operator with out inputs/outputs");
593eaf62fffSJeremy L Thompson 
594ed9e99e6SJeremy L Thompson   CeedElemRestriction active_rstr;
595eaf62fffSJeremy L Thompson   CeedInt             num_elem, elem_size, num_qpts, num_comp;
5962b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveElemRestriction(op, &active_rstr));
5972b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(active_rstr, &num_elem));
5982b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetElementSize(active_rstr, &elem_size));
5992b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumComponents(active_rstr, &num_comp));
6002b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_in, &num_qpts));
601eaf62fffSJeremy L Thompson 
602eaf62fffSJeremy L Thompson   CeedInt local_num_entries = elem_size * num_comp * elem_size * num_comp * num_elem;
603eaf62fffSJeremy L Thompson 
604eaf62fffSJeremy L Thompson   // loop over elements and put in data structure
605eaf62fffSJeremy L Thompson   const CeedScalar *assembled_qf_array;
6062b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array));
607eaf62fffSJeremy L Thompson 
608eaf62fffSJeremy L Thompson   CeedInt layout_qf[3];
6092b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetELayout(rstr_q, &layout_qf));
6102b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&rstr_q));
611eaf62fffSJeremy L Thompson 
612eaf62fffSJeremy L Thompson   // we store B_mat_in, B_mat_out, BTD, elem_mat in row-major order
613437c7c90SJeremy L Thompson   const CeedScalar **B_mats_in, **B_mats_out;
614437c7c90SJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, NULL, &B_mats_in, &B_mats_out));
615437c7c90SJeremy L Thompson   const CeedScalar *B_mat_in = B_mats_in[0], *B_mat_out = B_mats_out[0];
616437c7c90SJeremy L Thompson   CeedScalar        BTD_mat[elem_size * num_qpts * num_eval_modes_in[0]];
617eaf62fffSJeremy L Thompson   CeedScalar        elem_mat[elem_size * elem_size];
618b94338b9SJed Brown   CeedSize          count = 0;
619eaf62fffSJeremy L Thompson   CeedScalar       *vals;
62028ec399dSJeremy L Thompson   CeedCall(CeedVectorGetArray(values, CEED_MEM_HOST, &vals));
621b94338b9SJed Brown   for (CeedSize e = 0; e < num_elem; e++) {
622ed9e99e6SJeremy L Thompson     for (CeedInt comp_in = 0; comp_in < num_comp; comp_in++) {
623ed9e99e6SJeremy L Thompson       for (CeedInt comp_out = 0; comp_out < num_comp; comp_out++) {
624ed9e99e6SJeremy L Thompson         // Compute B^T*D
625b94338b9SJed Brown         for (CeedSize n = 0; n < elem_size; n++) {
626b94338b9SJed Brown           for (CeedSize q = 0; q < num_qpts; q++) {
627437c7c90SJeremy L Thompson             for (CeedInt e_in = 0; e_in < num_eval_modes_in[0]; e_in++) {
628b94338b9SJed Brown               const CeedSize btd_index = n * (num_qpts * num_eval_modes_in[0]) + (num_eval_modes_in[0] * q + e_in);
629067fd99fSJeremy L Thompson               CeedScalar     sum       = 0.0;
630437c7c90SJeremy L Thompson               for (CeedInt e_out = 0; e_out < num_eval_modes_out[0]; e_out++) {
631b94338b9SJed Brown                 const CeedSize b_out_index     = (num_eval_modes_out[0] * q + e_out) * elem_size + n;
632b94338b9SJed Brown                 const CeedSize eval_mode_index = ((e_in * num_comp + comp_in) * num_eval_modes_out[0] + e_out) * num_comp + comp_out;
633b94338b9SJed Brown                 const CeedSize qf_index        = q * layout_qf[0] + eval_mode_index * layout_qf[1] + e * layout_qf[2];
634067fd99fSJeremy L Thompson                 sum += B_mat_out[b_out_index] * assembled_qf_array[qf_index];
635eaf62fffSJeremy L Thompson               }
636067fd99fSJeremy L Thompson               BTD_mat[btd_index] = sum;
637ed9e99e6SJeremy L Thompson             }
638ed9e99e6SJeremy L Thompson           }
639eaf62fffSJeremy L Thompson         }
640eaf62fffSJeremy L Thompson         // form element matrix itself (for each block component)
641437c7c90SJeremy L Thompson         CeedCall(CeedMatrixMatrixMultiply(ceed, BTD_mat, B_mat_in, elem_mat, elem_size, elem_size, num_qpts * num_eval_modes_in[0]));
642eaf62fffSJeremy L Thompson 
643eaf62fffSJeremy L Thompson         // put element matrix in coordinate data structure
644ed9e99e6SJeremy L Thompson         for (CeedInt i = 0; i < elem_size; i++) {
645ed9e99e6SJeremy L Thompson           for (CeedInt j = 0; j < elem_size; j++) {
646eaf62fffSJeremy L Thompson             vals[offset + count] = elem_mat[i * elem_size + j];
647eaf62fffSJeremy L Thompson             count++;
648eaf62fffSJeremy L Thompson           }
649eaf62fffSJeremy L Thompson         }
650eaf62fffSJeremy L Thompson       }
651eaf62fffSJeremy L Thompson     }
652eaf62fffSJeremy L Thompson   }
6536574a04fSJeremy L Thompson   CeedCheck(count == local_num_entries, ceed, CEED_ERROR_MAJOR, "Error computing entries");
6542b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArray(values, &vals));
655eaf62fffSJeremy L Thompson 
6562b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array));
6572b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&assembled_qf));
658eaf62fffSJeremy L Thompson 
659eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
660eaf62fffSJeremy L Thompson }
661eaf62fffSJeremy L Thompson 
662eaf62fffSJeremy L Thompson /**
663eaf62fffSJeremy L Thompson   @brief Count number of entries for assembled CeedOperator
664eaf62fffSJeremy L Thompson 
665eaf62fffSJeremy L Thompson   @param[in]  op          CeedOperator to assemble
666eaf62fffSJeremy L Thompson   @param[out] num_entries Number of entries in assembled representation
667eaf62fffSJeremy L Thompson 
668eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
669eaf62fffSJeremy L Thompson 
670eaf62fffSJeremy L Thompson   @ref Utility
671eaf62fffSJeremy L Thompson **/
672b94338b9SJed Brown static int CeedSingleOperatorAssemblyCountEntries(CeedOperator op, CeedSize *num_entries) {
673b275c451SJeremy L Thompson   bool                is_composite;
674eaf62fffSJeremy L Thompson   CeedElemRestriction rstr;
675eaf62fffSJeremy L Thompson   CeedInt             num_elem, elem_size, num_comp;
676eaf62fffSJeremy L Thompson 
677b275c451SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
6786574a04fSJeremy L Thompson   CeedCheck(!is_composite, op->ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported");
6792b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveElemRestriction(op, &rstr));
6802b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem));
6812b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size));
6822b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp));
683b94338b9SJed Brown   *num_entries = (CeedSize)elem_size * num_comp * elem_size * num_comp * num_elem;
684eaf62fffSJeremy L Thompson 
685eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
686eaf62fffSJeremy L Thompson }
687eaf62fffSJeremy L Thompson 
688eaf62fffSJeremy L Thompson /**
689ea61e9acSJeremy L Thompson   @brief Common code for creating a multigrid coarse operator and level transfer operators for a CeedOperator
690eaf62fffSJeremy L Thompson 
691eaf62fffSJeremy L Thompson   @param[in]  op_fine      Fine grid operator
69285bb9dcfSJeremy L Thompson   @param[in]  p_mult_fine  L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators
693eaf62fffSJeremy L Thompson   @param[in]  rstr_coarse  Coarse grid restriction
694eaf62fffSJeremy L Thompson   @param[in]  basis_coarse Coarse grid active vector basis
69585bb9dcfSJeremy L Thompson   @param[in]  basis_c_to_f Basis for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators
696eaf62fffSJeremy L Thompson   @param[out] op_coarse    Coarse grid operator
69785bb9dcfSJeremy L Thompson   @param[out] op_prolong   Coarse to fine operator, or NULL
69885bb9dcfSJeremy L Thompson   @param[out] op_restrict  Fine to coarse operator, or NULL
699eaf62fffSJeremy L Thompson 
700eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
701eaf62fffSJeremy L Thompson 
702eaf62fffSJeremy L Thompson   @ref Developer
703eaf62fffSJeremy L Thompson **/
7042b730f8bSJeremy L Thompson static int CeedSingleOperatorMultigridLevel(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse,
7052b730f8bSJeremy L Thompson                                             CeedBasis basis_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) {
706eaf62fffSJeremy L Thompson   Ceed                ceed;
70785bb9dcfSJeremy L Thompson   CeedVector          mult_vec         = NULL;
708c17ec2beSJeremy L Thompson   CeedElemRestriction rstr_p_mult_fine = NULL;
7092b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op_fine, &ceed));
710eaf62fffSJeremy L Thompson 
711eaf62fffSJeremy L Thompson   // Check for composite operator
712eaf62fffSJeremy L Thompson   bool is_composite;
7132b730f8bSJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op_fine, &is_composite));
7146574a04fSJeremy L Thompson   CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Automatic multigrid setup for composite operators not supported");
715eaf62fffSJeremy L Thompson 
716eaf62fffSJeremy L Thompson   // Coarse Grid
7172b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCreate(ceed, op_fine->qf, op_fine->dqf, op_fine->dqfT, op_coarse));
718eaf62fffSJeremy L Thompson   CeedElemRestriction rstr_fine = NULL;
719eaf62fffSJeremy L Thompson   // -- Clone input fields
72092ae7e47SJeremy L Thompson   for (CeedInt i = 0; i < op_fine->qf->num_input_fields; i++) {
721eaf62fffSJeremy L Thompson     if (op_fine->input_fields[i]->vec == CEED_VECTOR_ACTIVE) {
722437c7c90SJeremy L Thompson       rstr_fine = op_fine->input_fields[i]->elem_rstr;
7232b730f8bSJeremy L Thompson       CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE));
724eaf62fffSJeremy L Thompson     } else {
725437c7c90SJeremy L Thompson       CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, op_fine->input_fields[i]->elem_rstr,
7262b730f8bSJeremy L Thompson                                     op_fine->input_fields[i]->basis, op_fine->input_fields[i]->vec));
727eaf62fffSJeremy L Thompson     }
728eaf62fffSJeremy L Thompson   }
729eaf62fffSJeremy L Thompson   // -- Clone output fields
73092ae7e47SJeremy L Thompson   for (CeedInt i = 0; i < op_fine->qf->num_output_fields; i++) {
731eaf62fffSJeremy L Thompson     if (op_fine->output_fields[i]->vec == CEED_VECTOR_ACTIVE) {
7322b730f8bSJeremy L Thompson       CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE));
733eaf62fffSJeremy L Thompson     } else {
734437c7c90SJeremy L Thompson       CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, op_fine->output_fields[i]->elem_rstr,
7352b730f8bSJeremy L Thompson                                     op_fine->output_fields[i]->basis, op_fine->output_fields[i]->vec));
736eaf62fffSJeremy L Thompson     }
737eaf62fffSJeremy L Thompson   }
738af99e877SJeremy L Thompson   // -- Clone QFunctionAssemblyData
7392b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op_fine->qf_assembled, &(*op_coarse)->qf_assembled));
740eaf62fffSJeremy L Thompson 
741eaf62fffSJeremy L Thompson   // Multiplicity vector
74285bb9dcfSJeremy L Thompson   if (op_restrict || op_prolong) {
74385bb9dcfSJeremy L Thompson     CeedVector mult_e_vec;
74485bb9dcfSJeremy L Thompson 
745c17ec2beSJeremy L Thompson     CeedCall(CeedElemRestrictionCreateUnsignedCopy(rstr_fine, &rstr_p_mult_fine));
7466574a04fSJeremy L Thompson     CeedCheck(p_mult_fine, ceed, CEED_ERROR_INCOMPATIBLE, "Prolongation or restriction operator creation requires fine grid multiplicity vector");
7472b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionCreateVector(rstr_fine, &mult_vec, &mult_e_vec));
7482b730f8bSJeremy L Thompson     CeedCall(CeedVectorSetValue(mult_e_vec, 0.0));
749c17ec2beSJeremy L Thompson     CeedCall(CeedElemRestrictionApply(rstr_p_mult_fine, CEED_NOTRANSPOSE, p_mult_fine, mult_e_vec, CEED_REQUEST_IMMEDIATE));
7502b730f8bSJeremy L Thompson     CeedCall(CeedVectorSetValue(mult_vec, 0.0));
751c17ec2beSJeremy L Thompson     CeedCall(CeedElemRestrictionApply(rstr_p_mult_fine, CEED_TRANSPOSE, mult_e_vec, mult_vec, CEED_REQUEST_IMMEDIATE));
7522b730f8bSJeremy L Thompson     CeedCall(CeedVectorDestroy(&mult_e_vec));
7532b730f8bSJeremy L Thompson     CeedCall(CeedVectorReciprocal(mult_vec));
75485bb9dcfSJeremy L Thompson   }
755eaf62fffSJeremy L Thompson 
756addd79feSZach Atkins   // Clone name
757addd79feSZach Atkins   bool   has_name = op_fine->name;
758addd79feSZach Atkins   size_t name_len = op_fine->name ? strlen(op_fine->name) : 0;
759addd79feSZach Atkins   CeedCall(CeedOperatorSetName(*op_coarse, op_fine->name));
760addd79feSZach Atkins 
76183d6adf3SZach Atkins   // Check that coarse to fine basis is provided if prolong/restrict operators are requested
7626574a04fSJeremy L Thompson   CeedCheck(basis_c_to_f || (!op_restrict && !op_prolong), ceed, CEED_ERROR_INCOMPATIBLE,
7636574a04fSJeremy L Thompson             "Prolongation or restriction operator creation requires coarse-to-fine basis");
76483d6adf3SZach Atkins 
76585bb9dcfSJeremy L Thompson   // Restriction/Prolongation Operators
766eaf62fffSJeremy L Thompson   CeedInt num_comp;
7672b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumComponents(basis_coarse, &num_comp));
768addd79feSZach Atkins 
769addd79feSZach Atkins   // Restriction
770addd79feSZach Atkins   if (op_restrict) {
771eaf62fffSJeremy L Thompson     CeedInt             *num_comp_r_data;
77285bb9dcfSJeremy L Thompson     CeedQFunction        qf_restrict;
77385bb9dcfSJeremy L Thompson     CeedQFunctionContext ctx_r;
77485bb9dcfSJeremy L Thompson 
77585bb9dcfSJeremy L Thompson     CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_restrict));
7762b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(1, &num_comp_r_data));
777eaf62fffSJeremy L Thompson     num_comp_r_data[0] = num_comp;
7782b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextCreate(ceed, &ctx_r));
7792b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextSetData(ctx_r, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_r_data), num_comp_r_data));
7802b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionSetContext(qf_restrict, ctx_r));
7812b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextDestroy(&ctx_r));
7822b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddInput(qf_restrict, "input", num_comp, CEED_EVAL_NONE));
7832b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddInput(qf_restrict, "scale", num_comp, CEED_EVAL_NONE));
7842b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddOutput(qf_restrict, "output", num_comp, CEED_EVAL_INTERP));
7852b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_restrict, num_comp));
786eaf62fffSJeremy L Thompson 
7872b730f8bSJeremy L Thompson     CeedCall(CeedOperatorCreate(ceed, qf_restrict, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_restrict));
7882b730f8bSJeremy L Thompson     CeedCall(CeedOperatorSetField(*op_restrict, "input", rstr_fine, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE));
789c17ec2beSJeremy L Thompson     CeedCall(CeedOperatorSetField(*op_restrict, "scale", rstr_p_mult_fine, CEED_BASIS_COLLOCATED, mult_vec));
7902b730f8bSJeremy L Thompson     CeedCall(CeedOperatorSetField(*op_restrict, "output", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE));
791eaf62fffSJeremy L Thompson 
792addd79feSZach Atkins     // Set name
793addd79feSZach Atkins     char *restriction_name;
794addd79feSZach Atkins     CeedCall(CeedCalloc(17 + name_len, &restriction_name));
795addd79feSZach Atkins     sprintf(restriction_name, "restriction%s%s", has_name ? " for " : "", has_name ? op_fine->name : "");
796addd79feSZach Atkins     CeedCall(CeedOperatorSetName(*op_restrict, restriction_name));
797addd79feSZach Atkins     CeedCall(CeedFree(&restriction_name));
798addd79feSZach Atkins 
799addd79feSZach Atkins     // Check
800addd79feSZach Atkins     CeedCall(CeedOperatorCheckReady(*op_restrict));
801addd79feSZach Atkins 
802addd79feSZach Atkins     // Cleanup
803addd79feSZach Atkins     CeedCall(CeedQFunctionDestroy(&qf_restrict));
804addd79feSZach Atkins   }
805addd79feSZach Atkins 
806eaf62fffSJeremy L Thompson   // Prolongation
807addd79feSZach Atkins   if (op_prolong) {
808eaf62fffSJeremy L Thompson     CeedInt             *num_comp_p_data;
80985bb9dcfSJeremy L Thompson     CeedQFunction        qf_prolong;
81085bb9dcfSJeremy L Thompson     CeedQFunctionContext ctx_p;
81185bb9dcfSJeremy L Thompson 
81285bb9dcfSJeremy L Thompson     CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_prolong));
8132b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(1, &num_comp_p_data));
814eaf62fffSJeremy L Thompson     num_comp_p_data[0] = num_comp;
8152b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextCreate(ceed, &ctx_p));
8162b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextSetData(ctx_p, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_p_data), num_comp_p_data));
8172b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionSetContext(qf_prolong, ctx_p));
8182b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextDestroy(&ctx_p));
8192b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddInput(qf_prolong, "input", num_comp, CEED_EVAL_INTERP));
8202b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddInput(qf_prolong, "scale", num_comp, CEED_EVAL_NONE));
8212b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddOutput(qf_prolong, "output", num_comp, CEED_EVAL_NONE));
8222b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_prolong, num_comp));
823eaf62fffSJeremy L Thompson 
8242b730f8bSJeremy L Thompson     CeedCall(CeedOperatorCreate(ceed, qf_prolong, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_prolong));
8252b730f8bSJeremy L Thompson     CeedCall(CeedOperatorSetField(*op_prolong, "input", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE));
826c17ec2beSJeremy L Thompson     CeedCall(CeedOperatorSetField(*op_prolong, "scale", rstr_p_mult_fine, CEED_BASIS_COLLOCATED, mult_vec));
8272b730f8bSJeremy L Thompson     CeedCall(CeedOperatorSetField(*op_prolong, "output", rstr_fine, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE));
828eaf62fffSJeremy L Thompson 
829addd79feSZach Atkins     // Set name
830ea6b5821SJeremy L Thompson     char *prolongation_name;
8312b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(18 + name_len, &prolongation_name));
8322b730f8bSJeremy L Thompson     sprintf(prolongation_name, "prolongation%s%s", has_name ? " for " : "", has_name ? op_fine->name : "");
8332b730f8bSJeremy L Thompson     CeedCall(CeedOperatorSetName(*op_prolong, prolongation_name));
8342b730f8bSJeremy L Thompson     CeedCall(CeedFree(&prolongation_name));
835addd79feSZach Atkins 
836addd79feSZach Atkins     // Check
837addd79feSZach Atkins     CeedCall(CeedOperatorCheckReady(*op_prolong));
838addd79feSZach Atkins 
839addd79feSZach Atkins     // Cleanup
840addd79feSZach Atkins     CeedCall(CeedQFunctionDestroy(&qf_prolong));
841ea6b5821SJeremy L Thompson   }
842ea6b5821SJeremy L Thompson 
84358e4b056SJeremy L Thompson   // Check
84458e4b056SJeremy L Thompson   CeedCall(CeedOperatorCheckReady(*op_coarse));
84558e4b056SJeremy L Thompson 
846eaf62fffSJeremy L Thompson   // Cleanup
8472b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&mult_vec));
848c17ec2beSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&rstr_p_mult_fine));
8492b730f8bSJeremy L Thompson   CeedCall(CeedBasisDestroy(&basis_c_to_f));
850805fe78eSJeremy L Thompson 
851eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
852eaf62fffSJeremy L Thompson }
853eaf62fffSJeremy L Thompson 
854eaf62fffSJeremy L Thompson /**
855eaf62fffSJeremy L Thompson   @brief Build 1D mass matrix and Laplacian with perturbation
856eaf62fffSJeremy L Thompson 
857eaf62fffSJeremy L Thompson   @param[in]  interp_1d   Interpolation matrix in one dimension
858eaf62fffSJeremy L Thompson   @param[in]  grad_1d     Gradient matrix in one dimension
859eaf62fffSJeremy L Thompson   @param[in]  q_weight_1d Quadrature weights in one dimension
860eaf62fffSJeremy L Thompson   @param[in]  P_1d        Number of basis nodes in one dimension
861eaf62fffSJeremy L Thompson   @param[in]  Q_1d        Number of quadrature points in one dimension
862eaf62fffSJeremy L Thompson   @param[in]  dim         Dimension of basis
863eaf62fffSJeremy L Thompson   @param[out] mass        Assembled mass matrix in one dimension
864eaf62fffSJeremy L Thompson   @param[out] laplace     Assembled perturbed Laplacian in one dimension
865eaf62fffSJeremy L Thompson 
866eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
867eaf62fffSJeremy L Thompson 
868eaf62fffSJeremy L Thompson   @ref Developer
869eaf62fffSJeremy L Thompson **/
8702c2ea1dbSJeremy L Thompson CeedPragmaOptimizeOff
8712c2ea1dbSJeremy L Thompson static int CeedBuildMassLaplace(const CeedScalar *interp_1d, const CeedScalar *grad_1d, const CeedScalar *q_weight_1d, CeedInt P_1d, CeedInt Q_1d,
8722c2ea1dbSJeremy L Thompson                                 CeedInt dim, CeedScalar *mass, CeedScalar *laplace) {
8732b730f8bSJeremy L Thompson   for (CeedInt i = 0; i < P_1d; i++) {
874eaf62fffSJeremy L Thompson     for (CeedInt j = 0; j < P_1d; j++) {
875eaf62fffSJeremy L Thompson       CeedScalar sum = 0.0;
8762b730f8bSJeremy L Thompson       for (CeedInt k = 0; k < Q_1d; k++) sum += interp_1d[k * P_1d + i] * q_weight_1d[k] * interp_1d[k * P_1d + j];
877eaf62fffSJeremy L Thompson       mass[i + j * P_1d] = sum;
878eaf62fffSJeremy L Thompson     }
8792b730f8bSJeremy L Thompson   }
880eaf62fffSJeremy L Thompson   // -- Laplacian
8812b730f8bSJeremy L Thompson   for (CeedInt i = 0; i < P_1d; i++) {
882eaf62fffSJeremy L Thompson     for (CeedInt j = 0; j < P_1d; j++) {
883eaf62fffSJeremy L Thompson       CeedScalar sum = 0.0;
8842b730f8bSJeremy L Thompson       for (CeedInt k = 0; k < Q_1d; k++) sum += grad_1d[k * P_1d + i] * q_weight_1d[k] * grad_1d[k * P_1d + j];
885eaf62fffSJeremy L Thompson       laplace[i + j * P_1d] = sum;
886eaf62fffSJeremy L Thompson     }
8872b730f8bSJeremy L Thompson   }
888eaf62fffSJeremy L Thompson   CeedScalar perturbation = dim > 2 ? 1e-6 : 1e-4;
8892b730f8bSJeremy L Thompson   for (CeedInt i = 0; i < P_1d; i++) laplace[i + P_1d * i] += perturbation;
890eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
891eaf62fffSJeremy L Thompson }
8922c2ea1dbSJeremy L Thompson CeedPragmaOptimizeOn
893eaf62fffSJeremy L Thompson 
894eaf62fffSJeremy L Thompson /// @}
895eaf62fffSJeremy L Thompson 
896eaf62fffSJeremy L Thompson /// ----------------------------------------------------------------------------
897480fae85SJeremy L Thompson /// CeedOperator Backend API
898480fae85SJeremy L Thompson /// ----------------------------------------------------------------------------
899480fae85SJeremy L Thompson /// @addtogroup CeedOperatorBackend
900480fae85SJeremy L Thompson /// @{
901480fae85SJeremy L Thompson 
902480fae85SJeremy L Thompson /**
903480fae85SJeremy L Thompson   @brief Create object holding CeedQFunction assembly data for CeedOperator
904480fae85SJeremy L Thompson 
905480fae85SJeremy L Thompson   @param[in]  ceed A Ceed object where the CeedQFunctionAssemblyData will be created
906ea61e9acSJeremy L Thompson   @param[out] data Address of the variable where the newly created CeedQFunctionAssemblyData will be stored
907480fae85SJeremy L Thompson 
908480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
909480fae85SJeremy L Thompson 
910480fae85SJeremy L Thompson   @ref Backend
911480fae85SJeremy L Thompson **/
912ea61e9acSJeremy L Thompson int CeedQFunctionAssemblyDataCreate(Ceed ceed, CeedQFunctionAssemblyData *data) {
9132b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(1, data));
914480fae85SJeremy L Thompson   (*data)->ref_count = 1;
915480fae85SJeremy L Thompson   (*data)->ceed      = ceed;
9162b730f8bSJeremy L Thompson   CeedCall(CeedReference(ceed));
917480fae85SJeremy L Thompson 
918480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
919480fae85SJeremy L Thompson }
920480fae85SJeremy L Thompson 
921480fae85SJeremy L Thompson /**
922480fae85SJeremy L Thompson   @brief Increment the reference counter for a CeedQFunctionAssemblyData
923480fae85SJeremy L Thompson 
924ea61e9acSJeremy L Thompson   @param[in,out] data CeedQFunctionAssemblyData to increment the reference counter
925480fae85SJeremy L Thompson 
926480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
927480fae85SJeremy L Thompson 
928480fae85SJeremy L Thompson   @ref Backend
929480fae85SJeremy L Thompson **/
930480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataReference(CeedQFunctionAssemblyData data) {
931480fae85SJeremy L Thompson   data->ref_count++;
932480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
933480fae85SJeremy L Thompson }
934480fae85SJeremy L Thompson 
935480fae85SJeremy L Thompson /**
936beecbf24SJeremy L Thompson   @brief Set re-use of CeedQFunctionAssemblyData
9378b919e6bSJeremy L Thompson 
938ea61e9acSJeremy L Thompson   @param[in,out] data       CeedQFunctionAssemblyData to mark for reuse
939ea61e9acSJeremy L Thompson   @param[in]     reuse_data Boolean flag indicating data re-use
9408b919e6bSJeremy L Thompson 
9418b919e6bSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
9428b919e6bSJeremy L Thompson 
9438b919e6bSJeremy L Thompson   @ref Backend
9448b919e6bSJeremy L Thompson **/
9452b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetReuse(CeedQFunctionAssemblyData data, bool reuse_data) {
946beecbf24SJeremy L Thompson   data->reuse_data        = reuse_data;
947beecbf24SJeremy L Thompson   data->needs_data_update = true;
948beecbf24SJeremy L Thompson   return CEED_ERROR_SUCCESS;
949beecbf24SJeremy L Thompson }
950beecbf24SJeremy L Thompson 
951beecbf24SJeremy L Thompson /**
952beecbf24SJeremy L Thompson   @brief Mark QFunctionAssemblyData as stale
953beecbf24SJeremy L Thompson 
954ea61e9acSJeremy L Thompson   @param[in,out] data              CeedQFunctionAssemblyData to mark as stale
955ea61e9acSJeremy L Thompson   @param[in]     needs_data_update Boolean flag indicating if update is needed or completed
956beecbf24SJeremy L Thompson 
957beecbf24SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
958beecbf24SJeremy L Thompson 
959beecbf24SJeremy L Thompson   @ref Backend
960beecbf24SJeremy L Thompson **/
9612b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetUpdateNeeded(CeedQFunctionAssemblyData data, bool needs_data_update) {
962beecbf24SJeremy L Thompson   data->needs_data_update = needs_data_update;
9638b919e6bSJeremy L Thompson   return CEED_ERROR_SUCCESS;
9648b919e6bSJeremy L Thompson }
9658b919e6bSJeremy L Thompson 
9668b919e6bSJeremy L Thompson /**
9678b919e6bSJeremy L Thompson   @brief Determine if QFunctionAssemblyData needs update
9688b919e6bSJeremy L Thompson 
9698b919e6bSJeremy L Thompson   @param[in]  data             CeedQFunctionAssemblyData to mark as stale
9708b919e6bSJeremy L Thompson   @param[out] is_update_needed Boolean flag indicating if re-assembly is required
9718b919e6bSJeremy L Thompson 
9728b919e6bSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
9738b919e6bSJeremy L Thompson 
9748b919e6bSJeremy L Thompson   @ref Backend
9758b919e6bSJeremy L Thompson **/
9762b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsUpdateNeeded(CeedQFunctionAssemblyData data, bool *is_update_needed) {
977beecbf24SJeremy L Thompson   *is_update_needed = !data->reuse_data || data->needs_data_update;
9788b919e6bSJeremy L Thompson   return CEED_ERROR_SUCCESS;
9798b919e6bSJeremy L Thompson }
9808b919e6bSJeremy L Thompson 
9818b919e6bSJeremy L Thompson /**
982ea61e9acSJeremy L Thompson   @brief Copy the pointer to a CeedQFunctionAssemblyData.
9834385fb7fSSebastian Grimberg 
984ea61e9acSJeremy L Thompson   Both pointers should be destroyed with `CeedCeedQFunctionAssemblyDataDestroy()`.
985512bb800SJeremy L Thompson 
986512bb800SJeremy L Thompson   Note: If the value of `data_copy` passed to this function is non-NULL, then it is assumed that `*data_copy` is a pointer to a
987512bb800SJeremy L Thompson         CeedQFunctionAssemblyData. This CeedQFunctionAssemblyData will be destroyed if `data_copy` is the only reference to this
988512bb800SJeremy L Thompson         CeedQFunctionAssemblyData.
989480fae85SJeremy L Thompson 
990ea61e9acSJeremy L Thompson   @param[in]     data      CeedQFunctionAssemblyData to copy reference to
991ea61e9acSJeremy L Thompson   @param[in,out] data_copy Variable to store copied reference
992480fae85SJeremy L Thompson 
993480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
994480fae85SJeremy L Thompson 
995480fae85SJeremy L Thompson   @ref Backend
996480fae85SJeremy L Thompson **/
9972b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataReferenceCopy(CeedQFunctionAssemblyData data, CeedQFunctionAssemblyData *data_copy) {
9982b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAssemblyDataReference(data));
9992b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAssemblyDataDestroy(data_copy));
1000480fae85SJeremy L Thompson   *data_copy = data;
1001480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1002480fae85SJeremy L Thompson }
1003480fae85SJeremy L Thompson 
1004480fae85SJeremy L Thompson /**
1005480fae85SJeremy L Thompson   @brief Get setup status for internal objects for CeedQFunctionAssemblyData
1006480fae85SJeremy L Thompson 
1007ea61e9acSJeremy L Thompson   @param[in]  data     CeedQFunctionAssemblyData to retrieve status
1008480fae85SJeremy L Thompson   @param[out] is_setup Boolean flag for setup status
1009480fae85SJeremy L Thompson 
1010480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1011480fae85SJeremy L Thompson 
1012480fae85SJeremy L Thompson   @ref Backend
1013480fae85SJeremy L Thompson **/
10142b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsSetup(CeedQFunctionAssemblyData data, bool *is_setup) {
1015480fae85SJeremy L Thompson   *is_setup = data->is_setup;
1016480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1017480fae85SJeremy L Thompson }
1018480fae85SJeremy L Thompson 
1019480fae85SJeremy L Thompson /**
1020480fae85SJeremy L Thompson   @brief Set internal objects for CeedQFunctionAssemblyData
1021480fae85SJeremy L Thompson 
1022ea61e9acSJeremy L Thompson   @param[in,out] data CeedQFunctionAssemblyData to set objects
1023480fae85SJeremy L Thompson   @param[in]     vec  CeedVector to store assembled CeedQFunction at quadrature points
1024480fae85SJeremy L Thompson   @param[in]     rstr CeedElemRestriction for CeedVector containing assembled CeedQFunction
1025480fae85SJeremy L Thompson 
1026480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1027480fae85SJeremy L Thompson 
1028480fae85SJeremy L Thompson   @ref Backend
1029480fae85SJeremy L Thompson **/
10302b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetObjects(CeedQFunctionAssemblyData data, CeedVector vec, CeedElemRestriction rstr) {
10312b730f8bSJeremy L Thompson   CeedCall(CeedVectorReferenceCopy(vec, &data->vec));
10322b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionReferenceCopy(rstr, &data->rstr));
1033480fae85SJeremy L Thompson 
1034480fae85SJeremy L Thompson   data->is_setup = true;
1035480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1036480fae85SJeremy L Thompson }
1037480fae85SJeremy L Thompson 
10382b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataGetObjects(CeedQFunctionAssemblyData data, CeedVector *vec, CeedElemRestriction *rstr) {
10396574a04fSJeremy L Thompson   CeedCheck(data->is_setup, data->ceed, CEED_ERROR_INCOMPLETE, "Internal objects not set; must call CeedQFunctionAssemblyDataSetObjects first.");
1040480fae85SJeremy L Thompson 
10412b730f8bSJeremy L Thompson   CeedCall(CeedVectorReferenceCopy(data->vec, vec));
10422b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionReferenceCopy(data->rstr, rstr));
1043480fae85SJeremy L Thompson 
1044480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1045480fae85SJeremy L Thompson }
1046480fae85SJeremy L Thompson 
1047480fae85SJeremy L Thompson /**
1048480fae85SJeremy L Thompson   @brief Destroy CeedQFunctionAssemblyData
1049480fae85SJeremy L Thompson 
1050ea61e9acSJeremy L Thompson   @param[in,out] data  CeedQFunctionAssemblyData to destroy
1051480fae85SJeremy L Thompson 
1052480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1053480fae85SJeremy L Thompson 
1054480fae85SJeremy L Thompson   @ref Backend
1055480fae85SJeremy L Thompson **/
1056480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataDestroy(CeedQFunctionAssemblyData *data) {
1057ad6481ceSJeremy L Thompson   if (!*data || --(*data)->ref_count > 0) {
1058ad6481ceSJeremy L Thompson     *data = NULL;
1059ad6481ceSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1060ad6481ceSJeremy L Thompson   }
10612b730f8bSJeremy L Thompson   CeedCall(CeedDestroy(&(*data)->ceed));
10622b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&(*data)->vec));
10632b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&(*data)->rstr));
1064480fae85SJeremy L Thompson 
10652b730f8bSJeremy L Thompson   CeedCall(CeedFree(data));
1066480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1067480fae85SJeremy L Thompson }
1068480fae85SJeremy L Thompson 
1069ed9e99e6SJeremy L Thompson /**
1070ed9e99e6SJeremy L Thompson   @brief Get CeedOperatorAssemblyData
1071ed9e99e6SJeremy L Thompson 
1072ed9e99e6SJeremy L Thompson   @param[in]  op   CeedOperator to assemble
1073ed9e99e6SJeremy L Thompson   @param[out] data CeedQFunctionAssemblyData
1074ed9e99e6SJeremy L Thompson 
1075ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1076ed9e99e6SJeremy L Thompson 
1077ed9e99e6SJeremy L Thompson   @ref Backend
1078ed9e99e6SJeremy L Thompson **/
10792b730f8bSJeremy L Thompson int CeedOperatorGetOperatorAssemblyData(CeedOperator op, CeedOperatorAssemblyData *data) {
1080ed9e99e6SJeremy L Thompson   if (!op->op_assembled) {
1081ed9e99e6SJeremy L Thompson     CeedOperatorAssemblyData data;
1082ed9e99e6SJeremy L Thompson 
10832b730f8bSJeremy L Thompson     CeedCall(CeedOperatorAssemblyDataCreate(op->ceed, op, &data));
1084ed9e99e6SJeremy L Thompson     op->op_assembled = data;
1085ed9e99e6SJeremy L Thompson   }
1086ed9e99e6SJeremy L Thompson   *data = op->op_assembled;
1087ed9e99e6SJeremy L Thompson 
1088ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1089ed9e99e6SJeremy L Thompson }
1090ed9e99e6SJeremy L Thompson 
1091ed9e99e6SJeremy L Thompson /**
1092ba746a46SJeremy L Thompson   @brief Create object holding CeedOperator assembly data.
1093ba746a46SJeremy L Thompson 
1094ba746a46SJeremy L Thompson   The CeedOperatorAssemblyData holds an array with references to every active CeedBasis used in the CeedOperator.
1095ba746a46SJeremy L Thompson   An array with references to the corresponding active CeedElemRestrictions is also stored.
1096ba746a46SJeremy L Thompson   For each active CeedBasis, the CeedOperatorAssemblyData holds an array of all input and output CeedEvalModes for this CeedBasis.
1097ba746a46SJeremy L Thompson   The CeedOperatorAssemblyData holds an array of offsets for indexing into the assembled CeedQFunction arrays to the row representing each
1098ba746a46SJeremy L Thompson CeedEvalMode.
1099ba746a46SJeremy L Thompson   The number of input columns across all active bases for the assembled CeedQFunction is also stored.
1100ba746a46SJeremy L Thompson   Lastly, the CeedOperatorAssembly data holds assembled matrices representing the full action of the CeedBasis for all CeedEvalModes.
1101ed9e99e6SJeremy L Thompson 
1102ea61e9acSJeremy L Thompson   @param[in]  ceed Ceed object where the CeedOperatorAssemblyData will be created
1103ed9e99e6SJeremy L Thompson   @param[in]  op   CeedOperator to be assembled
1104ea61e9acSJeremy L Thompson   @param[out] data Address of the variable where the newly created CeedOperatorAssemblyData will be stored
1105ed9e99e6SJeremy L Thompson 
1106ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1107ed9e99e6SJeremy L Thompson 
1108ed9e99e6SJeremy L Thompson   @ref Backend
1109ed9e99e6SJeremy L Thompson **/
11102b730f8bSJeremy L Thompson int CeedOperatorAssemblyDataCreate(Ceed ceed, CeedOperator op, CeedOperatorAssemblyData *data) {
1111437c7c90SJeremy L Thompson   CeedInt num_active_bases = 0;
1112437c7c90SJeremy L Thompson 
1113437c7c90SJeremy L Thompson   // Allocate
11142b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(1, data));
1115ed9e99e6SJeremy L Thompson   (*data)->ceed = ceed;
11162b730f8bSJeremy L Thompson   CeedCall(CeedReference(ceed));
1117ed9e99e6SJeremy L Thompson 
1118ed9e99e6SJeremy L Thompson   // Build OperatorAssembly data
1119ed9e99e6SJeremy L Thompson   CeedQFunction       qf;
1120ed9e99e6SJeremy L Thompson   CeedQFunctionField *qf_fields;
1121ed9e99e6SJeremy L Thompson   CeedOperatorField  *op_fields;
1122ed9e99e6SJeremy L Thompson   CeedInt             num_input_fields;
11232b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetQFunction(op, &qf));
11242b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionGetFields(qf, &num_input_fields, &qf_fields, NULL, NULL));
11252b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL));
1126ed9e99e6SJeremy L Thompson 
1127ed9e99e6SJeremy L Thompson   // Determine active input basis
1128437c7c90SJeremy L Thompson   CeedInt       *num_eval_modes_in = NULL, *num_eval_modes_out = NULL, offset = 0;
1129437c7c90SJeremy L Thompson   CeedEvalMode **eval_modes_in = NULL, **eval_modes_out = NULL;
1130437c7c90SJeremy L Thompson   CeedSize     **eval_mode_offsets_in = NULL, **eval_mode_offsets_out = NULL;
1131ed9e99e6SJeremy L Thompson   for (CeedInt i = 0; i < num_input_fields; i++) {
1132ed9e99e6SJeremy L Thompson     CeedVector vec;
11332b730f8bSJeremy L Thompson     CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec));
1134ed9e99e6SJeremy L Thompson     if (vec == CEED_VECTOR_ACTIVE) {
1135437c7c90SJeremy L Thompson       CeedBasis    basis_in = NULL;
1136437c7c90SJeremy L Thompson       CeedEvalMode eval_mode;
1137352a5e7cSSebastian Grimberg       CeedInt      index = -1, dim, num_comp, q_comp;
11382b730f8bSJeremy L Thompson       CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_in));
11392b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode));
1140352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetDimension(basis_in, &dim));
1141352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetNumComponents(basis_in, &num_comp));
1142352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetNumQuadratureComponents(basis_in, eval_mode, &q_comp));
1143437c7c90SJeremy L Thompson       for (CeedInt i = 0; i < num_active_bases; i++) {
1144437c7c90SJeremy L Thompson         if ((*data)->active_bases[i] == basis_in) index = i;
1145437c7c90SJeremy L Thompson       }
1146437c7c90SJeremy L Thompson       if (index == -1) {
1147437c7c90SJeremy L Thompson         CeedElemRestriction elem_rstr_in;
1148437c7c90SJeremy L Thompson         index = num_active_bases;
1149437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_bases));
1150437c7c90SJeremy L Thompson         (*data)->active_bases[num_active_bases] = NULL;
1151437c7c90SJeremy L Thompson         CeedCall(CeedBasisReferenceCopy(basis_in, &(*data)->active_bases[num_active_bases]));
1152437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_elem_rstrs));
1153437c7c90SJeremy L Thompson         (*data)->active_elem_rstrs[num_active_bases] = NULL;
1154437c7c90SJeremy L Thompson         CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr_in));
1155437c7c90SJeremy L Thompson         CeedCall(CeedElemRestrictionReferenceCopy(elem_rstr_in, &(*data)->active_elem_rstrs[num_active_bases]));
1156437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_in));
1157437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_out));
1158437c7c90SJeremy L Thompson         num_eval_modes_in[index]  = 0;
1159437c7c90SJeremy L Thompson         num_eval_modes_out[index] = 0;
1160437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_in));
1161437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_out));
1162437c7c90SJeremy L Thompson         eval_modes_in[index]  = NULL;
1163437c7c90SJeremy L Thompson         eval_modes_out[index] = NULL;
1164437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_in));
1165437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_out));
1166437c7c90SJeremy L Thompson         eval_mode_offsets_in[index]  = NULL;
1167437c7c90SJeremy L Thompson         eval_mode_offsets_out[index] = NULL;
1168437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_in));
1169437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_out));
1170437c7c90SJeremy L Thompson         (*data)->assembled_bases_in[index]  = NULL;
1171437c7c90SJeremy L Thompson         (*data)->assembled_bases_out[index] = NULL;
1172437c7c90SJeremy L Thompson         num_active_bases++;
1173437c7c90SJeremy L Thompson       }
1174352a5e7cSSebastian Grimberg       if (eval_mode != CEED_EVAL_WEIGHT) {
1175352a5e7cSSebastian Grimberg         // q_comp = 1 if CEED_EVAL_NONE, CEED_EVAL_WEIGHT caught by QF Assembly
1176352a5e7cSSebastian Grimberg         CeedCall(CeedRealloc(num_eval_modes_in[index] + q_comp, &eval_modes_in[index]));
1177352a5e7cSSebastian Grimberg         CeedCall(CeedRealloc(num_eval_modes_in[index] + q_comp, &eval_mode_offsets_in[index]));
1178352a5e7cSSebastian Grimberg         for (CeedInt d = 0; d < q_comp; d++) {
1179437c7c90SJeremy L Thompson           eval_modes_in[index][num_eval_modes_in[index] + d]        = eval_mode;
1180437c7c90SJeremy L Thompson           eval_mode_offsets_in[index][num_eval_modes_in[index] + d] = offset;
1181352a5e7cSSebastian Grimberg           offset += num_comp;
1182ed9e99e6SJeremy L Thompson         }
1183352a5e7cSSebastian Grimberg         num_eval_modes_in[index] += q_comp;
1184ed9e99e6SJeremy L Thompson       }
1185ed9e99e6SJeremy L Thompson     }
1186ed9e99e6SJeremy L Thompson   }
1187437c7c90SJeremy L Thompson   (*data)->num_eval_modes_in    = num_eval_modes_in;
1188437c7c90SJeremy L Thompson   (*data)->eval_modes_in        = eval_modes_in;
1189437c7c90SJeremy L Thompson   (*data)->eval_mode_offsets_in = eval_mode_offsets_in;
1190ed9e99e6SJeremy L Thompson 
1191ed9e99e6SJeremy L Thompson   // Determine active output basis
1192ed9e99e6SJeremy L Thompson   CeedInt num_output_fields;
11932b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionGetFields(qf, NULL, NULL, &num_output_fields, &qf_fields));
11942b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields));
1195437c7c90SJeremy L Thompson   offset = 0;
1196ed9e99e6SJeremy L Thompson   for (CeedInt i = 0; i < num_output_fields; i++) {
1197ed9e99e6SJeremy L Thompson     CeedVector vec;
11982b730f8bSJeremy L Thompson     CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec));
1199ed9e99e6SJeremy L Thompson     if (vec == CEED_VECTOR_ACTIVE) {
1200437c7c90SJeremy L Thompson       CeedBasis    basis_out = NULL;
1201ed9e99e6SJeremy L Thompson       CeedEvalMode eval_mode;
1202352a5e7cSSebastian Grimberg       CeedInt      index = -1, dim, num_comp, q_comp;
1203437c7c90SJeremy L Thompson       CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_out));
12042b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode));
1205352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetDimension(basis_out, &dim));
1206352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetNumComponents(basis_out, &num_comp));
1207352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetNumQuadratureComponents(basis_out, eval_mode, &q_comp));
1208437c7c90SJeremy L Thompson       for (CeedInt i = 0; i < num_active_bases; i++) {
1209437c7c90SJeremy L Thompson         if ((*data)->active_bases[i] == basis_out) index = i;
1210437c7c90SJeremy L Thompson       }
1211437c7c90SJeremy L Thompson       if (index == -1) {
1212437c7c90SJeremy L Thompson         CeedElemRestriction elem_rstr_out;
1213437c7c90SJeremy L Thompson 
1214437c7c90SJeremy L Thompson         index = num_active_bases;
1215437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_bases));
1216437c7c90SJeremy L Thompson         (*data)->active_bases[num_active_bases] = NULL;
1217437c7c90SJeremy L Thompson         CeedCall(CeedBasisReferenceCopy(basis_out, &(*data)->active_bases[num_active_bases]));
1218437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->active_elem_rstrs));
1219437c7c90SJeremy L Thompson         (*data)->active_elem_rstrs[num_active_bases] = NULL;
1220437c7c90SJeremy L Thompson         CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr_out));
1221437c7c90SJeremy L Thompson         CeedCall(CeedElemRestrictionReferenceCopy(elem_rstr_out, &(*data)->active_elem_rstrs[num_active_bases]));
1222437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_in));
1223437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &num_eval_modes_out));
1224437c7c90SJeremy L Thompson         num_eval_modes_in[index]  = 0;
1225437c7c90SJeremy L Thompson         num_eval_modes_out[index] = 0;
1226437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_in));
1227437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &eval_modes_out));
1228437c7c90SJeremy L Thompson         eval_modes_in[index]  = NULL;
1229437c7c90SJeremy L Thompson         eval_modes_out[index] = NULL;
1230437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_in));
1231437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &eval_mode_offsets_out));
1232437c7c90SJeremy L Thompson         eval_mode_offsets_in[index]  = NULL;
1233437c7c90SJeremy L Thompson         eval_mode_offsets_out[index] = NULL;
1234437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_in));
1235437c7c90SJeremy L Thompson         CeedCall(CeedRealloc(num_active_bases + 1, &(*data)->assembled_bases_out));
1236437c7c90SJeremy L Thompson         (*data)->assembled_bases_in[index]  = NULL;
1237437c7c90SJeremy L Thompson         (*data)->assembled_bases_out[index] = NULL;
1238437c7c90SJeremy L Thompson         num_active_bases++;
1239437c7c90SJeremy L Thompson       }
1240352a5e7cSSebastian Grimberg       if (eval_mode != CEED_EVAL_WEIGHT) {
1241352a5e7cSSebastian Grimberg         // q_comp = 1 if CEED_EVAL_NONE, CEED_EVAL_WEIGHT caught by QF Assembly
1242352a5e7cSSebastian Grimberg         CeedCall(CeedRealloc(num_eval_modes_out[index] + q_comp, &eval_modes_out[index]));
1243352a5e7cSSebastian Grimberg         CeedCall(CeedRealloc(num_eval_modes_out[index] + q_comp, &eval_mode_offsets_out[index]));
1244352a5e7cSSebastian Grimberg         for (CeedInt d = 0; d < q_comp; d++) {
1245437c7c90SJeremy L Thompson           eval_modes_out[index][num_eval_modes_out[index] + d]        = eval_mode;
1246437c7c90SJeremy L Thompson           eval_mode_offsets_out[index][num_eval_modes_out[index] + d] = offset;
1247352a5e7cSSebastian Grimberg           offset += num_comp;
1248ed9e99e6SJeremy L Thompson         }
1249352a5e7cSSebastian Grimberg         num_eval_modes_out[index] += q_comp;
1250ed9e99e6SJeremy L Thompson       }
1251ed9e99e6SJeremy L Thompson     }
1252ed9e99e6SJeremy L Thompson   }
1253437c7c90SJeremy L Thompson   (*data)->num_output_components = offset;
1254437c7c90SJeremy L Thompson   (*data)->num_eval_modes_out    = num_eval_modes_out;
1255437c7c90SJeremy L Thompson   (*data)->eval_modes_out        = eval_modes_out;
1256437c7c90SJeremy L Thompson   (*data)->eval_mode_offsets_out = eval_mode_offsets_out;
1257437c7c90SJeremy L Thompson   (*data)->num_active_bases      = num_active_bases;
1258ed9e99e6SJeremy L Thompson 
1259ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1260ed9e99e6SJeremy L Thompson }
1261ed9e99e6SJeremy L Thompson 
1262ed9e99e6SJeremy L Thompson /**
1263ba746a46SJeremy L Thompson   @brief Get CeedOperator CeedEvalModes for assembly.
1264ba746a46SJeremy L Thompson 
1265ba746a46SJeremy L Thompson   Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object.
1266ed9e99e6SJeremy L Thompson 
1267ed9e99e6SJeremy L Thompson   @param[in]  data                  CeedOperatorAssemblyData
1268ba746a46SJeremy L Thompson   @param[out] num_active_bases      Total number of active bases
1269c5d0f995SJed Brown   @param[out] num_eval_modes_in     Pointer to hold array of numbers of input CeedEvalModes, or NULL.
1270ba746a46SJeremy L Thompson                                       `eval_modes_in[0]` holds an array of eval modes for the first active basis.
1271c5d0f995SJed Brown   @param[out] eval_modes_in         Pointer to hold arrays of input CeedEvalModes, or NULL.
1272ba746a46SJeremy L Thompson   @param[out] eval_mode_offsets_in  Pointer to hold arrays of input offsets at each quadrature point.
1273c5d0f995SJed Brown   @param[out] num_eval_modes_out    Pointer to hold array of numbers of output CeedEvalModes, or NULL
1274c5d0f995SJed Brown   @param[out] eval_modes_out        Pointer to hold arrays of output CeedEvalModes, or NULL.
1275437c7c90SJeremy L Thompson   @param[out] eval_mode_offsets_out Pointer to hold arrays of output offsets at each quadrature point
1276ba746a46SJeremy L Thompson   @param[out] num_output_components The number of columns in the assembled CeedQFunction matrix for each quadrature point,
1277ba746a46SJeremy L Thompson                                       including contributions of all active bases
1278ed9e99e6SJeremy L Thompson 
1279ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1280ed9e99e6SJeremy L Thompson 
1281c5d0f995SJed Brown 
1282ed9e99e6SJeremy L Thompson   @ref Backend
1283ed9e99e6SJeremy L Thompson **/
1284437c7c90SJeremy L Thompson int CeedOperatorAssemblyDataGetEvalModes(CeedOperatorAssemblyData data, CeedInt *num_active_bases, CeedInt **num_eval_modes_in,
1285437c7c90SJeremy L Thompson                                          const CeedEvalMode ***eval_modes_in, CeedSize ***eval_mode_offsets_in, CeedInt **num_eval_modes_out,
1286437c7c90SJeremy L Thompson                                          const CeedEvalMode ***eval_modes_out, CeedSize ***eval_mode_offsets_out, CeedSize *num_output_components) {
1287437c7c90SJeremy L Thompson   if (num_active_bases) *num_active_bases = data->num_active_bases;
1288437c7c90SJeremy L Thompson   if (num_eval_modes_in) *num_eval_modes_in = data->num_eval_modes_in;
1289437c7c90SJeremy L Thompson   if (eval_modes_in) *eval_modes_in = (const CeedEvalMode **)data->eval_modes_in;
1290437c7c90SJeremy L Thompson   if (eval_mode_offsets_in) *eval_mode_offsets_in = data->eval_mode_offsets_in;
1291437c7c90SJeremy L Thompson   if (num_eval_modes_out) *num_eval_modes_out = data->num_eval_modes_out;
1292437c7c90SJeremy L Thompson   if (eval_modes_out) *eval_modes_out = (const CeedEvalMode **)data->eval_modes_out;
1293437c7c90SJeremy L Thompson   if (eval_mode_offsets_out) *eval_mode_offsets_out = data->eval_mode_offsets_out;
1294437c7c90SJeremy L Thompson   if (num_output_components) *num_output_components = data->num_output_components;
1295ed9e99e6SJeremy L Thompson 
1296ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1297ed9e99e6SJeremy L Thompson }
1298ed9e99e6SJeremy L Thompson 
1299ed9e99e6SJeremy L Thompson /**
1300ba746a46SJeremy L Thompson   @brief Get CeedOperator CeedBasis data for assembly.
1301ba746a46SJeremy L Thompson 
1302ba746a46SJeremy L Thompson   Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object.
1303ed9e99e6SJeremy L Thompson 
1304ed9e99e6SJeremy L Thompson   @param[in]  data                CeedOperatorAssemblyData
1305437c7c90SJeremy L Thompson   @param[out] num_active_bases    Number of active bases, or NULL
1306437c7c90SJeremy L Thompson   @param[out] active_bases        Pointer to hold active CeedBasis, or NULL
1307437c7c90SJeremy L Thompson   @param[out] assembled_bases_in  Pointer to hold assembled active input B, or NULL
1308437c7c90SJeremy L Thompson   @param[out] assembled_bases_out Pointer to hold assembled active output B, or NULL
1309ed9e99e6SJeremy L Thompson 
1310ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1311ed9e99e6SJeremy L Thompson 
1312ed9e99e6SJeremy L Thompson   @ref Backend
1313ed9e99e6SJeremy L Thompson **/
1314437c7c90SJeremy L Thompson int CeedOperatorAssemblyDataGetBases(CeedOperatorAssemblyData data, CeedInt *num_active_bases, CeedBasis **active_bases,
1315437c7c90SJeremy L Thompson                                      const CeedScalar ***assembled_bases_in, const CeedScalar ***assembled_bases_out) {
1316ed9e99e6SJeremy L Thompson   // Assemble B_in, B_out if needed
1317437c7c90SJeremy L Thompson   if (assembled_bases_in && !data->assembled_bases_in[0]) {
1318437c7c90SJeremy L Thompson     CeedInt num_qpts;
1319437c7c90SJeremy L Thompson 
1320437c7c90SJeremy L Thompson     CeedCall(CeedBasisGetNumQuadraturePoints(data->active_bases[0], &num_qpts));
1321437c7c90SJeremy L Thompson     for (CeedInt b = 0; b < data->num_active_bases; b++) {
1322352a5e7cSSebastian Grimberg       CeedInt     num_nodes;
1323437c7c90SJeremy L Thompson       CeedScalar *B_in = NULL, *identity = NULL;
1324ed9e99e6SJeremy L Thompson       bool        has_eval_none = false;
1325ed9e99e6SJeremy L Thompson 
1326352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetNumNodes(data->active_bases[b], &num_nodes));
1327352a5e7cSSebastian Grimberg       CeedCall(CeedCalloc(num_qpts * num_nodes * data->num_eval_modes_in[b], &B_in));
1328ed9e99e6SJeremy L Thompson 
1329437c7c90SJeremy L Thompson       for (CeedInt i = 0; i < data->num_eval_modes_in[b]; i++) {
1330437c7c90SJeremy L Thompson         has_eval_none = has_eval_none || (data->eval_modes_in[b][i] == CEED_EVAL_NONE);
1331ed9e99e6SJeremy L Thompson       }
1332ed9e99e6SJeremy L Thompson       if (has_eval_none) {
1333352a5e7cSSebastian Grimberg         CeedCall(CeedCalloc(num_qpts * num_nodes, &identity));
1334352a5e7cSSebastian Grimberg         for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) {
1335352a5e7cSSebastian Grimberg           identity[i * num_nodes + i] = 1.0;
1336ed9e99e6SJeremy L Thompson         }
1337ed9e99e6SJeremy L Thompson       }
1338ed9e99e6SJeremy L Thompson 
1339ed9e99e6SJeremy L Thompson       for (CeedInt q = 0; q < num_qpts; q++) {
1340352a5e7cSSebastian Grimberg         for (CeedInt n = 0; n < num_nodes; n++) {
1341352a5e7cSSebastian Grimberg           CeedInt      d_in              = 0, q_comp_in;
1342352a5e7cSSebastian Grimberg           CeedEvalMode eval_mode_in_prev = CEED_EVAL_NONE;
1343437c7c90SJeremy L Thompson           for (CeedInt e_in = 0; e_in < data->num_eval_modes_in[b]; e_in++) {
1344437c7c90SJeremy L Thompson             const CeedInt     qq = data->num_eval_modes_in[b] * q;
1345437c7c90SJeremy L Thompson             const CeedScalar *B  = NULL;
1346352a5e7cSSebastian Grimberg             CeedOperatorGetBasisPointer(data->active_bases[b], data->eval_modes_in[b][e_in], identity, &B);
1347352a5e7cSSebastian Grimberg             CeedCall(CeedBasisGetNumQuadratureComponents(data->active_bases[b], data->eval_modes_in[b][e_in], &q_comp_in));
1348352a5e7cSSebastian Grimberg             if (q_comp_in > 1) {
1349352a5e7cSSebastian Grimberg               if (e_in == 0 || data->eval_modes_in[b][e_in] != eval_mode_in_prev) d_in = 0;
1350352a5e7cSSebastian Grimberg               else B = &B[(++d_in) * num_qpts * num_nodes];
1351352a5e7cSSebastian Grimberg             }
1352352a5e7cSSebastian Grimberg             eval_mode_in_prev                 = data->eval_modes_in[b][e_in];
1353352a5e7cSSebastian Grimberg             B_in[(qq + e_in) * num_nodes + n] = B[q * num_nodes + n];
1354ed9e99e6SJeremy L Thompson           }
1355ed9e99e6SJeremy L Thompson         }
1356ed9e99e6SJeremy L Thompson       }
1357437c7c90SJeremy L Thompson       if (identity) CeedCall(CeedFree(identity));
1358437c7c90SJeremy L Thompson       data->assembled_bases_in[b] = B_in;
1359437c7c90SJeremy L Thompson     }
1360ed9e99e6SJeremy L Thompson   }
1361ed9e99e6SJeremy L Thompson 
1362437c7c90SJeremy L Thompson   if (assembled_bases_out && !data->assembled_bases_out[0]) {
1363437c7c90SJeremy L Thompson     CeedInt num_qpts;
1364437c7c90SJeremy L Thompson 
1365437c7c90SJeremy L Thompson     CeedCall(CeedBasisGetNumQuadraturePoints(data->active_bases[0], &num_qpts));
1366437c7c90SJeremy L Thompson     for (CeedInt b = 0; b < data->num_active_bases; b++) {
1367352a5e7cSSebastian Grimberg       CeedInt     num_nodes;
1368ed9e99e6SJeremy L Thompson       bool        has_eval_none = false;
1369437c7c90SJeremy L Thompson       CeedScalar *B_out = NULL, *identity = NULL;
1370ed9e99e6SJeremy L Thompson 
1371352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetNumNodes(data->active_bases[b], &num_nodes));
1372352a5e7cSSebastian Grimberg       CeedCall(CeedCalloc(num_qpts * num_nodes * data->num_eval_modes_out[b], &B_out));
1373ed9e99e6SJeremy L Thompson 
1374437c7c90SJeremy L Thompson       for (CeedInt i = 0; i < data->num_eval_modes_out[b]; i++) {
1375437c7c90SJeremy L Thompson         has_eval_none = has_eval_none || (data->eval_modes_out[b][i] == CEED_EVAL_NONE);
1376ed9e99e6SJeremy L Thompson       }
1377ed9e99e6SJeremy L Thompson       if (has_eval_none) {
1378352a5e7cSSebastian Grimberg         CeedCall(CeedCalloc(num_qpts * num_nodes, &identity));
1379352a5e7cSSebastian Grimberg         for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) {
1380352a5e7cSSebastian Grimberg           identity[i * num_nodes + i] = 1.0;
1381ed9e99e6SJeremy L Thompson         }
1382ed9e99e6SJeremy L Thompson       }
1383ed9e99e6SJeremy L Thompson 
1384ed9e99e6SJeremy L Thompson       for (CeedInt q = 0; q < num_qpts; q++) {
1385352a5e7cSSebastian Grimberg         for (CeedInt n = 0; n < num_nodes; n++) {
1386352a5e7cSSebastian Grimberg           CeedInt      d_out              = 0, q_comp_out;
1387352a5e7cSSebastian Grimberg           CeedEvalMode eval_mode_out_prev = CEED_EVAL_NONE;
1388437c7c90SJeremy L Thompson           for (CeedInt e_out = 0; e_out < data->num_eval_modes_out[b]; e_out++) {
1389437c7c90SJeremy L Thompson             const CeedInt     qq = data->num_eval_modes_out[b] * q;
1390437c7c90SJeremy L Thompson             const CeedScalar *B  = NULL;
1391352a5e7cSSebastian Grimberg             CeedOperatorGetBasisPointer(data->active_bases[b], data->eval_modes_out[b][e_out], identity, &B);
1392352a5e7cSSebastian Grimberg             CeedCall(CeedBasisGetNumQuadratureComponents(data->active_bases[b], data->eval_modes_out[b][e_out], &q_comp_out));
1393352a5e7cSSebastian Grimberg             if (q_comp_out > 1) {
1394352a5e7cSSebastian Grimberg               if (e_out == 0 || data->eval_modes_out[b][e_out] != eval_mode_out_prev) d_out = 0;
1395352a5e7cSSebastian Grimberg               else B = &B[(++d_out) * num_qpts * num_nodes];
1396352a5e7cSSebastian Grimberg             }
1397352a5e7cSSebastian Grimberg             eval_mode_out_prev                  = data->eval_modes_out[b][e_out];
1398352a5e7cSSebastian Grimberg             B_out[(qq + e_out) * num_nodes + n] = B[q * num_nodes + n];
1399ed9e99e6SJeremy L Thompson           }
1400ed9e99e6SJeremy L Thompson         }
1401ed9e99e6SJeremy L Thompson       }
1402437c7c90SJeremy L Thompson       if (identity) CeedCall(CeedFree(identity));
1403437c7c90SJeremy L Thompson       data->assembled_bases_out[b] = B_out;
1404437c7c90SJeremy L Thompson     }
1405ed9e99e6SJeremy L Thompson   }
1406ed9e99e6SJeremy L Thompson 
1407437c7c90SJeremy L Thompson   // Pass out assembled data
1408437c7c90SJeremy L Thompson   if (active_bases) *active_bases = data->active_bases;
1409437c7c90SJeremy L Thompson   if (assembled_bases_in) *assembled_bases_in = (const CeedScalar **)data->assembled_bases_in;
1410437c7c90SJeremy L Thompson   if (assembled_bases_out) *assembled_bases_out = (const CeedScalar **)data->assembled_bases_out;
1411437c7c90SJeremy L Thompson 
1412437c7c90SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1413437c7c90SJeremy L Thompson }
1414437c7c90SJeremy L Thompson 
1415437c7c90SJeremy L Thompson /**
1416ba746a46SJeremy L Thompson   @brief Get CeedOperator CeedBasis data for assembly.
1417ba746a46SJeremy L Thompson 
1418ba746a46SJeremy L Thompson   Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object.
1419437c7c90SJeremy L Thompson 
1420437c7c90SJeremy L Thompson   @param[in]  data                  CeedOperatorAssemblyData
1421437c7c90SJeremy L Thompson   @param[out] num_active_elem_rstrs Number of active element restrictions, or NULL
1422437c7c90SJeremy L Thompson   @param[out] active_elem_rstrs     Pointer to hold active CeedElemRestrictions, or NULL
1423437c7c90SJeremy L Thompson 
1424437c7c90SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1425437c7c90SJeremy L Thompson 
1426437c7c90SJeremy L Thompson   @ref Backend
1427437c7c90SJeremy L Thompson **/
1428437c7c90SJeremy L Thompson int CeedOperatorAssemblyDataGetElemRestrictions(CeedOperatorAssemblyData data, CeedInt *num_active_elem_rstrs,
1429437c7c90SJeremy L Thompson                                                 CeedElemRestriction **active_elem_rstrs) {
1430437c7c90SJeremy L Thompson   if (num_active_elem_rstrs) *num_active_elem_rstrs = data->num_active_bases;
1431437c7c90SJeremy L Thompson   if (active_elem_rstrs) *active_elem_rstrs = data->active_elem_rstrs;
1432ed9e99e6SJeremy L Thompson 
1433ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1434ed9e99e6SJeremy L Thompson }
1435ed9e99e6SJeremy L Thompson 
1436ed9e99e6SJeremy L Thompson /**
1437ed9e99e6SJeremy L Thompson   @brief Destroy CeedOperatorAssemblyData
1438ed9e99e6SJeremy L Thompson 
1439ea61e9acSJeremy L Thompson   @param[in,out] data CeedOperatorAssemblyData to destroy
1440ed9e99e6SJeremy L Thompson 
1441ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1442ed9e99e6SJeremy L Thompson 
1443ed9e99e6SJeremy L Thompson   @ref Backend
1444ed9e99e6SJeremy L Thompson **/
1445ed9e99e6SJeremy L Thompson int CeedOperatorAssemblyDataDestroy(CeedOperatorAssemblyData *data) {
1446ad6481ceSJeremy L Thompson   if (!*data) {
1447ad6481ceSJeremy L Thompson     *data = NULL;
1448ad6481ceSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1449ad6481ceSJeremy L Thompson   }
14502b730f8bSJeremy L Thompson   CeedCall(CeedDestroy(&(*data)->ceed));
1451437c7c90SJeremy L Thompson   for (CeedInt b = 0; b < (*data)->num_active_bases; b++) {
1452437c7c90SJeremy L Thompson     CeedCall(CeedBasisDestroy(&(*data)->active_bases[b]));
1453437c7c90SJeremy L Thompson     CeedCall(CeedElemRestrictionDestroy(&(*data)->active_elem_rstrs[b]));
1454437c7c90SJeremy L Thompson     CeedCall(CeedFree(&(*data)->eval_modes_in[b]));
1455437c7c90SJeremy L Thompson     CeedCall(CeedFree(&(*data)->eval_modes_out[b]));
1456437c7c90SJeremy L Thompson     CeedCall(CeedFree(&(*data)->eval_mode_offsets_in[b]));
1457437c7c90SJeremy L Thompson     CeedCall(CeedFree(&(*data)->eval_mode_offsets_out[b]));
1458437c7c90SJeremy L Thompson     CeedCall(CeedFree(&(*data)->assembled_bases_in[b]));
1459437c7c90SJeremy L Thompson     CeedCall(CeedFree(&(*data)->assembled_bases_out[b]));
1460437c7c90SJeremy L Thompson   }
1461437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->active_bases));
1462437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->active_elem_rstrs));
1463437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->num_eval_modes_in));
1464437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->num_eval_modes_out));
1465437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->eval_modes_in));
1466437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->eval_modes_out));
1467437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->eval_mode_offsets_in));
1468437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->eval_mode_offsets_out));
1469437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->assembled_bases_in));
1470437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->assembled_bases_out));
1471ed9e99e6SJeremy L Thompson 
14722b730f8bSJeremy L Thompson   CeedCall(CeedFree(data));
1473ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1474ed9e99e6SJeremy L Thompson }
1475ed9e99e6SJeremy L Thompson 
1476480fae85SJeremy L Thompson /// @}
1477480fae85SJeremy L Thompson 
1478480fae85SJeremy L Thompson /// ----------------------------------------------------------------------------
1479eaf62fffSJeremy L Thompson /// CeedOperator Public API
1480eaf62fffSJeremy L Thompson /// ----------------------------------------------------------------------------
1481eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorUser
1482eaf62fffSJeremy L Thompson /// @{
1483eaf62fffSJeremy L Thompson 
1484eaf62fffSJeremy L Thompson /**
1485eaf62fffSJeremy L Thompson   @brief Assemble a linear CeedQFunction associated with a CeedOperator
1486eaf62fffSJeremy L Thompson 
1487ea61e9acSJeremy L Thompson   This returns a CeedVector containing a matrix at each quadrature point providing the action of the CeedQFunction associated with the CeedOperator.
1488859c15bbSJames Wright   The vector `assembled` is of shape `[num_elements, num_input_fields, num_output_fields, num_quad_points]` and contains column-major matrices
1489859c15bbSJames Wright representing the action of the CeedQFunction for a corresponding quadrature point on an element.
1490859c15bbSJames Wright 
14919fd66db6SSebastian Grimberg   Inputs and outputs are in the order provided by the user when adding CeedOperator fields.
14929fd66db6SSebastian Grimberg   For example, a CeedQFunction with inputs 'u' and 'gradu' and outputs 'gradv' and 'v', provided in that order, would result in an assembled QFunction
14939fd66db6SSebastian Grimberg that consists of (1 + dim) x (dim + 1) matrices at each quadrature point acting on the input [u, du_0, du_1] and producing the output [dv_0, dv_1, v].
1494eaf62fffSJeremy L Thompson 
1495ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1496f04ea552SJeremy L Thompson 
1497ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1498ea61e9acSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points
1499ea61e9acSJeremy L Thompson   @param[out] rstr      CeedElemRestriction for CeedVector containing assembled CeedQFunction
1500ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1501eaf62fffSJeremy L Thompson 
1502eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1503eaf62fffSJeremy L Thompson 
1504eaf62fffSJeremy L Thompson   @ref User
1505eaf62fffSJeremy L Thompson **/
15062b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunction(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) {
15072b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1508eaf62fffSJeremy L Thompson 
1509eaf62fffSJeremy L Thompson   if (op->LinearAssembleQFunction) {
1510d04bbc78SJeremy L Thompson     // Backend version
15112b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleQFunction(op, assembled, rstr, request));
1512eaf62fffSJeremy L Thompson   } else {
1513d04bbc78SJeremy L Thompson     // Operator fallback
1514d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1515d04bbc78SJeremy L Thompson 
15162b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
15176574a04fSJeremy L Thompson     if (op_fallback) CeedCall(CeedOperatorLinearAssembleQFunction(op_fallback, assembled, rstr, request));
15186574a04fSJeremy L Thompson     else return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunction");
151970a7ffb3SJeremy L Thompson   }
1520eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1521eaf62fffSJeremy L Thompson }
152270a7ffb3SJeremy L Thompson 
152370a7ffb3SJeremy L Thompson /**
1524ea61e9acSJeremy L Thompson   @brief Assemble CeedQFunction and store result internally.
15254385fb7fSSebastian Grimberg 
1526ea61e9acSJeremy L Thompson   Return copied references of stored data to the caller.
1527ea61e9acSJeremy L Thompson   Caller is responsible for ownership and destruction of the copied references.
1528ea61e9acSJeremy L Thompson   See also @ref CeedOperatorLinearAssembleQFunction
152970a7ffb3SJeremy L Thompson 
1530c5f45aeaSJeremy L Thompson   Note: If the value of `assembled` or `rstr` passed to this function are non-NULL, then it is assumed that they hold valid pointers.
1531c5f45aeaSJeremy L Thompson         These objects will be destroyed if `*assembled` or `*rstr` is the only reference to the object.
1532c5f45aeaSJeremy L Thompson 
1533ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1534ea61e9acSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points
1535ea61e9acSJeremy L Thompson   @param[out] rstr      CeedElemRestriction for CeedVector containing assembledCeedQFunction
1536ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
153770a7ffb3SJeremy L Thompson 
153870a7ffb3SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
153970a7ffb3SJeremy L Thompson 
154070a7ffb3SJeremy L Thompson   @ref User
154170a7ffb3SJeremy L Thompson **/
15422b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunctionBuildOrUpdate(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) {
1543*b05f7e9fSJeremy L Thompson   int (*LinearAssembleQFunctionUpdate)(CeedOperator, CeedVector, CeedElemRestriction, CeedRequest *) = NULL;
1544*b05f7e9fSJeremy L Thompson   CeedOperator op_assemble                                                                           = NULL;
1545*b05f7e9fSJeremy L Thompson 
15462b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
154770a7ffb3SJeremy L Thompson 
1548*b05f7e9fSJeremy L Thompson   // Determine if fallback parent or operator has implementation
1549*b05f7e9fSJeremy L Thompson   if (op->op_fallback_parent && op->op_fallback_parent->LinearAssembleQFunctionUpdate) {
1550*b05f7e9fSJeremy L Thompson     // -- Backend version for op fallback parent is faster, if it exists
1551*b05f7e9fSJeremy L Thompson     LinearAssembleQFunctionUpdate = op->op_fallback_parent->LinearAssembleQFunctionUpdate;
1552*b05f7e9fSJeremy L Thompson     op_assemble                   = op->op_fallback_parent;
1553*b05f7e9fSJeremy L Thompson   } else if (op->LinearAssembleQFunctionUpdate) {
1554*b05f7e9fSJeremy L Thompson     // -- Backend version for op
1555*b05f7e9fSJeremy L Thompson     LinearAssembleQFunctionUpdate = op->LinearAssembleQFunctionUpdate;
1556*b05f7e9fSJeremy L Thompson     op_assemble                   = op;
1557*b05f7e9fSJeremy L Thompson   }
1558*b05f7e9fSJeremy L Thompson 
1559*b05f7e9fSJeremy L Thompson   // Assemble QFunction
1560*b05f7e9fSJeremy L Thompson   if (LinearAssembleQFunctionUpdate) {
1561*b05f7e9fSJeremy L Thompson     // Backend or fallback parent version
1562480fae85SJeremy L Thompson     bool                qf_assembled_is_setup;
15632efa2d85SJeremy L Thompson     CeedVector          assembled_vec  = NULL;
15642efa2d85SJeremy L Thompson     CeedElemRestriction assembled_rstr = NULL;
1565480fae85SJeremy L Thompson 
15662b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAssemblyDataIsSetup(op->qf_assembled, &qf_assembled_is_setup));
1567480fae85SJeremy L Thompson     if (qf_assembled_is_setup) {
1568d04bbc78SJeremy L Thompson       bool update_needed;
1569d04bbc78SJeremy L Thompson 
15702b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionAssemblyDataGetObjects(op->qf_assembled, &assembled_vec, &assembled_rstr));
15712b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionAssemblyDataIsUpdateNeeded(op->qf_assembled, &update_needed));
1572*b05f7e9fSJeremy L Thompson       if (update_needed) CeedCall(LinearAssembleQFunctionUpdate(op_assemble, assembled_vec, assembled_rstr, request));
157370a7ffb3SJeremy L Thompson     } else {
1574*b05f7e9fSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleQFunction(op_assemble, &assembled_vec, &assembled_rstr, request));
15752b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionAssemblyDataSetObjects(op->qf_assembled, assembled_vec, assembled_rstr));
157670a7ffb3SJeremy L Thompson     }
15772b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAssemblyDataSetUpdateNeeded(op->qf_assembled, false));
15782efa2d85SJeremy L Thompson 
1579d04bbc78SJeremy L Thompson     // Copy reference from internally held copy
15802b730f8bSJeremy L Thompson     CeedCall(CeedVectorReferenceCopy(assembled_vec, assembled));
15812b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionReferenceCopy(assembled_rstr, rstr));
1582c5f45aeaSJeremy L Thompson     CeedCall(CeedVectorDestroy(&assembled_vec));
15832b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionDestroy(&assembled_rstr));
158470a7ffb3SJeremy L Thompson   } else {
1585d04bbc78SJeremy L Thompson     // Operator fallback
1586d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1587d04bbc78SJeremy L Thompson 
15882b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
15896574a04fSJeremy L Thompson     if (op_fallback) CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op_fallback, assembled, rstr, request));
15906574a04fSJeremy L Thompson     else return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunctionUpdate");
159170a7ffb3SJeremy L Thompson   }
159270a7ffb3SJeremy L Thompson 
159370a7ffb3SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1594eaf62fffSJeremy L Thompson }
1595eaf62fffSJeremy L Thompson 
1596eaf62fffSJeremy L Thompson /**
1597eaf62fffSJeremy L Thompson   @brief Assemble the diagonal of a square linear CeedOperator
1598eaf62fffSJeremy L Thompson 
1599eaf62fffSJeremy L Thompson   This overwrites a CeedVector with the diagonal of a linear CeedOperator.
1600eaf62fffSJeremy L Thompson 
1601ea61e9acSJeremy L Thompson   Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported.
1602eaf62fffSJeremy L Thompson 
1603ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1604f04ea552SJeremy L Thompson 
1605ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1606eaf62fffSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedOperator diagonal
1607ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1608eaf62fffSJeremy L Thompson 
1609eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1610eaf62fffSJeremy L Thompson 
1611eaf62fffSJeremy L Thompson   @ref User
1612eaf62fffSJeremy L Thompson **/
16132b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) {
1614f3d47e36SJeremy L Thompson   bool is_composite;
16152b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1616f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1617eaf62fffSJeremy L Thompson 
1618c9366a6bSJeremy L Thompson   CeedSize input_size = 0, output_size = 0;
16192b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size));
16206574a04fSJeremy L Thompson   CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square");
1621c9366a6bSJeremy L Thompson 
1622f3d47e36SJeremy L Thompson   // Early exit for empty operator
1623f3d47e36SJeremy L Thompson   if (!is_composite) {
1624f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
1625f3d47e36SJeremy L Thompson 
1626f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
1627f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
1628f3d47e36SJeremy L Thompson   }
1629f3d47e36SJeremy L Thompson 
1630eaf62fffSJeremy L Thompson   if (op->LinearAssembleDiagonal) {
1631d04bbc78SJeremy L Thompson     // Backend version
16322b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleDiagonal(op, assembled, request));
1633eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1634eaf62fffSJeremy L Thompson   } else if (op->LinearAssembleAddDiagonal) {
1635d04bbc78SJeremy L Thompson     // Backend version with zeroing first
16362b730f8bSJeremy L Thompson     CeedCall(CeedVectorSetValue(assembled, 0.0));
16372b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request));
1638eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1639eaf62fffSJeremy L Thompson   } else {
1640d04bbc78SJeremy L Thompson     // Operator fallback
1641d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1642d04bbc78SJeremy L Thompson 
16432b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1644d04bbc78SJeremy L Thompson     if (op_fallback) {
16452b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleDiagonal(op_fallback, assembled, request));
1646eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1647eaf62fffSJeremy L Thompson     }
1648eaf62fffSJeremy L Thompson   }
1649eaf62fffSJeremy L Thompson   // Default interface implementation
16502b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(assembled, 0.0));
16512b730f8bSJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleAddDiagonal(op, assembled, request));
1652d04bbc78SJeremy L Thompson 
1653eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1654eaf62fffSJeremy L Thompson }
1655eaf62fffSJeremy L Thompson 
1656eaf62fffSJeremy L Thompson /**
1657eaf62fffSJeremy L Thompson   @brief Assemble the diagonal of a square linear CeedOperator
1658eaf62fffSJeremy L Thompson 
1659eaf62fffSJeremy L Thompson   This sums into a CeedVector the diagonal of a linear CeedOperator.
1660eaf62fffSJeremy L Thompson 
1661ea61e9acSJeremy L Thompson   Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported.
1662eaf62fffSJeremy L Thompson 
1663ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1664f04ea552SJeremy L Thompson 
1665ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1666eaf62fffSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedOperator diagonal
1667ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1668eaf62fffSJeremy L Thompson 
1669eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1670eaf62fffSJeremy L Thompson 
1671eaf62fffSJeremy L Thompson   @ref User
1672eaf62fffSJeremy L Thompson **/
16732b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) {
1674f3d47e36SJeremy L Thompson   bool is_composite;
16752b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1676f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1677eaf62fffSJeremy L Thompson 
1678c9366a6bSJeremy L Thompson   CeedSize input_size = 0, output_size = 0;
16792b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size));
16806574a04fSJeremy L Thompson   CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square");
1681c9366a6bSJeremy L Thompson 
1682f3d47e36SJeremy L Thompson   // Early exit for empty operator
1683f3d47e36SJeremy L Thompson   if (!is_composite) {
1684f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
1685f3d47e36SJeremy L Thompson 
1686f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
1687f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
1688f3d47e36SJeremy L Thompson   }
1689f3d47e36SJeremy L Thompson 
1690eaf62fffSJeremy L Thompson   if (op->LinearAssembleAddDiagonal) {
1691d04bbc78SJeremy L Thompson     // Backend version
16922b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request));
1693eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1694eaf62fffSJeremy L Thompson   } else {
1695d04bbc78SJeremy L Thompson     // Operator fallback
1696d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1697d04bbc78SJeremy L Thompson 
16982b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1699d04bbc78SJeremy L Thompson     if (op_fallback) {
17002b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleAddDiagonal(op_fallback, assembled, request));
1701eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1702eaf62fffSJeremy L Thompson     }
1703eaf62fffSJeremy L Thompson   }
1704eaf62fffSJeremy L Thompson   // Default interface implementation
1705eaf62fffSJeremy L Thompson   if (is_composite) {
17062b730f8bSJeremy L Thompson     CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, false, assembled));
1707eaf62fffSJeremy L Thompson   } else {
17082b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, false, assembled));
1709eaf62fffSJeremy L Thompson   }
1710d04bbc78SJeremy L Thompson 
1711d04bbc78SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1712eaf62fffSJeremy L Thompson }
1713eaf62fffSJeremy L Thompson 
1714eaf62fffSJeremy L Thompson /**
1715eaf62fffSJeremy L Thompson   @brief Assemble the point block diagonal of a square linear CeedOperator
1716eaf62fffSJeremy L Thompson 
1717ea61e9acSJeremy L Thompson   This overwrites a CeedVector with the point block diagonal of a linear CeedOperator.
1718eaf62fffSJeremy L Thompson 
1719ea61e9acSJeremy L Thompson   Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported.
1720eaf62fffSJeremy L Thompson 
1721ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1722f04ea552SJeremy L Thompson 
1723ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1724ea61e9acSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp
1725ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out,
1726ea61e9acSJeremy L Thompson component in].
1727ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1728eaf62fffSJeremy L Thompson 
1729eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1730eaf62fffSJeremy L Thompson 
1731eaf62fffSJeremy L Thompson   @ref User
1732eaf62fffSJeremy L Thompson **/
17332b730f8bSJeremy L Thompson int CeedOperatorLinearAssemblePointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) {
1734f3d47e36SJeremy L Thompson   bool is_composite;
17352b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1736f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1737eaf62fffSJeremy L Thompson 
1738c9366a6bSJeremy L Thompson   CeedSize input_size = 0, output_size = 0;
17392b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size));
17406574a04fSJeremy L Thompson   CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square");
1741c9366a6bSJeremy L Thompson 
1742f3d47e36SJeremy L Thompson   // Early exit for empty operator
1743f3d47e36SJeremy L Thompson   if (!is_composite) {
1744f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
1745f3d47e36SJeremy L Thompson 
1746f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
1747f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
1748f3d47e36SJeremy L Thompson   }
1749f3d47e36SJeremy L Thompson 
1750eaf62fffSJeremy L Thompson   if (op->LinearAssemblePointBlockDiagonal) {
1751d04bbc78SJeremy L Thompson     // Backend version
17522b730f8bSJeremy L Thompson     CeedCall(op->LinearAssemblePointBlockDiagonal(op, assembled, request));
1753eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1754eaf62fffSJeremy L Thompson   } else if (op->LinearAssembleAddPointBlockDiagonal) {
1755d04bbc78SJeremy L Thompson     // Backend version with zeroing first
17562b730f8bSJeremy L Thompson     CeedCall(CeedVectorSetValue(assembled, 0.0));
17572b730f8bSJeremy L Thompson     CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request));
1758eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1759eaf62fffSJeremy L Thompson   } else {
1760d04bbc78SJeremy L Thompson     // Operator fallback
1761d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1762d04bbc78SJeremy L Thompson 
17632b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1764d04bbc78SJeremy L Thompson     if (op_fallback) {
17652b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssemblePointBlockDiagonal(op_fallback, assembled, request));
1766eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1767eaf62fffSJeremy L Thompson     }
1768eaf62fffSJeremy L Thompson   }
1769eaf62fffSJeremy L Thompson   // Default interface implementation
17702b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(assembled, 0.0));
17712b730f8bSJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request));
1772d04bbc78SJeremy L Thompson 
1773eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1774eaf62fffSJeremy L Thompson }
1775eaf62fffSJeremy L Thompson 
1776eaf62fffSJeremy L Thompson /**
1777eaf62fffSJeremy L Thompson   @brief Assemble the point block diagonal of a square linear CeedOperator
1778eaf62fffSJeremy L Thompson 
1779ea61e9acSJeremy L Thompson   This sums into a CeedVector with the point block diagonal of a linear CeedOperator.
1780eaf62fffSJeremy L Thompson 
1781ea61e9acSJeremy L Thompson   Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported.
1782eaf62fffSJeremy L Thompson 
1783ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1784f04ea552SJeremy L Thompson 
1785ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1786ea61e9acSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp
1787ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out,
1788ea61e9acSJeremy L Thompson component in].
1789ea61e9acSJeremy L Thompson   @param[in]  request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1790eaf62fffSJeremy L Thompson 
1791eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1792eaf62fffSJeremy L Thompson 
1793eaf62fffSJeremy L Thompson   @ref User
1794eaf62fffSJeremy L Thompson **/
17952b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddPointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) {
1796f3d47e36SJeremy L Thompson   bool is_composite;
17972b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1798f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1799eaf62fffSJeremy L Thompson 
1800c9366a6bSJeremy L Thompson   CeedSize input_size = 0, output_size = 0;
18012b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size));
18026574a04fSJeremy L Thompson   CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square");
1803c9366a6bSJeremy L Thompson 
1804f3d47e36SJeremy L Thompson   // Early exit for empty operator
1805f3d47e36SJeremy L Thompson   if (!is_composite) {
1806f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
1807f3d47e36SJeremy L Thompson 
1808f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
1809f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
1810f3d47e36SJeremy L Thompson   }
1811f3d47e36SJeremy L Thompson 
1812eaf62fffSJeremy L Thompson   if (op->LinearAssembleAddPointBlockDiagonal) {
1813d04bbc78SJeremy L Thompson     // Backend version
18142b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleAddPointBlockDiagonal(op, assembled, request));
1815eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1816eaf62fffSJeremy L Thompson   } else {
1817d04bbc78SJeremy L Thompson     // Operator fallback
1818d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1819d04bbc78SJeremy L Thompson 
18202b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1821d04bbc78SJeremy L Thompson     if (op_fallback) {
18222b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op_fallback, assembled, request));
1823eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1824eaf62fffSJeremy L Thompson     }
1825eaf62fffSJeremy L Thompson   }
1826ea61e9acSJeremy L Thompson   // Default interface implementation
1827eaf62fffSJeremy L Thompson   if (is_composite) {
18282b730f8bSJeremy L Thompson     CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, true, assembled));
1829eaf62fffSJeremy L Thompson   } else {
18302b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, true, assembled));
1831eaf62fffSJeremy L Thompson   }
1832d04bbc78SJeremy L Thompson 
1833d04bbc78SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1834eaf62fffSJeremy L Thompson }
1835eaf62fffSJeremy L Thompson 
1836eaf62fffSJeremy L Thompson /**
1837eaf62fffSJeremy L Thompson    @brief Fully assemble the nonzero pattern of a linear operator.
1838eaf62fffSJeremy L Thompson 
1839ea61e9acSJeremy L Thompson    Expected to be used in conjunction with CeedOperatorLinearAssemble().
1840eaf62fffSJeremy L Thompson 
1841ea61e9acSJeremy L Thompson    The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the
18429fd66db6SSebastian Grimberg matrix in entry (i, j).
18439fd66db6SSebastian Grimberg   Note that the (i, j) pairs are not unique and may repeat.
18449fd66db6SSebastian Grimberg   This function returns the number of entries and their (i, j) locations, while CeedOperatorLinearAssemble() provides the values in the same ordering.
1845eaf62fffSJeremy L Thompson 
1846eaf62fffSJeremy L Thompson    This will generally be slow unless your operator is low-order.
1847eaf62fffSJeremy L Thompson 
1848ea61e9acSJeremy L Thompson    Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1849f04ea552SJeremy L Thompson 
1850eaf62fffSJeremy L Thompson    @param[in]  op          CeedOperator to assemble
1851eaf62fffSJeremy L Thompson    @param[out] num_entries Number of entries in coordinate nonzero pattern
1852eaf62fffSJeremy L Thompson    @param[out] rows        Row number for each entry
1853eaf62fffSJeremy L Thompson    @param[out] cols        Column number for each entry
1854eaf62fffSJeremy L Thompson 
1855eaf62fffSJeremy L Thompson    @ref User
1856eaf62fffSJeremy L Thompson **/
18572b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleSymbolic(CeedOperator op, CeedSize *num_entries, CeedInt **rows, CeedInt **cols) {
1858b94338b9SJed Brown   CeedInt       num_suboperators;
1859b94338b9SJed Brown   CeedSize      single_entries;
1860eaf62fffSJeremy L Thompson   CeedOperator *sub_operators;
1861eaf62fffSJeremy L Thompson   bool          is_composite;
18622b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1863f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1864eaf62fffSJeremy L Thompson 
1865eaf62fffSJeremy L Thompson   if (op->LinearAssembleSymbolic) {
1866d04bbc78SJeremy L Thompson     // Backend version
18672b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleSymbolic(op, num_entries, rows, cols));
1868eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1869eaf62fffSJeremy L Thompson   } else {
1870d04bbc78SJeremy L Thompson     // Operator fallback
1871d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1872d04bbc78SJeremy L Thompson 
18732b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1874d04bbc78SJeremy L Thompson     if (op_fallback) {
18752b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleSymbolic(op_fallback, num_entries, rows, cols));
1876eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1877eaf62fffSJeremy L Thompson     }
1878eaf62fffSJeremy L Thompson   }
1879eaf62fffSJeremy L Thompson 
1880eaf62fffSJeremy L Thompson   // Default interface implementation
1881eaf62fffSJeremy L Thompson 
1882eaf62fffSJeremy L Thompson   // count entries and allocate rows, cols arrays
1883eaf62fffSJeremy L Thompson   *num_entries = 0;
1884eaf62fffSJeremy L Thompson   if (is_composite) {
1885c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
1886c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
188792ae7e47SJeremy L Thompson     for (CeedInt k = 0; k < num_suboperators; ++k) {
18882b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries));
1889eaf62fffSJeremy L Thompson       *num_entries += single_entries;
1890eaf62fffSJeremy L Thompson     }
1891eaf62fffSJeremy L Thompson   } else {
18922b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssemblyCountEntries(op, &single_entries));
1893eaf62fffSJeremy L Thompson     *num_entries += single_entries;
1894eaf62fffSJeremy L Thompson   }
18952b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(*num_entries, rows));
18962b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(*num_entries, cols));
1897eaf62fffSJeremy L Thompson 
1898eaf62fffSJeremy L Thompson   // assemble nonzero locations
1899eaf62fffSJeremy L Thompson   CeedInt offset = 0;
1900eaf62fffSJeremy L Thompson   if (is_composite) {
1901c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
1902c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
190392ae7e47SJeremy L Thompson     for (CeedInt k = 0; k < num_suboperators; ++k) {
19042b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssembleSymbolic(sub_operators[k], offset, *rows, *cols));
19052b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries));
1906eaf62fffSJeremy L Thompson       offset += single_entries;
1907eaf62fffSJeremy L Thompson     }
1908eaf62fffSJeremy L Thompson   } else {
19092b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssembleSymbolic(op, offset, *rows, *cols));
1910eaf62fffSJeremy L Thompson   }
1911eaf62fffSJeremy L Thompson 
1912eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1913eaf62fffSJeremy L Thompson }
1914eaf62fffSJeremy L Thompson 
1915eaf62fffSJeremy L Thompson /**
1916eaf62fffSJeremy L Thompson    @brief Fully assemble the nonzero entries of a linear operator.
1917eaf62fffSJeremy L Thompson 
1918ea61e9acSJeremy L Thompson    Expected to be used in conjunction with CeedOperatorLinearAssembleSymbolic().
1919eaf62fffSJeremy L Thompson 
1920ea61e9acSJeremy L Thompson    The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the
19219fd66db6SSebastian Grimberg matrix in entry (i, j).
19229fd66db6SSebastian Grimberg   Note that the (i, j) pairs are not unique and may repeat.
19239fd66db6SSebastian Grimberg   This function returns the values of the nonzero entries to be added, their (i, j) locations are provided by CeedOperatorLinearAssembleSymbolic()
1924eaf62fffSJeremy L Thompson 
1925eaf62fffSJeremy L Thompson    This will generally be slow unless your operator is low-order.
1926eaf62fffSJeremy L Thompson 
1927ea61e9acSJeremy L Thompson    Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1928f04ea552SJeremy L Thompson 
1929eaf62fffSJeremy L Thompson    @param[in]  op     CeedOperator to assemble
1930eaf62fffSJeremy L Thompson    @param[out] values Values to assemble into matrix
1931eaf62fffSJeremy L Thompson 
1932eaf62fffSJeremy L Thompson    @ref User
1933eaf62fffSJeremy L Thompson **/
1934eaf62fffSJeremy L Thompson int CeedOperatorLinearAssemble(CeedOperator op, CeedVector values) {
1935b94338b9SJed Brown   CeedInt       num_suboperators;
1936b94338b9SJed Brown   CeedSize      single_entries = 0;
1937eaf62fffSJeremy L Thompson   CeedOperator *sub_operators;
1938f3d47e36SJeremy L Thompson   bool          is_composite;
19392b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1940f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1941f3d47e36SJeremy L Thompson 
1942f3d47e36SJeremy L Thompson   // Early exit for empty operator
1943f3d47e36SJeremy L Thompson   if (!is_composite) {
1944f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
1945f3d47e36SJeremy L Thompson 
1946f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
1947f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
1948f3d47e36SJeremy L Thompson   }
1949eaf62fffSJeremy L Thompson 
1950eaf62fffSJeremy L Thompson   if (op->LinearAssemble) {
1951d04bbc78SJeremy L Thompson     // Backend version
19522b730f8bSJeremy L Thompson     CeedCall(op->LinearAssemble(op, values));
1953eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1954eaf62fffSJeremy L Thompson   } else {
1955d04bbc78SJeremy L Thompson     // Operator fallback
1956d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1957d04bbc78SJeremy L Thompson 
19582b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1959d04bbc78SJeremy L Thompson     if (op_fallback) {
19602b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssemble(op_fallback, values));
1961eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1962eaf62fffSJeremy L Thompson     }
1963eaf62fffSJeremy L Thompson   }
1964eaf62fffSJeremy L Thompson 
1965eaf62fffSJeremy L Thompson   // Default interface implementation
1966eaf62fffSJeremy L Thompson   CeedInt offset = 0;
196728ec399dSJeremy L Thompson   CeedCall(CeedVectorSetValue(values, 0.0));
1968eaf62fffSJeremy L Thompson   if (is_composite) {
1969c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
1970c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
1971cefa2673SJeremy L Thompson     for (CeedInt k = 0; k < num_suboperators; k++) {
19722b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemble(sub_operators[k], offset, values));
19732b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries));
1974eaf62fffSJeremy L Thompson       offset += single_entries;
1975eaf62fffSJeremy L Thompson     }
1976eaf62fffSJeremy L Thompson   } else {
19772b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssemble(op, offset, values));
1978eaf62fffSJeremy L Thompson   }
1979eaf62fffSJeremy L Thompson 
1980eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1981eaf62fffSJeremy L Thompson }
1982eaf62fffSJeremy L Thompson 
1983eaf62fffSJeremy L Thompson /**
198475f0d5a4SJeremy L Thompson   @brief Get the multiplicity of nodes across suboperators in a composite CeedOperator
198575f0d5a4SJeremy L Thompson 
198675f0d5a4SJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
198775f0d5a4SJeremy L Thompson 
198875f0d5a4SJeremy L Thompson   @param[in]  op               Composite CeedOperator
198975f0d5a4SJeremy L Thompson   @param[in]  num_skip_indices Number of suboperators to skip
199075f0d5a4SJeremy L Thompson   @param[in]  skip_indices     Array of indices of suboperators to skip
199175f0d5a4SJeremy L Thompson   @param[out] mult             Vector to store multiplicity (of size l_size)
199275f0d5a4SJeremy L Thompson 
199375f0d5a4SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
199475f0d5a4SJeremy L Thompson 
199575f0d5a4SJeremy L Thompson   @ref User
199675f0d5a4SJeremy L Thompson **/
199775f0d5a4SJeremy L Thompson int CeedCompositeOperatorGetMultiplicity(CeedOperator op, CeedInt num_skip_indices, CeedInt *skip_indices, CeedVector mult) {
199875f0d5a4SJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
199975f0d5a4SJeremy L Thompson 
200075f0d5a4SJeremy L Thompson   Ceed                ceed;
2001b275c451SJeremy L Thompson   CeedInt             num_suboperators;
200275f0d5a4SJeremy L Thompson   CeedSize            l_vec_len;
200375f0d5a4SJeremy L Thompson   CeedScalar         *mult_array;
200475f0d5a4SJeremy L Thompson   CeedVector          ones_l_vec;
2005437c7c90SJeremy L Thompson   CeedElemRestriction elem_rstr;
2006b275c451SJeremy L Thompson   CeedOperator       *sub_operators;
200775f0d5a4SJeremy L Thompson 
200875f0d5a4SJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
200975f0d5a4SJeremy L Thompson 
201075f0d5a4SJeremy L Thompson   // Zero mult vector
201175f0d5a4SJeremy L Thompson   CeedCall(CeedVectorSetValue(mult, 0.0));
201275f0d5a4SJeremy L Thompson 
201375f0d5a4SJeremy L Thompson   // Get suboperators
2014b275c451SJeremy L Thompson   CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
2015b275c451SJeremy L Thompson   CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
2016b275c451SJeremy L Thompson   if (num_suboperators == 0) return CEED_ERROR_SUCCESS;
201775f0d5a4SJeremy L Thompson 
201875f0d5a4SJeremy L Thompson   // Work vector
201975f0d5a4SJeremy L Thompson   CeedCall(CeedVectorGetLength(mult, &l_vec_len));
202075f0d5a4SJeremy L Thompson   CeedCall(CeedVectorCreate(ceed, l_vec_len, &ones_l_vec));
202175f0d5a4SJeremy L Thompson   CeedCall(CeedVectorSetValue(ones_l_vec, 1.0));
202275f0d5a4SJeremy L Thompson   CeedCall(CeedVectorGetArray(mult, CEED_MEM_HOST, &mult_array));
202375f0d5a4SJeremy L Thompson 
202475f0d5a4SJeremy L Thompson   // Compute multiplicity across suboperators
2025b275c451SJeremy L Thompson   for (CeedInt i = 0; i < num_suboperators; i++) {
202675f0d5a4SJeremy L Thompson     const CeedScalar *sub_mult_array;
202775f0d5a4SJeremy L Thompson     CeedVector        sub_mult_l_vec, ones_e_vec;
202875f0d5a4SJeremy L Thompson 
202975f0d5a4SJeremy L Thompson     // -- Check for suboperator to skip
203075f0d5a4SJeremy L Thompson     for (CeedInt j = 0; j < num_skip_indices; j++) {
203175f0d5a4SJeremy L Thompson       if (skip_indices[j] == i) continue;
203275f0d5a4SJeremy L Thompson     }
203375f0d5a4SJeremy L Thompson 
203475f0d5a4SJeremy L Thompson     // -- Sub operator multiplicity
2035437c7c90SJeremy L Thompson     CeedCall(CeedOperatorGetActiveElemRestriction(sub_operators[i], &elem_rstr));
2036437c7c90SJeremy L Thompson     CeedCall(CeedElemRestrictionCreateVector(elem_rstr, &sub_mult_l_vec, &ones_e_vec));
203775f0d5a4SJeremy L Thompson     CeedCall(CeedVectorSetValue(sub_mult_l_vec, 0.0));
2038437c7c90SJeremy L Thompson     CeedCall(CeedElemRestrictionApply(elem_rstr, CEED_NOTRANSPOSE, ones_l_vec, ones_e_vec, CEED_REQUEST_IMMEDIATE));
2039437c7c90SJeremy L Thompson     CeedCall(CeedElemRestrictionApply(elem_rstr, CEED_TRANSPOSE, ones_e_vec, sub_mult_l_vec, CEED_REQUEST_IMMEDIATE));
204075f0d5a4SJeremy L Thompson     CeedCall(CeedVectorGetArrayRead(sub_mult_l_vec, CEED_MEM_HOST, &sub_mult_array));
204175f0d5a4SJeremy L Thompson     // ---- Flag every node present in the current suboperator
204275f0d5a4SJeremy L Thompson     for (CeedInt j = 0; j < l_vec_len; j++) {
204375f0d5a4SJeremy L Thompson       if (sub_mult_array[j] > 0.0) mult_array[j] += 1.0;
204475f0d5a4SJeremy L Thompson     }
204575f0d5a4SJeremy L Thompson     CeedCall(CeedVectorRestoreArrayRead(sub_mult_l_vec, &sub_mult_array));
204675f0d5a4SJeremy L Thompson     CeedCall(CeedVectorDestroy(&sub_mult_l_vec));
204775f0d5a4SJeremy L Thompson     CeedCall(CeedVectorDestroy(&ones_e_vec));
204875f0d5a4SJeremy L Thompson   }
204975f0d5a4SJeremy L Thompson   CeedCall(CeedVectorRestoreArray(mult, &mult_array));
2050811d0ccfSJeremy L Thompson   CeedCall(CeedVectorDestroy(&ones_l_vec));
205175f0d5a4SJeremy L Thompson 
205275f0d5a4SJeremy L Thompson   return CEED_ERROR_SUCCESS;
205375f0d5a4SJeremy L Thompson }
205475f0d5a4SJeremy L Thompson 
205575f0d5a4SJeremy L Thompson /**
2056ea61e9acSJeremy L Thompson   @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator, creating the prolongation basis from the fine and coarse
2057ea61e9acSJeremy L Thompson grid interpolation
2058eaf62fffSJeremy L Thompson 
205958e4b056SJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable.
2060f04ea552SJeremy L Thompson 
2061eaf62fffSJeremy L Thompson   @param[in]  op_fine      Fine grid operator
206285bb9dcfSJeremy L Thompson   @param[in]  p_mult_fine  L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators
2063eaf62fffSJeremy L Thompson   @param[in]  rstr_coarse  Coarse grid restriction
2064eaf62fffSJeremy L Thompson   @param[in]  basis_coarse Coarse grid active vector basis
2065eaf62fffSJeremy L Thompson   @param[out] op_coarse    Coarse grid operator
206685bb9dcfSJeremy L Thompson   @param[out] op_prolong   Coarse to fine operator, or NULL
206785bb9dcfSJeremy L Thompson   @param[out] op_restrict  Fine to coarse operator, or NULL
2068eaf62fffSJeremy L Thompson 
2069eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
2070eaf62fffSJeremy L Thompson 
2071eaf62fffSJeremy L Thompson   @ref User
2072eaf62fffSJeremy L Thompson **/
20732b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreate(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse,
20742b730f8bSJeremy L Thompson                                      CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) {
20752b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op_fine));
2076eaf62fffSJeremy L Thompson 
207783d6adf3SZach Atkins   // Build prolongation matrix, if required
207883d6adf3SZach Atkins   CeedBasis basis_c_to_f = NULL;
207983d6adf3SZach Atkins   if (op_prolong || op_restrict) {
208083d6adf3SZach Atkins     CeedBasis basis_fine;
20812b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine));
20822b730f8bSJeremy L Thompson     CeedCall(CeedBasisCreateProjection(basis_coarse, basis_fine, &basis_c_to_f));
208383d6adf3SZach Atkins   }
2084eaf62fffSJeremy L Thompson 
2085f113e5dcSJeremy L Thompson   // Core code
20862b730f8bSJeremy L Thompson   CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict));
2087f113e5dcSJeremy L Thompson 
2088eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
2089eaf62fffSJeremy L Thompson }
2090eaf62fffSJeremy L Thompson 
2091eaf62fffSJeremy L Thompson /**
2092ea61e9acSJeremy L Thompson   @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a tensor basis for the active basis
2093eaf62fffSJeremy L Thompson 
209458e4b056SJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable.
2095f04ea552SJeremy L Thompson 
2096eaf62fffSJeremy L Thompson   @param[in]  op_fine       Fine grid operator
209785bb9dcfSJeremy L Thompson   @param[in]  p_mult_fine   L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators
2098eaf62fffSJeremy L Thompson   @param[in]  rstr_coarse   Coarse grid restriction
2099eaf62fffSJeremy L Thompson   @param[in]  basis_coarse  Coarse grid active vector basis
210085bb9dcfSJeremy L Thompson   @param[in]  interp_c_to_f Matrix for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators
2101eaf62fffSJeremy L Thompson   @param[out] op_coarse     Coarse grid operator
210285bb9dcfSJeremy L Thompson   @param[out] op_prolong    Coarse to fine operator, or NULL
210385bb9dcfSJeremy L Thompson   @param[out] op_restrict   Fine to coarse operator, or NULL
2104eaf62fffSJeremy L Thompson 
2105eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
2106eaf62fffSJeremy L Thompson 
2107eaf62fffSJeremy L Thompson   @ref User
2108eaf62fffSJeremy L Thompson **/
21092b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateTensorH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse,
21102b730f8bSJeremy L Thompson                                              const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong,
21112b730f8bSJeremy L Thompson                                              CeedOperator *op_restrict) {
21122b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op_fine));
2113eaf62fffSJeremy L Thompson   Ceed ceed;
21142b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op_fine, &ceed));
2115eaf62fffSJeremy L Thompson 
2116eaf62fffSJeremy L Thompson   // Check for compatible quadrature spaces
2117eaf62fffSJeremy L Thompson   CeedBasis basis_fine;
21182b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine));
2119eaf62fffSJeremy L Thompson   CeedInt Q_f, Q_c;
21202b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f));
21212b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c));
21226574a04fSJeremy L Thompson   CeedCheck(Q_f == Q_c, ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces");
2123eaf62fffSJeremy L Thompson 
212483d6adf3SZach Atkins   // Create coarse to fine basis, if required
212583d6adf3SZach Atkins   CeedBasis basis_c_to_f = NULL;
212683d6adf3SZach Atkins   if (op_prolong || op_restrict) {
212783d6adf3SZach Atkins     // Check if interpolation matrix is provided
21286574a04fSJeremy L Thompson     CeedCheck(interp_c_to_f, ceed, CEED_ERROR_INCOMPATIBLE,
21296574a04fSJeremy L Thompson               "Prolongation or restriction operator creation requires coarse-to-fine interpolation matrix");
2130eaf62fffSJeremy L Thompson     CeedInt dim, num_comp, num_nodes_c, P_1d_f, P_1d_c;
21312b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetDimension(basis_fine, &dim));
21322b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp));
21332b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumNodes1D(basis_fine, &P_1d_f));
21342b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c));
21352b730f8bSJeremy L Thompson     P_1d_c = dim == 1 ? num_nodes_c : dim == 2 ? sqrt(num_nodes_c) : cbrt(num_nodes_c);
2136eaf62fffSJeremy L Thompson     CeedScalar *q_ref, *q_weight, *grad;
21372b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(P_1d_f, &q_ref));
21382b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(P_1d_f, &q_weight));
21392b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(P_1d_f * P_1d_c * dim, &grad));
21402b730f8bSJeremy L Thompson     CeedCall(CeedBasisCreateTensorH1(ceed, dim, num_comp, P_1d_c, P_1d_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f));
21412b730f8bSJeremy L Thompson     CeedCall(CeedFree(&q_ref));
21422b730f8bSJeremy L Thompson     CeedCall(CeedFree(&q_weight));
21432b730f8bSJeremy L Thompson     CeedCall(CeedFree(&grad));
214483d6adf3SZach Atkins   }
2145eaf62fffSJeremy L Thompson 
2146eaf62fffSJeremy L Thompson   // Core code
21472b730f8bSJeremy L Thompson   CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict));
2148eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
2149eaf62fffSJeremy L Thompson }
2150eaf62fffSJeremy L Thompson 
2151eaf62fffSJeremy L Thompson /**
2152ea61e9acSJeremy L Thompson   @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a non-tensor basis for the active vector
2153eaf62fffSJeremy L Thompson 
215458e4b056SJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable.
2155f04ea552SJeremy L Thompson 
2156eaf62fffSJeremy L Thompson   @param[in]  op_fine       Fine grid operator
215785bb9dcfSJeremy L Thompson   @param[in]  p_mult_fine   L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators
2158eaf62fffSJeremy L Thompson   @param[in]  rstr_coarse   Coarse grid restriction
2159eaf62fffSJeremy L Thompson   @param[in]  basis_coarse  Coarse grid active vector basis
216085bb9dcfSJeremy L Thompson   @param[in]  interp_c_to_f Matrix for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators
2161eaf62fffSJeremy L Thompson   @param[out] op_coarse     Coarse grid operator
216285bb9dcfSJeremy L Thompson   @param[out] op_prolong    Coarse to fine operator, or NULL
216385bb9dcfSJeremy L Thompson   @param[out] op_restrict   Fine to coarse operator, or NULL
2164eaf62fffSJeremy L Thompson 
2165eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
2166eaf62fffSJeremy L Thompson 
2167eaf62fffSJeremy L Thompson   @ref User
2168eaf62fffSJeremy L Thompson **/
21692b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse,
21702b730f8bSJeremy L Thompson                                        const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong,
2171eaf62fffSJeremy L Thompson                                        CeedOperator *op_restrict) {
21722b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op_fine));
2173eaf62fffSJeremy L Thompson   Ceed ceed;
21742b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op_fine, &ceed));
2175eaf62fffSJeremy L Thompson 
2176eaf62fffSJeremy L Thompson   // Check for compatible quadrature spaces
2177eaf62fffSJeremy L Thompson   CeedBasis basis_fine;
21782b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine));
2179eaf62fffSJeremy L Thompson   CeedInt Q_f, Q_c;
21802b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f));
21812b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c));
21826574a04fSJeremy L Thompson   CeedCheck(Q_f == Q_c, ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces");
2183eaf62fffSJeremy L Thompson 
2184eaf62fffSJeremy L Thompson   // Coarse to fine basis
218583d6adf3SZach Atkins   CeedBasis basis_c_to_f = NULL;
218683d6adf3SZach Atkins   if (op_prolong || op_restrict) {
218783d6adf3SZach Atkins     // Check if interpolation matrix is provided
21886574a04fSJeremy L Thompson     CeedCheck(interp_c_to_f, ceed, CEED_ERROR_INCOMPATIBLE,
21896574a04fSJeremy L Thompson               "Prolongation or restriction operator creation requires coarse-to-fine interpolation matrix");
2190eaf62fffSJeremy L Thompson     CeedElemTopology topo;
21912b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetTopology(basis_fine, &topo));
2192eaf62fffSJeremy L Thompson     CeedInt dim, num_comp, num_nodes_c, num_nodes_f;
21932b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetDimension(basis_fine, &dim));
21942b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp));
21952b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumNodes(basis_fine, &num_nodes_f));
21962b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c));
2197eaf62fffSJeremy L Thompson     CeedScalar *q_ref, *q_weight, *grad;
21982b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(num_nodes_f * dim, &q_ref));
21992b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(num_nodes_f, &q_weight));
22002b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(num_nodes_f * num_nodes_c * dim, &grad));
22012b730f8bSJeremy L Thompson     CeedCall(CeedBasisCreateH1(ceed, topo, num_comp, num_nodes_c, num_nodes_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f));
22022b730f8bSJeremy L Thompson     CeedCall(CeedFree(&q_ref));
22032b730f8bSJeremy L Thompson     CeedCall(CeedFree(&q_weight));
22042b730f8bSJeremy L Thompson     CeedCall(CeedFree(&grad));
220583d6adf3SZach Atkins   }
2206eaf62fffSJeremy L Thompson 
2207eaf62fffSJeremy L Thompson   // Core code
22082b730f8bSJeremy L Thompson   CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict));
2209eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
2210eaf62fffSJeremy L Thompson }
2211eaf62fffSJeremy L Thompson 
2212eaf62fffSJeremy L Thompson /**
2213ea61e9acSJeremy L Thompson   @brief Build a FDM based approximate inverse for each element for a CeedOperator
2214eaf62fffSJeremy L Thompson 
2215ea61e9acSJeremy L Thompson   This returns a CeedOperator and CeedVector to apply a Fast Diagonalization Method based approximate inverse.
2216859c15bbSJames Wright   This function obtains the simultaneous diagonalization for the 1D mass and Laplacian operators, \f$M = V^T V, K = V^T S V\f$.
2217859c15bbSJames Wright   The assembled QFunction is used to modify the eigenvalues from simultaneous diagonalization and obtain an approximate inverse of the form \f$V^T
22189fd66db6SSebastian Grimberg \hat S V\f$.
22199fd66db6SSebastian Grimberg   The CeedOperator must be linear and non-composite.
22209fd66db6SSebastian Grimberg   The associated CeedQFunction must therefore also be linear.
2221eaf62fffSJeremy L Thompson 
2222ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
2223f04ea552SJeremy L Thompson 
2224ea61e9acSJeremy L Thompson   @param[in]  op      CeedOperator to create element inverses
2225ea61e9acSJeremy L Thompson   @param[out] fdm_inv CeedOperator to apply the action of a FDM based inverse for each element
2226ea61e9acSJeremy L Thompson   @param[in]  request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
2227eaf62fffSJeremy L Thompson 
2228eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
2229eaf62fffSJeremy L Thompson 
2230480fae85SJeremy L Thompson   @ref User
2231eaf62fffSJeremy L Thompson **/
22322b730f8bSJeremy L Thompson int CeedOperatorCreateFDMElementInverse(CeedOperator op, CeedOperator *fdm_inv, CeedRequest *request) {
22332b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
2234eaf62fffSJeremy L Thompson 
2235eaf62fffSJeremy L Thompson   if (op->CreateFDMElementInverse) {
2236d04bbc78SJeremy L Thompson     // Backend version
22372b730f8bSJeremy L Thompson     CeedCall(op->CreateFDMElementInverse(op, fdm_inv, request));
2238eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
2239eaf62fffSJeremy L Thompson   } else {
2240d04bbc78SJeremy L Thompson     // Operator fallback
2241d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
2242d04bbc78SJeremy L Thompson 
22432b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
2244d04bbc78SJeremy L Thompson     if (op_fallback) {
22452b730f8bSJeremy L Thompson       CeedCall(CeedOperatorCreateFDMElementInverse(op_fallback, fdm_inv, request));
2246eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
2247eaf62fffSJeremy L Thompson     }
2248eaf62fffSJeremy L Thompson   }
2249eaf62fffSJeremy L Thompson 
2250d04bbc78SJeremy L Thompson   // Default interface implementation
2251eaf62fffSJeremy L Thompson   Ceed ceed, ceed_parent;
22522b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
22532b730f8bSJeremy L Thompson   CeedCall(CeedGetOperatorFallbackParentCeed(ceed, &ceed_parent));
2254eaf62fffSJeremy L Thompson   ceed_parent = ceed_parent ? ceed_parent : ceed;
2255eaf62fffSJeremy L Thompson   CeedQFunction qf;
22562b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetQFunction(op, &qf));
2257eaf62fffSJeremy L Thompson 
2258eaf62fffSJeremy L Thompson   // Determine active input basis
2259eaf62fffSJeremy L Thompson   bool                interp = false, grad = false;
2260eaf62fffSJeremy L Thompson   CeedBasis           basis = NULL;
2261eaf62fffSJeremy L Thompson   CeedElemRestriction rstr  = NULL;
2262eaf62fffSJeremy L Thompson   CeedOperatorField  *op_fields;
2263eaf62fffSJeremy L Thompson   CeedQFunctionField *qf_fields;
2264eaf62fffSJeremy L Thompson   CeedInt             num_input_fields;
22652b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetFields(op, &num_input_fields, &op_fields, NULL, NULL));
22662b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL));
2267eaf62fffSJeremy L Thompson   for (CeedInt i = 0; i < num_input_fields; i++) {
2268eaf62fffSJeremy L Thompson     CeedVector vec;
22692b730f8bSJeremy L Thompson     CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec));
2270eaf62fffSJeremy L Thompson     if (vec == CEED_VECTOR_ACTIVE) {
2271eaf62fffSJeremy L Thompson       CeedEvalMode eval_mode;
22722b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode));
2273eaf62fffSJeremy L Thompson       interp = interp || eval_mode == CEED_EVAL_INTERP;
2274eaf62fffSJeremy L Thompson       grad   = grad || eval_mode == CEED_EVAL_GRAD;
22752b730f8bSJeremy L Thompson       CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis));
22762b730f8bSJeremy L Thompson       CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr));
2277eaf62fffSJeremy L Thompson     }
2278eaf62fffSJeremy L Thompson   }
22796574a04fSJeremy L Thompson   CeedCheck(basis, ceed, CEED_ERROR_BACKEND, "No active field set");
2280e79b91d9SJeremy L Thompson   CeedSize l_size = 1;
2281352a5e7cSSebastian Grimberg   CeedInt  P_1d, Q_1d, num_nodes, num_qpts, dim, num_comp = 1, num_elem = 1;
22822b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumNodes1D(basis, &P_1d));
2283352a5e7cSSebastian Grimberg   CeedCall(CeedBasisGetNumNodes(basis, &num_nodes));
22842b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints1D(basis, &Q_1d));
22852b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis, &num_qpts));
22862b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetDimension(basis, &dim));
22872b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumComponents(basis, &num_comp));
22882b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem));
22892b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size));
2290eaf62fffSJeremy L Thompson 
2291eaf62fffSJeremy L Thompson   // Build and diagonalize 1D Mass and Laplacian
22926574a04fSJeremy L Thompson   bool is_tensor_basis;
22936574a04fSJeremy L Thompson   CeedCall(CeedBasisIsTensor(basis, &is_tensor_basis));
22946574a04fSJeremy L Thompson   CeedCheck(is_tensor_basis, ceed, CEED_ERROR_BACKEND, "FDMElementInverse only supported for tensor bases");
2295eaf62fffSJeremy L Thompson   CeedScalar *mass, *laplace, *x, *fdm_interp, *lambda;
22962b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &mass));
22972b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &laplace));
22982b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &x));
22992b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &fdm_interp));
23002b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d, &lambda));
2301eaf62fffSJeremy L Thompson   // -- Build matrices
2302eaf62fffSJeremy L Thompson   const CeedScalar *interp_1d, *grad_1d, *q_weight_1d;
23032b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetInterp1D(basis, &interp_1d));
23042b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetGrad1D(basis, &grad_1d));
23052b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetQWeights(basis, &q_weight_1d));
23062b730f8bSJeremy L Thompson   CeedCall(CeedBuildMassLaplace(interp_1d, grad_1d, q_weight_1d, P_1d, Q_1d, dim, mass, laplace));
2307eaf62fffSJeremy L Thompson 
2308eaf62fffSJeremy L Thompson   // -- Diagonalize
23092b730f8bSJeremy L Thompson   CeedCall(CeedSimultaneousDiagonalization(ceed, laplace, mass, x, lambda, P_1d));
23102b730f8bSJeremy L Thompson   CeedCall(CeedFree(&mass));
23112b730f8bSJeremy L Thompson   CeedCall(CeedFree(&laplace));
23122b730f8bSJeremy L Thompson   for (CeedInt i = 0; i < P_1d; i++) {
23132b730f8bSJeremy L Thompson     for (CeedInt j = 0; j < P_1d; j++) fdm_interp[i + j * P_1d] = x[j + i * P_1d];
23142b730f8bSJeremy L Thompson   }
23152b730f8bSJeremy L Thompson   CeedCall(CeedFree(&x));
2316eaf62fffSJeremy L Thompson 
2317eaf62fffSJeremy L Thompson   // Assemble QFunction
2318c5f45aeaSJeremy L Thompson   CeedVector          assembled = NULL;
2319c5f45aeaSJeremy L Thompson   CeedElemRestriction rstr_qf   = NULL;
23202b730f8bSJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled, &rstr_qf, request));
2321eaf62fffSJeremy L Thompson   CeedInt layout[3];
23222b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetELayout(rstr_qf, &layout));
23232b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&rstr_qf));
2324eaf62fffSJeremy L Thompson   CeedScalar max_norm = 0;
23252b730f8bSJeremy L Thompson   CeedCall(CeedVectorNorm(assembled, CEED_NORM_MAX, &max_norm));
2326eaf62fffSJeremy L Thompson 
2327eaf62fffSJeremy L Thompson   // Calculate element averages
2328eaf62fffSJeremy L Thompson   CeedInt           num_modes = (interp ? 1 : 0) + (grad ? dim : 0);
2329eaf62fffSJeremy L Thompson   CeedScalar       *elem_avg;
2330eaf62fffSJeremy L Thompson   const CeedScalar *assembled_array, *q_weight_array;
2331eaf62fffSJeremy L Thompson   CeedVector        q_weight;
23322b730f8bSJeremy L Thompson   CeedCall(CeedVectorCreate(ceed_parent, num_qpts, &q_weight));
23332b730f8bSJeremy L Thompson   CeedCall(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, q_weight));
23342b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayRead(assembled, CEED_MEM_HOST, &assembled_array));
23352b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayRead(q_weight, CEED_MEM_HOST, &q_weight_array));
23362b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(num_elem, &elem_avg));
2337eaf62fffSJeremy L Thompson   const CeedScalar qf_value_bound = max_norm * 100 * CEED_EPSILON;
2338eaf62fffSJeremy L Thompson   for (CeedInt e = 0; e < num_elem; e++) {
2339eaf62fffSJeremy L Thompson     CeedInt count = 0;
23402b730f8bSJeremy L Thompson     for (CeedInt q = 0; q < num_qpts; q++) {
23412b730f8bSJeremy L Thompson       for (CeedInt i = 0; i < num_comp * num_comp * num_modes * num_modes; i++) {
23422b730f8bSJeremy L Thompson         if (fabs(assembled_array[q * layout[0] + i * layout[1] + e * layout[2]]) > qf_value_bound) {
23432b730f8bSJeremy L Thompson           elem_avg[e] += assembled_array[q * layout[0] + i * layout[1] + e * layout[2]] / q_weight_array[q];
2344eaf62fffSJeremy L Thompson           count++;
2345eaf62fffSJeremy L Thompson         }
23462b730f8bSJeremy L Thompson       }
23472b730f8bSJeremy L Thompson     }
2348eaf62fffSJeremy L Thompson     if (count) {
2349eaf62fffSJeremy L Thompson       elem_avg[e] /= count;
2350eaf62fffSJeremy L Thompson     } else {
2351eaf62fffSJeremy L Thompson       elem_avg[e] = 1.0;
2352eaf62fffSJeremy L Thompson     }
2353eaf62fffSJeremy L Thompson   }
23542b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArrayRead(assembled, &assembled_array));
23552b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&assembled));
23562b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArrayRead(q_weight, &q_weight_array));
23572b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&q_weight));
2358eaf62fffSJeremy L Thompson 
2359eaf62fffSJeremy L Thompson   // Build FDM diagonal
2360eaf62fffSJeremy L Thompson   CeedVector  q_data;
2361eaf62fffSJeremy L Thompson   CeedScalar *q_data_array, *fdm_diagonal;
2362352a5e7cSSebastian Grimberg   CeedCall(CeedCalloc(num_comp * num_nodes, &fdm_diagonal));
2363352a5e7cSSebastian Grimberg   const CeedScalar fdm_diagonal_bound = num_nodes * CEED_EPSILON;
23642b730f8bSJeremy L Thompson   for (CeedInt c = 0; c < num_comp; c++) {
2365352a5e7cSSebastian Grimberg     for (CeedInt n = 0; n < num_nodes; n++) {
2366352a5e7cSSebastian Grimberg       if (interp) fdm_diagonal[c * num_nodes + n] = 1.0;
23672b730f8bSJeremy L Thompson       if (grad) {
2368eaf62fffSJeremy L Thompson         for (CeedInt d = 0; d < dim; d++) {
2369eaf62fffSJeremy L Thompson           CeedInt i = (n / CeedIntPow(P_1d, d)) % P_1d;
2370352a5e7cSSebastian Grimberg           fdm_diagonal[c * num_nodes + n] += lambda[i];
2371eaf62fffSJeremy L Thompson         }
2372eaf62fffSJeremy L Thompson       }
2373352a5e7cSSebastian Grimberg       if (fabs(fdm_diagonal[c * num_nodes + n]) < fdm_diagonal_bound) fdm_diagonal[c * num_nodes + n] = fdm_diagonal_bound;
23742b730f8bSJeremy L Thompson     }
23752b730f8bSJeremy L Thompson   }
2376352a5e7cSSebastian Grimberg   CeedCall(CeedVectorCreate(ceed_parent, num_elem * num_comp * num_nodes, &q_data));
23772b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(q_data, 0.0));
23782b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayWrite(q_data, CEED_MEM_HOST, &q_data_array));
23792b730f8bSJeremy L Thompson   for (CeedInt e = 0; e < num_elem; e++) {
23802b730f8bSJeremy L Thompson     for (CeedInt c = 0; c < num_comp; c++) {
2381352a5e7cSSebastian Grimberg       for (CeedInt n = 0; n < num_nodes; n++) q_data_array[(e * num_comp + c) * num_nodes + n] = 1. / (elem_avg[e] * fdm_diagonal[c * num_nodes + n]);
23822b730f8bSJeremy L Thompson     }
23832b730f8bSJeremy L Thompson   }
23842b730f8bSJeremy L Thompson   CeedCall(CeedFree(&elem_avg));
23852b730f8bSJeremy L Thompson   CeedCall(CeedFree(&fdm_diagonal));
23862b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArray(q_data, &q_data_array));
2387eaf62fffSJeremy L Thompson 
2388eaf62fffSJeremy L Thompson   // Setup FDM operator
2389eaf62fffSJeremy L Thompson   // -- Basis
2390eaf62fffSJeremy L Thompson   CeedBasis   fdm_basis;
2391eaf62fffSJeremy L Thompson   CeedScalar *grad_dummy, *q_ref_dummy, *q_weight_dummy;
23922b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &grad_dummy));
23932b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d, &q_ref_dummy));
23942b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d, &q_weight_dummy));
23952b730f8bSJeremy L Thompson   CeedCall(CeedBasisCreateTensorH1(ceed_parent, dim, num_comp, P_1d, P_1d, fdm_interp, grad_dummy, q_ref_dummy, q_weight_dummy, &fdm_basis));
23962b730f8bSJeremy L Thompson   CeedCall(CeedFree(&fdm_interp));
23972b730f8bSJeremy L Thompson   CeedCall(CeedFree(&grad_dummy));
23982b730f8bSJeremy L Thompson   CeedCall(CeedFree(&q_ref_dummy));
23992b730f8bSJeremy L Thompson   CeedCall(CeedFree(&q_weight_dummy));
24002b730f8bSJeremy L Thompson   CeedCall(CeedFree(&lambda));
2401eaf62fffSJeremy L Thompson 
2402eaf62fffSJeremy L Thompson   // -- Restriction
2403eaf62fffSJeremy L Thompson   CeedElemRestriction rstr_qd_i;
2404352a5e7cSSebastian Grimberg   CeedInt             strides[3] = {1, num_nodes, num_nodes * num_comp};
2405352a5e7cSSebastian Grimberg   CeedCall(CeedElemRestrictionCreateStrided(ceed_parent, num_elem, num_nodes, num_comp, num_elem * num_comp * num_nodes, strides, &rstr_qd_i));
2406eaf62fffSJeremy L Thompson   // -- QFunction
2407eaf62fffSJeremy L Thompson   CeedQFunction qf_fdm;
24082b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionCreateInteriorByName(ceed_parent, "Scale", &qf_fdm));
24092b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAddInput(qf_fdm, "input", num_comp, CEED_EVAL_INTERP));
24102b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAddInput(qf_fdm, "scale", num_comp, CEED_EVAL_NONE));
24112b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAddOutput(qf_fdm, "output", num_comp, CEED_EVAL_INTERP));
24122b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_fdm, num_comp));
2413eaf62fffSJeremy L Thompson   // -- QFunction context
2414eaf62fffSJeremy L Thompson   CeedInt *num_comp_data;
24152b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(1, &num_comp_data));
2416eaf62fffSJeremy L Thompson   num_comp_data[0] = num_comp;
2417eaf62fffSJeremy L Thompson   CeedQFunctionContext ctx_fdm;
24182b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionContextCreate(ceed, &ctx_fdm));
24192b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionContextSetData(ctx_fdm, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_data), num_comp_data));
24202b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionSetContext(qf_fdm, ctx_fdm));
24212b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionContextDestroy(&ctx_fdm));
2422eaf62fffSJeremy L Thompson   // -- Operator
24232b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCreate(ceed_parent, qf_fdm, NULL, NULL, fdm_inv));
24242b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetField(*fdm_inv, "input", rstr, fdm_basis, CEED_VECTOR_ACTIVE));
24252b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetField(*fdm_inv, "scale", rstr_qd_i, CEED_BASIS_COLLOCATED, q_data));
24262b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetField(*fdm_inv, "output", rstr, fdm_basis, CEED_VECTOR_ACTIVE));
2427eaf62fffSJeremy L Thompson 
2428eaf62fffSJeremy L Thompson   // Cleanup
24292b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&q_data));
24302b730f8bSJeremy L Thompson   CeedCall(CeedBasisDestroy(&fdm_basis));
24312b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&rstr_qd_i));
24322b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionDestroy(&qf_fdm));
2433eaf62fffSJeremy L Thompson 
2434eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
2435eaf62fffSJeremy L Thompson }
2436eaf62fffSJeremy L Thompson 
2437eaf62fffSJeremy L Thompson /// @}
2438