xref: /libCEED/rust/libceed-sys/c-src/interface/ceed-preconditioning.c (revision 83d6adf320d467417864810b884f58e4c3cda983)
13d8e8822SJeremy L Thompson // Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors.
23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details.
3eaf62fffSJeremy L Thompson //
43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause
5eaf62fffSJeremy L Thompson //
63d8e8822SJeremy L Thompson // This file is part of CEED:  http://github.com/ceed
7eaf62fffSJeremy L Thompson 
8ed9e99e6SJeremy L Thompson #include <assert.h>
92b730f8bSJeremy L Thompson #include <ceed-impl.h>
102b730f8bSJeremy L Thompson #include <ceed/backend.h>
112b730f8bSJeremy L Thompson #include <ceed/ceed.h>
122b730f8bSJeremy L Thompson #include <math.h>
13eaf62fffSJeremy L Thompson #include <stdbool.h>
14eaf62fffSJeremy L Thompson #include <stdio.h>
15eaf62fffSJeremy L Thompson #include <string.h>
16eaf62fffSJeremy L Thompson 
17eaf62fffSJeremy L Thompson /// @file
18eaf62fffSJeremy L Thompson /// Implementation of CeedOperator preconditioning interfaces
19eaf62fffSJeremy L Thompson 
20eaf62fffSJeremy L Thompson /// ----------------------------------------------------------------------------
21eaf62fffSJeremy L Thompson /// CeedOperator Library Internal Preconditioning Functions
22eaf62fffSJeremy L Thompson /// ----------------------------------------------------------------------------
23eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorDeveloper
24eaf62fffSJeremy L Thompson /// @{
25eaf62fffSJeremy L Thompson 
26eaf62fffSJeremy L Thompson /**
27ea61e9acSJeremy L Thompson   @brief Duplicate a CeedQFunction with a reference Ceed to fallback for advanced CeedOperator functionality
289e77b9c8SJeremy L Thompson 
2901ea9c81SJed Brown   @param[in]  fallback_ceed Ceed on which to create fallback CeedQFunction
309e77b9c8SJeremy L Thompson   @param[in]  qf            CeedQFunction to create fallback for
3101ea9c81SJed Brown   @param[out] qf_fallback   fallback CeedQFunction
329e77b9c8SJeremy L Thompson 
339e77b9c8SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
349e77b9c8SJeremy L Thompson 
359e77b9c8SJeremy L Thompson   @ref Developer
369e77b9c8SJeremy L Thompson **/
372b730f8bSJeremy L Thompson static int CeedQFunctionCreateFallback(Ceed fallback_ceed, CeedQFunction qf, CeedQFunction *qf_fallback) {
389e77b9c8SJeremy L Thompson   // Check if NULL qf passed in
399e77b9c8SJeremy L Thompson   if (!qf) return CEED_ERROR_SUCCESS;
409e77b9c8SJeremy L Thompson 
41d04bbc78SJeremy L Thompson   CeedDebug256(qf->ceed, 1, "---------- CeedOperator Fallback ----------\n");
4213f886e9SJeremy L Thompson   CeedDebug(qf->ceed, "Creating fallback CeedQFunction\n");
43d04bbc78SJeremy L Thompson 
449e77b9c8SJeremy L Thompson   char *source_path_with_name = "";
459e77b9c8SJeremy L Thompson   if (qf->source_path) {
462b730f8bSJeremy L Thompson     size_t path_len = strlen(qf->source_path), name_len = strlen(qf->kernel_name);
472b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(path_len + name_len + 2, &source_path_with_name));
489e77b9c8SJeremy L Thompson     memcpy(source_path_with_name, qf->source_path, path_len);
499e77b9c8SJeremy L Thompson     memcpy(&source_path_with_name[path_len], ":", 1);
509e77b9c8SJeremy L Thompson     memcpy(&source_path_with_name[path_len + 1], qf->kernel_name, name_len);
519e77b9c8SJeremy L Thompson   } else {
522b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(1, &source_path_with_name));
539e77b9c8SJeremy L Thompson   }
549e77b9c8SJeremy L Thompson 
552b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionCreateInterior(fallback_ceed, qf->vec_length, qf->function, source_path_with_name, qf_fallback));
569e77b9c8SJeremy L Thompson   {
579e77b9c8SJeremy L Thompson     CeedQFunctionContext ctx;
589e77b9c8SJeremy L Thompson 
592b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionGetContext(qf, &ctx));
602b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionSetContext(*qf_fallback, ctx));
619e77b9c8SJeremy L Thompson   }
629e77b9c8SJeremy L Thompson   for (CeedInt i = 0; i < qf->num_input_fields; i++) {
632b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddInput(*qf_fallback, qf->input_fields[i]->field_name, qf->input_fields[i]->size, qf->input_fields[i]->eval_mode));
649e77b9c8SJeremy L Thompson   }
659e77b9c8SJeremy L Thompson   for (CeedInt i = 0; i < qf->num_output_fields; i++) {
662b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddOutput(*qf_fallback, qf->output_fields[i]->field_name, qf->output_fields[i]->size, qf->output_fields[i]->eval_mode));
679e77b9c8SJeremy L Thompson   }
682b730f8bSJeremy L Thompson   CeedCall(CeedFree(&source_path_with_name));
699e77b9c8SJeremy L Thompson 
709e77b9c8SJeremy L Thompson   return CEED_ERROR_SUCCESS;
719e77b9c8SJeremy L Thompson }
729e77b9c8SJeremy L Thompson 
739e77b9c8SJeremy L Thompson /**
74ea61e9acSJeremy L Thompson   @brief Duplicate a CeedOperator with a reference Ceed to fallback for advanced CeedOperator functionality
75eaf62fffSJeremy L Thompson 
76ea61e9acSJeremy L Thompson   @param[in,out] op CeedOperator to create fallback for
77eaf62fffSJeremy L Thompson 
78eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
79eaf62fffSJeremy L Thompson 
80eaf62fffSJeremy L Thompson   @ref Developer
81eaf62fffSJeremy L Thompson **/
82d04bbc78SJeremy L Thompson static int CeedOperatorCreateFallback(CeedOperator op) {
83b275c451SJeremy L Thompson   bool is_composite;
849e77b9c8SJeremy L Thompson   Ceed ceed_fallback;
85eaf62fffSJeremy L Thompson 
86805fe78eSJeremy L Thompson   // Check not already created
87805fe78eSJeremy L Thompson   if (op->op_fallback) return CEED_ERROR_SUCCESS;
88805fe78eSJeremy L Thompson 
89eaf62fffSJeremy L Thompson   // Fallback Ceed
902b730f8bSJeremy L Thompson   CeedCall(CeedGetOperatorFallbackCeed(op->ceed, &ceed_fallback));
91d04bbc78SJeremy L Thompson   if (!ceed_fallback) return CEED_ERROR_SUCCESS;
92d04bbc78SJeremy L Thompson 
93d04bbc78SJeremy L Thompson   CeedDebug256(op->ceed, 1, "---------- CeedOperator Fallback ----------\n");
9413f886e9SJeremy L Thompson   CeedDebug(op->ceed, "Creating fallback CeedOperator\n");
95eaf62fffSJeremy L Thompson 
96eaf62fffSJeremy L Thompson   // Clone Op
97805fe78eSJeremy L Thompson   CeedOperator op_fallback;
98b275c451SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
99b275c451SJeremy L Thompson   if (is_composite) {
100b275c451SJeremy L Thompson     CeedInt       num_suboperators;
101b275c451SJeremy L Thompson     CeedOperator *sub_operators;
102b275c451SJeremy L Thompson 
1032b730f8bSJeremy L Thompson     CeedCall(CeedCompositeOperatorCreate(ceed_fallback, &op_fallback));
104b275c451SJeremy L Thompson     CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
105b275c451SJeremy L Thompson     CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
106b275c451SJeremy L Thompson     for (CeedInt i = 0; i < num_suboperators; i++) {
107d04bbc78SJeremy L Thompson       CeedOperator op_sub_fallback;
108d04bbc78SJeremy L Thompson 
109b275c451SJeremy L Thompson       CeedCall(CeedOperatorGetFallback(sub_operators[i], &op_sub_fallback));
1102b730f8bSJeremy L Thompson       CeedCall(CeedCompositeOperatorAddSub(op_fallback, op_sub_fallback));
111805fe78eSJeremy L Thompson     }
112805fe78eSJeremy L Thompson   } else {
1139e77b9c8SJeremy L Thompson     CeedQFunction qf_fallback = NULL, dqf_fallback = NULL, dqfT_fallback = NULL;
1142b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->qf, &qf_fallback));
1152b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqf, &dqf_fallback));
1162b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqfT, &dqfT_fallback));
1172b730f8bSJeremy L Thompson     CeedCall(CeedOperatorCreate(ceed_fallback, qf_fallback, dqf_fallback, dqfT_fallback, &op_fallback));
118805fe78eSJeremy L Thompson     for (CeedInt i = 0; i < op->qf->num_input_fields; i++) {
1192b730f8bSJeremy L Thompson       CeedCall(CeedOperatorSetField(op_fallback, op->input_fields[i]->field_name, op->input_fields[i]->elem_restr, op->input_fields[i]->basis,
1202b730f8bSJeremy L Thompson                                     op->input_fields[i]->vec));
121805fe78eSJeremy L Thompson     }
122805fe78eSJeremy L Thompson     for (CeedInt i = 0; i < op->qf->num_output_fields; i++) {
1232b730f8bSJeremy L Thompson       CeedCall(CeedOperatorSetField(op_fallback, op->output_fields[i]->field_name, op->output_fields[i]->elem_restr, op->output_fields[i]->basis,
1242b730f8bSJeremy L Thompson                                     op->output_fields[i]->vec));
125805fe78eSJeremy L Thompson     }
1262b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op->qf_assembled, &op_fallback->qf_assembled));
127805fe78eSJeremy L Thompson     if (op_fallback->num_qpts == 0) {
1282b730f8bSJeremy L Thompson       CeedCall(CeedOperatorSetNumQuadraturePoints(op_fallback, op->num_qpts));
129805fe78eSJeremy L Thompson     }
1309e77b9c8SJeremy L Thompson     // Cleanup
1312b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionDestroy(&qf_fallback));
1322b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionDestroy(&dqf_fallback));
1332b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionDestroy(&dqfT_fallback));
134805fe78eSJeremy L Thompson   }
1352b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetName(op_fallback, op->name));
1362b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op_fallback));
137805fe78eSJeremy L Thompson   op->op_fallback = op_fallback;
138eaf62fffSJeremy L Thompson 
139eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
140eaf62fffSJeremy L Thompson }
141eaf62fffSJeremy L Thompson 
142eaf62fffSJeremy L Thompson /**
143ea61e9acSJeremy L Thompson   @brief Retrieve fallback CeedOperator with a reference Ceed for advanced CeedOperator functionality
144d04bbc78SJeremy L Thompson 
145d04bbc78SJeremy L Thompson   @param[in]  op          CeedOperator to retrieve fallback for
146d04bbc78SJeremy L Thompson   @param[out] op_fallback Fallback CeedOperator
147d04bbc78SJeremy L Thompson 
148d04bbc78SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
149d04bbc78SJeremy L Thompson 
150d04bbc78SJeremy L Thompson   @ref Developer
151d04bbc78SJeremy L Thompson **/
152d04bbc78SJeremy L Thompson int CeedOperatorGetFallback(CeedOperator op, CeedOperator *op_fallback) {
153d04bbc78SJeremy L Thompson   // Create if needed
154d04bbc78SJeremy L Thompson   if (!op->op_fallback) {
1552b730f8bSJeremy L Thompson     CeedCall(CeedOperatorCreateFallback(op));
156d04bbc78SJeremy L Thompson   }
157d04bbc78SJeremy L Thompson   if (op->op_fallback) {
158d04bbc78SJeremy L Thompson     bool is_debug;
159d04bbc78SJeremy L Thompson 
1602b730f8bSJeremy L Thompson     CeedCall(CeedIsDebug(op->ceed, &is_debug));
161d04bbc78SJeremy L Thompson     if (is_debug) {
162b275c451SJeremy L Thompson       Ceed        ceed, ceed_fallback;
163d04bbc78SJeremy L Thompson       const char *resource, *resource_fallback;
164d04bbc78SJeremy L Thompson 
165b275c451SJeremy L Thompson       CeedCall(CeedOperatorGetCeed(op, &ceed));
166b275c451SJeremy L Thompson       CeedCall(CeedGetOperatorFallbackCeed(ceed, &ceed_fallback));
167b275c451SJeremy L Thompson       CeedCall(CeedGetResource(ceed, &resource));
1682b730f8bSJeremy L Thompson       CeedCall(CeedGetResource(ceed_fallback, &resource_fallback));
169d04bbc78SJeremy L Thompson 
170b275c451SJeremy L Thompson       CeedDebug256(ceed, 1, "---------- CeedOperator Fallback ----------\n");
171b275c451SJeremy L Thompson       CeedDebug(ceed, "Falling back from %s operator at address %ld to %s operator at address %ld\n", resource, op, resource_fallback,
1722b730f8bSJeremy L Thompson                 op->op_fallback);
173d04bbc78SJeremy L Thompson     }
174d04bbc78SJeremy L Thompson   }
175d04bbc78SJeremy L Thompson   *op_fallback = op->op_fallback;
176d04bbc78SJeremy L Thompson 
177d04bbc78SJeremy L Thompson   return CEED_ERROR_SUCCESS;
178d04bbc78SJeremy L Thompson }
179d04bbc78SJeremy L Thompson 
180d04bbc78SJeremy L Thompson /**
181eaf62fffSJeremy L Thompson   @brief Select correct basis matrix pointer based on CeedEvalMode
182eaf62fffSJeremy L Thompson 
183eaf62fffSJeremy L Thompson   @param[in]  eval_mode Current basis evaluation mode
184eaf62fffSJeremy L Thompson   @param[in]  identity  Pointer to identity matrix
185eaf62fffSJeremy L Thompson   @param[in]  interp    Pointer to interpolation matrix
186eaf62fffSJeremy L Thompson   @param[in]  grad      Pointer to gradient matrix
187eaf62fffSJeremy L Thompson   @param[out] basis_ptr Basis pointer to set
188eaf62fffSJeremy L Thompson 
189eaf62fffSJeremy L Thompson   @ref Developer
190eaf62fffSJeremy L Thompson **/
1912b730f8bSJeremy L Thompson static inline void CeedOperatorGetBasisPointer(CeedEvalMode eval_mode, const CeedScalar *identity, const CeedScalar *interp, const CeedScalar *grad,
1922b730f8bSJeremy L Thompson                                                const CeedScalar **basis_ptr) {
193eaf62fffSJeremy L Thompson   switch (eval_mode) {
194eaf62fffSJeremy L Thompson     case CEED_EVAL_NONE:
195eaf62fffSJeremy L Thompson       *basis_ptr = identity;
196eaf62fffSJeremy L Thompson       break;
197eaf62fffSJeremy L Thompson     case CEED_EVAL_INTERP:
198eaf62fffSJeremy L Thompson       *basis_ptr = interp;
199eaf62fffSJeremy L Thompson       break;
200eaf62fffSJeremy L Thompson     case CEED_EVAL_GRAD:
201eaf62fffSJeremy L Thompson       *basis_ptr = grad;
202eaf62fffSJeremy L Thompson       break;
203eaf62fffSJeremy L Thompson     case CEED_EVAL_WEIGHT:
204eaf62fffSJeremy L Thompson     case CEED_EVAL_DIV:
205eaf62fffSJeremy L Thompson     case CEED_EVAL_CURL:
206eaf62fffSJeremy L Thompson       break;  // Caught by QF Assembly
207eaf62fffSJeremy L Thompson   }
208ed9e99e6SJeremy L Thompson   assert(*basis_ptr != NULL);
209eaf62fffSJeremy L Thompson }
210eaf62fffSJeremy L Thompson 
211eaf62fffSJeremy L Thompson /**
212eaf62fffSJeremy L Thompson   @brief Create point block restriction for active operator field
213eaf62fffSJeremy L Thompson 
214eaf62fffSJeremy L Thompson   @param[in]  rstr            Original CeedElemRestriction for active field
215ea61e9acSJeremy L Thompson   @param[out] pointblock_rstr Address of the variable where the newly created CeedElemRestriction will be stored
216eaf62fffSJeremy L Thompson 
217eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
218eaf62fffSJeremy L Thompson 
219eaf62fffSJeremy L Thompson   @ref Developer
220eaf62fffSJeremy L Thompson **/
2212b730f8bSJeremy L Thompson static int CeedOperatorCreateActivePointBlockRestriction(CeedElemRestriction rstr, CeedElemRestriction *pointblock_rstr) {
222eaf62fffSJeremy L Thompson   Ceed ceed;
2232b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetCeed(rstr, &ceed));
224eaf62fffSJeremy L Thompson   const CeedInt *offsets;
2252b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetOffsets(rstr, CEED_MEM_HOST, &offsets));
226eaf62fffSJeremy L Thompson 
227eaf62fffSJeremy L Thompson   // Expand offsets
2287b63f5c6SJed Brown   CeedInt  num_elem, num_comp, elem_size, comp_stride, *pointblock_offsets;
2297b63f5c6SJed Brown   CeedSize l_size;
2302b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem));
2312b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp));
2322b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size));
2332b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetCompStride(rstr, &comp_stride));
2342b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size));
235eaf62fffSJeremy L Thompson   CeedInt shift = num_comp;
2362b730f8bSJeremy L Thompson   if (comp_stride != 1) shift *= num_comp;
2372b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(num_elem * elem_size, &pointblock_offsets));
238eaf62fffSJeremy L Thompson   for (CeedInt i = 0; i < num_elem * elem_size; i++) {
239eaf62fffSJeremy L Thompson     pointblock_offsets[i] = offsets[i] * shift;
240eaf62fffSJeremy L Thompson   }
241eaf62fffSJeremy L Thompson 
242eaf62fffSJeremy L Thompson   // Create new restriction
2432b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionCreate(ceed, num_elem, elem_size, num_comp * num_comp, 1, l_size * num_comp, CEED_MEM_HOST, CEED_OWN_POINTER,
2442b730f8bSJeremy L Thompson                                      pointblock_offsets, pointblock_rstr));
245eaf62fffSJeremy L Thompson 
246eaf62fffSJeremy L Thompson   // Cleanup
2472b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionRestoreOffsets(rstr, &offsets));
248eaf62fffSJeremy L Thompson 
249eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
250eaf62fffSJeremy L Thompson }
251eaf62fffSJeremy L Thompson 
252eaf62fffSJeremy L Thompson /**
253eaf62fffSJeremy L Thompson   @brief Core logic for assembling operator diagonal or point block diagonal
254eaf62fffSJeremy L Thompson 
255eaf62fffSJeremy L Thompson   @param[in]  op            CeedOperator to assemble point block diagonal
256ea61e9acSJeremy L Thompson   @param[in]  request       Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE
257eaf62fffSJeremy L Thompson   @param[in]  is_pointblock Boolean flag to assemble diagonal or point block diagonal
258eaf62fffSJeremy L Thompson   @param[out] assembled     CeedVector to store assembled diagonal
259eaf62fffSJeremy L Thompson 
260eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
261eaf62fffSJeremy L Thompson 
262eaf62fffSJeremy L Thompson   @ref Developer
263eaf62fffSJeremy L Thompson **/
2642b730f8bSJeremy L Thompson static inline int CeedSingleOperatorAssembleAddDiagonal_Core(CeedOperator op, CeedRequest *request, const bool is_pointblock, CeedVector assembled) {
265eaf62fffSJeremy L Thompson   Ceed ceed;
2662b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
267eaf62fffSJeremy L Thompson 
268eaf62fffSJeremy L Thompson   // Assemble QFunction
269eaf62fffSJeremy L Thompson   CeedQFunction qf;
2702b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetQFunction(op, &qf));
271eaf62fffSJeremy L Thompson   CeedInt num_input_fields, num_output_fields;
2722b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionGetNumArgs(qf, &num_input_fields, &num_output_fields));
273eaf62fffSJeremy L Thompson   CeedVector          assembled_qf;
274eaf62fffSJeremy L Thompson   CeedElemRestriction rstr;
2752b730f8bSJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &rstr, request));
276eaf62fffSJeremy L Thompson   CeedInt layout[3];
2772b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetELayout(rstr, &layout));
2782b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&rstr));
279eaf62fffSJeremy L Thompson 
280ed9e99e6SJeremy L Thompson   // Get assembly data
281ed9e99e6SJeremy L Thompson   CeedOperatorAssemblyData data;
2822b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data));
283ed9e99e6SJeremy L Thompson   const CeedEvalMode *eval_mode_in, *eval_mode_out;
284ed9e99e6SJeremy L Thompson   CeedInt             num_eval_mode_in, num_eval_mode_out;
2852b730f8bSJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_eval_mode_in, &eval_mode_in, &num_eval_mode_out, &eval_mode_out));
286ed9e99e6SJeremy L Thompson   CeedBasis basis_in, basis_out;
2872b730f8bSJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetBases(data, &basis_in, NULL, &basis_out, NULL));
288ed9e99e6SJeremy L Thompson   CeedInt num_comp;
2892b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumComponents(basis_in, &num_comp));
290eaf62fffSJeremy L Thompson 
291eaf62fffSJeremy L Thompson   // Assemble point block diagonal restriction, if needed
292ed9e99e6SJeremy L Thompson   CeedElemRestriction diag_rstr;
2932b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveElemRestriction(op, &diag_rstr));
294eaf62fffSJeremy L Thompson   if (is_pointblock) {
295ed9e99e6SJeremy L Thompson     CeedElemRestriction point_block_rstr;
2962b730f8bSJeremy L Thompson     CeedCall(CeedOperatorCreateActivePointBlockRestriction(diag_rstr, &point_block_rstr));
297ed9e99e6SJeremy L Thompson     diag_rstr = point_block_rstr;
298eaf62fffSJeremy L Thompson   }
299eaf62fffSJeremy L Thompson 
300eaf62fffSJeremy L Thompson   // Create diagonal vector
301eaf62fffSJeremy L Thompson   CeedVector elem_diag;
3022b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionCreateVector(diag_rstr, NULL, &elem_diag));
303eaf62fffSJeremy L Thompson 
304eaf62fffSJeremy L Thompson   // Assemble element operator diagonals
3059c774eddSJeremy L Thompson   CeedScalar       *elem_diag_array;
3069c774eddSJeremy L Thompson   const CeedScalar *assembled_qf_array;
3072b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(elem_diag, 0.0));
3082b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArray(elem_diag, CEED_MEM_HOST, &elem_diag_array));
3092b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array));
310eaf62fffSJeremy L Thompson   CeedInt num_elem, num_nodes, num_qpts;
3112b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(diag_rstr, &num_elem));
3122b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumNodes(basis_in, &num_nodes));
3132b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_in, &num_qpts));
314ed9e99e6SJeremy L Thompson 
315eaf62fffSJeremy L Thompson   // Basis matrices
316eaf62fffSJeremy L Thompson   const CeedScalar *interp_in, *interp_out, *grad_in, *grad_out;
317eaf62fffSJeremy L Thompson   CeedScalar       *identity      = NULL;
318ed9e99e6SJeremy L Thompson   bool              has_eval_none = false;
319ed9e99e6SJeremy L Thompson   for (CeedInt i = 0; i < num_eval_mode_in; i++) {
320ed9e99e6SJeremy L Thompson     has_eval_none = has_eval_none || (eval_mode_in[i] == CEED_EVAL_NONE);
321ed9e99e6SJeremy L Thompson   }
322ed9e99e6SJeremy L Thompson   for (CeedInt i = 0; i < num_eval_mode_out; i++) {
323ed9e99e6SJeremy L Thompson     has_eval_none = has_eval_none || (eval_mode_out[i] == CEED_EVAL_NONE);
324ed9e99e6SJeremy L Thompson   }
325ed9e99e6SJeremy L Thompson   if (has_eval_none) {
3262b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(num_qpts * num_nodes, &identity));
3272b730f8bSJeremy L Thompson     for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) identity[i * num_nodes + i] = 1.0;
328eaf62fffSJeremy L Thompson   }
3292b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetInterp(basis_in, &interp_in));
3302b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetInterp(basis_out, &interp_out));
3312b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetGrad(basis_in, &grad_in));
3322b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetGrad(basis_out, &grad_out));
333eaf62fffSJeremy L Thompson   // Compute the diagonal of B^T D B
334eaf62fffSJeremy L Thompson   // Each element
335eaf62fffSJeremy L Thompson   for (CeedInt e = 0; e < num_elem; e++) {
336eaf62fffSJeremy L Thompson     CeedInt d_out = -1;
337eaf62fffSJeremy L Thompson     // Each basis eval mode pair
338eaf62fffSJeremy L Thompson     for (CeedInt e_out = 0; e_out < num_eval_mode_out; e_out++) {
339eaf62fffSJeremy L Thompson       const CeedScalar *bt = NULL;
3402b730f8bSJeremy L Thompson       if (eval_mode_out[e_out] == CEED_EVAL_GRAD) d_out += 1;
3412b730f8bSJeremy L Thompson       CeedOperatorGetBasisPointer(eval_mode_out[e_out], identity, interp_out, &grad_out[d_out * num_qpts * num_nodes], &bt);
342eaf62fffSJeremy L Thompson       CeedInt d_in = -1;
343eaf62fffSJeremy L Thompson       for (CeedInt e_in = 0; e_in < num_eval_mode_in; e_in++) {
344eaf62fffSJeremy L Thompson         const CeedScalar *b = NULL;
3452b730f8bSJeremy L Thompson         if (eval_mode_in[e_in] == CEED_EVAL_GRAD) d_in += 1;
3462b730f8bSJeremy L Thompson         CeedOperatorGetBasisPointer(eval_mode_in[e_in], identity, interp_in, &grad_in[d_in * num_qpts * num_nodes], &b);
347eaf62fffSJeremy L Thompson         // Each component
3482b730f8bSJeremy L Thompson         for (CeedInt c_out = 0; c_out < num_comp; c_out++) {
349eaf62fffSJeremy L Thompson           // Each qpoint/node pair
3502b730f8bSJeremy L Thompson           for (CeedInt q = 0; q < num_qpts; q++) {
351eaf62fffSJeremy L Thompson             if (is_pointblock) {
352eaf62fffSJeremy L Thompson               // Point Block Diagonal
353eaf62fffSJeremy L Thompson               for (CeedInt c_in = 0; c_in < num_comp; c_in++) {
354eaf62fffSJeremy L Thompson                 const CeedScalar qf_value =
3552b730f8bSJeremy L Thompson                     assembled_qf_array[q * layout[0] + (((e_in * num_comp + c_in) * num_eval_mode_out + e_out) * num_comp + c_out) * layout[1] +
3562b730f8bSJeremy L Thompson                                        e * layout[2]];
3572b730f8bSJeremy L Thompson                 for (CeedInt n = 0; n < num_nodes; n++) {
358eaf62fffSJeremy L Thompson                   elem_diag_array[((e * num_comp + c_out) * num_comp + c_in) * num_nodes + n] +=
359eaf62fffSJeremy L Thompson                       bt[q * num_nodes + n] * qf_value * b[q * num_nodes + n];
360eaf62fffSJeremy L Thompson                 }
3612b730f8bSJeremy L Thompson               }
362eaf62fffSJeremy L Thompson             } else {
363eaf62fffSJeremy L Thompson               // Diagonal Only
364eaf62fffSJeremy L Thompson               const CeedScalar qf_value =
3652b730f8bSJeremy L Thompson                   assembled_qf_array[q * layout[0] + (((e_in * num_comp + c_out) * num_eval_mode_out + e_out) * num_comp + c_out) * layout[1] +
3662b730f8bSJeremy L Thompson                                      e * layout[2]];
3672b730f8bSJeremy L Thompson               for (CeedInt n = 0; n < num_nodes; n++) {
3682b730f8bSJeremy L Thompson                 elem_diag_array[(e * num_comp + c_out) * num_nodes + n] += bt[q * num_nodes + n] * qf_value * b[q * num_nodes + n];
369eaf62fffSJeremy L Thompson               }
370eaf62fffSJeremy L Thompson             }
371eaf62fffSJeremy L Thompson           }
372eaf62fffSJeremy L Thompson         }
3732b730f8bSJeremy L Thompson       }
3742b730f8bSJeremy L Thompson     }
3752b730f8bSJeremy L Thompson   }
3762b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArray(elem_diag, &elem_diag_array));
3772b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array));
378eaf62fffSJeremy L Thompson 
379eaf62fffSJeremy L Thompson   // Assemble local operator diagonal
3802b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionApply(diag_rstr, CEED_TRANSPOSE, elem_diag, assembled, request));
381eaf62fffSJeremy L Thompson 
382eaf62fffSJeremy L Thompson   // Cleanup
383eaf62fffSJeremy L Thompson   if (is_pointblock) {
3842b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionDestroy(&diag_rstr));
385eaf62fffSJeremy L Thompson   }
3862b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&assembled_qf));
3872b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&elem_diag));
3882b730f8bSJeremy L Thompson   CeedCall(CeedFree(&identity));
389eaf62fffSJeremy L Thompson 
390eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
391eaf62fffSJeremy L Thompson }
392eaf62fffSJeremy L Thompson 
393eaf62fffSJeremy L Thompson /**
394eaf62fffSJeremy L Thompson   @brief Core logic for assembling composite operator diagonal
395eaf62fffSJeremy L Thompson 
396eaf62fffSJeremy L Thompson   @param[in]  op            CeedOperator to assemble point block diagonal
397ea61e9acSJeremy L Thompson   @param[in]  request       Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE
398eaf62fffSJeremy L Thompson   @param[in]  is_pointblock Boolean flag to assemble diagonal or point block diagonal
399eaf62fffSJeremy L Thompson   @param[out] assembled     CeedVector to store assembled diagonal
400eaf62fffSJeremy L Thompson 
401eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
402eaf62fffSJeremy L Thompson 
403eaf62fffSJeremy L Thompson   @ref Developer
404eaf62fffSJeremy L Thompson **/
4052b730f8bSJeremy L Thompson static inline int CeedCompositeOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedRequest *request, const bool is_pointblock,
406eaf62fffSJeremy L Thompson                                                                  CeedVector assembled) {
407eaf62fffSJeremy L Thompson   CeedInt       num_sub;
408eaf62fffSJeremy L Thompson   CeedOperator *suboperators;
409c6ebc35dSJeremy L Thompson   CeedCall(CeedCompositeOperatorGetNumSub(op, &num_sub));
410c6ebc35dSJeremy L Thompson   CeedCall(CeedCompositeOperatorGetSubList(op, &suboperators));
411eaf62fffSJeremy L Thompson   for (CeedInt i = 0; i < num_sub; i++) {
4126aa95790SJeremy L Thompson     if (is_pointblock) {
4132b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(suboperators[i], assembled, request));
4146aa95790SJeremy L Thompson     } else {
4152b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleAddDiagonal(suboperators[i], assembled, request));
4166aa95790SJeremy L Thompson     }
417eaf62fffSJeremy L Thompson   }
418eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
419eaf62fffSJeremy L Thompson }
420eaf62fffSJeremy L Thompson 
421eaf62fffSJeremy L Thompson /**
422eaf62fffSJeremy L Thompson   @brief Build nonzero pattern for non-composite operator
423eaf62fffSJeremy L Thompson 
424eaf62fffSJeremy L Thompson   Users should generally use CeedOperatorLinearAssembleSymbolic()
425eaf62fffSJeremy L Thompson 
426eaf62fffSJeremy L Thompson   @param[in]  op     CeedOperator to assemble nonzero pattern
427eaf62fffSJeremy L Thompson   @param[in]  offset Offset for number of entries
428eaf62fffSJeremy L Thompson   @param[out] rows   Row number for each entry
429eaf62fffSJeremy L Thompson   @param[out] cols   Column number for each entry
430eaf62fffSJeremy L Thompson 
431eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
432eaf62fffSJeremy L Thompson 
433eaf62fffSJeremy L Thompson   @ref Developer
434eaf62fffSJeremy L Thompson **/
4352b730f8bSJeremy L Thompson static int CeedSingleOperatorAssembleSymbolic(CeedOperator op, CeedInt offset, CeedInt *rows, CeedInt *cols) {
436f3d47e36SJeremy L Thompson   Ceed ceed;
437f3d47e36SJeremy L Thompson   bool is_composite;
438f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
439f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
440f3d47e36SJeremy L Thompson 
441b275c451SJeremy L Thompson   if (is_composite) {
442eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
4432b730f8bSJeremy L Thompson     return CeedError(ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported");
444eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
4452b730f8bSJeremy L Thompson   }
446eaf62fffSJeremy L Thompson 
447c9366a6bSJeremy L Thompson   CeedSize num_nodes;
4482b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &num_nodes, NULL));
449eaf62fffSJeremy L Thompson   CeedElemRestriction rstr_in;
4502b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveElemRestriction(op, &rstr_in));
451e79b91d9SJeremy L Thompson   CeedInt num_elem, elem_size, num_comp;
4522b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(rstr_in, &num_elem));
4532b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetElementSize(rstr_in, &elem_size));
4542b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumComponents(rstr_in, &num_comp));
455eaf62fffSJeremy L Thompson   CeedInt layout_er[3];
4562b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetELayout(rstr_in, &layout_er));
457eaf62fffSJeremy L Thompson 
458eaf62fffSJeremy L Thompson   CeedInt local_num_entries = elem_size * num_comp * elem_size * num_comp * num_elem;
459eaf62fffSJeremy L Thompson 
460eaf62fffSJeremy L Thompson   // Determine elem_dof relation
461eaf62fffSJeremy L Thompson   CeedVector index_vec;
4622b730f8bSJeremy L Thompson   CeedCall(CeedVectorCreate(ceed, num_nodes, &index_vec));
463eaf62fffSJeremy L Thompson   CeedScalar *array;
4642b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayWrite(index_vec, CEED_MEM_HOST, &array));
465ed9e99e6SJeremy L Thompson   for (CeedInt i = 0; i < num_nodes; i++) array[i] = i;
4662b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArray(index_vec, &array));
467eaf62fffSJeremy L Thompson   CeedVector elem_dof;
4682b730f8bSJeremy L Thompson   CeedCall(CeedVectorCreate(ceed, num_elem * elem_size * num_comp, &elem_dof));
4692b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(elem_dof, 0.0));
4702b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionApply(rstr_in, CEED_NOTRANSPOSE, index_vec, elem_dof, CEED_REQUEST_IMMEDIATE));
471eaf62fffSJeremy L Thompson   const CeedScalar *elem_dof_a;
4722b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayRead(elem_dof, CEED_MEM_HOST, &elem_dof_a));
4732b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&index_vec));
474eaf62fffSJeremy L Thompson 
475eaf62fffSJeremy L Thompson   // Determine i, j locations for element matrices
476eaf62fffSJeremy L Thompson   CeedInt count = 0;
477ed9e99e6SJeremy L Thompson   for (CeedInt e = 0; e < num_elem; e++) {
478ed9e99e6SJeremy L Thompson     for (CeedInt comp_in = 0; comp_in < num_comp; comp_in++) {
479ed9e99e6SJeremy L Thompson       for (CeedInt comp_out = 0; comp_out < num_comp; comp_out++) {
480ed9e99e6SJeremy L Thompson         for (CeedInt i = 0; i < elem_size; i++) {
481ed9e99e6SJeremy L Thompson           for (CeedInt j = 0; j < elem_size; j++) {
4822b730f8bSJeremy L Thompson             const CeedInt elem_dof_index_row = i * layout_er[0] + (comp_out)*layout_er[1] + e * layout_er[2];
4832b730f8bSJeremy L Thompson             const CeedInt elem_dof_index_col = j * layout_er[0] + comp_in * layout_er[1] + e * layout_er[2];
484eaf62fffSJeremy L Thompson 
485eaf62fffSJeremy L Thompson             const CeedInt row = elem_dof_a[elem_dof_index_row];
486eaf62fffSJeremy L Thompson             const CeedInt col = elem_dof_a[elem_dof_index_col];
487eaf62fffSJeremy L Thompson 
488eaf62fffSJeremy L Thompson             rows[offset + count] = row;
489eaf62fffSJeremy L Thompson             cols[offset + count] = col;
490eaf62fffSJeremy L Thompson             count++;
491eaf62fffSJeremy L Thompson           }
492eaf62fffSJeremy L Thompson         }
493eaf62fffSJeremy L Thompson       }
494eaf62fffSJeremy L Thompson     }
495eaf62fffSJeremy L Thompson   }
4962b730f8bSJeremy L Thompson   if (count != local_num_entries) {
497eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
498eaf62fffSJeremy L Thompson     return CeedError(ceed, CEED_ERROR_MAJOR, "Error computing assembled entries");
499eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
5002b730f8bSJeremy L Thompson   }
5012b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArrayRead(elem_dof, &elem_dof_a));
5022b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&elem_dof));
503eaf62fffSJeremy L Thompson 
504eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
505eaf62fffSJeremy L Thompson }
506eaf62fffSJeremy L Thompson 
507eaf62fffSJeremy L Thompson /**
508eaf62fffSJeremy L Thompson   @brief Assemble nonzero entries for non-composite operator
509eaf62fffSJeremy L Thompson 
510eaf62fffSJeremy L Thompson   Users should generally use CeedOperatorLinearAssemble()
511eaf62fffSJeremy L Thompson 
512eaf62fffSJeremy L Thompson   @param[in]  op     CeedOperator to assemble
513ea61e9acSJeremy L Thompson   @param[in]  offset Offset for number of entries
514eaf62fffSJeremy L Thompson   @param[out] values Values to assemble into matrix
515eaf62fffSJeremy L Thompson 
516eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
517eaf62fffSJeremy L Thompson 
518eaf62fffSJeremy L Thompson   @ref Developer
519eaf62fffSJeremy L Thompson **/
5202b730f8bSJeremy L Thompson static int CeedSingleOperatorAssemble(CeedOperator op, CeedInt offset, CeedVector values) {
521f3d47e36SJeremy L Thompson   Ceed ceed;
522f3d47e36SJeremy L Thompson   bool is_composite;
523f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
524f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
525f3d47e36SJeremy L Thompson 
526f3d47e36SJeremy L Thompson   if (is_composite) {
527eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
5282b730f8bSJeremy L Thompson     return CeedError(ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported");
529eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
5302b730f8bSJeremy L Thompson   }
531f3d47e36SJeremy L Thompson 
532f3d47e36SJeremy L Thompson   // Early exit for empty operator
533f3d47e36SJeremy L Thompson   {
534f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
535f3d47e36SJeremy L Thompson 
536f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
537f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
538f3d47e36SJeremy L Thompson   }
539eaf62fffSJeremy L Thompson 
540cefa2673SJeremy L Thompson   if (op->LinearAssembleSingle) {
541cefa2673SJeremy L Thompson     // Backend version
5422b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleSingle(op, offset, values));
543cefa2673SJeremy L Thompson     return CEED_ERROR_SUCCESS;
544cefa2673SJeremy L Thompson   } else {
545cefa2673SJeremy L Thompson     // Operator fallback
546cefa2673SJeremy L Thompson     CeedOperator op_fallback;
547cefa2673SJeremy L Thompson 
5482b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
549cefa2673SJeremy L Thompson     if (op_fallback) {
5502b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemble(op_fallback, offset, values));
551cefa2673SJeremy L Thompson       return CEED_ERROR_SUCCESS;
552cefa2673SJeremy L Thompson     }
553cefa2673SJeremy L Thompson   }
554cefa2673SJeremy L Thompson 
555eaf62fffSJeremy L Thompson   // Assemble QFunction
556eaf62fffSJeremy L Thompson   CeedQFunction qf;
5572b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetQFunction(op, &qf));
558eaf62fffSJeremy L Thompson   CeedVector          assembled_qf;
559eaf62fffSJeremy L Thompson   CeedElemRestriction rstr_q;
5602b730f8bSJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &rstr_q, CEED_REQUEST_IMMEDIATE));
5611f9221feSJeremy L Thompson   CeedSize qf_length;
5622b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetLength(assembled_qf, &qf_length));
563eaf62fffSJeremy L Thompson 
5647e7773b5SJeremy L Thompson   CeedInt            num_input_fields, num_output_fields;
565eaf62fffSJeremy L Thompson   CeedOperatorField *input_fields;
566eaf62fffSJeremy L Thompson   CeedOperatorField *output_fields;
5672b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetFields(op, &num_input_fields, &input_fields, &num_output_fields, &output_fields));
568eaf62fffSJeremy L Thompson 
569ed9e99e6SJeremy L Thompson   // Get assembly data
570ed9e99e6SJeremy L Thompson   CeedOperatorAssemblyData data;
5712b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data));
572ed9e99e6SJeremy L Thompson   const CeedEvalMode *eval_mode_in, *eval_mode_out;
573ed9e99e6SJeremy L Thompson   CeedInt             num_eval_mode_in, num_eval_mode_out;
5742b730f8bSJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_eval_mode_in, &eval_mode_in, &num_eval_mode_out, &eval_mode_out));
575ed9e99e6SJeremy L Thompson   CeedBasis basis_in, basis_out;
5762b730f8bSJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetBases(data, &basis_in, NULL, &basis_out, NULL));
577eaf62fffSJeremy L Thompson 
5782b730f8bSJeremy L Thompson   if (num_eval_mode_in == 0 || num_eval_mode_out == 0) {
579eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
5802b730f8bSJeremy L Thompson     return CeedError(ceed, CEED_ERROR_UNSUPPORTED, "Cannot assemble operator with out inputs/outputs");
581eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
5822b730f8bSJeremy L Thompson   }
583eaf62fffSJeremy L Thompson 
584ed9e99e6SJeremy L Thompson   CeedElemRestriction active_rstr;
585eaf62fffSJeremy L Thompson   CeedInt             num_elem, elem_size, num_qpts, num_comp;
5862b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveElemRestriction(op, &active_rstr));
5872b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(active_rstr, &num_elem));
5882b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetElementSize(active_rstr, &elem_size));
5892b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumComponents(active_rstr, &num_comp));
5902b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_in, &num_qpts));
591eaf62fffSJeremy L Thompson 
592eaf62fffSJeremy L Thompson   CeedInt local_num_entries = elem_size * num_comp * elem_size * num_comp * num_elem;
593eaf62fffSJeremy L Thompson 
594eaf62fffSJeremy L Thompson   // loop over elements and put in data structure
595eaf62fffSJeremy L Thompson   const CeedScalar *interp_in, *grad_in;
5962b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetInterp(basis_in, &interp_in));
5972b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetGrad(basis_in, &grad_in));
598eaf62fffSJeremy L Thompson 
599eaf62fffSJeremy L Thompson   const CeedScalar *assembled_qf_array;
6002b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array));
601eaf62fffSJeremy L Thompson 
602eaf62fffSJeremy L Thompson   CeedInt layout_qf[3];
6032b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetELayout(rstr_q, &layout_qf));
6042b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&rstr_q));
605eaf62fffSJeremy L Thompson 
606eaf62fffSJeremy L Thompson   // we store B_mat_in, B_mat_out, BTD, elem_mat in row-major order
607ed9e99e6SJeremy L Thompson   const CeedScalar *B_mat_in, *B_mat_out;
6082b730f8bSJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, &B_mat_in, NULL, &B_mat_out));
609ed9e99e6SJeremy L Thompson   CeedScalar  BTD_mat[elem_size * num_qpts * num_eval_mode_in];
610eaf62fffSJeremy L Thompson   CeedScalar  elem_mat[elem_size * elem_size];
61192ae7e47SJeremy L Thompson   CeedInt     count = 0;
612eaf62fffSJeremy L Thompson   CeedScalar *vals;
6132b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayWrite(values, CEED_MEM_HOST, &vals));
614ed9e99e6SJeremy L Thompson   for (CeedInt e = 0; e < num_elem; e++) {
615ed9e99e6SJeremy L Thompson     for (CeedInt comp_in = 0; comp_in < num_comp; comp_in++) {
616ed9e99e6SJeremy L Thompson       for (CeedInt comp_out = 0; comp_out < num_comp; comp_out++) {
617ed9e99e6SJeremy L Thompson         // Compute B^T*D
618ed9e99e6SJeremy L Thompson         for (CeedInt n = 0; n < elem_size; n++) {
619ed9e99e6SJeremy L Thompson           for (CeedInt q = 0; q < num_qpts; q++) {
620ed9e99e6SJeremy L Thompson             for (CeedInt e_in = 0; e_in < num_eval_mode_in; e_in++) {
6212b730f8bSJeremy L Thompson               const CeedInt btd_index = n * (num_qpts * num_eval_mode_in) + (num_eval_mode_in * q + e_in);
622067fd99fSJeremy L Thompson               CeedScalar    sum       = 0.0;
623067fd99fSJeremy L Thompson               for (CeedInt e_out = 0; e_out < num_eval_mode_out; e_out++) {
624ed9e99e6SJeremy L Thompson                 const CeedInt b_out_index     = (num_eval_mode_out * q + e_out) * elem_size + n;
6252b730f8bSJeremy L Thompson                 const CeedInt eval_mode_index = ((e_in * num_comp + comp_in) * num_eval_mode_out + e_out) * num_comp + comp_out;
6262b730f8bSJeremy L Thompson                 const CeedInt qf_index        = q * layout_qf[0] + eval_mode_index * layout_qf[1] + e * layout_qf[2];
627067fd99fSJeremy L Thompson                 sum += B_mat_out[b_out_index] * assembled_qf_array[qf_index];
628eaf62fffSJeremy L Thompson               }
629067fd99fSJeremy L Thompson               BTD_mat[btd_index] = sum;
630ed9e99e6SJeremy L Thompson             }
631ed9e99e6SJeremy L Thompson           }
632eaf62fffSJeremy L Thompson         }
633eaf62fffSJeremy L Thompson         // form element matrix itself (for each block component)
6342b730f8bSJeremy L Thompson         CeedCall(CeedMatrixMatrixMultiply(ceed, BTD_mat, B_mat_in, elem_mat, elem_size, elem_size, num_qpts * num_eval_mode_in));
635eaf62fffSJeremy L Thompson 
636eaf62fffSJeremy L Thompson         // put element matrix in coordinate data structure
637ed9e99e6SJeremy L Thompson         for (CeedInt i = 0; i < elem_size; i++) {
638ed9e99e6SJeremy L Thompson           for (CeedInt j = 0; j < elem_size; j++) {
639eaf62fffSJeremy L Thompson             vals[offset + count] = elem_mat[i * elem_size + j];
640eaf62fffSJeremy L Thompson             count++;
641eaf62fffSJeremy L Thompson           }
642eaf62fffSJeremy L Thompson         }
643eaf62fffSJeremy L Thompson       }
644eaf62fffSJeremy L Thompson     }
645eaf62fffSJeremy L Thompson   }
6462b730f8bSJeremy L Thompson   if (count != local_num_entries) {
647eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
648eaf62fffSJeremy L Thompson     return CeedError(ceed, CEED_ERROR_MAJOR, "Error computing entries");
649eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
6502b730f8bSJeremy L Thompson   }
6512b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArray(values, &vals));
652eaf62fffSJeremy L Thompson 
6532b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array));
6542b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&assembled_qf));
655eaf62fffSJeremy L Thompson 
656eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
657eaf62fffSJeremy L Thompson }
658eaf62fffSJeremy L Thompson 
659eaf62fffSJeremy L Thompson /**
660eaf62fffSJeremy L Thompson   @brief Count number of entries for assembled CeedOperator
661eaf62fffSJeremy L Thompson 
662eaf62fffSJeremy L Thompson   @param[in]  op          CeedOperator to assemble
663eaf62fffSJeremy L Thompson   @param[out] num_entries Number of entries in assembled representation
664eaf62fffSJeremy L Thompson 
665eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
666eaf62fffSJeremy L Thompson 
667eaf62fffSJeremy L Thompson   @ref Utility
668eaf62fffSJeremy L Thompson **/
6692b730f8bSJeremy L Thompson static int CeedSingleOperatorAssemblyCountEntries(CeedOperator op, CeedInt *num_entries) {
670b275c451SJeremy L Thompson   bool                is_composite;
671eaf62fffSJeremy L Thompson   CeedElemRestriction rstr;
672eaf62fffSJeremy L Thompson   CeedInt             num_elem, elem_size, num_comp;
673eaf62fffSJeremy L Thompson 
674b275c451SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
675b275c451SJeremy L Thompson   if (is_composite) {
676eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
6772b730f8bSJeremy L Thompson     return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported");
678eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
6792b730f8bSJeremy L Thompson   }
6802b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveElemRestriction(op, &rstr));
6812b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem));
6822b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size));
6832b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp));
684eaf62fffSJeremy L Thompson   *num_entries = elem_size * num_comp * elem_size * num_comp * num_elem;
685eaf62fffSJeremy L Thompson 
686eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
687eaf62fffSJeremy L Thompson }
688eaf62fffSJeremy L Thompson 
689eaf62fffSJeremy L Thompson /**
690ea61e9acSJeremy L Thompson   @brief Common code for creating a multigrid coarse operator and level transfer operators for a CeedOperator
691eaf62fffSJeremy L Thompson 
692eaf62fffSJeremy L Thompson   @param[in]  op_fine      Fine grid operator
693eaf62fffSJeremy L Thompson   @param[in]  p_mult_fine  L-vector multiplicity in parallel gather/scatter
694eaf62fffSJeremy L Thompson   @param[in]  rstr_coarse  Coarse grid restriction
695eaf62fffSJeremy L Thompson   @param[in]  basis_coarse Coarse grid active vector basis
696eaf62fffSJeremy L Thompson   @param[in]  basis_c_to_f Basis for coarse to fine interpolation
697eaf62fffSJeremy L Thompson   @param[out] op_coarse    Coarse grid operator
698eaf62fffSJeremy L Thompson   @param[out] op_prolong   Coarse to fine operator
699eaf62fffSJeremy L Thompson   @param[out] op_restrict  Fine to coarse operator
700eaf62fffSJeremy L Thompson 
701eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
702eaf62fffSJeremy L Thompson 
703eaf62fffSJeremy L Thompson   @ref Developer
704eaf62fffSJeremy L Thompson **/
7052b730f8bSJeremy L Thompson static int CeedSingleOperatorMultigridLevel(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse,
7062b730f8bSJeremy L Thompson                                             CeedBasis basis_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) {
707eaf62fffSJeremy L Thompson   Ceed ceed;
7082b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op_fine, &ceed));
709eaf62fffSJeremy L Thompson 
710eaf62fffSJeremy L Thompson   // Check for composite operator
711eaf62fffSJeremy L Thompson   bool is_composite;
7122b730f8bSJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op_fine, &is_composite));
7132b730f8bSJeremy L Thompson   if (is_composite) {
714eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
7152b730f8bSJeremy L Thompson     return CeedError(ceed, CEED_ERROR_UNSUPPORTED, "Automatic multigrid setup for composite operators not supported");
716eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
7172b730f8bSJeremy L Thompson   }
718eaf62fffSJeremy L Thompson 
719eaf62fffSJeremy L Thompson   // Coarse Grid
7202b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCreate(ceed, op_fine->qf, op_fine->dqf, op_fine->dqfT, op_coarse));
721eaf62fffSJeremy L Thompson   CeedElemRestriction rstr_fine = NULL;
722eaf62fffSJeremy L Thompson   // -- Clone input fields
72392ae7e47SJeremy L Thompson   for (CeedInt i = 0; i < op_fine->qf->num_input_fields; i++) {
724eaf62fffSJeremy L Thompson     if (op_fine->input_fields[i]->vec == CEED_VECTOR_ACTIVE) {
725eaf62fffSJeremy L Thompson       rstr_fine = op_fine->input_fields[i]->elem_restr;
7262b730f8bSJeremy L Thompson       CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE));
727eaf62fffSJeremy L Thompson     } else {
7282b730f8bSJeremy L Thompson       CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, op_fine->input_fields[i]->elem_restr,
7292b730f8bSJeremy L Thompson                                     op_fine->input_fields[i]->basis, op_fine->input_fields[i]->vec));
730eaf62fffSJeremy L Thompson     }
731eaf62fffSJeremy L Thompson   }
732eaf62fffSJeremy L Thompson   // -- Clone output fields
73392ae7e47SJeremy L Thompson   for (CeedInt i = 0; i < op_fine->qf->num_output_fields; i++) {
734eaf62fffSJeremy L Thompson     if (op_fine->output_fields[i]->vec == CEED_VECTOR_ACTIVE) {
7352b730f8bSJeremy L Thompson       CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE));
736eaf62fffSJeremy L Thompson     } else {
7372b730f8bSJeremy L Thompson       CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, op_fine->output_fields[i]->elem_restr,
7382b730f8bSJeremy L Thompson                                     op_fine->output_fields[i]->basis, op_fine->output_fields[i]->vec));
739eaf62fffSJeremy L Thompson     }
740eaf62fffSJeremy L Thompson   }
741af99e877SJeremy L Thompson   // -- Clone QFunctionAssemblyData
7422b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op_fine->qf_assembled, &(*op_coarse)->qf_assembled));
743eaf62fffSJeremy L Thompson 
744eaf62fffSJeremy L Thompson   // Multiplicity vector
745eaf62fffSJeremy L Thompson   CeedVector mult_vec, mult_e_vec;
7462b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionCreateVector(rstr_fine, &mult_vec, &mult_e_vec));
7472b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(mult_e_vec, 0.0));
7482b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionApply(rstr_fine, CEED_NOTRANSPOSE, p_mult_fine, mult_e_vec, CEED_REQUEST_IMMEDIATE));
7492b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(mult_vec, 0.0));
7502b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionApply(rstr_fine, CEED_TRANSPOSE, mult_e_vec, mult_vec, CEED_REQUEST_IMMEDIATE));
7512b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&mult_e_vec));
7522b730f8bSJeremy L Thompson   CeedCall(CeedVectorReciprocal(mult_vec));
753eaf62fffSJeremy L Thompson 
754addd79feSZach Atkins   // Clone name
755addd79feSZach Atkins   bool   has_name = op_fine->name;
756addd79feSZach Atkins   size_t name_len = op_fine->name ? strlen(op_fine->name) : 0;
757addd79feSZach Atkins   CeedCall(CeedOperatorSetName(*op_coarse, op_fine->name));
758addd79feSZach Atkins 
759addd79feSZach Atkins   // Restriction/Prolongation Operators
760*83d6adf3SZach Atkins 
761*83d6adf3SZach Atkins   // Check that coarse to fine basis is provided if prolong/restrict operators are requested
762*83d6adf3SZach Atkins   if ((op_restrict || op_prolong) && !basis_c_to_f) {
763*83d6adf3SZach Atkins     // LCOV_EXCL_START
764*83d6adf3SZach Atkins     return CeedError(ceed, CEED_ERROR_INCOMPATIBLE, "Prolongation or restriction operator creation requires coarse-to-fine basis");
765*83d6adf3SZach Atkins     // LCOV_EXCL_STOP
766*83d6adf3SZach Atkins   }
767*83d6adf3SZach Atkins 
768eaf62fffSJeremy L Thompson   CeedInt num_comp;
7692b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumComponents(basis_coarse, &num_comp));
770addd79feSZach Atkins 
771addd79feSZach Atkins   // Restriction
772addd79feSZach Atkins   if (op_restrict) {
773eaf62fffSJeremy L Thompson     CeedQFunction qf_restrict;
7742b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_restrict));
775eaf62fffSJeremy L Thompson     CeedInt *num_comp_r_data;
7762b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(1, &num_comp_r_data));
777eaf62fffSJeremy L Thompson     num_comp_r_data[0] = num_comp;
778eaf62fffSJeremy L Thompson     CeedQFunctionContext ctx_r;
7792b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextCreate(ceed, &ctx_r));
7802b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextSetData(ctx_r, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_r_data), num_comp_r_data));
7812b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionSetContext(qf_restrict, ctx_r));
7822b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextDestroy(&ctx_r));
7832b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddInput(qf_restrict, "input", num_comp, CEED_EVAL_NONE));
7842b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddInput(qf_restrict, "scale", num_comp, CEED_EVAL_NONE));
7852b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddOutput(qf_restrict, "output", num_comp, CEED_EVAL_INTERP));
7862b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_restrict, num_comp));
787eaf62fffSJeremy L Thompson 
7882b730f8bSJeremy L Thompson     CeedCall(CeedOperatorCreate(ceed, qf_restrict, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_restrict));
7892b730f8bSJeremy L Thompson     CeedCall(CeedOperatorSetField(*op_restrict, "input", rstr_fine, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE));
7902b730f8bSJeremy L Thompson     CeedCall(CeedOperatorSetField(*op_restrict, "scale", rstr_fine, CEED_BASIS_COLLOCATED, mult_vec));
7912b730f8bSJeremy L Thompson     CeedCall(CeedOperatorSetField(*op_restrict, "output", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE));
792eaf62fffSJeremy L Thompson 
793addd79feSZach Atkins     // Set name
794addd79feSZach Atkins     char *restriction_name;
795addd79feSZach Atkins     CeedCall(CeedCalloc(17 + name_len, &restriction_name));
796addd79feSZach Atkins     sprintf(restriction_name, "restriction%s%s", has_name ? " for " : "", has_name ? op_fine->name : "");
797addd79feSZach Atkins     CeedCall(CeedOperatorSetName(*op_restrict, restriction_name));
798addd79feSZach Atkins     CeedCall(CeedFree(&restriction_name));
799addd79feSZach Atkins 
800addd79feSZach Atkins     // Check
801addd79feSZach Atkins     CeedCall(CeedOperatorCheckReady(*op_restrict));
802addd79feSZach Atkins 
803addd79feSZach Atkins     // Cleanup
804addd79feSZach Atkins     CeedCall(CeedQFunctionDestroy(&qf_restrict));
805addd79feSZach Atkins   }
806addd79feSZach Atkins 
807eaf62fffSJeremy L Thompson   // Prolongation
808addd79feSZach Atkins   if (op_prolong) {
809eaf62fffSJeremy L Thompson     CeedQFunction qf_prolong;
8102b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_prolong));
811eaf62fffSJeremy L Thompson     CeedInt *num_comp_p_data;
8122b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(1, &num_comp_p_data));
813eaf62fffSJeremy L Thompson     num_comp_p_data[0] = num_comp;
814eaf62fffSJeremy L Thompson     CeedQFunctionContext ctx_p;
8152b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextCreate(ceed, &ctx_p));
8162b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextSetData(ctx_p, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_p_data), num_comp_p_data));
8172b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionSetContext(qf_prolong, ctx_p));
8182b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextDestroy(&ctx_p));
8192b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddInput(qf_prolong, "input", num_comp, CEED_EVAL_INTERP));
8202b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddInput(qf_prolong, "scale", num_comp, CEED_EVAL_NONE));
8212b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddOutput(qf_prolong, "output", num_comp, CEED_EVAL_NONE));
8222b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_prolong, num_comp));
823eaf62fffSJeremy L Thompson 
8242b730f8bSJeremy L Thompson     CeedCall(CeedOperatorCreate(ceed, qf_prolong, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_prolong));
8252b730f8bSJeremy L Thompson     CeedCall(CeedOperatorSetField(*op_prolong, "input", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE));
8262b730f8bSJeremy L Thompson     CeedCall(CeedOperatorSetField(*op_prolong, "scale", rstr_fine, CEED_BASIS_COLLOCATED, mult_vec));
8272b730f8bSJeremy L Thompson     CeedCall(CeedOperatorSetField(*op_prolong, "output", rstr_fine, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE));
828eaf62fffSJeremy L Thompson 
829addd79feSZach Atkins     // Set name
830ea6b5821SJeremy L Thompson     char *prolongation_name;
8312b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(18 + name_len, &prolongation_name));
8322b730f8bSJeremy L Thompson     sprintf(prolongation_name, "prolongation%s%s", has_name ? " for " : "", has_name ? op_fine->name : "");
8332b730f8bSJeremy L Thompson     CeedCall(CeedOperatorSetName(*op_prolong, prolongation_name));
8342b730f8bSJeremy L Thompson     CeedCall(CeedFree(&prolongation_name));
835addd79feSZach Atkins 
836addd79feSZach Atkins     // Check
837addd79feSZach Atkins     CeedCall(CeedOperatorCheckReady(*op_prolong));
838addd79feSZach Atkins 
839addd79feSZach Atkins     // Cleanup
840addd79feSZach Atkins     CeedCall(CeedQFunctionDestroy(&qf_prolong));
841ea6b5821SJeremy L Thompson   }
842ea6b5821SJeremy L Thompson 
84358e4b056SJeremy L Thompson   // Check
84458e4b056SJeremy L Thompson   CeedCall(CeedOperatorCheckReady(*op_coarse));
84558e4b056SJeremy L Thompson 
846eaf62fffSJeremy L Thompson   // Cleanup
8472b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&mult_vec));
8482b730f8bSJeremy L Thompson   CeedCall(CeedBasisDestroy(&basis_c_to_f));
849805fe78eSJeremy L Thompson 
850eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
851eaf62fffSJeremy L Thompson }
852eaf62fffSJeremy L Thompson 
853eaf62fffSJeremy L Thompson /**
854eaf62fffSJeremy L Thompson   @brief Build 1D mass matrix and Laplacian with perturbation
855eaf62fffSJeremy L Thompson 
856eaf62fffSJeremy L Thompson   @param[in]  interp_1d   Interpolation matrix in one dimension
857eaf62fffSJeremy L Thompson   @param[in]  grad_1d     Gradient matrix in one dimension
858eaf62fffSJeremy L Thompson   @param[in]  q_weight_1d Quadrature weights in one dimension
859eaf62fffSJeremy L Thompson   @param[in]  P_1d        Number of basis nodes in one dimension
860eaf62fffSJeremy L Thompson   @param[in]  Q_1d        Number of quadrature points in one dimension
861eaf62fffSJeremy L Thompson   @param[in]  dim         Dimension of basis
862eaf62fffSJeremy L Thompson   @param[out] mass        Assembled mass matrix in one dimension
863eaf62fffSJeremy L Thompson   @param[out] laplace     Assembled perturbed Laplacian in one dimension
864eaf62fffSJeremy L Thompson 
865eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
866eaf62fffSJeremy L Thompson 
867eaf62fffSJeremy L Thompson   @ref Developer
868eaf62fffSJeremy L Thompson **/
8692b730f8bSJeremy L Thompson CeedPragmaOptimizeOff static int CeedBuildMassLaplace(const CeedScalar *interp_1d, const CeedScalar *grad_1d, const CeedScalar *q_weight_1d,
8702b730f8bSJeremy L Thompson                                                       CeedInt P_1d, CeedInt Q_1d, CeedInt dim, CeedScalar *mass, CeedScalar *laplace) {
8712b730f8bSJeremy L Thompson   for (CeedInt i = 0; i < P_1d; i++) {
872eaf62fffSJeremy L Thompson     for (CeedInt j = 0; j < P_1d; j++) {
873eaf62fffSJeremy L Thompson       CeedScalar sum = 0.0;
8742b730f8bSJeremy L Thompson       for (CeedInt k = 0; k < Q_1d; k++) sum += interp_1d[k * P_1d + i] * q_weight_1d[k] * interp_1d[k * P_1d + j];
875eaf62fffSJeremy L Thompson       mass[i + j * P_1d] = sum;
876eaf62fffSJeremy L Thompson     }
8772b730f8bSJeremy L Thompson   }
878eaf62fffSJeremy L Thompson   // -- Laplacian
8792b730f8bSJeremy L Thompson   for (CeedInt i = 0; i < P_1d; i++) {
880eaf62fffSJeremy L Thompson     for (CeedInt j = 0; j < P_1d; j++) {
881eaf62fffSJeremy L Thompson       CeedScalar sum = 0.0;
8822b730f8bSJeremy L Thompson       for (CeedInt k = 0; k < Q_1d; k++) sum += grad_1d[k * P_1d + i] * q_weight_1d[k] * grad_1d[k * P_1d + j];
883eaf62fffSJeremy L Thompson       laplace[i + j * P_1d] = sum;
884eaf62fffSJeremy L Thompson     }
8852b730f8bSJeremy L Thompson   }
886eaf62fffSJeremy L Thompson   CeedScalar perturbation = dim > 2 ? 1e-6 : 1e-4;
8872b730f8bSJeremy L Thompson   for (CeedInt i = 0; i < P_1d; i++) laplace[i + P_1d * i] += perturbation;
888eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
889eaf62fffSJeremy L Thompson }
890ea61e9acSJeremy L Thompson CeedPragmaOptimizeOn;
891eaf62fffSJeremy L Thompson 
892eaf62fffSJeremy L Thompson /// @}
893eaf62fffSJeremy L Thompson 
894eaf62fffSJeremy L Thompson /// ----------------------------------------------------------------------------
895480fae85SJeremy L Thompson /// CeedOperator Backend API
896480fae85SJeremy L Thompson /// ----------------------------------------------------------------------------
897480fae85SJeremy L Thompson /// @addtogroup CeedOperatorBackend
898480fae85SJeremy L Thompson /// @{
899480fae85SJeremy L Thompson 
900480fae85SJeremy L Thompson /**
901480fae85SJeremy L Thompson   @brief Create object holding CeedQFunction assembly data for CeedOperator
902480fae85SJeremy L Thompson 
903480fae85SJeremy L Thompson   @param[in]  ceed A Ceed object where the CeedQFunctionAssemblyData will be created
904ea61e9acSJeremy L Thompson   @param[out] data Address of the variable where the newly created CeedQFunctionAssemblyData will be stored
905480fae85SJeremy L Thompson 
906480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
907480fae85SJeremy L Thompson 
908480fae85SJeremy L Thompson   @ref Backend
909480fae85SJeremy L Thompson **/
910ea61e9acSJeremy L Thompson int CeedQFunctionAssemblyDataCreate(Ceed ceed, CeedQFunctionAssemblyData *data) {
9112b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(1, data));
912480fae85SJeremy L Thompson   (*data)->ref_count = 1;
913480fae85SJeremy L Thompson   (*data)->ceed      = ceed;
9142b730f8bSJeremy L Thompson   CeedCall(CeedReference(ceed));
915480fae85SJeremy L Thompson 
916480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
917480fae85SJeremy L Thompson }
918480fae85SJeremy L Thompson 
919480fae85SJeremy L Thompson /**
920480fae85SJeremy L Thompson   @brief Increment the reference counter for a CeedQFunctionAssemblyData
921480fae85SJeremy L Thompson 
922ea61e9acSJeremy L Thompson   @param[in,out] data CeedQFunctionAssemblyData to increment the reference counter
923480fae85SJeremy L Thompson 
924480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
925480fae85SJeremy L Thompson 
926480fae85SJeremy L Thompson   @ref Backend
927480fae85SJeremy L Thompson **/
928480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataReference(CeedQFunctionAssemblyData data) {
929480fae85SJeremy L Thompson   data->ref_count++;
930480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
931480fae85SJeremy L Thompson }
932480fae85SJeremy L Thompson 
933480fae85SJeremy L Thompson /**
934beecbf24SJeremy L Thompson   @brief Set re-use of CeedQFunctionAssemblyData
9358b919e6bSJeremy L Thompson 
936ea61e9acSJeremy L Thompson   @param[in,out] data       CeedQFunctionAssemblyData to mark for reuse
937ea61e9acSJeremy L Thompson   @param[in]     reuse_data Boolean flag indicating data re-use
9388b919e6bSJeremy L Thompson 
9398b919e6bSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
9408b919e6bSJeremy L Thompson 
9418b919e6bSJeremy L Thompson   @ref Backend
9428b919e6bSJeremy L Thompson **/
9432b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetReuse(CeedQFunctionAssemblyData data, bool reuse_data) {
944beecbf24SJeremy L Thompson   data->reuse_data        = reuse_data;
945beecbf24SJeremy L Thompson   data->needs_data_update = true;
946beecbf24SJeremy L Thompson   return CEED_ERROR_SUCCESS;
947beecbf24SJeremy L Thompson }
948beecbf24SJeremy L Thompson 
949beecbf24SJeremy L Thompson /**
950beecbf24SJeremy L Thompson   @brief Mark QFunctionAssemblyData as stale
951beecbf24SJeremy L Thompson 
952ea61e9acSJeremy L Thompson   @param[in,out] data              CeedQFunctionAssemblyData to mark as stale
953ea61e9acSJeremy L Thompson   @param[in]     needs_data_update Boolean flag indicating if update is needed or completed
954beecbf24SJeremy L Thompson 
955beecbf24SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
956beecbf24SJeremy L Thompson 
957beecbf24SJeremy L Thompson   @ref Backend
958beecbf24SJeremy L Thompson **/
9592b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetUpdateNeeded(CeedQFunctionAssemblyData data, bool needs_data_update) {
960beecbf24SJeremy L Thompson   data->needs_data_update = needs_data_update;
9618b919e6bSJeremy L Thompson   return CEED_ERROR_SUCCESS;
9628b919e6bSJeremy L Thompson }
9638b919e6bSJeremy L Thompson 
9648b919e6bSJeremy L Thompson /**
9658b919e6bSJeremy L Thompson   @brief Determine if QFunctionAssemblyData needs update
9668b919e6bSJeremy L Thompson 
9678b919e6bSJeremy L Thompson   @param[in]  data             CeedQFunctionAssemblyData to mark as stale
9688b919e6bSJeremy L Thompson   @param[out] is_update_needed Boolean flag indicating if re-assembly is required
9698b919e6bSJeremy L Thompson 
9708b919e6bSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
9718b919e6bSJeremy L Thompson 
9728b919e6bSJeremy L Thompson   @ref Backend
9738b919e6bSJeremy L Thompson **/
9742b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsUpdateNeeded(CeedQFunctionAssemblyData data, bool *is_update_needed) {
975beecbf24SJeremy L Thompson   *is_update_needed = !data->reuse_data || data->needs_data_update;
9768b919e6bSJeremy L Thompson   return CEED_ERROR_SUCCESS;
9778b919e6bSJeremy L Thompson }
9788b919e6bSJeremy L Thompson 
9798b919e6bSJeremy L Thompson /**
980ea61e9acSJeremy L Thompson   @brief Copy the pointer to a CeedQFunctionAssemblyData.
981ea61e9acSJeremy L Thompson            Both pointers should be destroyed with `CeedCeedQFunctionAssemblyDataDestroy()`.
982ea61e9acSJeremy L Thompson            Note: If `*data_copy` is non-NULL, then it is assumed that `*data_copy` is a pointer to a CeedQFunctionAssemblyData.
983ea61e9acSJeremy L Thompson              This CeedQFunctionAssemblyData will be destroyed if `*data_copy` is the only reference to this CeedQFunctionAssemblyData.
984480fae85SJeremy L Thompson 
985ea61e9acSJeremy L Thompson   @param[in]     data      CeedQFunctionAssemblyData to copy reference to
986ea61e9acSJeremy L Thompson   @param[in,out] data_copy Variable to store copied reference
987480fae85SJeremy L Thompson 
988480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
989480fae85SJeremy L Thompson 
990480fae85SJeremy L Thompson   @ref Backend
991480fae85SJeremy L Thompson **/
9922b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataReferenceCopy(CeedQFunctionAssemblyData data, CeedQFunctionAssemblyData *data_copy) {
9932b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAssemblyDataReference(data));
9942b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAssemblyDataDestroy(data_copy));
995480fae85SJeremy L Thompson   *data_copy = data;
996480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
997480fae85SJeremy L Thompson }
998480fae85SJeremy L Thompson 
999480fae85SJeremy L Thompson /**
1000480fae85SJeremy L Thompson   @brief Get setup status for internal objects for CeedQFunctionAssemblyData
1001480fae85SJeremy L Thompson 
1002ea61e9acSJeremy L Thompson   @param[in]  data     CeedQFunctionAssemblyData to retrieve status
1003480fae85SJeremy L Thompson   @param[out] is_setup Boolean flag for setup status
1004480fae85SJeremy L Thompson 
1005480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1006480fae85SJeremy L Thompson 
1007480fae85SJeremy L Thompson   @ref Backend
1008480fae85SJeremy L Thompson **/
10092b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsSetup(CeedQFunctionAssemblyData data, bool *is_setup) {
1010480fae85SJeremy L Thompson   *is_setup = data->is_setup;
1011480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1012480fae85SJeremy L Thompson }
1013480fae85SJeremy L Thompson 
1014480fae85SJeremy L Thompson /**
1015480fae85SJeremy L Thompson   @brief Set internal objects for CeedQFunctionAssemblyData
1016480fae85SJeremy L Thompson 
1017ea61e9acSJeremy L Thompson   @param[in,out] data CeedQFunctionAssemblyData to set objects
1018480fae85SJeremy L Thompson   @param[in]     vec  CeedVector to store assembled CeedQFunction at quadrature points
1019480fae85SJeremy L Thompson   @param[in]     rstr CeedElemRestriction for CeedVector containing assembled CeedQFunction
1020480fae85SJeremy L Thompson 
1021480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1022480fae85SJeremy L Thompson 
1023480fae85SJeremy L Thompson   @ref Backend
1024480fae85SJeremy L Thompson **/
10252b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetObjects(CeedQFunctionAssemblyData data, CeedVector vec, CeedElemRestriction rstr) {
10262b730f8bSJeremy L Thompson   CeedCall(CeedVectorReferenceCopy(vec, &data->vec));
10272b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionReferenceCopy(rstr, &data->rstr));
1028480fae85SJeremy L Thompson 
1029480fae85SJeremy L Thompson   data->is_setup = true;
1030480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1031480fae85SJeremy L Thompson }
1032480fae85SJeremy L Thompson 
10332b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataGetObjects(CeedQFunctionAssemblyData data, CeedVector *vec, CeedElemRestriction *rstr) {
10342b730f8bSJeremy L Thompson   if (!data->is_setup) {
1035480fae85SJeremy L Thompson     // LCOV_EXCL_START
10362b730f8bSJeremy L Thompson     return CeedError(data->ceed, CEED_ERROR_INCOMPLETE, "Internal objects not set; must call CeedQFunctionAssemblyDataSetObjects first.");
1037480fae85SJeremy L Thompson     // LCOV_EXCL_STOP
10382b730f8bSJeremy L Thompson   }
1039480fae85SJeremy L Thompson 
10402b730f8bSJeremy L Thompson   CeedCall(CeedVectorReferenceCopy(data->vec, vec));
10412b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionReferenceCopy(data->rstr, rstr));
1042480fae85SJeremy L Thompson 
1043480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1044480fae85SJeremy L Thompson }
1045480fae85SJeremy L Thompson 
1046480fae85SJeremy L Thompson /**
1047480fae85SJeremy L Thompson   @brief Destroy CeedQFunctionAssemblyData
1048480fae85SJeremy L Thompson 
1049ea61e9acSJeremy L Thompson   @param[in,out] data  CeedQFunctionAssemblyData to destroy
1050480fae85SJeremy L Thompson 
1051480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1052480fae85SJeremy L Thompson 
1053480fae85SJeremy L Thompson   @ref Backend
1054480fae85SJeremy L Thompson **/
1055480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataDestroy(CeedQFunctionAssemblyData *data) {
1056480fae85SJeremy L Thompson   if (!*data || --(*data)->ref_count > 0) return CEED_ERROR_SUCCESS;
1057480fae85SJeremy L Thompson 
10582b730f8bSJeremy L Thompson   CeedCall(CeedDestroy(&(*data)->ceed));
10592b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&(*data)->vec));
10602b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&(*data)->rstr));
1061480fae85SJeremy L Thompson 
10622b730f8bSJeremy L Thompson   CeedCall(CeedFree(data));
1063480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1064480fae85SJeremy L Thompson }
1065480fae85SJeremy L Thompson 
1066ed9e99e6SJeremy L Thompson /**
1067ed9e99e6SJeremy L Thompson   @brief Get CeedOperatorAssemblyData
1068ed9e99e6SJeremy L Thompson 
1069ed9e99e6SJeremy L Thompson   @param[in]  op   CeedOperator to assemble
1070ed9e99e6SJeremy L Thompson   @param[out] data CeedQFunctionAssemblyData
1071ed9e99e6SJeremy L Thompson 
1072ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1073ed9e99e6SJeremy L Thompson 
1074ed9e99e6SJeremy L Thompson   @ref Backend
1075ed9e99e6SJeremy L Thompson **/
10762b730f8bSJeremy L Thompson int CeedOperatorGetOperatorAssemblyData(CeedOperator op, CeedOperatorAssemblyData *data) {
1077ed9e99e6SJeremy L Thompson   if (!op->op_assembled) {
1078ed9e99e6SJeremy L Thompson     CeedOperatorAssemblyData data;
1079ed9e99e6SJeremy L Thompson 
10802b730f8bSJeremy L Thompson     CeedCall(CeedOperatorAssemblyDataCreate(op->ceed, op, &data));
1081ed9e99e6SJeremy L Thompson     op->op_assembled = data;
1082ed9e99e6SJeremy L Thompson   }
1083ed9e99e6SJeremy L Thompson   *data = op->op_assembled;
1084ed9e99e6SJeremy L Thompson 
1085ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1086ed9e99e6SJeremy L Thompson }
1087ed9e99e6SJeremy L Thompson 
1088ed9e99e6SJeremy L Thompson /**
1089ed9e99e6SJeremy L Thompson   @brief Create object holding CeedOperator assembly data
1090ed9e99e6SJeremy L Thompson 
1091ea61e9acSJeremy L Thompson   @param[in]  ceed Ceed object where the CeedOperatorAssemblyData will be created
1092ed9e99e6SJeremy L Thompson   @param[in]  op   CeedOperator to be assembled
1093ea61e9acSJeremy L Thompson   @param[out] data Address of the variable where the newly created CeedOperatorAssemblyData will be stored
1094ed9e99e6SJeremy L Thompson 
1095ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1096ed9e99e6SJeremy L Thompson 
1097ed9e99e6SJeremy L Thompson   @ref Backend
1098ed9e99e6SJeremy L Thompson **/
10992b730f8bSJeremy L Thompson int CeedOperatorAssemblyDataCreate(Ceed ceed, CeedOperator op, CeedOperatorAssemblyData *data) {
11002b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(1, data));
1101ed9e99e6SJeremy L Thompson   (*data)->ceed = ceed;
11022b730f8bSJeremy L Thompson   CeedCall(CeedReference(ceed));
1103ed9e99e6SJeremy L Thompson 
1104ed9e99e6SJeremy L Thompson   // Build OperatorAssembly data
1105ed9e99e6SJeremy L Thompson   CeedQFunction       qf;
1106ed9e99e6SJeremy L Thompson   CeedQFunctionField *qf_fields;
1107ed9e99e6SJeremy L Thompson   CeedOperatorField  *op_fields;
1108ed9e99e6SJeremy L Thompson   CeedInt             num_input_fields;
11092b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetQFunction(op, &qf));
11102b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionGetFields(qf, &num_input_fields, &qf_fields, NULL, NULL));
11112b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL));
1112ed9e99e6SJeremy L Thompson 
1113ed9e99e6SJeremy L Thompson   // Determine active input basis
1114ed9e99e6SJeremy L Thompson   CeedInt       num_eval_mode_in = 0, dim = 1;
1115ed9e99e6SJeremy L Thompson   CeedEvalMode *eval_mode_in = NULL;
1116ed9e99e6SJeremy L Thompson   CeedBasis     basis_in     = NULL;
1117ed9e99e6SJeremy L Thompson   for (CeedInt i = 0; i < num_input_fields; i++) {
1118ed9e99e6SJeremy L Thompson     CeedVector vec;
11192b730f8bSJeremy L Thompson     CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec));
1120ed9e99e6SJeremy L Thompson     if (vec == CEED_VECTOR_ACTIVE) {
11212b730f8bSJeremy L Thompson       CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_in));
11222b730f8bSJeremy L Thompson       CeedCall(CeedBasisGetDimension(basis_in, &dim));
1123ed9e99e6SJeremy L Thompson       CeedEvalMode eval_mode;
11242b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode));
1125ed9e99e6SJeremy L Thompson       switch (eval_mode) {
1126ed9e99e6SJeremy L Thompson         case CEED_EVAL_NONE:
1127ed9e99e6SJeremy L Thompson         case CEED_EVAL_INTERP:
11282b730f8bSJeremy L Thompson           CeedCall(CeedRealloc(num_eval_mode_in + 1, &eval_mode_in));
1129ed9e99e6SJeremy L Thompson           eval_mode_in[num_eval_mode_in] = eval_mode;
1130ed9e99e6SJeremy L Thompson           num_eval_mode_in += 1;
1131ed9e99e6SJeremy L Thompson           break;
1132ed9e99e6SJeremy L Thompson         case CEED_EVAL_GRAD:
11332b730f8bSJeremy L Thompson           CeedCall(CeedRealloc(num_eval_mode_in + dim, &eval_mode_in));
1134ed9e99e6SJeremy L Thompson           for (CeedInt d = 0; d < dim; d++) {
1135ed9e99e6SJeremy L Thompson             eval_mode_in[num_eval_mode_in + d] = eval_mode;
1136ed9e99e6SJeremy L Thompson           }
1137ed9e99e6SJeremy L Thompson           num_eval_mode_in += dim;
1138ed9e99e6SJeremy L Thompson           break;
1139ed9e99e6SJeremy L Thompson         case CEED_EVAL_WEIGHT:
1140ed9e99e6SJeremy L Thompson         case CEED_EVAL_DIV:
1141ed9e99e6SJeremy L Thompson         case CEED_EVAL_CURL:
1142ed9e99e6SJeremy L Thompson           break;  // Caught by QF Assembly
1143ed9e99e6SJeremy L Thompson       }
1144ed9e99e6SJeremy L Thompson     }
1145ed9e99e6SJeremy L Thompson   }
1146ed9e99e6SJeremy L Thompson   (*data)->num_eval_mode_in = num_eval_mode_in;
1147ed9e99e6SJeremy L Thompson   (*data)->eval_mode_in     = eval_mode_in;
11482b730f8bSJeremy L Thompson   CeedCall(CeedBasisReferenceCopy(basis_in, &(*data)->basis_in));
1149ed9e99e6SJeremy L Thompson 
1150ed9e99e6SJeremy L Thompson   // Determine active output basis
1151ed9e99e6SJeremy L Thompson   CeedInt num_output_fields;
11522b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionGetFields(qf, NULL, NULL, &num_output_fields, &qf_fields));
11532b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields));
1154ed9e99e6SJeremy L Thompson   CeedInt       num_eval_mode_out = 0;
1155ed9e99e6SJeremy L Thompson   CeedEvalMode *eval_mode_out     = NULL;
1156ed9e99e6SJeremy L Thompson   CeedBasis     basis_out         = NULL;
1157ed9e99e6SJeremy L Thompson   for (CeedInt i = 0; i < num_output_fields; i++) {
1158ed9e99e6SJeremy L Thompson     CeedVector vec;
11592b730f8bSJeremy L Thompson     CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec));
1160ed9e99e6SJeremy L Thompson     if (vec == CEED_VECTOR_ACTIVE) {
11612b730f8bSJeremy L Thompson       CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_out));
1162ed9e99e6SJeremy L Thompson       CeedEvalMode eval_mode;
11632b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode));
1164ed9e99e6SJeremy L Thompson       switch (eval_mode) {
1165ed9e99e6SJeremy L Thompson         case CEED_EVAL_NONE:
1166ed9e99e6SJeremy L Thompson         case CEED_EVAL_INTERP:
11672b730f8bSJeremy L Thompson           CeedCall(CeedRealloc(num_eval_mode_out + 1, &eval_mode_out));
1168ed9e99e6SJeremy L Thompson           eval_mode_out[num_eval_mode_out] = eval_mode;
1169ed9e99e6SJeremy L Thompson           num_eval_mode_out += 1;
1170ed9e99e6SJeremy L Thompson           break;
1171ed9e99e6SJeremy L Thompson         case CEED_EVAL_GRAD:
11722b730f8bSJeremy L Thompson           CeedCall(CeedRealloc(num_eval_mode_out + dim, &eval_mode_out));
1173ed9e99e6SJeremy L Thompson           for (CeedInt d = 0; d < dim; d++) {
1174ed9e99e6SJeremy L Thompson             eval_mode_out[num_eval_mode_out + d] = eval_mode;
1175ed9e99e6SJeremy L Thompson           }
1176ed9e99e6SJeremy L Thompson           num_eval_mode_out += dim;
1177ed9e99e6SJeremy L Thompson           break;
1178ed9e99e6SJeremy L Thompson         case CEED_EVAL_WEIGHT:
1179ed9e99e6SJeremy L Thompson         case CEED_EVAL_DIV:
1180ed9e99e6SJeremy L Thompson         case CEED_EVAL_CURL:
1181ed9e99e6SJeremy L Thompson           break;  // Caught by QF Assembly
1182ed9e99e6SJeremy L Thompson       }
1183ed9e99e6SJeremy L Thompson     }
1184ed9e99e6SJeremy L Thompson   }
1185ed9e99e6SJeremy L Thompson   (*data)->num_eval_mode_out = num_eval_mode_out;
1186ed9e99e6SJeremy L Thompson   (*data)->eval_mode_out     = eval_mode_out;
11872b730f8bSJeremy L Thompson   CeedCall(CeedBasisReferenceCopy(basis_out, &(*data)->basis_out));
1188ed9e99e6SJeremy L Thompson 
1189ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1190ed9e99e6SJeremy L Thompson }
1191ed9e99e6SJeremy L Thompson 
1192ed9e99e6SJeremy L Thompson /**
1193ed9e99e6SJeremy L Thompson   @brief Get CeedOperator CeedEvalModes for assembly
1194ed9e99e6SJeremy L Thompson 
1195ed9e99e6SJeremy L Thompson   @param[in]  data              CeedOperatorAssemblyData
1196ed9e99e6SJeremy L Thompson   @param[out] num_eval_mode_in  Pointer to hold number of input CeedEvalModes, or NULL
1197ed9e99e6SJeremy L Thompson   @param[out] eval_mode_in      Pointer to hold input CeedEvalModes, or NULL
1198ed9e99e6SJeremy L Thompson   @param[out] num_eval_mode_out Pointer to hold number of output CeedEvalModes, or NULL
1199ed9e99e6SJeremy L Thompson   @param[out] eval_mode_out     Pointer to hold output CeedEvalModes, or NULL
1200ed9e99e6SJeremy L Thompson 
1201ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1202ed9e99e6SJeremy L Thompson 
1203ed9e99e6SJeremy L Thompson   @ref Backend
1204ed9e99e6SJeremy L Thompson **/
12052b730f8bSJeremy L Thompson int CeedOperatorAssemblyDataGetEvalModes(CeedOperatorAssemblyData data, CeedInt *num_eval_mode_in, const CeedEvalMode **eval_mode_in,
1206ed9e99e6SJeremy L Thompson                                          CeedInt *num_eval_mode_out, const CeedEvalMode **eval_mode_out) {
1207ed9e99e6SJeremy L Thompson   if (num_eval_mode_in) *num_eval_mode_in = data->num_eval_mode_in;
1208ed9e99e6SJeremy L Thompson   if (eval_mode_in) *eval_mode_in = data->eval_mode_in;
1209ed9e99e6SJeremy L Thompson   if (num_eval_mode_out) *num_eval_mode_out = data->num_eval_mode_out;
1210ed9e99e6SJeremy L Thompson   if (eval_mode_out) *eval_mode_out = data->eval_mode_out;
1211ed9e99e6SJeremy L Thompson 
1212ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1213ed9e99e6SJeremy L Thompson }
1214ed9e99e6SJeremy L Thompson 
1215ed9e99e6SJeremy L Thompson /**
1216ed9e99e6SJeremy L Thompson   @brief Get CeedOperator CeedBasis data for assembly
1217ed9e99e6SJeremy L Thompson 
1218ed9e99e6SJeremy L Thompson   @param[in]  data      CeedOperatorAssemblyData
1219ed9e99e6SJeremy L Thompson   @param[out] basis_in  Pointer to hold active input CeedBasis, or NULL
1220ed9e99e6SJeremy L Thompson   @param[out] B_in      Pointer to hold assembled active input B, or NULL
1221ed9e99e6SJeremy L Thompson   @param[out] basis_out Pointer to hold active output CeedBasis, or NULL
1222ed9e99e6SJeremy L Thompson   @param[out] B_out     Pointer to hold assembled active output B, or NULL
1223ed9e99e6SJeremy L Thompson 
1224ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1225ed9e99e6SJeremy L Thompson 
1226ed9e99e6SJeremy L Thompson   @ref Backend
1227ed9e99e6SJeremy L Thompson **/
12282b730f8bSJeremy L Thompson int CeedOperatorAssemblyDataGetBases(CeedOperatorAssemblyData data, CeedBasis *basis_in, const CeedScalar **B_in, CeedBasis *basis_out,
1229ed9e99e6SJeremy L Thompson                                      const CeedScalar **B_out) {
1230ed9e99e6SJeremy L Thompson   // Assemble B_in, B_out if needed
1231ed9e99e6SJeremy L Thompson   if (B_in && !data->B_in) {
1232ed9e99e6SJeremy L Thompson     CeedInt           num_qpts, elem_size;
1233ed9e99e6SJeremy L Thompson     CeedScalar       *B_in, *identity = NULL;
1234ed9e99e6SJeremy L Thompson     const CeedScalar *interp_in, *grad_in;
1235ed9e99e6SJeremy L Thompson     bool              has_eval_none = false;
1236ed9e99e6SJeremy L Thompson 
12372b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumQuadraturePoints(data->basis_in, &num_qpts));
12382b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumNodes(data->basis_in, &elem_size));
12392b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(num_qpts * elem_size * data->num_eval_mode_in, &B_in));
1240ed9e99e6SJeremy L Thompson 
1241ed9e99e6SJeremy L Thompson     for (CeedInt i = 0; i < data->num_eval_mode_in; i++) {
1242ed9e99e6SJeremy L Thompson       has_eval_none = has_eval_none || (data->eval_mode_in[i] == CEED_EVAL_NONE);
1243ed9e99e6SJeremy L Thompson     }
1244ed9e99e6SJeremy L Thompson     if (has_eval_none) {
12452b730f8bSJeremy L Thompson       CeedCall(CeedCalloc(num_qpts * elem_size, &identity));
1246ed9e99e6SJeremy L Thompson       for (CeedInt i = 0; i < (elem_size < num_qpts ? elem_size : num_qpts); i++) {
1247ed9e99e6SJeremy L Thompson         identity[i * elem_size + i] = 1.0;
1248ed9e99e6SJeremy L Thompson       }
1249ed9e99e6SJeremy L Thompson     }
12502b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetInterp(data->basis_in, &interp_in));
12512b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetGrad(data->basis_in, &grad_in));
1252ed9e99e6SJeremy L Thompson 
1253ed9e99e6SJeremy L Thompson     for (CeedInt q = 0; q < num_qpts; q++) {
1254ed9e99e6SJeremy L Thompson       for (CeedInt n = 0; n < elem_size; n++) {
1255ed9e99e6SJeremy L Thompson         CeedInt d_in = -1;
1256ed9e99e6SJeremy L Thompson         for (CeedInt e_in = 0; e_in < data->num_eval_mode_in; e_in++) {
1257ed9e99e6SJeremy L Thompson           const CeedInt     qq = data->num_eval_mode_in * q;
1258ed9e99e6SJeremy L Thompson           const CeedScalar *b  = NULL;
1259ed9e99e6SJeremy L Thompson 
1260ed9e99e6SJeremy L Thompson           if (data->eval_mode_in[e_in] == CEED_EVAL_GRAD) d_in++;
12612b730f8bSJeremy L Thompson           CeedOperatorGetBasisPointer(data->eval_mode_in[e_in], identity, interp_in, &grad_in[d_in * num_qpts * elem_size], &b);
1262ed9e99e6SJeremy L Thompson           B_in[(qq + e_in) * elem_size + n] = b[q * elem_size + n];
1263ed9e99e6SJeremy L Thompson         }
1264ed9e99e6SJeremy L Thompson       }
1265ed9e99e6SJeremy L Thompson     }
1266ed9e99e6SJeremy L Thompson     data->B_in = B_in;
1267ed9e99e6SJeremy L Thompson   }
1268ed9e99e6SJeremy L Thompson 
1269ed9e99e6SJeremy L Thompson   if (B_out && !data->B_out) {
1270ed9e99e6SJeremy L Thompson     CeedInt           num_qpts, elem_size;
1271ed9e99e6SJeremy L Thompson     CeedScalar       *B_out, *identity = NULL;
1272ed9e99e6SJeremy L Thompson     const CeedScalar *interp_out, *grad_out;
1273ed9e99e6SJeremy L Thompson     bool              has_eval_none = false;
1274ed9e99e6SJeremy L Thompson 
12752b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumQuadraturePoints(data->basis_out, &num_qpts));
12762b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumNodes(data->basis_out, &elem_size));
12772b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(num_qpts * elem_size * data->num_eval_mode_out, &B_out));
1278ed9e99e6SJeremy L Thompson 
1279ed9e99e6SJeremy L Thompson     for (CeedInt i = 0; i < data->num_eval_mode_out; i++) {
1280ed9e99e6SJeremy L Thompson       has_eval_none = has_eval_none || (data->eval_mode_out[i] == CEED_EVAL_NONE);
1281ed9e99e6SJeremy L Thompson     }
1282ed9e99e6SJeremy L Thompson     if (has_eval_none) {
12832b730f8bSJeremy L Thompson       CeedCall(CeedCalloc(num_qpts * elem_size, &identity));
1284ed9e99e6SJeremy L Thompson       for (CeedInt i = 0; i < (elem_size < num_qpts ? elem_size : num_qpts); i++) {
1285ed9e99e6SJeremy L Thompson         identity[i * elem_size + i] = 1.0;
1286ed9e99e6SJeremy L Thompson       }
1287ed9e99e6SJeremy L Thompson     }
12882b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetInterp(data->basis_out, &interp_out));
12892b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetGrad(data->basis_out, &grad_out));
1290ed9e99e6SJeremy L Thompson 
1291ed9e99e6SJeremy L Thompson     for (CeedInt q = 0; q < num_qpts; q++) {
1292ed9e99e6SJeremy L Thompson       for (CeedInt n = 0; n < elem_size; n++) {
1293ed9e99e6SJeremy L Thompson         CeedInt d_out = -1;
1294ed9e99e6SJeremy L Thompson         for (CeedInt e_out = 0; e_out < data->num_eval_mode_out; e_out++) {
1295ed9e99e6SJeremy L Thompson           const CeedInt     qq = data->num_eval_mode_out * q;
1296ed9e99e6SJeremy L Thompson           const CeedScalar *b  = NULL;
1297ed9e99e6SJeremy L Thompson 
1298ed9e99e6SJeremy L Thompson           if (data->eval_mode_out[e_out] == CEED_EVAL_GRAD) d_out++;
12992b730f8bSJeremy L Thompson           CeedOperatorGetBasisPointer(data->eval_mode_out[e_out], identity, interp_out, &grad_out[d_out * num_qpts * elem_size], &b);
1300ed9e99e6SJeremy L Thompson           B_out[(qq + e_out) * elem_size + n] = b[q * elem_size + n];
1301ed9e99e6SJeremy L Thompson         }
1302ed9e99e6SJeremy L Thompson       }
1303ed9e99e6SJeremy L Thompson     }
1304ed9e99e6SJeremy L Thompson     data->B_out = B_out;
1305ed9e99e6SJeremy L Thompson   }
1306ed9e99e6SJeremy L Thompson 
1307ed9e99e6SJeremy L Thompson   if (basis_in) *basis_in = data->basis_in;
1308ed9e99e6SJeremy L Thompson   if (B_in) *B_in = data->B_in;
1309ed9e99e6SJeremy L Thompson   if (basis_out) *basis_out = data->basis_out;
1310ed9e99e6SJeremy L Thompson   if (B_out) *B_out = data->B_out;
1311ed9e99e6SJeremy L Thompson 
1312ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1313ed9e99e6SJeremy L Thompson }
1314ed9e99e6SJeremy L Thompson 
1315ed9e99e6SJeremy L Thompson /**
1316ed9e99e6SJeremy L Thompson   @brief Destroy CeedOperatorAssemblyData
1317ed9e99e6SJeremy L Thompson 
1318ea61e9acSJeremy L Thompson   @param[in,out] data CeedOperatorAssemblyData to destroy
1319ed9e99e6SJeremy L Thompson 
1320ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1321ed9e99e6SJeremy L Thompson 
1322ed9e99e6SJeremy L Thompson   @ref Backend
1323ed9e99e6SJeremy L Thompson **/
1324ed9e99e6SJeremy L Thompson int CeedOperatorAssemblyDataDestroy(CeedOperatorAssemblyData *data) {
1325ed9e99e6SJeremy L Thompson   if (!*data) return CEED_ERROR_SUCCESS;
1326ed9e99e6SJeremy L Thompson 
13272b730f8bSJeremy L Thompson   CeedCall(CeedDestroy(&(*data)->ceed));
13282b730f8bSJeremy L Thompson   CeedCall(CeedBasisDestroy(&(*data)->basis_in));
13292b730f8bSJeremy L Thompson   CeedCall(CeedBasisDestroy(&(*data)->basis_out));
13302b730f8bSJeremy L Thompson   CeedCall(CeedFree(&(*data)->eval_mode_in));
13312b730f8bSJeremy L Thompson   CeedCall(CeedFree(&(*data)->eval_mode_out));
13322b730f8bSJeremy L Thompson   CeedCall(CeedFree(&(*data)->B_in));
13332b730f8bSJeremy L Thompson   CeedCall(CeedFree(&(*data)->B_out));
1334ed9e99e6SJeremy L Thompson 
13352b730f8bSJeremy L Thompson   CeedCall(CeedFree(data));
1336ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1337ed9e99e6SJeremy L Thompson }
1338ed9e99e6SJeremy L Thompson 
1339480fae85SJeremy L Thompson /// @}
1340480fae85SJeremy L Thompson 
1341480fae85SJeremy L Thompson /// ----------------------------------------------------------------------------
1342eaf62fffSJeremy L Thompson /// CeedOperator Public API
1343eaf62fffSJeremy L Thompson /// ----------------------------------------------------------------------------
1344eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorUser
1345eaf62fffSJeremy L Thompson /// @{
1346eaf62fffSJeremy L Thompson 
1347eaf62fffSJeremy L Thompson /**
1348eaf62fffSJeremy L Thompson   @brief Assemble a linear CeedQFunction associated with a CeedOperator
1349eaf62fffSJeremy L Thompson 
1350ea61e9acSJeremy L Thompson   This returns a CeedVector containing a matrix at each quadrature point providing the action of the CeedQFunction associated with the CeedOperator.
1351ea61e9acSJeremy L Thompson     The vector 'assembled' is of shape [num_elements, num_input_fields, num_output_fields, num_quad_points] and contains column-major matrices
1352ea61e9acSJeremy L Thompson representing the action of the CeedQFunction for a corresponding quadrature point on an element. Inputs and outputs are in the order provided by the
1353ea61e9acSJeremy L Thompson user when adding CeedOperator fields. For example, a CeedQFunction with inputs 'u' and 'gradu' and outputs 'gradv' and 'v', provided in that order,
1354ea61e9acSJeremy L Thompson would result in an assembled QFunction that consists of (1 + dim) x (dim + 1) matrices at each quadrature point acting on the input [u, du_0, du_1]
1355ea61e9acSJeremy L Thompson and producing the output [dv_0, dv_1, v].
1356eaf62fffSJeremy L Thompson 
1357ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1358f04ea552SJeremy L Thompson 
1359ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1360ea61e9acSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points
1361ea61e9acSJeremy L Thompson   @param[out] rstr      CeedElemRestriction for CeedVector containing assembled CeedQFunction
1362ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1363eaf62fffSJeremy L Thompson 
1364eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1365eaf62fffSJeremy L Thompson 
1366eaf62fffSJeremy L Thompson   @ref User
1367eaf62fffSJeremy L Thompson **/
13682b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunction(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) {
13692b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1370eaf62fffSJeremy L Thompson 
1371eaf62fffSJeremy L Thompson   if (op->LinearAssembleQFunction) {
1372d04bbc78SJeremy L Thompson     // Backend version
13732b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleQFunction(op, assembled, rstr, request));
1374eaf62fffSJeremy L Thompson   } else {
1375d04bbc78SJeremy L Thompson     // Operator fallback
1376d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1377d04bbc78SJeremy L Thompson 
13782b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1379d04bbc78SJeremy L Thompson     if (op_fallback) {
13802b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleQFunction(op_fallback, assembled, rstr, request));
1381d04bbc78SJeremy L Thompson     } else {
1382d04bbc78SJeremy L Thompson       // LCOV_EXCL_START
13832b730f8bSJeremy L Thompson       return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunction");
1384d04bbc78SJeremy L Thompson       // LCOV_EXCL_STOP
1385d04bbc78SJeremy L Thompson     }
138670a7ffb3SJeremy L Thompson   }
1387eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1388eaf62fffSJeremy L Thompson }
138970a7ffb3SJeremy L Thompson 
139070a7ffb3SJeremy L Thompson /**
1391ea61e9acSJeremy L Thompson   @brief Assemble CeedQFunction and store result internally.
1392ea61e9acSJeremy L Thompson            Return copied references of stored data to the caller.
1393ea61e9acSJeremy L Thompson            Caller is responsible for ownership and destruction of the copied references.
1394ea61e9acSJeremy L Thompson            See also @ref CeedOperatorLinearAssembleQFunction
139570a7ffb3SJeremy L Thompson 
1396ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1397ea61e9acSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points
1398ea61e9acSJeremy L Thompson   @param[out] rstr      CeedElemRestriction for CeedVector containing assembledCeedQFunction
1399ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
140070a7ffb3SJeremy L Thompson 
140170a7ffb3SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
140270a7ffb3SJeremy L Thompson 
140370a7ffb3SJeremy L Thompson   @ref User
140470a7ffb3SJeremy L Thompson **/
14052b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunctionBuildOrUpdate(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) {
14062b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
140770a7ffb3SJeremy L Thompson 
140870a7ffb3SJeremy L Thompson   if (op->LinearAssembleQFunctionUpdate) {
1409d04bbc78SJeremy L Thompson     // Backend version
1410480fae85SJeremy L Thompson     bool                qf_assembled_is_setup;
14112efa2d85SJeremy L Thompson     CeedVector          assembled_vec  = NULL;
14122efa2d85SJeremy L Thompson     CeedElemRestriction assembled_rstr = NULL;
1413480fae85SJeremy L Thompson 
14142b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAssemblyDataIsSetup(op->qf_assembled, &qf_assembled_is_setup));
1415480fae85SJeremy L Thompson     if (qf_assembled_is_setup) {
1416d04bbc78SJeremy L Thompson       bool update_needed;
1417d04bbc78SJeremy L Thompson 
14182b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionAssemblyDataGetObjects(op->qf_assembled, &assembled_vec, &assembled_rstr));
14192b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionAssemblyDataIsUpdateNeeded(op->qf_assembled, &update_needed));
14208b919e6bSJeremy L Thompson       if (update_needed) {
14212b730f8bSJeremy L Thompson         CeedCall(op->LinearAssembleQFunctionUpdate(op, assembled_vec, assembled_rstr, request));
14228b919e6bSJeremy L Thompson       }
142370a7ffb3SJeremy L Thompson     } else {
14242b730f8bSJeremy L Thompson       CeedCall(op->LinearAssembleQFunction(op, &assembled_vec, &assembled_rstr, request));
14252b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionAssemblyDataSetObjects(op->qf_assembled, assembled_vec, assembled_rstr));
142670a7ffb3SJeremy L Thompson     }
14272b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAssemblyDataSetUpdateNeeded(op->qf_assembled, false));
14282efa2d85SJeremy L Thompson 
1429d04bbc78SJeremy L Thompson     // Copy reference from internally held copy
143070a7ffb3SJeremy L Thompson     *assembled = NULL;
143170a7ffb3SJeremy L Thompson     *rstr      = NULL;
14322b730f8bSJeremy L Thompson     CeedCall(CeedVectorReferenceCopy(assembled_vec, assembled));
14332b730f8bSJeremy L Thompson     CeedCall(CeedVectorDestroy(&assembled_vec));
14342b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionReferenceCopy(assembled_rstr, rstr));
14352b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionDestroy(&assembled_rstr));
143670a7ffb3SJeremy L Thompson   } else {
1437d04bbc78SJeremy L Thompson     // Operator fallback
1438d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1439d04bbc78SJeremy L Thompson 
14402b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1441d04bbc78SJeremy L Thompson     if (op_fallback) {
14422b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op_fallback, assembled, rstr, request));
1443d04bbc78SJeremy L Thompson     } else {
1444d04bbc78SJeremy L Thompson       // LCOV_EXCL_START
14452b730f8bSJeremy L Thompson       return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunctionUpdate");
1446d04bbc78SJeremy L Thompson       // LCOV_EXCL_STOP
144770a7ffb3SJeremy L Thompson     }
144870a7ffb3SJeremy L Thompson   }
144970a7ffb3SJeremy L Thompson 
145070a7ffb3SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1451eaf62fffSJeremy L Thompson }
1452eaf62fffSJeremy L Thompson 
1453eaf62fffSJeremy L Thompson /**
1454eaf62fffSJeremy L Thompson   @brief Assemble the diagonal of a square linear CeedOperator
1455eaf62fffSJeremy L Thompson 
1456eaf62fffSJeremy L Thompson   This overwrites a CeedVector with the diagonal of a linear CeedOperator.
1457eaf62fffSJeremy L Thompson 
1458ea61e9acSJeremy L Thompson   Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported.
1459eaf62fffSJeremy L Thompson 
1460ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1461f04ea552SJeremy L Thompson 
1462ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1463eaf62fffSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedOperator diagonal
1464ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1465eaf62fffSJeremy L Thompson 
1466eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1467eaf62fffSJeremy L Thompson 
1468eaf62fffSJeremy L Thompson   @ref User
1469eaf62fffSJeremy L Thompson **/
14702b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) {
1471f3d47e36SJeremy L Thompson   bool is_composite;
14722b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1473f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1474eaf62fffSJeremy L Thompson 
1475c9366a6bSJeremy L Thompson   CeedSize input_size = 0, output_size = 0;
14762b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size));
14772b730f8bSJeremy L Thompson   if (input_size != output_size) {
1478c9366a6bSJeremy L Thompson     // LCOV_EXCL_START
1479c9366a6bSJeremy L Thompson     return CeedError(op->ceed, CEED_ERROR_DIMENSION, "Operator must be square");
1480c9366a6bSJeremy L Thompson     // LCOV_EXCL_STOP
14812b730f8bSJeremy L Thompson   }
1482c9366a6bSJeremy L Thompson 
1483f3d47e36SJeremy L Thompson   // Early exit for empty operator
1484f3d47e36SJeremy L Thompson   if (!is_composite) {
1485f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
1486f3d47e36SJeremy L Thompson 
1487f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
1488f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
1489f3d47e36SJeremy L Thompson   }
1490f3d47e36SJeremy L Thompson 
1491eaf62fffSJeremy L Thompson   if (op->LinearAssembleDiagonal) {
1492d04bbc78SJeremy L Thompson     // Backend version
14932b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleDiagonal(op, assembled, request));
1494eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1495eaf62fffSJeremy L Thompson   } else if (op->LinearAssembleAddDiagonal) {
1496d04bbc78SJeremy L Thompson     // Backend version with zeroing first
14972b730f8bSJeremy L Thompson     CeedCall(CeedVectorSetValue(assembled, 0.0));
14982b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request));
1499eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1500eaf62fffSJeremy L Thompson   } else {
1501d04bbc78SJeremy L Thompson     // Operator fallback
1502d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1503d04bbc78SJeremy L Thompson 
15042b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1505d04bbc78SJeremy L Thompson     if (op_fallback) {
15062b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleDiagonal(op_fallback, assembled, request));
1507eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1508eaf62fffSJeremy L Thompson     }
1509eaf62fffSJeremy L Thompson   }
1510eaf62fffSJeremy L Thompson   // Default interface implementation
15112b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(assembled, 0.0));
15122b730f8bSJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleAddDiagonal(op, assembled, request));
1513d04bbc78SJeremy L Thompson 
1514eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1515eaf62fffSJeremy L Thompson }
1516eaf62fffSJeremy L Thompson 
1517eaf62fffSJeremy L Thompson /**
1518eaf62fffSJeremy L Thompson   @brief Assemble the diagonal of a square linear CeedOperator
1519eaf62fffSJeremy L Thompson 
1520eaf62fffSJeremy L Thompson   This sums into a CeedVector the diagonal of a linear CeedOperator.
1521eaf62fffSJeremy L Thompson 
1522ea61e9acSJeremy L Thompson   Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported.
1523eaf62fffSJeremy L Thompson 
1524ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1525f04ea552SJeremy L Thompson 
1526ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1527eaf62fffSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedOperator diagonal
1528ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1529eaf62fffSJeremy L Thompson 
1530eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1531eaf62fffSJeremy L Thompson 
1532eaf62fffSJeremy L Thompson   @ref User
1533eaf62fffSJeremy L Thompson **/
15342b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) {
1535f3d47e36SJeremy L Thompson   bool is_composite;
15362b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1537f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1538eaf62fffSJeremy L Thompson 
1539c9366a6bSJeremy L Thompson   CeedSize input_size = 0, output_size = 0;
15402b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size));
15412b730f8bSJeremy L Thompson   if (input_size != output_size) {
1542c9366a6bSJeremy L Thompson     // LCOV_EXCL_START
1543c9366a6bSJeremy L Thompson     return CeedError(op->ceed, CEED_ERROR_DIMENSION, "Operator must be square");
1544c9366a6bSJeremy L Thompson     // LCOV_EXCL_STOP
15452b730f8bSJeremy L Thompson   }
1546c9366a6bSJeremy L Thompson 
1547f3d47e36SJeremy L Thompson   // Early exit for empty operator
1548f3d47e36SJeremy L Thompson   if (!is_composite) {
1549f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
1550f3d47e36SJeremy L Thompson 
1551f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
1552f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
1553f3d47e36SJeremy L Thompson   }
1554f3d47e36SJeremy L Thompson 
1555eaf62fffSJeremy L Thompson   if (op->LinearAssembleAddDiagonal) {
1556d04bbc78SJeremy L Thompson     // Backend version
15572b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request));
1558eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1559eaf62fffSJeremy L Thompson   } else {
1560d04bbc78SJeremy L Thompson     // Operator fallback
1561d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1562d04bbc78SJeremy L Thompson 
15632b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1564d04bbc78SJeremy L Thompson     if (op_fallback) {
15652b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleAddDiagonal(op_fallback, assembled, request));
1566eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1567eaf62fffSJeremy L Thompson     }
1568eaf62fffSJeremy L Thompson   }
1569eaf62fffSJeremy L Thompson   // Default interface implementation
1570eaf62fffSJeremy L Thompson   if (is_composite) {
15712b730f8bSJeremy L Thompson     CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, false, assembled));
1572eaf62fffSJeremy L Thompson   } else {
15732b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, false, assembled));
1574eaf62fffSJeremy L Thompson   }
1575d04bbc78SJeremy L Thompson 
1576d04bbc78SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1577eaf62fffSJeremy L Thompson }
1578eaf62fffSJeremy L Thompson 
1579eaf62fffSJeremy L Thompson /**
1580eaf62fffSJeremy L Thompson   @brief Assemble the point block diagonal of a square linear CeedOperator
1581eaf62fffSJeremy L Thompson 
1582ea61e9acSJeremy L Thompson   This overwrites a CeedVector with the point block diagonal of a linear CeedOperator.
1583eaf62fffSJeremy L Thompson 
1584ea61e9acSJeremy L Thompson   Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported.
1585eaf62fffSJeremy L Thompson 
1586ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1587f04ea552SJeremy L Thompson 
1588ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1589ea61e9acSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp
1590ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out,
1591ea61e9acSJeremy L Thompson component in].
1592ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1593eaf62fffSJeremy L Thompson 
1594eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1595eaf62fffSJeremy L Thompson 
1596eaf62fffSJeremy L Thompson   @ref User
1597eaf62fffSJeremy L Thompson **/
15982b730f8bSJeremy L Thompson int CeedOperatorLinearAssemblePointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) {
1599f3d47e36SJeremy L Thompson   bool is_composite;
16002b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1601f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1602eaf62fffSJeremy L Thompson 
1603c9366a6bSJeremy L Thompson   CeedSize input_size = 0, output_size = 0;
16042b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size));
16052b730f8bSJeremy L Thompson   if (input_size != output_size) {
1606c9366a6bSJeremy L Thompson     // LCOV_EXCL_START
1607c9366a6bSJeremy L Thompson     return CeedError(op->ceed, CEED_ERROR_DIMENSION, "Operator must be square");
1608c9366a6bSJeremy L Thompson     // LCOV_EXCL_STOP
16092b730f8bSJeremy L Thompson   }
1610c9366a6bSJeremy L Thompson 
1611f3d47e36SJeremy L Thompson   // Early exit for empty operator
1612f3d47e36SJeremy L Thompson   if (!is_composite) {
1613f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
1614f3d47e36SJeremy L Thompson 
1615f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
1616f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
1617f3d47e36SJeremy L Thompson   }
1618f3d47e36SJeremy L Thompson 
1619eaf62fffSJeremy L Thompson   if (op->LinearAssemblePointBlockDiagonal) {
1620d04bbc78SJeremy L Thompson     // Backend version
16212b730f8bSJeremy L Thompson     CeedCall(op->LinearAssemblePointBlockDiagonal(op, assembled, request));
1622eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1623eaf62fffSJeremy L Thompson   } else if (op->LinearAssembleAddPointBlockDiagonal) {
1624d04bbc78SJeremy L Thompson     // Backend version with zeroing first
16252b730f8bSJeremy L Thompson     CeedCall(CeedVectorSetValue(assembled, 0.0));
16262b730f8bSJeremy L Thompson     CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request));
1627eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1628eaf62fffSJeremy L Thompson   } else {
1629d04bbc78SJeremy L Thompson     // Operator fallback
1630d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1631d04bbc78SJeremy L Thompson 
16322b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1633d04bbc78SJeremy L Thompson     if (op_fallback) {
16342b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssemblePointBlockDiagonal(op_fallback, assembled, request));
1635eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1636eaf62fffSJeremy L Thompson     }
1637eaf62fffSJeremy L Thompson   }
1638eaf62fffSJeremy L Thompson   // Default interface implementation
16392b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(assembled, 0.0));
16402b730f8bSJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request));
1641d04bbc78SJeremy L Thompson 
1642eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1643eaf62fffSJeremy L Thompson }
1644eaf62fffSJeremy L Thompson 
1645eaf62fffSJeremy L Thompson /**
1646eaf62fffSJeremy L Thompson   @brief Assemble the point block diagonal of a square linear CeedOperator
1647eaf62fffSJeremy L Thompson 
1648ea61e9acSJeremy L Thompson   This sums into a CeedVector with the point block diagonal of a linear CeedOperator.
1649eaf62fffSJeremy L Thompson 
1650ea61e9acSJeremy L Thompson   Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported.
1651eaf62fffSJeremy L Thompson 
1652ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1653f04ea552SJeremy L Thompson 
1654ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1655ea61e9acSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp
1656ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out,
1657ea61e9acSJeremy L Thompson component in].
1658ea61e9acSJeremy L Thompson   @param[in]  request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1659eaf62fffSJeremy L Thompson 
1660eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1661eaf62fffSJeremy L Thompson 
1662eaf62fffSJeremy L Thompson   @ref User
1663eaf62fffSJeremy L Thompson **/
16642b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddPointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) {
1665f3d47e36SJeremy L Thompson   bool is_composite;
16662b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1667f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1668eaf62fffSJeremy L Thompson 
1669c9366a6bSJeremy L Thompson   CeedSize input_size = 0, output_size = 0;
16702b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size));
16712b730f8bSJeremy L Thompson   if (input_size != output_size) {
1672c9366a6bSJeremy L Thompson     // LCOV_EXCL_START
1673c9366a6bSJeremy L Thompson     return CeedError(op->ceed, CEED_ERROR_DIMENSION, "Operator must be square");
1674c9366a6bSJeremy L Thompson     // LCOV_EXCL_STOP
16752b730f8bSJeremy L Thompson   }
1676c9366a6bSJeremy L Thompson 
1677f3d47e36SJeremy L Thompson   // Early exit for empty operator
1678f3d47e36SJeremy L Thompson   if (!is_composite) {
1679f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
1680f3d47e36SJeremy L Thompson 
1681f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
1682f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
1683f3d47e36SJeremy L Thompson   }
1684f3d47e36SJeremy L Thompson 
1685eaf62fffSJeremy L Thompson   if (op->LinearAssembleAddPointBlockDiagonal) {
1686d04bbc78SJeremy L Thompson     // Backend version
16872b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleAddPointBlockDiagonal(op, assembled, request));
1688eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1689eaf62fffSJeremy L Thompson   } else {
1690d04bbc78SJeremy L Thompson     // Operator fallback
1691d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1692d04bbc78SJeremy L Thompson 
16932b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1694d04bbc78SJeremy L Thompson     if (op_fallback) {
16952b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op_fallback, assembled, request));
1696eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1697eaf62fffSJeremy L Thompson     }
1698eaf62fffSJeremy L Thompson   }
1699ea61e9acSJeremy L Thompson   // Default interface implementation
1700eaf62fffSJeremy L Thompson   if (is_composite) {
17012b730f8bSJeremy L Thompson     CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, true, assembled));
1702eaf62fffSJeremy L Thompson   } else {
17032b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, true, assembled));
1704eaf62fffSJeremy L Thompson   }
1705d04bbc78SJeremy L Thompson 
1706d04bbc78SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1707eaf62fffSJeremy L Thompson }
1708eaf62fffSJeremy L Thompson 
1709eaf62fffSJeremy L Thompson /**
1710eaf62fffSJeremy L Thompson    @brief Fully assemble the nonzero pattern of a linear operator.
1711eaf62fffSJeremy L Thompson 
1712ea61e9acSJeremy L Thompson    Expected to be used in conjunction with CeedOperatorLinearAssemble().
1713eaf62fffSJeremy L Thompson 
1714ea61e9acSJeremy L Thompson    The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the
1715ea61e9acSJeremy L Thompson matrix in entry (i, j). Note that the (i, j) pairs are not unique and may repeat. This function returns the number of entries and their (i, j)
1716ea61e9acSJeremy L Thompson locations, while CeedOperatorLinearAssemble() provides the values in the same ordering.
1717eaf62fffSJeremy L Thompson 
1718eaf62fffSJeremy L Thompson    This will generally be slow unless your operator is low-order.
1719eaf62fffSJeremy L Thompson 
1720ea61e9acSJeremy L Thompson    Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1721f04ea552SJeremy L Thompson 
1722eaf62fffSJeremy L Thompson    @param[in]  op          CeedOperator to assemble
1723eaf62fffSJeremy L Thompson    @param[out] num_entries Number of entries in coordinate nonzero pattern
1724eaf62fffSJeremy L Thompson    @param[out] rows        Row number for each entry
1725eaf62fffSJeremy L Thompson    @param[out] cols        Column number for each entry
1726eaf62fffSJeremy L Thompson 
1727eaf62fffSJeremy L Thompson    @ref User
1728eaf62fffSJeremy L Thompson **/
17292b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleSymbolic(CeedOperator op, CeedSize *num_entries, CeedInt **rows, CeedInt **cols) {
1730eaf62fffSJeremy L Thompson   CeedInt       num_suboperators, single_entries;
1731eaf62fffSJeremy L Thompson   CeedOperator *sub_operators;
1732eaf62fffSJeremy L Thompson   bool          is_composite;
17332b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1734f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1735eaf62fffSJeremy L Thompson 
1736eaf62fffSJeremy L Thompson   if (op->LinearAssembleSymbolic) {
1737d04bbc78SJeremy L Thompson     // Backend version
17382b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleSymbolic(op, num_entries, rows, cols));
1739eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1740eaf62fffSJeremy L Thompson   } else {
1741d04bbc78SJeremy L Thompson     // Operator fallback
1742d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1743d04bbc78SJeremy L Thompson 
17442b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1745d04bbc78SJeremy L Thompson     if (op_fallback) {
17462b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleSymbolic(op_fallback, num_entries, rows, cols));
1747eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1748eaf62fffSJeremy L Thompson     }
1749eaf62fffSJeremy L Thompson   }
1750eaf62fffSJeremy L Thompson 
1751eaf62fffSJeremy L Thompson   // Default interface implementation
1752eaf62fffSJeremy L Thompson 
1753eaf62fffSJeremy L Thompson   // count entries and allocate rows, cols arrays
1754eaf62fffSJeremy L Thompson   *num_entries = 0;
1755eaf62fffSJeremy L Thompson   if (is_composite) {
1756c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
1757c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
175892ae7e47SJeremy L Thompson     for (CeedInt k = 0; k < num_suboperators; ++k) {
17592b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries));
1760eaf62fffSJeremy L Thompson       *num_entries += single_entries;
1761eaf62fffSJeremy L Thompson     }
1762eaf62fffSJeremy L Thompson   } else {
17632b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssemblyCountEntries(op, &single_entries));
1764eaf62fffSJeremy L Thompson     *num_entries += single_entries;
1765eaf62fffSJeremy L Thompson   }
17662b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(*num_entries, rows));
17672b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(*num_entries, cols));
1768eaf62fffSJeremy L Thompson 
1769eaf62fffSJeremy L Thompson   // assemble nonzero locations
1770eaf62fffSJeremy L Thompson   CeedInt offset = 0;
1771eaf62fffSJeremy L Thompson   if (is_composite) {
1772c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
1773c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
177492ae7e47SJeremy L Thompson     for (CeedInt k = 0; k < num_suboperators; ++k) {
17752b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssembleSymbolic(sub_operators[k], offset, *rows, *cols));
17762b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries));
1777eaf62fffSJeremy L Thompson       offset += single_entries;
1778eaf62fffSJeremy L Thompson     }
1779eaf62fffSJeremy L Thompson   } else {
17802b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssembleSymbolic(op, offset, *rows, *cols));
1781eaf62fffSJeremy L Thompson   }
1782eaf62fffSJeremy L Thompson 
1783eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1784eaf62fffSJeremy L Thompson }
1785eaf62fffSJeremy L Thompson 
1786eaf62fffSJeremy L Thompson /**
1787eaf62fffSJeremy L Thompson    @brief Fully assemble the nonzero entries of a linear operator.
1788eaf62fffSJeremy L Thompson 
1789ea61e9acSJeremy L Thompson    Expected to be used in conjunction with CeedOperatorLinearAssembleSymbolic().
1790eaf62fffSJeremy L Thompson 
1791ea61e9acSJeremy L Thompson    The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the
1792ea61e9acSJeremy L Thompson matrix in entry (i, j). Note that the (i, j) pairs are not unique and may repeat. This function returns the values of the nonzero entries to be added,
1793ea61e9acSJeremy L Thompson their (i, j) locations are provided by CeedOperatorLinearAssembleSymbolic()
1794eaf62fffSJeremy L Thompson 
1795eaf62fffSJeremy L Thompson    This will generally be slow unless your operator is low-order.
1796eaf62fffSJeremy L Thompson 
1797ea61e9acSJeremy L Thompson    Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1798f04ea552SJeremy L Thompson 
1799eaf62fffSJeremy L Thompson    @param[in]  op     CeedOperator to assemble
1800eaf62fffSJeremy L Thompson    @param[out] values Values to assemble into matrix
1801eaf62fffSJeremy L Thompson 
1802eaf62fffSJeremy L Thompson    @ref User
1803eaf62fffSJeremy L Thompson **/
1804eaf62fffSJeremy L Thompson int CeedOperatorLinearAssemble(CeedOperator op, CeedVector values) {
1805eaf62fffSJeremy L Thompson   CeedInt       num_suboperators, single_entries = 0;
1806eaf62fffSJeremy L Thompson   CeedOperator *sub_operators;
1807f3d47e36SJeremy L Thompson   bool          is_composite;
18082b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1809f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1810f3d47e36SJeremy L Thompson 
1811f3d47e36SJeremy L Thompson   // Early exit for empty operator
1812f3d47e36SJeremy L Thompson   if (!is_composite) {
1813f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
1814f3d47e36SJeremy L Thompson 
1815f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
1816f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
1817f3d47e36SJeremy L Thompson   }
1818eaf62fffSJeremy L Thompson 
1819eaf62fffSJeremy L Thompson   if (op->LinearAssemble) {
1820d04bbc78SJeremy L Thompson     // Backend version
18212b730f8bSJeremy L Thompson     CeedCall(op->LinearAssemble(op, values));
1822eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1823eaf62fffSJeremy L Thompson   } else {
1824d04bbc78SJeremy L Thompson     // Operator fallback
1825d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1826d04bbc78SJeremy L Thompson 
18272b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1828d04bbc78SJeremy L Thompson     if (op_fallback) {
18292b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssemble(op_fallback, values));
1830eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1831eaf62fffSJeremy L Thompson     }
1832eaf62fffSJeremy L Thompson   }
1833eaf62fffSJeremy L Thompson 
1834eaf62fffSJeremy L Thompson   // Default interface implementation
1835eaf62fffSJeremy L Thompson   CeedInt offset = 0;
1836eaf62fffSJeremy L Thompson   if (is_composite) {
1837c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
1838c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
1839cefa2673SJeremy L Thompson     for (CeedInt k = 0; k < num_suboperators; k++) {
18402b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemble(sub_operators[k], offset, values));
18412b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries));
1842eaf62fffSJeremy L Thompson       offset += single_entries;
1843eaf62fffSJeremy L Thompson     }
1844eaf62fffSJeremy L Thompson   } else {
18452b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssemble(op, offset, values));
1846eaf62fffSJeremy L Thompson   }
1847eaf62fffSJeremy L Thompson 
1848eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1849eaf62fffSJeremy L Thompson }
1850eaf62fffSJeremy L Thompson 
1851eaf62fffSJeremy L Thompson /**
185275f0d5a4SJeremy L Thompson   @brief Get the multiplicity of nodes across suboperators in a composite CeedOperator
185375f0d5a4SJeremy L Thompson 
185475f0d5a4SJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
185575f0d5a4SJeremy L Thompson 
185675f0d5a4SJeremy L Thompson   @param[in]  op               Composite CeedOperator
185775f0d5a4SJeremy L Thompson   @param[in]  num_skip_indices Number of suboperators to skip
185875f0d5a4SJeremy L Thompson   @param[in]  skip_indices     Array of indices of suboperators to skip
185975f0d5a4SJeremy L Thompson   @param[out] mult             Vector to store multiplicity (of size l_size)
186075f0d5a4SJeremy L Thompson 
186175f0d5a4SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
186275f0d5a4SJeremy L Thompson 
186375f0d5a4SJeremy L Thompson   @ref User
186475f0d5a4SJeremy L Thompson **/
186575f0d5a4SJeremy L Thompson int CeedCompositeOperatorGetMultiplicity(CeedOperator op, CeedInt num_skip_indices, CeedInt *skip_indices, CeedVector mult) {
186675f0d5a4SJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
186775f0d5a4SJeremy L Thompson 
186875f0d5a4SJeremy L Thompson   Ceed                ceed;
1869b275c451SJeremy L Thompson   CeedInt             num_suboperators;
187075f0d5a4SJeremy L Thompson   CeedSize            l_vec_len;
187175f0d5a4SJeremy L Thompson   CeedScalar         *mult_array;
187275f0d5a4SJeremy L Thompson   CeedVector          ones_l_vec;
187375f0d5a4SJeremy L Thompson   CeedElemRestriction elem_restr;
1874b275c451SJeremy L Thompson   CeedOperator       *sub_operators;
187575f0d5a4SJeremy L Thompson 
187675f0d5a4SJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
187775f0d5a4SJeremy L Thompson 
187875f0d5a4SJeremy L Thompson   // Zero mult vector
187975f0d5a4SJeremy L Thompson   CeedCall(CeedVectorSetValue(mult, 0.0));
188075f0d5a4SJeremy L Thompson 
188175f0d5a4SJeremy L Thompson   // Get suboperators
1882b275c451SJeremy L Thompson   CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
1883b275c451SJeremy L Thompson   CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
1884b275c451SJeremy L Thompson   if (num_suboperators == 0) return CEED_ERROR_SUCCESS;
188575f0d5a4SJeremy L Thompson 
188675f0d5a4SJeremy L Thompson   // Work vector
188775f0d5a4SJeremy L Thompson   CeedCall(CeedVectorGetLength(mult, &l_vec_len));
188875f0d5a4SJeremy L Thompson   CeedCall(CeedVectorCreate(ceed, l_vec_len, &ones_l_vec));
188975f0d5a4SJeremy L Thompson   CeedCall(CeedVectorSetValue(ones_l_vec, 1.0));
189075f0d5a4SJeremy L Thompson   CeedCall(CeedVectorGetArray(mult, CEED_MEM_HOST, &mult_array));
189175f0d5a4SJeremy L Thompson 
189275f0d5a4SJeremy L Thompson   // Compute multiplicity across suboperators
1893b275c451SJeremy L Thompson   for (CeedInt i = 0; i < num_suboperators; i++) {
189475f0d5a4SJeremy L Thompson     const CeedScalar *sub_mult_array;
189575f0d5a4SJeremy L Thompson     CeedVector        sub_mult_l_vec, ones_e_vec;
189675f0d5a4SJeremy L Thompson 
189775f0d5a4SJeremy L Thompson     // -- Check for suboperator to skip
189875f0d5a4SJeremy L Thompson     for (CeedInt j = 0; j < num_skip_indices; j++) {
189975f0d5a4SJeremy L Thompson       if (skip_indices[j] == i) continue;
190075f0d5a4SJeremy L Thompson     }
190175f0d5a4SJeremy L Thompson 
190275f0d5a4SJeremy L Thompson     // -- Sub operator multiplicity
1903b275c451SJeremy L Thompson     CeedCall(CeedOperatorGetActiveElemRestriction(sub_operators[i], &elem_restr));
190475f0d5a4SJeremy L Thompson     CeedCall(CeedElemRestrictionCreateVector(elem_restr, &sub_mult_l_vec, &ones_e_vec));
190575f0d5a4SJeremy L Thompson     CeedCall(CeedVectorSetValue(sub_mult_l_vec, 0.0));
190675f0d5a4SJeremy L Thompson     CeedCall(CeedElemRestrictionApply(elem_restr, CEED_NOTRANSPOSE, ones_l_vec, ones_e_vec, CEED_REQUEST_IMMEDIATE));
190775f0d5a4SJeremy L Thompson     CeedCall(CeedElemRestrictionApply(elem_restr, CEED_TRANSPOSE, ones_e_vec, sub_mult_l_vec, CEED_REQUEST_IMMEDIATE));
190875f0d5a4SJeremy L Thompson     CeedCall(CeedVectorGetArrayRead(sub_mult_l_vec, CEED_MEM_HOST, &sub_mult_array));
190975f0d5a4SJeremy L Thompson     // ---- Flag every node present in the current suboperator
191075f0d5a4SJeremy L Thompson     for (CeedInt j = 0; j < l_vec_len; j++) {
191175f0d5a4SJeremy L Thompson       if (sub_mult_array[j] > 0.0) mult_array[j] += 1.0;
191275f0d5a4SJeremy L Thompson     }
191375f0d5a4SJeremy L Thompson     CeedCall(CeedVectorRestoreArrayRead(sub_mult_l_vec, &sub_mult_array));
191475f0d5a4SJeremy L Thompson     CeedCall(CeedVectorDestroy(&sub_mult_l_vec));
191575f0d5a4SJeremy L Thompson     CeedCall(CeedVectorDestroy(&ones_e_vec));
191675f0d5a4SJeremy L Thompson   }
191775f0d5a4SJeremy L Thompson   CeedCall(CeedVectorRestoreArray(mult, &mult_array));
1918811d0ccfSJeremy L Thompson   CeedCall(CeedVectorDestroy(&ones_l_vec));
191975f0d5a4SJeremy L Thompson 
192075f0d5a4SJeremy L Thompson   return CEED_ERROR_SUCCESS;
192175f0d5a4SJeremy L Thompson }
192275f0d5a4SJeremy L Thompson 
192375f0d5a4SJeremy L Thompson /**
1924ea61e9acSJeremy L Thompson   @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator, creating the prolongation basis from the fine and coarse
1925ea61e9acSJeremy L Thompson grid interpolation
1926eaf62fffSJeremy L Thompson 
192758e4b056SJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable.
1928f04ea552SJeremy L Thompson 
1929eaf62fffSJeremy L Thompson   @param[in]  op_fine      Fine grid operator
1930eaf62fffSJeremy L Thompson   @param[in]  p_mult_fine  L-vector multiplicity in parallel gather/scatter
1931eaf62fffSJeremy L Thompson   @param[in]  rstr_coarse  Coarse grid restriction
1932eaf62fffSJeremy L Thompson   @param[in]  basis_coarse Coarse grid active vector basis
1933eaf62fffSJeremy L Thompson   @param[out] op_coarse    Coarse grid operator
1934eaf62fffSJeremy L Thompson   @param[out] op_prolong   Coarse to fine operator
1935eaf62fffSJeremy L Thompson   @param[out] op_restrict  Fine to coarse operator
1936eaf62fffSJeremy L Thompson 
1937eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1938eaf62fffSJeremy L Thompson 
1939eaf62fffSJeremy L Thompson   @ref User
1940eaf62fffSJeremy L Thompson **/
19412b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreate(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse,
19422b730f8bSJeremy L Thompson                                      CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) {
19432b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op_fine));
1944eaf62fffSJeremy L Thompson 
1945*83d6adf3SZach Atkins   // Build prolongation matrix, if required
1946*83d6adf3SZach Atkins   CeedBasis basis_c_to_f = NULL;
1947*83d6adf3SZach Atkins   if (op_prolong || op_restrict) {
1948*83d6adf3SZach Atkins     CeedBasis basis_fine;
19492b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine));
19502b730f8bSJeremy L Thompson     CeedCall(CeedBasisCreateProjection(basis_coarse, basis_fine, &basis_c_to_f));
1951*83d6adf3SZach Atkins   }
1952eaf62fffSJeremy L Thompson 
1953f113e5dcSJeremy L Thompson   // Core code
19542b730f8bSJeremy L Thompson   CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict));
1955f113e5dcSJeremy L Thompson 
1956eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1957eaf62fffSJeremy L Thompson }
1958eaf62fffSJeremy L Thompson 
1959eaf62fffSJeremy L Thompson /**
1960ea61e9acSJeremy L Thompson   @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a tensor basis for the active basis
1961eaf62fffSJeremy L Thompson 
196258e4b056SJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable.
1963f04ea552SJeremy L Thompson 
1964eaf62fffSJeremy L Thompson   @param[in]  op_fine       Fine grid operator
1965eaf62fffSJeremy L Thompson   @param[in]  p_mult_fine   L-vector multiplicity in parallel gather/scatter
1966eaf62fffSJeremy L Thompson   @param[in]  rstr_coarse   Coarse grid restriction
1967eaf62fffSJeremy L Thompson   @param[in]  basis_coarse  Coarse grid active vector basis
1968eaf62fffSJeremy L Thompson   @param[in]  interp_c_to_f Matrix for coarse to fine interpolation
1969eaf62fffSJeremy L Thompson   @param[out] op_coarse     Coarse grid operator
1970eaf62fffSJeremy L Thompson   @param[out] op_prolong    Coarse to fine operator
1971eaf62fffSJeremy L Thompson   @param[out] op_restrict   Fine to coarse operator
1972eaf62fffSJeremy L Thompson 
1973eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1974eaf62fffSJeremy L Thompson 
1975eaf62fffSJeremy L Thompson   @ref User
1976eaf62fffSJeremy L Thompson **/
19772b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateTensorH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse,
19782b730f8bSJeremy L Thompson                                              const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong,
19792b730f8bSJeremy L Thompson                                              CeedOperator *op_restrict) {
19802b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op_fine));
1981eaf62fffSJeremy L Thompson   Ceed ceed;
19822b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op_fine, &ceed));
1983eaf62fffSJeremy L Thompson 
1984eaf62fffSJeremy L Thompson   // Check for compatible quadrature spaces
1985eaf62fffSJeremy L Thompson   CeedBasis basis_fine;
19862b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine));
1987eaf62fffSJeremy L Thompson   CeedInt Q_f, Q_c;
19882b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f));
19892b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c));
19902b730f8bSJeremy L Thompson   if (Q_f != Q_c) {
1991eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
19922b730f8bSJeremy L Thompson     return CeedError(ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces");
1993eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
19942b730f8bSJeremy L Thompson   }
1995eaf62fffSJeremy L Thompson 
1996*83d6adf3SZach Atkins   // Create coarse to fine basis, if required
1997*83d6adf3SZach Atkins   CeedBasis basis_c_to_f = NULL;
1998*83d6adf3SZach Atkins   if (op_prolong || op_restrict) {
1999*83d6adf3SZach Atkins     // Check if interpolation matrix is provided
2000*83d6adf3SZach Atkins     if (!interp_c_to_f) {
2001*83d6adf3SZach Atkins       // LCOV_EXCL_START
2002*83d6adf3SZach Atkins       return CeedError(ceed, CEED_ERROR_INCOMPATIBLE, "Prolongation or restriction operator creation requires coarse-to-fine interpolation matrix");
2003*83d6adf3SZach Atkins       // LCOV_EXCL_STOP
2004*83d6adf3SZach Atkins     }
2005eaf62fffSJeremy L Thompson     CeedInt dim, num_comp, num_nodes_c, P_1d_f, P_1d_c;
20062b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetDimension(basis_fine, &dim));
20072b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp));
20082b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumNodes1D(basis_fine, &P_1d_f));
20092b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c));
20102b730f8bSJeremy L Thompson     P_1d_c = dim == 1 ? num_nodes_c : dim == 2 ? sqrt(num_nodes_c) : cbrt(num_nodes_c);
2011eaf62fffSJeremy L Thompson     CeedScalar *q_ref, *q_weight, *grad;
20122b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(P_1d_f, &q_ref));
20132b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(P_1d_f, &q_weight));
20142b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(P_1d_f * P_1d_c * dim, &grad));
20152b730f8bSJeremy L Thompson     CeedCall(CeedBasisCreateTensorH1(ceed, dim, num_comp, P_1d_c, P_1d_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f));
20162b730f8bSJeremy L Thompson     CeedCall(CeedFree(&q_ref));
20172b730f8bSJeremy L Thompson     CeedCall(CeedFree(&q_weight));
20182b730f8bSJeremy L Thompson     CeedCall(CeedFree(&grad));
2019*83d6adf3SZach Atkins   }
2020eaf62fffSJeremy L Thompson 
2021eaf62fffSJeremy L Thompson   // Core code
20222b730f8bSJeremy L Thompson   CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict));
2023eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
2024eaf62fffSJeremy L Thompson }
2025eaf62fffSJeremy L Thompson 
2026eaf62fffSJeremy L Thompson /**
2027ea61e9acSJeremy L Thompson   @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a non-tensor basis for the active vector
2028eaf62fffSJeremy L Thompson 
202958e4b056SJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable.
2030f04ea552SJeremy L Thompson 
2031eaf62fffSJeremy L Thompson   @param[in]  op_fine       Fine grid operator
2032eaf62fffSJeremy L Thompson   @param[in]  p_mult_fine   L-vector multiplicity in parallel gather/scatter
2033eaf62fffSJeremy L Thompson   @param[in]  rstr_coarse   Coarse grid restriction
2034eaf62fffSJeremy L Thompson   @param[in]  basis_coarse  Coarse grid active vector basis
2035eaf62fffSJeremy L Thompson   @param[in]  interp_c_to_f Matrix for coarse to fine interpolation
2036eaf62fffSJeremy L Thompson   @param[out] op_coarse     Coarse grid operator
2037eaf62fffSJeremy L Thompson   @param[out] op_prolong    Coarse to fine operator
2038eaf62fffSJeremy L Thompson   @param[out] op_restrict   Fine to coarse operator
2039eaf62fffSJeremy L Thompson 
2040eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
2041eaf62fffSJeremy L Thompson 
2042eaf62fffSJeremy L Thompson   @ref User
2043eaf62fffSJeremy L Thompson **/
20442b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse,
20452b730f8bSJeremy L Thompson                                        const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong,
2046eaf62fffSJeremy L Thompson                                        CeedOperator *op_restrict) {
20472b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op_fine));
2048eaf62fffSJeremy L Thompson   Ceed ceed;
20492b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op_fine, &ceed));
2050eaf62fffSJeremy L Thompson 
2051eaf62fffSJeremy L Thompson   // Check for compatible quadrature spaces
2052eaf62fffSJeremy L Thompson   CeedBasis basis_fine;
20532b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine));
2054eaf62fffSJeremy L Thompson   CeedInt Q_f, Q_c;
20552b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f));
20562b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c));
20572b730f8bSJeremy L Thompson   if (Q_f != Q_c) {
2058eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
20592b730f8bSJeremy L Thompson     return CeedError(ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces");
2060eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
20612b730f8bSJeremy L Thompson   }
2062eaf62fffSJeremy L Thompson 
2063eaf62fffSJeremy L Thompson   // Coarse to fine basis
2064*83d6adf3SZach Atkins   CeedBasis basis_c_to_f = NULL;
2065*83d6adf3SZach Atkins   if (op_prolong || op_restrict) {
2066*83d6adf3SZach Atkins     // Check if interpolation matrix is provided
2067*83d6adf3SZach Atkins     if (!interp_c_to_f) {
2068*83d6adf3SZach Atkins       // LCOV_EXCL_START
2069*83d6adf3SZach Atkins       return CeedError(ceed, CEED_ERROR_INCOMPATIBLE, "Prolongation or restriction operator creation requires coarse-to-fine interpolation matrix");
2070*83d6adf3SZach Atkins       // LCOV_EXCL_STOP
2071*83d6adf3SZach Atkins     }
2072eaf62fffSJeremy L Thompson     CeedElemTopology topo;
20732b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetTopology(basis_fine, &topo));
2074eaf62fffSJeremy L Thompson     CeedInt dim, num_comp, num_nodes_c, num_nodes_f;
20752b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetDimension(basis_fine, &dim));
20762b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp));
20772b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumNodes(basis_fine, &num_nodes_f));
20782b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c));
2079eaf62fffSJeremy L Thompson     CeedScalar *q_ref, *q_weight, *grad;
20802b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(num_nodes_f * dim, &q_ref));
20812b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(num_nodes_f, &q_weight));
20822b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(num_nodes_f * num_nodes_c * dim, &grad));
20832b730f8bSJeremy L Thompson     CeedCall(CeedBasisCreateH1(ceed, topo, num_comp, num_nodes_c, num_nodes_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f));
20842b730f8bSJeremy L Thompson     CeedCall(CeedFree(&q_ref));
20852b730f8bSJeremy L Thompson     CeedCall(CeedFree(&q_weight));
20862b730f8bSJeremy L Thompson     CeedCall(CeedFree(&grad));
2087*83d6adf3SZach Atkins   }
2088eaf62fffSJeremy L Thompson 
2089eaf62fffSJeremy L Thompson   // Core code
20902b730f8bSJeremy L Thompson   CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict));
2091eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
2092eaf62fffSJeremy L Thompson }
2093eaf62fffSJeremy L Thompson 
2094eaf62fffSJeremy L Thompson /**
2095ea61e9acSJeremy L Thompson   @brief Build a FDM based approximate inverse for each element for a CeedOperator
2096eaf62fffSJeremy L Thompson 
2097ea61e9acSJeremy L Thompson   This returns a CeedOperator and CeedVector to apply a Fast Diagonalization Method based approximate inverse.
2098ea61e9acSJeremy L Thompson     This function obtains the simultaneous diagonalization for the 1D mass and Laplacian operators, M = V^T V, K = V^T S V.
2099ea61e9acSJeremy L Thompson     The assembled QFunction is used to modify the eigenvalues from simultaneous diagonalization and obtain an approximate inverse of the form V^T
2100ea61e9acSJeremy L Thompson S^hat V. The CeedOperator must be linear and non-composite. The associated CeedQFunction must therefore also be linear.
2101eaf62fffSJeremy L Thompson 
2102ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
2103f04ea552SJeremy L Thompson 
2104ea61e9acSJeremy L Thompson   @param[in]  op      CeedOperator to create element inverses
2105ea61e9acSJeremy L Thompson   @param[out] fdm_inv CeedOperator to apply the action of a FDM based inverse for each element
2106ea61e9acSJeremy L Thompson   @param[in]  request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
2107eaf62fffSJeremy L Thompson 
2108eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
2109eaf62fffSJeremy L Thompson 
2110480fae85SJeremy L Thompson   @ref User
2111eaf62fffSJeremy L Thompson **/
21122b730f8bSJeremy L Thompson int CeedOperatorCreateFDMElementInverse(CeedOperator op, CeedOperator *fdm_inv, CeedRequest *request) {
21132b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
2114eaf62fffSJeremy L Thompson 
2115eaf62fffSJeremy L Thompson   if (op->CreateFDMElementInverse) {
2116d04bbc78SJeremy L Thompson     // Backend version
21172b730f8bSJeremy L Thompson     CeedCall(op->CreateFDMElementInverse(op, fdm_inv, request));
2118eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
2119eaf62fffSJeremy L Thompson   } else {
2120d04bbc78SJeremy L Thompson     // Operator fallback
2121d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
2122d04bbc78SJeremy L Thompson 
21232b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
2124d04bbc78SJeremy L Thompson     if (op_fallback) {
21252b730f8bSJeremy L Thompson       CeedCall(CeedOperatorCreateFDMElementInverse(op_fallback, fdm_inv, request));
2126eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
2127eaf62fffSJeremy L Thompson     }
2128eaf62fffSJeremy L Thompson   }
2129eaf62fffSJeremy L Thompson 
2130d04bbc78SJeremy L Thompson   // Default interface implementation
2131eaf62fffSJeremy L Thompson   Ceed ceed, ceed_parent;
21322b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
21332b730f8bSJeremy L Thompson   CeedCall(CeedGetOperatorFallbackParentCeed(ceed, &ceed_parent));
2134eaf62fffSJeremy L Thompson   ceed_parent = ceed_parent ? ceed_parent : ceed;
2135eaf62fffSJeremy L Thompson   CeedQFunction qf;
21362b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetQFunction(op, &qf));
2137eaf62fffSJeremy L Thompson 
2138eaf62fffSJeremy L Thompson   // Determine active input basis
2139eaf62fffSJeremy L Thompson   bool                interp = false, grad = false;
2140eaf62fffSJeremy L Thompson   CeedBasis           basis = NULL;
2141eaf62fffSJeremy L Thompson   CeedElemRestriction rstr  = NULL;
2142eaf62fffSJeremy L Thompson   CeedOperatorField  *op_fields;
2143eaf62fffSJeremy L Thompson   CeedQFunctionField *qf_fields;
2144eaf62fffSJeremy L Thompson   CeedInt             num_input_fields;
21452b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetFields(op, &num_input_fields, &op_fields, NULL, NULL));
21462b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL));
2147eaf62fffSJeremy L Thompson   for (CeedInt i = 0; i < num_input_fields; i++) {
2148eaf62fffSJeremy L Thompson     CeedVector vec;
21492b730f8bSJeremy L Thompson     CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec));
2150eaf62fffSJeremy L Thompson     if (vec == CEED_VECTOR_ACTIVE) {
2151eaf62fffSJeremy L Thompson       CeedEvalMode eval_mode;
21522b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode));
2153eaf62fffSJeremy L Thompson       interp = interp || eval_mode == CEED_EVAL_INTERP;
2154eaf62fffSJeremy L Thompson       grad   = grad || eval_mode == CEED_EVAL_GRAD;
21552b730f8bSJeremy L Thompson       CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis));
21562b730f8bSJeremy L Thompson       CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr));
2157eaf62fffSJeremy L Thompson     }
2158eaf62fffSJeremy L Thompson   }
21592b730f8bSJeremy L Thompson   if (!basis) {
2160eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
2161eaf62fffSJeremy L Thompson     return CeedError(ceed, CEED_ERROR_BACKEND, "No active field set");
2162eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
21632b730f8bSJeremy L Thompson   }
2164e79b91d9SJeremy L Thompson   CeedSize l_size = 1;
2165e79b91d9SJeremy L Thompson   CeedInt  P_1d, Q_1d, elem_size, num_qpts, dim, num_comp = 1, num_elem = 1;
21662b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumNodes1D(basis, &P_1d));
21672b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumNodes(basis, &elem_size));
21682b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints1D(basis, &Q_1d));
21692b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis, &num_qpts));
21702b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetDimension(basis, &dim));
21712b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumComponents(basis, &num_comp));
21722b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem));
21732b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size));
2174eaf62fffSJeremy L Thompson 
2175eaf62fffSJeremy L Thompson   // Build and diagonalize 1D Mass and Laplacian
2176eaf62fffSJeremy L Thompson   bool tensor_basis;
21772b730f8bSJeremy L Thompson   CeedCall(CeedBasisIsTensor(basis, &tensor_basis));
21782b730f8bSJeremy L Thompson   if (!tensor_basis) {
2179eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
21802b730f8bSJeremy L Thompson     return CeedError(ceed, CEED_ERROR_BACKEND, "FDMElementInverse only supported for tensor bases");
2181eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
21822b730f8bSJeremy L Thompson   }
2183eaf62fffSJeremy L Thompson   CeedScalar *mass, *laplace, *x, *fdm_interp, *lambda;
21842b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &mass));
21852b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &laplace));
21862b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &x));
21872b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &fdm_interp));
21882b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d, &lambda));
2189eaf62fffSJeremy L Thompson   // -- Build matrices
2190eaf62fffSJeremy L Thompson   const CeedScalar *interp_1d, *grad_1d, *q_weight_1d;
21912b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetInterp1D(basis, &interp_1d));
21922b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetGrad1D(basis, &grad_1d));
21932b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetQWeights(basis, &q_weight_1d));
21942b730f8bSJeremy L Thompson   CeedCall(CeedBuildMassLaplace(interp_1d, grad_1d, q_weight_1d, P_1d, Q_1d, dim, mass, laplace));
2195eaf62fffSJeremy L Thompson 
2196eaf62fffSJeremy L Thompson   // -- Diagonalize
21972b730f8bSJeremy L Thompson   CeedCall(CeedSimultaneousDiagonalization(ceed, laplace, mass, x, lambda, P_1d));
21982b730f8bSJeremy L Thompson   CeedCall(CeedFree(&mass));
21992b730f8bSJeremy L Thompson   CeedCall(CeedFree(&laplace));
22002b730f8bSJeremy L Thompson   for (CeedInt i = 0; i < P_1d; i++) {
22012b730f8bSJeremy L Thompson     for (CeedInt j = 0; j < P_1d; j++) fdm_interp[i + j * P_1d] = x[j + i * P_1d];
22022b730f8bSJeremy L Thompson   }
22032b730f8bSJeremy L Thompson   CeedCall(CeedFree(&x));
2204eaf62fffSJeremy L Thompson 
2205eaf62fffSJeremy L Thompson   // Assemble QFunction
2206eaf62fffSJeremy L Thompson   CeedVector          assembled;
2207eaf62fffSJeremy L Thompson   CeedElemRestriction rstr_qf;
22082b730f8bSJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled, &rstr_qf, request));
2209eaf62fffSJeremy L Thompson   CeedInt layout[3];
22102b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetELayout(rstr_qf, &layout));
22112b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&rstr_qf));
2212eaf62fffSJeremy L Thompson   CeedScalar max_norm = 0;
22132b730f8bSJeremy L Thompson   CeedCall(CeedVectorNorm(assembled, CEED_NORM_MAX, &max_norm));
2214eaf62fffSJeremy L Thompson 
2215eaf62fffSJeremy L Thompson   // Calculate element averages
2216eaf62fffSJeremy L Thompson   CeedInt           num_modes = (interp ? 1 : 0) + (grad ? dim : 0);
2217eaf62fffSJeremy L Thompson   CeedScalar       *elem_avg;
2218eaf62fffSJeremy L Thompson   const CeedScalar *assembled_array, *q_weight_array;
2219eaf62fffSJeremy L Thompson   CeedVector        q_weight;
22202b730f8bSJeremy L Thompson   CeedCall(CeedVectorCreate(ceed_parent, num_qpts, &q_weight));
22212b730f8bSJeremy L Thompson   CeedCall(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, q_weight));
22222b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayRead(assembled, CEED_MEM_HOST, &assembled_array));
22232b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayRead(q_weight, CEED_MEM_HOST, &q_weight_array));
22242b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(num_elem, &elem_avg));
2225eaf62fffSJeremy L Thompson   const CeedScalar qf_value_bound = max_norm * 100 * CEED_EPSILON;
2226eaf62fffSJeremy L Thompson   for (CeedInt e = 0; e < num_elem; e++) {
2227eaf62fffSJeremy L Thompson     CeedInt count = 0;
22282b730f8bSJeremy L Thompson     for (CeedInt q = 0; q < num_qpts; q++) {
22292b730f8bSJeremy L Thompson       for (CeedInt i = 0; i < num_comp * num_comp * num_modes * num_modes; i++) {
22302b730f8bSJeremy L Thompson         if (fabs(assembled_array[q * layout[0] + i * layout[1] + e * layout[2]]) > qf_value_bound) {
22312b730f8bSJeremy L Thompson           elem_avg[e] += assembled_array[q * layout[0] + i * layout[1] + e * layout[2]] / q_weight_array[q];
2232eaf62fffSJeremy L Thompson           count++;
2233eaf62fffSJeremy L Thompson         }
22342b730f8bSJeremy L Thompson       }
22352b730f8bSJeremy L Thompson     }
2236eaf62fffSJeremy L Thompson     if (count) {
2237eaf62fffSJeremy L Thompson       elem_avg[e] /= count;
2238eaf62fffSJeremy L Thompson     } else {
2239eaf62fffSJeremy L Thompson       elem_avg[e] = 1.0;
2240eaf62fffSJeremy L Thompson     }
2241eaf62fffSJeremy L Thompson   }
22422b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArrayRead(assembled, &assembled_array));
22432b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&assembled));
22442b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArrayRead(q_weight, &q_weight_array));
22452b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&q_weight));
2246eaf62fffSJeremy L Thompson 
2247eaf62fffSJeremy L Thompson   // Build FDM diagonal
2248eaf62fffSJeremy L Thompson   CeedVector  q_data;
2249eaf62fffSJeremy L Thompson   CeedScalar *q_data_array, *fdm_diagonal;
22502b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(num_comp * elem_size, &fdm_diagonal));
2251eaf62fffSJeremy L Thompson   const CeedScalar fdm_diagonal_bound = elem_size * CEED_EPSILON;
22522b730f8bSJeremy L Thompson   for (CeedInt c = 0; c < num_comp; c++) {
2253eaf62fffSJeremy L Thompson     for (CeedInt n = 0; n < elem_size; n++) {
22542b730f8bSJeremy L Thompson       if (interp) fdm_diagonal[c * elem_size + n] = 1.0;
22552b730f8bSJeremy L Thompson       if (grad) {
2256eaf62fffSJeremy L Thompson         for (CeedInt d = 0; d < dim; d++) {
2257eaf62fffSJeremy L Thompson           CeedInt i = (n / CeedIntPow(P_1d, d)) % P_1d;
2258eaf62fffSJeremy L Thompson           fdm_diagonal[c * elem_size + n] += lambda[i];
2259eaf62fffSJeremy L Thompson         }
2260eaf62fffSJeremy L Thompson       }
22612b730f8bSJeremy L Thompson       if (fabs(fdm_diagonal[c * elem_size + n]) < fdm_diagonal_bound) fdm_diagonal[c * elem_size + n] = fdm_diagonal_bound;
22622b730f8bSJeremy L Thompson     }
22632b730f8bSJeremy L Thompson   }
22642b730f8bSJeremy L Thompson   CeedCall(CeedVectorCreate(ceed_parent, num_elem * num_comp * elem_size, &q_data));
22652b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(q_data, 0.0));
22662b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayWrite(q_data, CEED_MEM_HOST, &q_data_array));
22672b730f8bSJeremy L Thompson   for (CeedInt e = 0; e < num_elem; e++) {
22682b730f8bSJeremy L Thompson     for (CeedInt c = 0; c < num_comp; c++) {
22692b730f8bSJeremy L Thompson       for (CeedInt n = 0; n < elem_size; n++) q_data_array[(e * num_comp + c) * elem_size + n] = 1. / (elem_avg[e] * fdm_diagonal[c * elem_size + n]);
22702b730f8bSJeremy L Thompson     }
22712b730f8bSJeremy L Thompson   }
22722b730f8bSJeremy L Thompson   CeedCall(CeedFree(&elem_avg));
22732b730f8bSJeremy L Thompson   CeedCall(CeedFree(&fdm_diagonal));
22742b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArray(q_data, &q_data_array));
2275eaf62fffSJeremy L Thompson 
2276eaf62fffSJeremy L Thompson   // Setup FDM operator
2277eaf62fffSJeremy L Thompson   // -- Basis
2278eaf62fffSJeremy L Thompson   CeedBasis   fdm_basis;
2279eaf62fffSJeremy L Thompson   CeedScalar *grad_dummy, *q_ref_dummy, *q_weight_dummy;
22802b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &grad_dummy));
22812b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d, &q_ref_dummy));
22822b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d, &q_weight_dummy));
22832b730f8bSJeremy L Thompson   CeedCall(CeedBasisCreateTensorH1(ceed_parent, dim, num_comp, P_1d, P_1d, fdm_interp, grad_dummy, q_ref_dummy, q_weight_dummy, &fdm_basis));
22842b730f8bSJeremy L Thompson   CeedCall(CeedFree(&fdm_interp));
22852b730f8bSJeremy L Thompson   CeedCall(CeedFree(&grad_dummy));
22862b730f8bSJeremy L Thompson   CeedCall(CeedFree(&q_ref_dummy));
22872b730f8bSJeremy L Thompson   CeedCall(CeedFree(&q_weight_dummy));
22882b730f8bSJeremy L Thompson   CeedCall(CeedFree(&lambda));
2289eaf62fffSJeremy L Thompson 
2290eaf62fffSJeremy L Thompson   // -- Restriction
2291eaf62fffSJeremy L Thompson   CeedElemRestriction rstr_qd_i;
2292eaf62fffSJeremy L Thompson   CeedInt             strides[3] = {1, elem_size, elem_size * num_comp};
22932b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionCreateStrided(ceed_parent, num_elem, elem_size, num_comp, num_elem * num_comp * elem_size, strides, &rstr_qd_i));
2294eaf62fffSJeremy L Thompson   // -- QFunction
2295eaf62fffSJeremy L Thompson   CeedQFunction qf_fdm;
22962b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionCreateInteriorByName(ceed_parent, "Scale", &qf_fdm));
22972b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAddInput(qf_fdm, "input", num_comp, CEED_EVAL_INTERP));
22982b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAddInput(qf_fdm, "scale", num_comp, CEED_EVAL_NONE));
22992b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAddOutput(qf_fdm, "output", num_comp, CEED_EVAL_INTERP));
23002b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_fdm, num_comp));
2301eaf62fffSJeremy L Thompson   // -- QFunction context
2302eaf62fffSJeremy L Thompson   CeedInt *num_comp_data;
23032b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(1, &num_comp_data));
2304eaf62fffSJeremy L Thompson   num_comp_data[0] = num_comp;
2305eaf62fffSJeremy L Thompson   CeedQFunctionContext ctx_fdm;
23062b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionContextCreate(ceed, &ctx_fdm));
23072b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionContextSetData(ctx_fdm, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_data), num_comp_data));
23082b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionSetContext(qf_fdm, ctx_fdm));
23092b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionContextDestroy(&ctx_fdm));
2310eaf62fffSJeremy L Thompson   // -- Operator
23112b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCreate(ceed_parent, qf_fdm, NULL, NULL, fdm_inv));
23122b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetField(*fdm_inv, "input", rstr, fdm_basis, CEED_VECTOR_ACTIVE));
23132b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetField(*fdm_inv, "scale", rstr_qd_i, CEED_BASIS_COLLOCATED, q_data));
23142b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetField(*fdm_inv, "output", rstr, fdm_basis, CEED_VECTOR_ACTIVE));
2315eaf62fffSJeremy L Thompson 
2316eaf62fffSJeremy L Thompson   // Cleanup
23172b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&q_data));
23182b730f8bSJeremy L Thompson   CeedCall(CeedBasisDestroy(&fdm_basis));
23192b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&rstr_qd_i));
23202b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionDestroy(&qf_fdm));
2321eaf62fffSJeremy L Thompson 
2322eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
2323eaf62fffSJeremy L Thompson }
2324eaf62fffSJeremy L Thompson 
2325eaf62fffSJeremy L Thompson /// @}
2326