xref: /libCEED/rust/libceed-sys/c-src/interface/ceed-preconditioning.c (revision 123d890ddf70fcda52aa403ec2d78adc317a115c)
13d8e8822SJeremy L Thompson // Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors.
23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details.
3eaf62fffSJeremy L Thompson //
43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause
5eaf62fffSJeremy L Thompson //
63d8e8822SJeremy L Thompson // This file is part of CEED:  http://github.com/ceed
7eaf62fffSJeremy L Thompson 
82b730f8bSJeremy L Thompson #include <ceed-impl.h>
949aac155SJeremy L Thompson #include <ceed.h>
102b730f8bSJeremy L Thompson #include <ceed/backend.h>
11c85e8640SSebastian Grimberg #include <assert.h>
122b730f8bSJeremy L Thompson #include <math.h>
13eaf62fffSJeremy L Thompson #include <stdbool.h>
14eaf62fffSJeremy L Thompson #include <stdio.h>
15eaf62fffSJeremy L Thompson #include <string.h>
16eaf62fffSJeremy L Thompson 
17eaf62fffSJeremy L Thompson /// @file
18eaf62fffSJeremy L Thompson /// Implementation of CeedOperator preconditioning interfaces
19eaf62fffSJeremy L Thompson 
20eaf62fffSJeremy L Thompson /// ----------------------------------------------------------------------------
21eaf62fffSJeremy L Thompson /// CeedOperator Library Internal Preconditioning Functions
22eaf62fffSJeremy L Thompson /// ----------------------------------------------------------------------------
23eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorDeveloper
24eaf62fffSJeremy L Thompson /// @{
25eaf62fffSJeremy L Thompson 
26eaf62fffSJeremy L Thompson /**
27ea61e9acSJeremy L Thompson   @brief Duplicate a CeedQFunction with a reference Ceed to fallback for advanced CeedOperator functionality
289e77b9c8SJeremy L Thompson 
2901ea9c81SJed Brown   @param[in]  fallback_ceed Ceed on which to create fallback CeedQFunction
309e77b9c8SJeremy L Thompson   @param[in]  qf            CeedQFunction to create fallback for
3101ea9c81SJed Brown   @param[out] qf_fallback   fallback CeedQFunction
329e77b9c8SJeremy L Thompson 
339e77b9c8SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
349e77b9c8SJeremy L Thompson 
359e77b9c8SJeremy L Thompson   @ref Developer
369e77b9c8SJeremy L Thompson **/
372b730f8bSJeremy L Thompson static int CeedQFunctionCreateFallback(Ceed fallback_ceed, CeedQFunction qf, CeedQFunction *qf_fallback) {
381c66c397SJeremy L Thompson   char *source_path_with_name = NULL;
391c66c397SJeremy L Thompson 
409e77b9c8SJeremy L Thompson   // Check if NULL qf passed in
419e77b9c8SJeremy L Thompson   if (!qf) return CEED_ERROR_SUCCESS;
429e77b9c8SJeremy L Thompson 
43d04bbc78SJeremy L Thompson   CeedDebug256(qf->ceed, 1, "---------- CeedOperator Fallback ----------\n");
4413f886e9SJeremy L Thompson   CeedDebug(qf->ceed, "Creating fallback CeedQFunction\n");
45d04bbc78SJeremy L Thompson 
469e77b9c8SJeremy L Thompson   if (qf->source_path) {
472b730f8bSJeremy L Thompson     size_t path_len = strlen(qf->source_path), name_len = strlen(qf->kernel_name);
482b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(path_len + name_len + 2, &source_path_with_name));
499e77b9c8SJeremy L Thompson     memcpy(source_path_with_name, qf->source_path, path_len);
509e77b9c8SJeremy L Thompson     memcpy(&source_path_with_name[path_len], ":", 1);
519e77b9c8SJeremy L Thompson     memcpy(&source_path_with_name[path_len + 1], qf->kernel_name, name_len);
529e77b9c8SJeremy L Thompson   } else {
532b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(1, &source_path_with_name));
549e77b9c8SJeremy L Thompson   }
559e77b9c8SJeremy L Thompson 
562b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionCreateInterior(fallback_ceed, qf->vec_length, qf->function, source_path_with_name, qf_fallback));
579e77b9c8SJeremy L Thompson   {
589e77b9c8SJeremy L Thompson     CeedQFunctionContext ctx;
599e77b9c8SJeremy L Thompson 
602b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionGetContext(qf, &ctx));
612b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionSetContext(*qf_fallback, ctx));
629e77b9c8SJeremy L Thompson   }
639e77b9c8SJeremy L Thompson   for (CeedInt i = 0; i < qf->num_input_fields; i++) {
642b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddInput(*qf_fallback, qf->input_fields[i]->field_name, qf->input_fields[i]->size, qf->input_fields[i]->eval_mode));
659e77b9c8SJeremy L Thompson   }
669e77b9c8SJeremy L Thompson   for (CeedInt i = 0; i < qf->num_output_fields; i++) {
672b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddOutput(*qf_fallback, qf->output_fields[i]->field_name, qf->output_fields[i]->size, qf->output_fields[i]->eval_mode));
689e77b9c8SJeremy L Thompson   }
692b730f8bSJeremy L Thompson   CeedCall(CeedFree(&source_path_with_name));
709e77b9c8SJeremy L Thompson   return CEED_ERROR_SUCCESS;
719e77b9c8SJeremy L Thompson }
729e77b9c8SJeremy L Thompson 
739e77b9c8SJeremy L Thompson /**
74ea61e9acSJeremy L Thompson   @brief Duplicate a CeedOperator with a reference Ceed to fallback for advanced CeedOperator functionality
75eaf62fffSJeremy L Thompson 
76ea61e9acSJeremy L Thompson   @param[in,out] op CeedOperator to create fallback for
77eaf62fffSJeremy L Thompson 
78eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
79eaf62fffSJeremy L Thompson 
80eaf62fffSJeremy L Thompson   @ref Developer
81eaf62fffSJeremy L Thompson **/
82d04bbc78SJeremy L Thompson static int CeedOperatorCreateFallback(CeedOperator op) {
839e77b9c8SJeremy L Thompson   Ceed         ceed_fallback;
841c66c397SJeremy L Thompson   bool         is_composite;
851c66c397SJeremy L Thompson   CeedOperator op_fallback;
86eaf62fffSJeremy L Thompson 
87805fe78eSJeremy L Thompson   // Check not already created
88805fe78eSJeremy L Thompson   if (op->op_fallback) return CEED_ERROR_SUCCESS;
89805fe78eSJeremy L Thompson 
90eaf62fffSJeremy L Thompson   // Fallback Ceed
912b730f8bSJeremy L Thompson   CeedCall(CeedGetOperatorFallbackCeed(op->ceed, &ceed_fallback));
92d04bbc78SJeremy L Thompson   if (!ceed_fallback) return CEED_ERROR_SUCCESS;
93d04bbc78SJeremy L Thompson 
94d04bbc78SJeremy L Thompson   CeedDebug256(op->ceed, 1, "---------- CeedOperator Fallback ----------\n");
9513f886e9SJeremy L Thompson   CeedDebug(op->ceed, "Creating fallback CeedOperator\n");
96eaf62fffSJeremy L Thompson 
97eaf62fffSJeremy L Thompson   // Clone Op
98b275c451SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
99b275c451SJeremy L Thompson   if (is_composite) {
100b275c451SJeremy L Thompson     CeedInt       num_suboperators;
101b275c451SJeremy L Thompson     CeedOperator *sub_operators;
102b275c451SJeremy L Thompson 
1032b730f8bSJeremy L Thompson     CeedCall(CeedCompositeOperatorCreate(ceed_fallback, &op_fallback));
104b275c451SJeremy L Thompson     CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
105b275c451SJeremy L Thompson     CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
106b275c451SJeremy L Thompson     for (CeedInt i = 0; i < num_suboperators; i++) {
107d04bbc78SJeremy L Thompson       CeedOperator op_sub_fallback;
108d04bbc78SJeremy L Thompson 
109b275c451SJeremy L Thompson       CeedCall(CeedOperatorGetFallback(sub_operators[i], &op_sub_fallback));
1102b730f8bSJeremy L Thompson       CeedCall(CeedCompositeOperatorAddSub(op_fallback, op_sub_fallback));
111805fe78eSJeremy L Thompson     }
112805fe78eSJeremy L Thompson   } else {
1139e77b9c8SJeremy L Thompson     CeedQFunction qf_fallback = NULL, dqf_fallback = NULL, dqfT_fallback = NULL;
1141c66c397SJeremy L Thompson 
1152b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->qf, &qf_fallback));
1162b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqf, &dqf_fallback));
1172b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqfT, &dqfT_fallback));
1182b730f8bSJeremy L Thompson     CeedCall(CeedOperatorCreate(ceed_fallback, qf_fallback, dqf_fallback, dqfT_fallback, &op_fallback));
119805fe78eSJeremy L Thompson     for (CeedInt i = 0; i < op->qf->num_input_fields; i++) {
120437c7c90SJeremy L Thompson       CeedCall(CeedOperatorSetField(op_fallback, op->input_fields[i]->field_name, op->input_fields[i]->elem_rstr, op->input_fields[i]->basis,
1212b730f8bSJeremy L Thompson                                     op->input_fields[i]->vec));
122805fe78eSJeremy L Thompson     }
123805fe78eSJeremy L Thompson     for (CeedInt i = 0; i < op->qf->num_output_fields; i++) {
124437c7c90SJeremy L Thompson       CeedCall(CeedOperatorSetField(op_fallback, op->output_fields[i]->field_name, op->output_fields[i]->elem_rstr, op->output_fields[i]->basis,
1252b730f8bSJeremy L Thompson                                     op->output_fields[i]->vec));
126805fe78eSJeremy L Thompson     }
1272b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op->qf_assembled, &op_fallback->qf_assembled));
128febe2972SJeremy L Thompson     if (op_fallback->num_qpts == 0) CeedCall(CeedOperatorSetNumQuadraturePoints(op_fallback, op->num_qpts));
1299e77b9c8SJeremy L Thompson     // Cleanup
1302b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionDestroy(&qf_fallback));
1312b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionDestroy(&dqf_fallback));
1322b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionDestroy(&dqfT_fallback));
133805fe78eSJeremy L Thompson   }
1342b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetName(op_fallback, op->name));
1352b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op_fallback));
136b05f7e9fSJeremy L Thompson   // Note: No ref-counting here so we don't get caught in a reference loop.
137b05f7e9fSJeremy L Thompson   //       The op holds the only reference to op_fallback and is responsible for deleting itself and op_fallback.
138805fe78eSJeremy L Thompson   op->op_fallback                 = op_fallback;
139b05f7e9fSJeremy L Thompson   op_fallback->op_fallback_parent = op;
140eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
141eaf62fffSJeremy L Thompson }
142eaf62fffSJeremy L Thompson 
143eaf62fffSJeremy L Thompson /**
144ea61e9acSJeremy L Thompson   @brief Retrieve fallback CeedOperator with a reference Ceed for advanced CeedOperator functionality
145d04bbc78SJeremy L Thompson 
146d04bbc78SJeremy L Thompson   @param[in]  op          CeedOperator to retrieve fallback for
147d04bbc78SJeremy L Thompson   @param[out] op_fallback Fallback CeedOperator
148d04bbc78SJeremy L Thompson 
149d04bbc78SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
150d04bbc78SJeremy L Thompson 
151d04bbc78SJeremy L Thompson   @ref Developer
152d04bbc78SJeremy L Thompson **/
153d04bbc78SJeremy L Thompson int CeedOperatorGetFallback(CeedOperator op, CeedOperator *op_fallback) {
154d04bbc78SJeremy L Thompson   // Create if needed
1551c66c397SJeremy L Thompson   if (!op->op_fallback) CeedCall(CeedOperatorCreateFallback(op));
156d04bbc78SJeremy L Thompson   if (op->op_fallback) {
157d04bbc78SJeremy L Thompson     bool is_debug;
158d04bbc78SJeremy L Thompson 
1592b730f8bSJeremy L Thompson     CeedCall(CeedIsDebug(op->ceed, &is_debug));
160d04bbc78SJeremy L Thompson     if (is_debug) {
161b275c451SJeremy L Thompson       Ceed        ceed, ceed_fallback;
162d04bbc78SJeremy L Thompson       const char *resource, *resource_fallback;
163d04bbc78SJeremy L Thompson 
164b275c451SJeremy L Thompson       CeedCall(CeedOperatorGetCeed(op, &ceed));
165b275c451SJeremy L Thompson       CeedCall(CeedGetOperatorFallbackCeed(ceed, &ceed_fallback));
166b275c451SJeremy L Thompson       CeedCall(CeedGetResource(ceed, &resource));
1672b730f8bSJeremy L Thompson       CeedCall(CeedGetResource(ceed_fallback, &resource_fallback));
168d04bbc78SJeremy L Thompson 
16923d4529eSJeremy L Thompson       CeedDebug256(ceed, CEED_DEBUG_COLOR_SUCCESS, "---------- CeedOperator Fallback ----------\n");
170b275c451SJeremy L Thompson       CeedDebug(ceed, "Falling back from %s operator at address %ld to %s operator at address %ld\n", resource, op, resource_fallback,
1712b730f8bSJeremy L Thompson                 op->op_fallback);
172d04bbc78SJeremy L Thompson     }
173d04bbc78SJeremy L Thompson   }
174d04bbc78SJeremy L Thompson   *op_fallback = op->op_fallback;
175d04bbc78SJeremy L Thompson   return CEED_ERROR_SUCCESS;
176d04bbc78SJeremy L Thompson }
177d04bbc78SJeremy L Thompson 
178d04bbc78SJeremy L Thompson /**
1792e8f5c67SJeremy L Thompson   @brief Get the parent CeedOperator for a fallback CeedOperator
180bb229da9SJeremy L Thompson 
181bb229da9SJeremy L Thompson   @param[in]  op     CeedOperator context
182bb229da9SJeremy L Thompson   @param[out] parent Variable to store parent CeedOperator context
183bb229da9SJeremy L Thompson 
184bb229da9SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
185bb229da9SJeremy L Thompson 
186bb229da9SJeremy L Thompson   @ref Developer
187bb229da9SJeremy L Thompson **/
188bb229da9SJeremy L Thompson int CeedOperatorGetFallbackParent(CeedOperator op, CeedOperator *parent) {
189bb229da9SJeremy L Thompson   *parent = op->op_fallback_parent ? op->op_fallback_parent : NULL;
190bb229da9SJeremy L Thompson   return CEED_ERROR_SUCCESS;
191bb229da9SJeremy L Thompson }
192bb229da9SJeremy L Thompson 
193bb229da9SJeremy L Thompson /**
1942e8f5c67SJeremy L Thompson   @brief Get the Ceed context of the parent CeedOperator for a fallback CeedOperator
195bb229da9SJeremy L Thompson 
196bb229da9SJeremy L Thompson   @param[in]  op     CeedOperator context
197bb229da9SJeremy L Thompson   @param[out] parent Variable to store parent Ceed context
198bb229da9SJeremy L Thompson 
199bb229da9SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
200bb229da9SJeremy L Thompson 
201bb229da9SJeremy L Thompson   @ref Developer
202bb229da9SJeremy L Thompson **/
203bb229da9SJeremy L Thompson int CeedOperatorGetFallbackParentCeed(CeedOperator op, Ceed *parent) {
204e984cf9aSJeremy L Thompson   *parent = op->op_fallback_parent ? op->op_fallback_parent->ceed : op->ceed;
205bb229da9SJeremy L Thompson   return CEED_ERROR_SUCCESS;
206bb229da9SJeremy L Thompson }
207bb229da9SJeremy L Thompson 
208bb229da9SJeremy L Thompson /**
209eaf62fffSJeremy L Thompson   @brief Select correct basis matrix pointer based on CeedEvalMode
210eaf62fffSJeremy L Thompson 
211352a5e7cSSebastian Grimberg   @param[in]  basis     CeedBasis from which to get the basis matrix
212eaf62fffSJeremy L Thompson   @param[in]  eval_mode Current basis evaluation mode
213eaf62fffSJeremy L Thompson   @param[in]  identity  Pointer to identity matrix
214eaf62fffSJeremy L Thompson   @param[out] basis_ptr Basis pointer to set
215eaf62fffSJeremy L Thompson 
216eaf62fffSJeremy L Thompson   @ref Developer
217eaf62fffSJeremy L Thompson **/
218352a5e7cSSebastian Grimberg static inline int CeedOperatorGetBasisPointer(CeedBasis basis, CeedEvalMode eval_mode, const CeedScalar *identity, const CeedScalar **basis_ptr) {
219eaf62fffSJeremy L Thompson   switch (eval_mode) {
220eaf62fffSJeremy L Thompson     case CEED_EVAL_NONE:
221eaf62fffSJeremy L Thompson       *basis_ptr = identity;
222eaf62fffSJeremy L Thompson       break;
223eaf62fffSJeremy L Thompson     case CEED_EVAL_INTERP:
224352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetInterp(basis, basis_ptr));
225eaf62fffSJeremy L Thompson       break;
226eaf62fffSJeremy L Thompson     case CEED_EVAL_GRAD:
227352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetGrad(basis, basis_ptr));
228352a5e7cSSebastian Grimberg       break;
229352a5e7cSSebastian Grimberg     case CEED_EVAL_DIV:
230352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetDiv(basis, basis_ptr));
231352a5e7cSSebastian Grimberg       break;
232352a5e7cSSebastian Grimberg     case CEED_EVAL_CURL:
233352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetCurl(basis, basis_ptr));
234eaf62fffSJeremy L Thompson       break;
235eaf62fffSJeremy L Thompson     case CEED_EVAL_WEIGHT:
236eaf62fffSJeremy L Thompson       break;  // Caught by QF Assembly
237eaf62fffSJeremy L Thompson   }
238ed9e99e6SJeremy L Thompson   assert(*basis_ptr != NULL);
239352a5e7cSSebastian Grimberg   return CEED_ERROR_SUCCESS;
240eaf62fffSJeremy L Thompson }
241eaf62fffSJeremy L Thompson 
242eaf62fffSJeremy L Thompson /**
243eaf62fffSJeremy L Thompson   @brief Core logic for assembling operator diagonal or point block diagonal
244eaf62fffSJeremy L Thompson 
245eaf62fffSJeremy L Thompson   @param[in]  op             CeedOperator to assemble point block diagonal
246ea61e9acSJeremy L Thompson   @param[in]  request        Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE
247bd83916cSSebastian Grimberg   @param[in]  is_point_block Boolean flag to assemble diagonal or point block diagonal
248eaf62fffSJeremy L Thompson   @param[out] assembled      CeedVector to store assembled diagonal
249eaf62fffSJeremy L Thompson 
250eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
251eaf62fffSJeremy L Thompson 
252eaf62fffSJeremy L Thompson   @ref Developer
253eaf62fffSJeremy L Thompson **/
254bd83916cSSebastian Grimberg static inline int CeedSingleOperatorAssembleAddDiagonal_Core(CeedOperator op, CeedRequest *request, const bool is_point_block, CeedVector assembled) {
255eaf62fffSJeremy L Thompson   Ceed ceed;
256506b1a0cSSebastian Grimberg   bool is_composite;
257506b1a0cSSebastian Grimberg 
258506b1a0cSSebastian Grimberg   CeedCall(CeedOperatorGetCeed(op, &ceed));
259506b1a0cSSebastian Grimberg   CeedCall(CeedOperatorIsComposite(op, &is_composite));
260506b1a0cSSebastian Grimberg   CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported");
261506b1a0cSSebastian Grimberg 
262506b1a0cSSebastian Grimberg   // Assemble QFunction
263506b1a0cSSebastian Grimberg   CeedInt             layout_qf[3];
264437c7c90SJeremy L Thompson   const CeedScalar   *assembled_qf_array;
265c5f45aeaSJeremy L Thompson   CeedVector          assembled_qf        = NULL;
266c5f45aeaSJeremy L Thompson   CeedElemRestriction assembled_elem_rstr = NULL;
267437c7c90SJeremy L Thompson 
268437c7c90SJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &assembled_elem_rstr, request));
269506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionGetELayout(assembled_elem_rstr, &layout_qf));
270437c7c90SJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&assembled_elem_rstr));
271437c7c90SJeremy L Thompson   CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array));
272eaf62fffSJeremy L Thompson 
273ed9e99e6SJeremy L Thompson   // Get assembly data
274437c7c90SJeremy L Thompson   const CeedEvalMode     **eval_modes_in, **eval_modes_out;
275506b1a0cSSebastian Grimberg   CeedInt                  num_active_bases_in, *num_eval_modes_in, num_active_bases_out, *num_eval_modes_out;
276437c7c90SJeremy L Thompson   CeedSize               **eval_mode_offsets_in, **eval_mode_offsets_out, num_output_components;
277506b1a0cSSebastian Grimberg   CeedBasis               *active_bases_in, *active_bases_out;
278506b1a0cSSebastian Grimberg   CeedElemRestriction     *active_elem_rstrs_in, *active_elem_rstrs_out;
2791c66c397SJeremy L Thompson   CeedOperatorAssemblyData data;
2801c66c397SJeremy L Thompson 
281437c7c90SJeremy L Thompson   CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data));
282506b1a0cSSebastian Grimberg   CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_active_bases_in, &num_eval_modes_in, &eval_modes_in, &eval_mode_offsets_in,
283506b1a0cSSebastian Grimberg                                                 &num_active_bases_out, &num_eval_modes_out, &eval_modes_out, &eval_mode_offsets_out,
284506b1a0cSSebastian Grimberg                                                 &num_output_components));
285506b1a0cSSebastian Grimberg   CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, &active_bases_in, NULL, NULL, &active_bases_out, NULL));
286506b1a0cSSebastian Grimberg   CeedCall(CeedOperatorAssemblyDataGetElemRestrictions(data, NULL, &active_elem_rstrs_in, NULL, &active_elem_rstrs_out));
287506b1a0cSSebastian Grimberg 
288506b1a0cSSebastian Grimberg   CeedCheck(num_active_bases_in == num_active_bases_out, ceed, CEED_ERROR_UNSUPPORTED,
289506b1a0cSSebastian Grimberg             "Cannot assemble operator diagonal with different numbers of input and output active bases");
290437c7c90SJeremy L Thompson 
291437c7c90SJeremy L Thompson   // Loop over all active bases
292506b1a0cSSebastian Grimberg   for (CeedInt b = 0; b < num_active_bases_in; b++) {
2931c66c397SJeremy L Thompson     bool                has_eval_none = false;
294506b1a0cSSebastian Grimberg     CeedInt             num_elem, num_nodes, num_qpts, num_comp;
2951c66c397SJeremy L Thompson     CeedScalar         *elem_diag_array, *identity = NULL;
2961c66c397SJeremy L Thompson     CeedVector          elem_diag;
2977c1dbaffSSebastian Grimberg     CeedElemRestriction diag_elem_rstr;
2981c66c397SJeremy L Thompson 
299506b1a0cSSebastian Grimberg     CeedCheck(active_elem_rstrs_in[b] == active_elem_rstrs_out[b], ceed, CEED_ERROR_UNSUPPORTED,
300506b1a0cSSebastian Grimberg               "Cannot assemble operator diagonal with different input and output active element restrictions");
301506b1a0cSSebastian Grimberg 
3021c66c397SJeremy L Thompson     // Assemble point block diagonal restriction, if needed
303bd83916cSSebastian Grimberg     if (is_point_block) {
304506b1a0cSSebastian Grimberg       CeedCall(CeedOperatorCreateActivePointBlockRestriction(active_elem_rstrs_in[b], &diag_elem_rstr));
3057c1dbaffSSebastian Grimberg     } else {
306506b1a0cSSebastian Grimberg       CeedCall(CeedElemRestrictionCreateUnsignedCopy(active_elem_rstrs_in[b], &diag_elem_rstr));
307eaf62fffSJeremy L Thompson     }
308eaf62fffSJeremy L Thompson 
309eaf62fffSJeremy L Thompson     // Create diagonal vector
310437c7c90SJeremy L Thompson     CeedCall(CeedElemRestrictionCreateVector(diag_elem_rstr, NULL, &elem_diag));
311eaf62fffSJeremy L Thompson 
312eaf62fffSJeremy L Thompson     // Assemble element operator diagonals
3132b730f8bSJeremy L Thompson     CeedCall(CeedVectorSetValue(elem_diag, 0.0));
3142b730f8bSJeremy L Thompson     CeedCall(CeedVectorGetArray(elem_diag, CEED_MEM_HOST, &elem_diag_array));
315437c7c90SJeremy L Thompson     CeedCall(CeedElemRestrictionGetNumElements(diag_elem_rstr, &num_elem));
316506b1a0cSSebastian Grimberg     CeedCall(CeedBasisGetNumNodes(active_bases_in[b], &num_nodes));
317506b1a0cSSebastian Grimberg     CeedCall(CeedBasisGetNumComponents(active_bases_in[b], &num_comp));
318506b1a0cSSebastian Grimberg     if (active_bases_in[b] == CEED_BASIS_NONE) num_qpts = num_nodes;
319506b1a0cSSebastian Grimberg     else CeedCall(CeedBasisGetNumQuadraturePoints(active_bases_in[b], &num_qpts));
320506b1a0cSSebastian Grimberg 
321506b1a0cSSebastian Grimberg     if (active_bases_in[b] != active_bases_out[b]) {
322506b1a0cSSebastian Grimberg       CeedInt num_nodes_out, num_qpts_out, num_comp_out;
323506b1a0cSSebastian Grimberg 
324506b1a0cSSebastian Grimberg       CeedCall(CeedBasisGetNumNodes(active_bases_out[b], &num_nodes_out));
325506b1a0cSSebastian Grimberg       CeedCheck(num_nodes == num_nodes_out, ceed, CEED_ERROR_UNSUPPORTED, "Active input and output bases must have the same number of nodes");
326506b1a0cSSebastian Grimberg       CeedCall(CeedBasisGetNumComponents(active_bases_out[b], &num_comp_out));
327506b1a0cSSebastian Grimberg       CeedCheck(num_comp == num_comp_out, ceed, CEED_ERROR_UNSUPPORTED, "Active input and output bases must have the same number of components");
328506b1a0cSSebastian Grimberg       if (active_bases_out[b] == CEED_BASIS_NONE) num_qpts_out = num_nodes_out;
329506b1a0cSSebastian Grimberg       else CeedCall(CeedBasisGetNumQuadraturePoints(active_bases_out[b], &num_qpts_out));
330506b1a0cSSebastian Grimberg       CeedCheck(num_qpts == num_qpts_out, ceed, CEED_ERROR_UNSUPPORTED,
331506b1a0cSSebastian Grimberg                 "Active input and output bases must have the same number of quadrature points");
332506b1a0cSSebastian Grimberg     }
333ed9e99e6SJeremy L Thompson 
334352a5e7cSSebastian Grimberg     // Construct identity matrix for basis if required
335437c7c90SJeremy L Thompson     for (CeedInt i = 0; i < num_eval_modes_in[b]; i++) {
336437c7c90SJeremy L Thompson       has_eval_none = has_eval_none || (eval_modes_in[b][i] == CEED_EVAL_NONE);
337ed9e99e6SJeremy L Thompson     }
338437c7c90SJeremy L Thompson     for (CeedInt i = 0; i < num_eval_modes_out[b]; i++) {
339437c7c90SJeremy L Thompson       has_eval_none = has_eval_none || (eval_modes_out[b][i] == CEED_EVAL_NONE);
340ed9e99e6SJeremy L Thompson     }
341ed9e99e6SJeremy L Thompson     if (has_eval_none) {
3422b730f8bSJeremy L Thompson       CeedCall(CeedCalloc(num_qpts * num_nodes, &identity));
3432b730f8bSJeremy L Thompson       for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) identity[i * num_nodes + i] = 1.0;
344eaf62fffSJeremy L Thompson     }
345352a5e7cSSebastian Grimberg 
346eaf62fffSJeremy L Thompson     // Compute the diagonal of B^T D B
347eaf62fffSJeremy L Thompson     // Each element
348b94338b9SJed Brown     for (CeedSize e = 0; e < num_elem; e++) {
349eaf62fffSJeremy L Thompson       // Each basis eval mode pair
350352a5e7cSSebastian Grimberg       CeedInt      d_out              = 0, q_comp_out;
351352a5e7cSSebastian Grimberg       CeedEvalMode eval_mode_out_prev = CEED_EVAL_NONE;
3521c66c397SJeremy L Thompson 
353437c7c90SJeremy L Thompson       for (CeedInt e_out = 0; e_out < num_eval_modes_out[b]; e_out++) {
3541c66c397SJeremy L Thompson         CeedInt           d_in              = 0, q_comp_in;
355437c7c90SJeremy L Thompson         const CeedScalar *B_t               = NULL;
3561c66c397SJeremy L Thompson         CeedEvalMode      eval_mode_in_prev = CEED_EVAL_NONE;
3571c66c397SJeremy L Thompson 
358506b1a0cSSebastian Grimberg         CeedCall(CeedOperatorGetBasisPointer(active_bases_out[b], eval_modes_out[b][e_out], identity, &B_t));
359506b1a0cSSebastian Grimberg         CeedCall(CeedBasisGetNumQuadratureComponents(active_bases_out[b], eval_modes_out[b][e_out], &q_comp_out));
360352a5e7cSSebastian Grimberg         if (q_comp_out > 1) {
361352a5e7cSSebastian Grimberg           if (e_out == 0 || eval_modes_out[b][e_out] != eval_mode_out_prev) d_out = 0;
362352a5e7cSSebastian Grimberg           else B_t = &B_t[(++d_out) * num_qpts * num_nodes];
363352a5e7cSSebastian Grimberg         }
364352a5e7cSSebastian Grimberg         eval_mode_out_prev = eval_modes_out[b][e_out];
365352a5e7cSSebastian Grimberg 
366437c7c90SJeremy L Thompson         for (CeedInt e_in = 0; e_in < num_eval_modes_in[b]; e_in++) {
367437c7c90SJeremy L Thompson           const CeedScalar *B = NULL;
3681c66c397SJeremy L Thompson 
369506b1a0cSSebastian Grimberg           CeedCall(CeedOperatorGetBasisPointer(active_bases_in[b], eval_modes_in[b][e_in], identity, &B));
370506b1a0cSSebastian Grimberg           CeedCall(CeedBasisGetNumQuadratureComponents(active_bases_in[b], eval_modes_in[b][e_in], &q_comp_in));
371352a5e7cSSebastian Grimberg           if (q_comp_in > 1) {
372352a5e7cSSebastian Grimberg             if (e_in == 0 || eval_modes_in[b][e_in] != eval_mode_in_prev) d_in = 0;
373352a5e7cSSebastian Grimberg             else B = &B[(++d_in) * num_qpts * num_nodes];
374352a5e7cSSebastian Grimberg           }
375352a5e7cSSebastian Grimberg           eval_mode_in_prev = eval_modes_in[b][e_in];
376352a5e7cSSebastian Grimberg 
377eaf62fffSJeremy L Thompson           // Each component
378506b1a0cSSebastian Grimberg           for (CeedInt c_out = 0; c_out < num_comp; c_out++) {
379437c7c90SJeremy L Thompson             // Each qpt/node pair
3802b730f8bSJeremy L Thompson             for (CeedInt q = 0; q < num_qpts; q++) {
381bd83916cSSebastian Grimberg               if (is_point_block) {
382eaf62fffSJeremy L Thompson                 // Point Block Diagonal
383506b1a0cSSebastian Grimberg                 for (CeedInt c_in = 0; c_in < num_comp; c_in++) {
384b94338b9SJed Brown                   const CeedSize c_offset = (eval_mode_offsets_in[b][e_in] + c_in) * num_output_components + eval_mode_offsets_out[b][e_out] + c_out;
385506b1a0cSSebastian Grimberg                   const CeedScalar qf_value = assembled_qf_array[q * layout_qf[0] + c_offset * layout_qf[1] + e * layout_qf[2]];
3861c66c397SJeremy L Thompson 
3872b730f8bSJeremy L Thompson                   for (CeedInt n = 0; n < num_nodes; n++) {
388506b1a0cSSebastian Grimberg                     elem_diag_array[((e * num_comp + c_out) * num_comp + c_in) * num_nodes + n] +=
389437c7c90SJeremy L Thompson                         B_t[q * num_nodes + n] * qf_value * B[q * num_nodes + n];
390eaf62fffSJeremy L Thompson                   }
3912b730f8bSJeremy L Thompson                 }
392eaf62fffSJeremy L Thompson               } else {
393eaf62fffSJeremy L Thompson                 // Diagonal Only
394437c7c90SJeremy L Thompson                 const CeedInt    c_offset = (eval_mode_offsets_in[b][e_in] + c_out) * num_output_components + eval_mode_offsets_out[b][e_out] + c_out;
395506b1a0cSSebastian Grimberg                 const CeedScalar qf_value = assembled_qf_array[q * layout_qf[0] + c_offset * layout_qf[1] + e * layout_qf[2]];
3961c66c397SJeremy L Thompson 
3972b730f8bSJeremy L Thompson                 for (CeedInt n = 0; n < num_nodes; n++) {
398506b1a0cSSebastian Grimberg                   elem_diag_array[(e * num_comp + c_out) * num_nodes + n] += B_t[q * num_nodes + n] * qf_value * B[q * num_nodes + n];
399eaf62fffSJeremy L Thompson                 }
400eaf62fffSJeremy L Thompson               }
401eaf62fffSJeremy L Thompson             }
402eaf62fffSJeremy L Thompson           }
4032b730f8bSJeremy L Thompson         }
4042b730f8bSJeremy L Thompson       }
4052b730f8bSJeremy L Thompson     }
4062b730f8bSJeremy L Thompson     CeedCall(CeedVectorRestoreArray(elem_diag, &elem_diag_array));
407eaf62fffSJeremy L Thompson 
408eaf62fffSJeremy L Thompson     // Assemble local operator diagonal
4097c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionApply(diag_elem_rstr, CEED_TRANSPOSE, elem_diag, assembled, request));
410eaf62fffSJeremy L Thompson 
411eaf62fffSJeremy L Thompson     // Cleanup
4127c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionDestroy(&diag_elem_rstr));
4132b730f8bSJeremy L Thompson     CeedCall(CeedVectorDestroy(&elem_diag));
4142b730f8bSJeremy L Thompson     CeedCall(CeedFree(&identity));
415437c7c90SJeremy L Thompson   }
416437c7c90SJeremy L Thompson   CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array));
417437c7c90SJeremy L Thompson   CeedCall(CeedVectorDestroy(&assembled_qf));
418eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
419eaf62fffSJeremy L Thompson }
420eaf62fffSJeremy L Thompson 
421eaf62fffSJeremy L Thompson /**
422eaf62fffSJeremy L Thompson   @brief Core logic for assembling composite operator diagonal
423eaf62fffSJeremy L Thompson 
424eaf62fffSJeremy L Thompson   @param[in]  op             CeedOperator to assemble point block diagonal
425ea61e9acSJeremy L Thompson   @param[in]  request        Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE
426bd83916cSSebastian Grimberg   @param[in]  is_point_block Boolean flag to assemble diagonal or point block diagonal
427eaf62fffSJeremy L Thompson   @param[out] assembled      CeedVector to store assembled diagonal
428eaf62fffSJeremy L Thompson 
429eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
430eaf62fffSJeremy L Thompson 
431eaf62fffSJeremy L Thompson   @ref Developer
432eaf62fffSJeremy L Thompson **/
433bd83916cSSebastian Grimberg static inline int CeedCompositeOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedRequest *request, const bool is_point_block,
434eaf62fffSJeremy L Thompson                                                                  CeedVector assembled) {
435eaf62fffSJeremy L Thompson   CeedInt       num_sub;
436eaf62fffSJeremy L Thompson   CeedOperator *suboperators;
4371c66c397SJeremy L Thompson 
438c6ebc35dSJeremy L Thompson   CeedCall(CeedCompositeOperatorGetNumSub(op, &num_sub));
439c6ebc35dSJeremy L Thompson   CeedCall(CeedCompositeOperatorGetSubList(op, &suboperators));
440eaf62fffSJeremy L Thompson   for (CeedInt i = 0; i < num_sub; i++) {
441bd83916cSSebastian Grimberg     if (is_point_block) {
4422b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(suboperators[i], assembled, request));
4436aa95790SJeremy L Thompson     } else {
4442b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleAddDiagonal(suboperators[i], assembled, request));
4456aa95790SJeremy L Thompson     }
446eaf62fffSJeremy L Thompson   }
447eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
448eaf62fffSJeremy L Thompson }
449eaf62fffSJeremy L Thompson 
450eaf62fffSJeremy L Thompson /**
451eaf62fffSJeremy L Thompson   @brief Build nonzero pattern for non-composite operator
452eaf62fffSJeremy L Thompson 
453eaf62fffSJeremy L Thompson   Users should generally use CeedOperatorLinearAssembleSymbolic()
454eaf62fffSJeremy L Thompson 
455eaf62fffSJeremy L Thompson   @param[in]  op     CeedOperator to assemble nonzero pattern
456eaf62fffSJeremy L Thompson   @param[in]  offset Offset for number of entries
457eaf62fffSJeremy L Thompson   @param[out] rows   Row number for each entry
458eaf62fffSJeremy L Thompson   @param[out] cols   Column number for each entry
459eaf62fffSJeremy L Thompson 
460eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
461eaf62fffSJeremy L Thompson 
462eaf62fffSJeremy L Thompson   @ref Developer
463eaf62fffSJeremy L Thompson **/
4642b730f8bSJeremy L Thompson static int CeedSingleOperatorAssembleSymbolic(CeedOperator op, CeedInt offset, CeedInt *rows, CeedInt *cols) {
465f3d47e36SJeremy L Thompson   Ceed                ceed;
466f3d47e36SJeremy L Thompson   bool                is_composite;
467506b1a0cSSebastian Grimberg   CeedSize            num_nodes_in, num_nodes_out, count = 0;
468506b1a0cSSebastian Grimberg   CeedInt             num_elem_in, elem_size_in, num_comp_in, layout_er_in[3];
469506b1a0cSSebastian Grimberg   CeedInt             num_elem_out, elem_size_out, num_comp_out, layout_er_out[3], local_num_entries;
4701c66c397SJeremy L Thompson   CeedScalar         *array;
471506b1a0cSSebastian Grimberg   const CeedScalar   *elem_dof_a_in, *elem_dof_a_out;
472506b1a0cSSebastian Grimberg   CeedVector          index_vec_in, index_vec_out, elem_dof_in, elem_dof_out;
473506b1a0cSSebastian Grimberg   CeedElemRestriction elem_rstr_in, elem_rstr_out, index_elem_rstr_in, index_elem_rstr_out;
4741c66c397SJeremy L Thompson 
475f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
476f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
4776574a04fSJeremy L Thompson   CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported");
478eaf62fffSJeremy L Thompson 
479506b1a0cSSebastian Grimberg   CeedCall(CeedOperatorGetActiveVectorLengths(op, &num_nodes_in, &num_nodes_out));
480506b1a0cSSebastian Grimberg   CeedCall(CeedOperatorGetActiveElemRestrictions(op, &elem_rstr_in, &elem_rstr_out));
481506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionGetNumElements(elem_rstr_in, &num_elem_in));
482506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionGetElementSize(elem_rstr_in, &elem_size_in));
483506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionGetNumComponents(elem_rstr_in, &num_comp_in));
484506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionGetELayout(elem_rstr_in, &layout_er_in));
485eaf62fffSJeremy L Thompson 
486506b1a0cSSebastian Grimberg   // Determine elem_dof relation for input
487506b1a0cSSebastian Grimberg   CeedCall(CeedVectorCreate(ceed, num_nodes_in, &index_vec_in));
488506b1a0cSSebastian Grimberg   CeedCall(CeedVectorGetArrayWrite(index_vec_in, CEED_MEM_HOST, &array));
489506b1a0cSSebastian Grimberg   for (CeedInt i = 0; i < num_nodes_in; i++) array[i] = i;
490506b1a0cSSebastian Grimberg   CeedCall(CeedVectorRestoreArray(index_vec_in, &array));
491506b1a0cSSebastian Grimberg   CeedCall(CeedVectorCreate(ceed, num_elem_in * elem_size_in * num_comp_in, &elem_dof_in));
492506b1a0cSSebastian Grimberg   CeedCall(CeedVectorSetValue(elem_dof_in, 0.0));
493506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionCreateUnorientedCopy(elem_rstr_in, &index_elem_rstr_in));
494506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionApply(index_elem_rstr_in, CEED_NOTRANSPOSE, index_vec_in, elem_dof_in, CEED_REQUEST_IMMEDIATE));
495506b1a0cSSebastian Grimberg   CeedCall(CeedVectorGetArrayRead(elem_dof_in, CEED_MEM_HOST, &elem_dof_a_in));
496506b1a0cSSebastian Grimberg   CeedCall(CeedVectorDestroy(&index_vec_in));
497506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionDestroy(&index_elem_rstr_in));
498506b1a0cSSebastian Grimberg 
499506b1a0cSSebastian Grimberg   if (elem_rstr_in != elem_rstr_out) {
500506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionGetNumElements(elem_rstr_out, &num_elem_out));
501506b1a0cSSebastian Grimberg     CeedCheck(num_elem_in == num_elem_out, ceed, CEED_ERROR_UNSUPPORTED,
502506b1a0cSSebastian Grimberg               "Active input and output operator restrictions must have the same number of elements");
503506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionGetElementSize(elem_rstr_out, &elem_size_out));
504506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionGetNumComponents(elem_rstr_out, &num_comp_out));
505506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionGetELayout(elem_rstr_out, &layout_er_out));
506506b1a0cSSebastian Grimberg 
507506b1a0cSSebastian Grimberg     // Determine elem_dof relation for output
508506b1a0cSSebastian Grimberg     CeedCall(CeedVectorCreate(ceed, num_nodes_out, &index_vec_out));
509506b1a0cSSebastian Grimberg     CeedCall(CeedVectorGetArrayWrite(index_vec_out, CEED_MEM_HOST, &array));
510506b1a0cSSebastian Grimberg     for (CeedInt i = 0; i < num_nodes_out; i++) array[i] = i;
511506b1a0cSSebastian Grimberg     CeedCall(CeedVectorRestoreArray(index_vec_out, &array));
512506b1a0cSSebastian Grimberg     CeedCall(CeedVectorCreate(ceed, num_elem_out * elem_size_out * num_comp_out, &elem_dof_out));
513506b1a0cSSebastian Grimberg     CeedCall(CeedVectorSetValue(elem_dof_out, 0.0));
514506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionCreateUnorientedCopy(elem_rstr_out, &index_elem_rstr_out));
515506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionApply(index_elem_rstr_out, CEED_NOTRANSPOSE, index_vec_out, elem_dof_out, CEED_REQUEST_IMMEDIATE));
516506b1a0cSSebastian Grimberg     CeedCall(CeedVectorGetArrayRead(elem_dof_out, CEED_MEM_HOST, &elem_dof_a_out));
517506b1a0cSSebastian Grimberg     CeedCall(CeedVectorDestroy(&index_vec_out));
518506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionDestroy(&index_elem_rstr_out));
519506b1a0cSSebastian Grimberg   } else {
520506b1a0cSSebastian Grimberg     num_elem_out     = num_elem_in;
521506b1a0cSSebastian Grimberg     elem_size_out    = elem_size_in;
522506b1a0cSSebastian Grimberg     num_comp_out     = num_comp_in;
523506b1a0cSSebastian Grimberg     layout_er_out[0] = layout_er_in[0];
524506b1a0cSSebastian Grimberg     layout_er_out[1] = layout_er_in[1];
525506b1a0cSSebastian Grimberg     layout_er_out[2] = layout_er_in[2];
526506b1a0cSSebastian Grimberg     elem_dof_a_out   = elem_dof_a_in;
527506b1a0cSSebastian Grimberg   }
528506b1a0cSSebastian Grimberg   local_num_entries = elem_size_out * num_comp_out * elem_size_in * num_comp_in * num_elem_in;
529eaf62fffSJeremy L Thompson 
530eaf62fffSJeremy L Thompson   // Determine i, j locations for element matrices
531506b1a0cSSebastian Grimberg   for (CeedInt e = 0; e < num_elem_in; e++) {
532506b1a0cSSebastian Grimberg     for (CeedInt comp_in = 0; comp_in < num_comp_in; comp_in++) {
533506b1a0cSSebastian Grimberg       for (CeedInt comp_out = 0; comp_out < num_comp_out; comp_out++) {
534506b1a0cSSebastian Grimberg         for (CeedInt i = 0; i < elem_size_out; i++) {
535506b1a0cSSebastian Grimberg           for (CeedInt j = 0; j < elem_size_in; j++) {
536506b1a0cSSebastian Grimberg             const CeedInt elem_dof_index_row = i * layout_er_out[0] + comp_out * layout_er_out[1] + e * layout_er_out[2];
537506b1a0cSSebastian Grimberg             const CeedInt elem_dof_index_col = j * layout_er_in[0] + comp_in * layout_er_in[1] + e * layout_er_in[2];
538506b1a0cSSebastian Grimberg             const CeedInt row                = elem_dof_a_out[elem_dof_index_row];
539506b1a0cSSebastian Grimberg             const CeedInt col                = elem_dof_a_in[elem_dof_index_col];
540eaf62fffSJeremy L Thompson 
541eaf62fffSJeremy L Thompson             rows[offset + count] = row;
542eaf62fffSJeremy L Thompson             cols[offset + count] = col;
543eaf62fffSJeremy L Thompson             count++;
544eaf62fffSJeremy L Thompson           }
545eaf62fffSJeremy L Thompson         }
546eaf62fffSJeremy L Thompson       }
547eaf62fffSJeremy L Thompson     }
548eaf62fffSJeremy L Thompson   }
5496574a04fSJeremy L Thompson   CeedCheck(count == local_num_entries, ceed, CEED_ERROR_MAJOR, "Error computing assembled entries");
550506b1a0cSSebastian Grimberg   CeedCall(CeedVectorRestoreArrayRead(elem_dof_in, &elem_dof_a_in));
551506b1a0cSSebastian Grimberg   CeedCall(CeedVectorDestroy(&elem_dof_in));
552506b1a0cSSebastian Grimberg   if (elem_rstr_in != elem_rstr_out) {
553506b1a0cSSebastian Grimberg     CeedCall(CeedVectorRestoreArrayRead(elem_dof_out, &elem_dof_a_out));
554506b1a0cSSebastian Grimberg     CeedCall(CeedVectorDestroy(&elem_dof_out));
555506b1a0cSSebastian Grimberg   }
556eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
557eaf62fffSJeremy L Thompson }
558eaf62fffSJeremy L Thompson 
559eaf62fffSJeremy L Thompson /**
560eaf62fffSJeremy L Thompson   @brief Assemble nonzero entries for non-composite operator
561eaf62fffSJeremy L Thompson 
562eaf62fffSJeremy L Thompson   Users should generally use CeedOperatorLinearAssemble()
563eaf62fffSJeremy L Thompson 
564eaf62fffSJeremy L Thompson   @param[in]  op     CeedOperator to assemble
565ea61e9acSJeremy L Thompson   @param[in]  offset Offset for number of entries
566eaf62fffSJeremy L Thompson   @param[out] values Values to assemble into matrix
567eaf62fffSJeremy L Thompson 
568eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
569eaf62fffSJeremy L Thompson 
570eaf62fffSJeremy L Thompson   @ref Developer
571eaf62fffSJeremy L Thompson **/
5722b730f8bSJeremy L Thompson static int CeedSingleOperatorAssemble(CeedOperator op, CeedInt offset, CeedVector values) {
573f3d47e36SJeremy L Thompson   Ceed ceed;
574f3d47e36SJeremy L Thompson   bool is_composite;
5751c66c397SJeremy L Thompson 
576f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
577f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
5786574a04fSJeremy L Thompson   CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported");
579f3d47e36SJeremy L Thompson 
580f3d47e36SJeremy L Thompson   // Early exit for empty operator
581f3d47e36SJeremy L Thompson   {
582f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
583f3d47e36SJeremy L Thompson 
584f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
585f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
586f3d47e36SJeremy L Thompson   }
587eaf62fffSJeremy L Thompson 
588cefa2673SJeremy L Thompson   if (op->LinearAssembleSingle) {
589cefa2673SJeremy L Thompson     // Backend version
5902b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleSingle(op, offset, values));
591cefa2673SJeremy L Thompson     return CEED_ERROR_SUCCESS;
592cefa2673SJeremy L Thompson   } else {
593cefa2673SJeremy L Thompson     // Operator fallback
594cefa2673SJeremy L Thompson     CeedOperator op_fallback;
595cefa2673SJeremy L Thompson 
5962b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
597cefa2673SJeremy L Thompson     if (op_fallback) {
5982b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemble(op_fallback, offset, values));
599cefa2673SJeremy L Thompson       return CEED_ERROR_SUCCESS;
600cefa2673SJeremy L Thompson     }
601cefa2673SJeremy L Thompson   }
602cefa2673SJeremy L Thompson 
603eaf62fffSJeremy L Thompson   // Assemble QFunction
604506b1a0cSSebastian Grimberg   CeedInt             layout_qf[3];
6051c66c397SJeremy L Thompson   const CeedScalar   *assembled_qf_array;
606c5f45aeaSJeremy L Thompson   CeedVector          assembled_qf        = NULL;
607506b1a0cSSebastian Grimberg   CeedElemRestriction assembled_elem_rstr = NULL;
608eaf62fffSJeremy L Thompson 
609506b1a0cSSebastian Grimberg   CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &assembled_elem_rstr, CEED_REQUEST_IMMEDIATE));
610506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionGetELayout(assembled_elem_rstr, &layout_qf));
611506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionDestroy(&assembled_elem_rstr));
612506b1a0cSSebastian Grimberg   CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array));
613eaf62fffSJeremy L Thompson 
614ed9e99e6SJeremy L Thompson   // Get assembly data
615506b1a0cSSebastian Grimberg   CeedInt                  num_elem_in, elem_size_in, num_comp_in, num_qpts_in;
616506b1a0cSSebastian Grimberg   CeedInt                  num_elem_out, elem_size_out, num_comp_out, num_qpts_out, local_num_entries;
617506b1a0cSSebastian Grimberg   const CeedEvalMode     **eval_modes_in, **eval_modes_out;
618506b1a0cSSebastian Grimberg   CeedInt                  num_active_bases_in, *num_eval_modes_in, num_active_bases_out, *num_eval_modes_out;
619506b1a0cSSebastian Grimberg   CeedBasis               *active_bases_in, *active_bases_out, basis_in, basis_out;
620506b1a0cSSebastian Grimberg   const CeedScalar       **B_mats_in, **B_mats_out, *B_mat_in, *B_mat_out;
621506b1a0cSSebastian Grimberg   CeedElemRestriction      elem_rstr_in, elem_rstr_out;
622506b1a0cSSebastian Grimberg   CeedRestrictionType      elem_rstr_type_in, elem_rstr_type_out;
623506b1a0cSSebastian Grimberg   const bool              *elem_rstr_orients_in = NULL, *elem_rstr_orients_out = NULL;
624506b1a0cSSebastian Grimberg   const CeedInt8          *elem_rstr_curl_orients_in = NULL, *elem_rstr_curl_orients_out = NULL;
625506b1a0cSSebastian Grimberg   CeedOperatorAssemblyData data;
626eaf62fffSJeremy L Thompson 
627506b1a0cSSebastian Grimberg   CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data));
628506b1a0cSSebastian Grimberg   CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_active_bases_in, &num_eval_modes_in, &eval_modes_in, NULL, &num_active_bases_out,
629506b1a0cSSebastian Grimberg                                                 &num_eval_modes_out, &eval_modes_out, NULL, NULL));
630506b1a0cSSebastian Grimberg 
631506b1a0cSSebastian Grimberg   CeedCheck(num_active_bases_in == num_active_bases_out && num_active_bases_in == 1, ceed, CEED_ERROR_UNSUPPORTED,
632506b1a0cSSebastian Grimberg             "Cannot assemble operator with multiple active bases");
6336574a04fSJeremy L Thompson   CeedCheck(num_eval_modes_in[0] > 0 && num_eval_modes_out[0] > 0, ceed, CEED_ERROR_UNSUPPORTED, "Cannot assemble operator without inputs/outputs");
634eaf62fffSJeremy L Thompson 
635506b1a0cSSebastian Grimberg   CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, &active_bases_in, &B_mats_in, NULL, &active_bases_out, &B_mats_out));
636506b1a0cSSebastian Grimberg   CeedCall(CeedOperatorGetActiveElemRestrictions(op, &elem_rstr_in, &elem_rstr_out));
637506b1a0cSSebastian Grimberg   basis_in  = active_bases_in[0];
638506b1a0cSSebastian Grimberg   basis_out = active_bases_out[0];
639506b1a0cSSebastian Grimberg   B_mat_in  = B_mats_in[0];
640506b1a0cSSebastian Grimberg   B_mat_out = B_mats_out[0];
641eaf62fffSJeremy L Thompson 
642506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionGetNumElements(elem_rstr_in, &num_elem_in));
643506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionGetElementSize(elem_rstr_in, &elem_size_in));
644506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionGetNumComponents(elem_rstr_in, &num_comp_in));
645506b1a0cSSebastian Grimberg   if (basis_in == CEED_BASIS_NONE) num_qpts_in = elem_size_in;
646506b1a0cSSebastian Grimberg   else CeedCall(CeedBasisGetNumQuadraturePoints(basis_in, &num_qpts_in));
647506b1a0cSSebastian Grimberg 
648506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionGetType(elem_rstr_in, &elem_rstr_type_in));
649506b1a0cSSebastian Grimberg   if (elem_rstr_type_in == CEED_RESTRICTION_ORIENTED) {
650506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionGetOrientations(elem_rstr_in, CEED_MEM_HOST, &elem_rstr_orients_in));
651506b1a0cSSebastian Grimberg   } else if (elem_rstr_type_in == CEED_RESTRICTION_CURL_ORIENTED) {
652506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionGetCurlOrientations(elem_rstr_in, CEED_MEM_HOST, &elem_rstr_curl_orients_in));
6537c1dbaffSSebastian Grimberg   }
6547c1dbaffSSebastian Grimberg 
655506b1a0cSSebastian Grimberg   if (elem_rstr_in != elem_rstr_out) {
656506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionGetNumElements(elem_rstr_out, &num_elem_out));
657506b1a0cSSebastian Grimberg     CeedCheck(num_elem_in == num_elem_out, ceed, CEED_ERROR_UNSUPPORTED,
658506b1a0cSSebastian Grimberg               "Active input and output operator restrictions must have the same number of elements");
659506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionGetElementSize(elem_rstr_out, &elem_size_out));
660506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionGetNumComponents(elem_rstr_out, &num_comp_out));
661506b1a0cSSebastian Grimberg     if (basis_out == CEED_BASIS_NONE) num_qpts_out = elem_size_out;
662506b1a0cSSebastian Grimberg     else CeedCall(CeedBasisGetNumQuadraturePoints(basis_out, &num_qpts_out));
663506b1a0cSSebastian Grimberg     CeedCheck(num_qpts_in == num_qpts_out, ceed, CEED_ERROR_UNSUPPORTED,
664506b1a0cSSebastian Grimberg               "Active input and output bases must have the same number of quadrature points");
665eaf62fffSJeremy L Thompson 
666506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionGetType(elem_rstr_out, &elem_rstr_type_out));
667506b1a0cSSebastian Grimberg     if (elem_rstr_type_out == CEED_RESTRICTION_ORIENTED) {
668506b1a0cSSebastian Grimberg       CeedCall(CeedElemRestrictionGetOrientations(elem_rstr_out, CEED_MEM_HOST, &elem_rstr_orients_out));
669506b1a0cSSebastian Grimberg     } else if (elem_rstr_type_out == CEED_RESTRICTION_CURL_ORIENTED) {
670506b1a0cSSebastian Grimberg       CeedCall(CeedElemRestrictionGetCurlOrientations(elem_rstr_out, CEED_MEM_HOST, &elem_rstr_curl_orients_out));
671506b1a0cSSebastian Grimberg     }
672506b1a0cSSebastian Grimberg   } else {
673506b1a0cSSebastian Grimberg     num_elem_out  = num_elem_in;
674506b1a0cSSebastian Grimberg     elem_size_out = elem_size_in;
675506b1a0cSSebastian Grimberg     num_comp_out  = num_comp_in;
676506b1a0cSSebastian Grimberg     num_qpts_out  = num_qpts_in;
677506b1a0cSSebastian Grimberg 
678506b1a0cSSebastian Grimberg     elem_rstr_orients_out      = elem_rstr_orients_in;
679506b1a0cSSebastian Grimberg     elem_rstr_curl_orients_out = elem_rstr_curl_orients_in;
680506b1a0cSSebastian Grimberg   }
681506b1a0cSSebastian Grimberg   local_num_entries = elem_size_out * num_comp_out * elem_size_in * num_comp_in * num_elem_in;
682506b1a0cSSebastian Grimberg 
683506b1a0cSSebastian Grimberg   // Loop over elements and put in data structure
6847c1dbaffSSebastian Grimberg   // We store B_mat_in, B_mat_out, BTD, elem_mat in row-major order
6851c66c397SJeremy L Thompson   CeedSize    count = 0;
686*123d890dSSebastian Grimberg   CeedScalar *vals, *BTD_mat = NULL, *elem_mat = NULL, *elem_mat_b = NULL;
687506b1a0cSSebastian Grimberg 
688*123d890dSSebastian Grimberg   CeedCall(CeedCalloc(elem_size_out * num_qpts_in * num_eval_modes_in[0], &BTD_mat));
689*123d890dSSebastian Grimberg   CeedCall(CeedCalloc(elem_size_out * elem_size_in, &elem_mat));
690506b1a0cSSebastian Grimberg   if (elem_rstr_curl_orients_in || elem_rstr_curl_orients_out) CeedCall(CeedCalloc(elem_size_out * elem_size_in, &elem_mat_b));
6911c66c397SJeremy L Thompson 
69228ec399dSJeremy L Thompson   CeedCall(CeedVectorGetArray(values, CEED_MEM_HOST, &vals));
693506b1a0cSSebastian Grimberg   for (CeedSize e = 0; e < num_elem_in; e++) {
694506b1a0cSSebastian Grimberg     for (CeedInt comp_in = 0; comp_in < num_comp_in; comp_in++) {
695506b1a0cSSebastian Grimberg       for (CeedInt comp_out = 0; comp_out < num_comp_out; comp_out++) {
696ed9e99e6SJeremy L Thompson         // Compute B^T*D
697506b1a0cSSebastian Grimberg         for (CeedSize n = 0; n < elem_size_out; n++) {
698506b1a0cSSebastian Grimberg           for (CeedSize q = 0; q < num_qpts_in; q++) {
699437c7c90SJeremy L Thompson             for (CeedInt e_in = 0; e_in < num_eval_modes_in[0]; e_in++) {
700506b1a0cSSebastian Grimberg               const CeedSize btd_index = n * (num_qpts_in * num_eval_modes_in[0]) + q * num_eval_modes_in[0] + e_in;
701067fd99fSJeremy L Thompson               CeedScalar     sum       = 0.0;
7021c66c397SJeremy L Thompson 
703437c7c90SJeremy L Thompson               for (CeedInt e_out = 0; e_out < num_eval_modes_out[0]; e_out++) {
704506b1a0cSSebastian Grimberg                 const CeedSize b_out_index     = (q * num_eval_modes_out[0] + e_out) * elem_size_out + n;
705506b1a0cSSebastian Grimberg                 const CeedSize eval_mode_index = ((e_in * num_comp_in + comp_in) * num_eval_modes_out[0] + e_out) * num_comp_out + comp_out;
706b94338b9SJed Brown                 const CeedSize qf_index        = q * layout_qf[0] + eval_mode_index * layout_qf[1] + e * layout_qf[2];
7071c66c397SJeremy L Thompson 
708067fd99fSJeremy L Thompson                 sum += B_mat_out[b_out_index] * assembled_qf_array[qf_index];
709eaf62fffSJeremy L Thompson               }
710067fd99fSJeremy L Thompson               BTD_mat[btd_index] = sum;
711ed9e99e6SJeremy L Thompson             }
712ed9e99e6SJeremy L Thompson           }
713eaf62fffSJeremy L Thompson         }
7147c1dbaffSSebastian Grimberg 
7157c1dbaffSSebastian Grimberg         // Form element matrix itself (for each block component)
716506b1a0cSSebastian Grimberg         CeedCall(CeedMatrixMatrixMultiply(ceed, BTD_mat, B_mat_in, elem_mat, elem_size_out, elem_size_in, num_qpts_in * num_eval_modes_in[0]));
717eaf62fffSJeremy L Thompson 
7187c1dbaffSSebastian Grimberg         // Transform the element matrix if required
719506b1a0cSSebastian Grimberg         if (elem_rstr_orients_out) {
720506b1a0cSSebastian Grimberg           const bool *elem_orients = &elem_rstr_orients_out[e * elem_size_out];
7211c66c397SJeremy L Thompson 
722506b1a0cSSebastian Grimberg           for (CeedInt i = 0; i < elem_size_out; i++) {
723506b1a0cSSebastian Grimberg             const double orient = elem_orients[i] ? -1.0 : 1.0;
724506b1a0cSSebastian Grimberg 
725506b1a0cSSebastian Grimberg             for (CeedInt j = 0; j < elem_size_in; j++) {
726506b1a0cSSebastian Grimberg               elem_mat[i * elem_size_in + j] *= orient;
7277c1dbaffSSebastian Grimberg             }
7287c1dbaffSSebastian Grimberg           }
729506b1a0cSSebastian Grimberg         } else if (elem_rstr_curl_orients_out) {
730506b1a0cSSebastian Grimberg           const CeedInt8 *elem_curl_orients = &elem_rstr_curl_orients_out[e * 3 * elem_size_out];
7311c66c397SJeremy L Thompson 
7327c1dbaffSSebastian Grimberg           // T^T*(B^T*D*B)
733506b1a0cSSebastian Grimberg           memcpy(elem_mat_b, elem_mat, elem_size_out * elem_size_in * sizeof(CeedScalar));
734506b1a0cSSebastian Grimberg           for (CeedInt i = 0; i < elem_size_out; i++) {
735506b1a0cSSebastian Grimberg             for (CeedInt j = 0; j < elem_size_in; j++) {
736506b1a0cSSebastian Grimberg               elem_mat[i * elem_size_in + j] = elem_mat_b[i * elem_size_in + j] * elem_curl_orients[3 * i + 1] +
737506b1a0cSSebastian Grimberg                                                (i > 0 ? elem_mat_b[(i - 1) * elem_size_in + j] * elem_curl_orients[3 * i - 1] : 0.0) +
738506b1a0cSSebastian Grimberg                                                (i < elem_size_out - 1 ? elem_mat_b[(i + 1) * elem_size_in + j] * elem_curl_orients[3 * i + 3] : 0.0);
7397c1dbaffSSebastian Grimberg             }
7407c1dbaffSSebastian Grimberg           }
741506b1a0cSSebastian Grimberg         }
742506b1a0cSSebastian Grimberg         if (elem_rstr_orients_in) {
743506b1a0cSSebastian Grimberg           const bool *elem_orients = &elem_rstr_orients_in[e * elem_size_in];
744506b1a0cSSebastian Grimberg 
745506b1a0cSSebastian Grimberg           for (CeedInt i = 0; i < elem_size_out; i++) {
746506b1a0cSSebastian Grimberg             for (CeedInt j = 0; j < elem_size_in; j++) {
747506b1a0cSSebastian Grimberg               elem_mat[i * elem_size_in + j] *= elem_orients[j] ? -1.0 : 1.0;
748506b1a0cSSebastian Grimberg             }
749506b1a0cSSebastian Grimberg           }
750506b1a0cSSebastian Grimberg         } else if (elem_rstr_curl_orients_in) {
751506b1a0cSSebastian Grimberg           const CeedInt8 *elem_curl_orients = &elem_rstr_curl_orients_in[e * 3 * elem_size_in];
752506b1a0cSSebastian Grimberg 
753506b1a0cSSebastian Grimberg           // (B^T*D*B)*T
754506b1a0cSSebastian Grimberg           memcpy(elem_mat_b, elem_mat, elem_size_out * elem_size_in * sizeof(CeedScalar));
755506b1a0cSSebastian Grimberg           for (CeedInt i = 0; i < elem_size_out; i++) {
756506b1a0cSSebastian Grimberg             for (CeedInt j = 0; j < elem_size_in; j++) {
757506b1a0cSSebastian Grimberg               elem_mat[i * elem_size_in + j] = elem_mat_b[i * elem_size_in + j] * elem_curl_orients[3 * j + 1] +
758506b1a0cSSebastian Grimberg                                                (j > 0 ? elem_mat_b[i * elem_size_in + j - 1] * elem_curl_orients[3 * j - 1] : 0.0) +
759506b1a0cSSebastian Grimberg                                                (j < elem_size_in - 1 ? elem_mat_b[i * elem_size_in + j + 1] * elem_curl_orients[3 * j + 3] : 0.0);
7607c1dbaffSSebastian Grimberg             }
7617c1dbaffSSebastian Grimberg           }
7627c1dbaffSSebastian Grimberg         }
7637c1dbaffSSebastian Grimberg 
7647c1dbaffSSebastian Grimberg         // Put element matrix in coordinate data structure
765506b1a0cSSebastian Grimberg         for (CeedInt i = 0; i < elem_size_out; i++) {
766506b1a0cSSebastian Grimberg           for (CeedInt j = 0; j < elem_size_in; j++) {
767506b1a0cSSebastian Grimberg             vals[offset + count] = elem_mat[i * elem_size_in + j];
768eaf62fffSJeremy L Thompson             count++;
769eaf62fffSJeremy L Thompson           }
770eaf62fffSJeremy L Thompson         }
771eaf62fffSJeremy L Thompson       }
772eaf62fffSJeremy L Thompson     }
773eaf62fffSJeremy L Thompson   }
7746574a04fSJeremy L Thompson   CeedCheck(count == local_num_entries, ceed, CEED_ERROR_MAJOR, "Error computing entries");
7752b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArray(values, &vals));
776eaf62fffSJeremy L Thompson 
777506b1a0cSSebastian Grimberg   // Cleanup
778*123d890dSSebastian Grimberg   CeedCall(CeedFree(&BTD_mat));
779*123d890dSSebastian Grimberg   CeedCall(CeedFree(&elem_mat));
780506b1a0cSSebastian Grimberg   CeedCall(CeedFree(&elem_mat_b));
781506b1a0cSSebastian Grimberg   if (elem_rstr_type_in == CEED_RESTRICTION_ORIENTED) {
782506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionRestoreOrientations(elem_rstr_in, &elem_rstr_orients_in));
783506b1a0cSSebastian Grimberg   } else if (elem_rstr_type_in == CEED_RESTRICTION_CURL_ORIENTED) {
784506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionRestoreCurlOrientations(elem_rstr_in, &elem_rstr_curl_orients_in));
785506b1a0cSSebastian Grimberg   }
786506b1a0cSSebastian Grimberg   if (elem_rstr_in != elem_rstr_out) {
787506b1a0cSSebastian Grimberg     if (elem_rstr_type_out == CEED_RESTRICTION_ORIENTED) {
788506b1a0cSSebastian Grimberg       CeedCall(CeedElemRestrictionRestoreOrientations(elem_rstr_out, &elem_rstr_orients_out));
789506b1a0cSSebastian Grimberg     } else if (elem_rstr_type_out == CEED_RESTRICTION_CURL_ORIENTED) {
790506b1a0cSSebastian Grimberg       CeedCall(CeedElemRestrictionRestoreCurlOrientations(elem_rstr_out, &elem_rstr_curl_orients_out));
791506b1a0cSSebastian Grimberg     }
792506b1a0cSSebastian Grimberg   }
7932b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array));
7942b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&assembled_qf));
795eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
796eaf62fffSJeremy L Thompson }
797eaf62fffSJeremy L Thompson 
798eaf62fffSJeremy L Thompson /**
799eaf62fffSJeremy L Thompson   @brief Count number of entries for assembled CeedOperator
800eaf62fffSJeremy L Thompson 
801eaf62fffSJeremy L Thompson   @param[in]  op          CeedOperator to assemble
802eaf62fffSJeremy L Thompson   @param[out] num_entries Number of entries in assembled representation
803eaf62fffSJeremy L Thompson 
804eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
805eaf62fffSJeremy L Thompson 
806eaf62fffSJeremy L Thompson   @ref Utility
807eaf62fffSJeremy L Thompson **/
808b94338b9SJed Brown static int CeedSingleOperatorAssemblyCountEntries(CeedOperator op, CeedSize *num_entries) {
809b275c451SJeremy L Thompson   bool                is_composite;
810506b1a0cSSebastian Grimberg   CeedInt             num_elem_in, elem_size_in, num_comp_in, num_elem_out, elem_size_out, num_comp_out;
811506b1a0cSSebastian Grimberg   CeedElemRestriction rstr_in, rstr_out;
812eaf62fffSJeremy L Thompson 
813b275c451SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
8146574a04fSJeremy L Thompson   CeedCheck(!is_composite, op->ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported");
815506b1a0cSSebastian Grimberg 
816506b1a0cSSebastian Grimberg   CeedCall(CeedOperatorGetActiveElemRestrictions(op, &rstr_in, &rstr_out));
817506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionGetNumElements(rstr_in, &num_elem_in));
818506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionGetElementSize(rstr_in, &elem_size_in));
819506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionGetNumComponents(rstr_in, &num_comp_in));
820506b1a0cSSebastian Grimberg   if (rstr_in != rstr_out) {
821506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionGetNumElements(rstr_out, &num_elem_out));
822506b1a0cSSebastian Grimberg     CeedCheck(num_elem_in == num_elem_out, op->ceed, CEED_ERROR_UNSUPPORTED,
823506b1a0cSSebastian Grimberg               "Active input and output operator restrictions must have the same number of elements");
824506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionGetElementSize(rstr_out, &elem_size_out));
825506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionGetNumComponents(rstr_out, &num_comp_out));
826506b1a0cSSebastian Grimberg   } else {
827506b1a0cSSebastian Grimberg     num_elem_out  = num_elem_in;
828506b1a0cSSebastian Grimberg     elem_size_out = elem_size_in;
829506b1a0cSSebastian Grimberg     num_comp_out  = num_comp_in;
830506b1a0cSSebastian Grimberg   }
831506b1a0cSSebastian Grimberg   *num_entries = (CeedSize)elem_size_in * num_comp_in * elem_size_out * num_comp_out * num_elem_in;
832eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
833eaf62fffSJeremy L Thompson }
834eaf62fffSJeremy L Thompson 
835eaf62fffSJeremy L Thompson /**
836ea61e9acSJeremy L Thompson   @brief Common code for creating a multigrid coarse operator and level transfer operators for a CeedOperator
837eaf62fffSJeremy L Thompson 
838eaf62fffSJeremy L Thompson   @param[in]  op_fine      Fine grid operator
83985bb9dcfSJeremy L Thompson   @param[in]  p_mult_fine  L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators
840eaf62fffSJeremy L Thompson   @param[in]  rstr_coarse  Coarse grid restriction
841eaf62fffSJeremy L Thompson   @param[in]  basis_coarse Coarse grid active vector basis
84285bb9dcfSJeremy L Thompson   @param[in]  basis_c_to_f Basis for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators
843eaf62fffSJeremy L Thompson   @param[out] op_coarse    Coarse grid operator
84485bb9dcfSJeremy L Thompson   @param[out] op_prolong   Coarse to fine operator, or NULL
8457758292fSSebastian Grimberg   @param[out] op_restrict  Fine to coarse operator, or NULL
846eaf62fffSJeremy L Thompson 
847eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
848eaf62fffSJeremy L Thompson 
849eaf62fffSJeremy L Thompson   @ref Developer
850eaf62fffSJeremy L Thompson **/
8512b730f8bSJeremy L Thompson static int CeedSingleOperatorMultigridLevel(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse,
8527758292fSSebastian Grimberg                                             CeedBasis basis_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) {
8531c66c397SJeremy L Thompson   bool                is_composite;
854eaf62fffSJeremy L Thompson   Ceed                ceed;
8551c66c397SJeremy L Thompson   CeedInt             num_comp;
85685bb9dcfSJeremy L Thompson   CeedVector          mult_vec         = NULL;
8571c66c397SJeremy L Thompson   CeedElemRestriction rstr_p_mult_fine = NULL, rstr_fine = NULL;
8581c66c397SJeremy L Thompson 
8592b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op_fine, &ceed));
860eaf62fffSJeremy L Thompson 
861eaf62fffSJeremy L Thompson   // Check for composite operator
8622b730f8bSJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op_fine, &is_composite));
8636574a04fSJeremy L Thompson   CeedCheck(!is_composite, ceed, CEED_ERROR_UNSUPPORTED, "Automatic multigrid setup for composite operators not supported");
864eaf62fffSJeremy L Thompson 
865eaf62fffSJeremy L Thompson   // Coarse Grid
8662b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCreate(ceed, op_fine->qf, op_fine->dqf, op_fine->dqfT, op_coarse));
867eaf62fffSJeremy L Thompson   // -- Clone input fields
86892ae7e47SJeremy L Thompson   for (CeedInt i = 0; i < op_fine->qf->num_input_fields; i++) {
869eaf62fffSJeremy L Thompson     if (op_fine->input_fields[i]->vec == CEED_VECTOR_ACTIVE) {
870437c7c90SJeremy L Thompson       rstr_fine = op_fine->input_fields[i]->elem_rstr;
8712b730f8bSJeremy L Thompson       CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE));
872eaf62fffSJeremy L Thompson     } else {
873437c7c90SJeremy L Thompson       CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, op_fine->input_fields[i]->elem_rstr,
8742b730f8bSJeremy L Thompson                                     op_fine->input_fields[i]->basis, op_fine->input_fields[i]->vec));
875eaf62fffSJeremy L Thompson     }
876eaf62fffSJeremy L Thompson   }
877eaf62fffSJeremy L Thompson   // -- Clone output fields
87892ae7e47SJeremy L Thompson   for (CeedInt i = 0; i < op_fine->qf->num_output_fields; i++) {
879eaf62fffSJeremy L Thompson     if (op_fine->output_fields[i]->vec == CEED_VECTOR_ACTIVE) {
8802b730f8bSJeremy L Thompson       CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE));
881eaf62fffSJeremy L Thompson     } else {
882437c7c90SJeremy L Thompson       CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, op_fine->output_fields[i]->elem_rstr,
8832b730f8bSJeremy L Thompson                                     op_fine->output_fields[i]->basis, op_fine->output_fields[i]->vec));
884eaf62fffSJeremy L Thompson     }
885eaf62fffSJeremy L Thompson   }
886af99e877SJeremy L Thompson   // -- Clone QFunctionAssemblyData
8872b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op_fine->qf_assembled, &(*op_coarse)->qf_assembled));
888eaf62fffSJeremy L Thompson 
889eaf62fffSJeremy L Thompson   // Multiplicity vector
8907758292fSSebastian Grimberg   if (op_restrict || op_prolong) {
89185bb9dcfSJeremy L Thompson     CeedVector          mult_e_vec;
8921c66c397SJeremy L Thompson     CeedRestrictionType rstr_type;
89385bb9dcfSJeremy L Thompson 
8947c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionGetType(rstr_fine, &rstr_type));
8957c1dbaffSSebastian Grimberg     CeedCheck(rstr_type != CEED_RESTRICTION_CURL_ORIENTED, ceed, CEED_ERROR_UNSUPPORTED,
8967c1dbaffSSebastian Grimberg               "Element restrictions created with CeedElemRestrictionCreateCurlOriented are not supported");
8976574a04fSJeremy L Thompson     CeedCheck(p_mult_fine, ceed, CEED_ERROR_INCOMPATIBLE, "Prolongation or restriction operator creation requires fine grid multiplicity vector");
8987c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionCreateUnsignedCopy(rstr_fine, &rstr_p_mult_fine));
8992b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionCreateVector(rstr_fine, &mult_vec, &mult_e_vec));
9002b730f8bSJeremy L Thompson     CeedCall(CeedVectorSetValue(mult_e_vec, 0.0));
901c17ec2beSJeremy L Thompson     CeedCall(CeedElemRestrictionApply(rstr_p_mult_fine, CEED_NOTRANSPOSE, p_mult_fine, mult_e_vec, CEED_REQUEST_IMMEDIATE));
9022b730f8bSJeremy L Thompson     CeedCall(CeedVectorSetValue(mult_vec, 0.0));
903c17ec2beSJeremy L Thompson     CeedCall(CeedElemRestrictionApply(rstr_p_mult_fine, CEED_TRANSPOSE, mult_e_vec, mult_vec, CEED_REQUEST_IMMEDIATE));
9042b730f8bSJeremy L Thompson     CeedCall(CeedVectorDestroy(&mult_e_vec));
9052b730f8bSJeremy L Thompson     CeedCall(CeedVectorReciprocal(mult_vec));
90685bb9dcfSJeremy L Thompson   }
907eaf62fffSJeremy L Thompson 
908addd79feSZach Atkins   // Clone name
909addd79feSZach Atkins   bool   has_name = op_fine->name;
910addd79feSZach Atkins   size_t name_len = op_fine->name ? strlen(op_fine->name) : 0;
911addd79feSZach Atkins   CeedCall(CeedOperatorSetName(*op_coarse, op_fine->name));
912addd79feSZach Atkins 
9137758292fSSebastian Grimberg   // Check that coarse to fine basis is provided if prolong/restrict operators are requested
9147758292fSSebastian Grimberg   CeedCheck(basis_c_to_f || (!op_restrict && !op_prolong), ceed, CEED_ERROR_INCOMPATIBLE,
9156574a04fSJeremy L Thompson             "Prolongation or restriction operator creation requires coarse-to-fine basis");
91683d6adf3SZach Atkins 
91785bb9dcfSJeremy L Thompson   // Restriction/Prolongation Operators
9182b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumComponents(basis_coarse, &num_comp));
919addd79feSZach Atkins 
920addd79feSZach Atkins   // Restriction
9217758292fSSebastian Grimberg   if (op_restrict) {
922eaf62fffSJeremy L Thompson     CeedInt             *num_comp_r_data;
92385bb9dcfSJeremy L Thompson     CeedQFunctionContext ctx_r;
9247758292fSSebastian Grimberg     CeedQFunction        qf_restrict;
92585bb9dcfSJeremy L Thompson 
9267758292fSSebastian Grimberg     CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_restrict));
9272b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(1, &num_comp_r_data));
928eaf62fffSJeremy L Thompson     num_comp_r_data[0] = num_comp;
9292b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextCreate(ceed, &ctx_r));
9302b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextSetData(ctx_r, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_r_data), num_comp_r_data));
9317758292fSSebastian Grimberg     CeedCall(CeedQFunctionSetContext(qf_restrict, ctx_r));
9322b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextDestroy(&ctx_r));
9337758292fSSebastian Grimberg     CeedCall(CeedQFunctionAddInput(qf_restrict, "input", num_comp, CEED_EVAL_NONE));
9347758292fSSebastian Grimberg     CeedCall(CeedQFunctionAddInput(qf_restrict, "scale", num_comp, CEED_EVAL_NONE));
9357758292fSSebastian Grimberg     CeedCall(CeedQFunctionAddOutput(qf_restrict, "output", num_comp, CEED_EVAL_INTERP));
9367758292fSSebastian Grimberg     CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_restrict, num_comp));
937eaf62fffSJeremy L Thompson 
9387758292fSSebastian Grimberg     CeedCall(CeedOperatorCreate(ceed, qf_restrict, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_restrict));
9397758292fSSebastian Grimberg     CeedCall(CeedOperatorSetField(*op_restrict, "input", rstr_fine, CEED_BASIS_NONE, CEED_VECTOR_ACTIVE));
9407758292fSSebastian Grimberg     CeedCall(CeedOperatorSetField(*op_restrict, "scale", rstr_p_mult_fine, CEED_BASIS_NONE, mult_vec));
9417758292fSSebastian Grimberg     CeedCall(CeedOperatorSetField(*op_restrict, "output", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE));
942eaf62fffSJeremy L Thompson 
943addd79feSZach Atkins     // Set name
944addd79feSZach Atkins     char *restriction_name;
9451c66c397SJeremy L Thompson 
946addd79feSZach Atkins     CeedCall(CeedCalloc(17 + name_len, &restriction_name));
947addd79feSZach Atkins     sprintf(restriction_name, "restriction%s%s", has_name ? " for " : "", has_name ? op_fine->name : "");
9487758292fSSebastian Grimberg     CeedCall(CeedOperatorSetName(*op_restrict, restriction_name));
949addd79feSZach Atkins     CeedCall(CeedFree(&restriction_name));
950addd79feSZach Atkins 
951addd79feSZach Atkins     // Check
9527758292fSSebastian Grimberg     CeedCall(CeedOperatorCheckReady(*op_restrict));
953addd79feSZach Atkins 
954addd79feSZach Atkins     // Cleanup
9557758292fSSebastian Grimberg     CeedCall(CeedQFunctionDestroy(&qf_restrict));
956addd79feSZach Atkins   }
957addd79feSZach Atkins 
958eaf62fffSJeremy L Thompson   // Prolongation
959addd79feSZach Atkins   if (op_prolong) {
960eaf62fffSJeremy L Thompson     CeedInt             *num_comp_p_data;
96185bb9dcfSJeremy L Thompson     CeedQFunctionContext ctx_p;
9621c66c397SJeremy L Thompson     CeedQFunction        qf_prolong;
96385bb9dcfSJeremy L Thompson 
96485bb9dcfSJeremy L Thompson     CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_prolong));
9652b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(1, &num_comp_p_data));
966eaf62fffSJeremy L Thompson     num_comp_p_data[0] = num_comp;
9672b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextCreate(ceed, &ctx_p));
9682b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextSetData(ctx_p, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_p_data), num_comp_p_data));
9692b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionSetContext(qf_prolong, ctx_p));
9702b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextDestroy(&ctx_p));
9712b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddInput(qf_prolong, "input", num_comp, CEED_EVAL_INTERP));
9722b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddInput(qf_prolong, "scale", num_comp, CEED_EVAL_NONE));
9732b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddOutput(qf_prolong, "output", num_comp, CEED_EVAL_NONE));
9742b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_prolong, num_comp));
975eaf62fffSJeremy L Thompson 
9762b730f8bSJeremy L Thompson     CeedCall(CeedOperatorCreate(ceed, qf_prolong, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_prolong));
9772b730f8bSJeremy L Thompson     CeedCall(CeedOperatorSetField(*op_prolong, "input", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE));
978356036faSJeremy L Thompson     CeedCall(CeedOperatorSetField(*op_prolong, "scale", rstr_p_mult_fine, CEED_BASIS_NONE, mult_vec));
979356036faSJeremy L Thompson     CeedCall(CeedOperatorSetField(*op_prolong, "output", rstr_fine, CEED_BASIS_NONE, CEED_VECTOR_ACTIVE));
980eaf62fffSJeremy L Thompson 
981addd79feSZach Atkins     // Set name
982ea6b5821SJeremy L Thompson     char *prolongation_name;
9831c66c397SJeremy L Thompson 
9842b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(18 + name_len, &prolongation_name));
9852b730f8bSJeremy L Thompson     sprintf(prolongation_name, "prolongation%s%s", has_name ? " for " : "", has_name ? op_fine->name : "");
9862b730f8bSJeremy L Thompson     CeedCall(CeedOperatorSetName(*op_prolong, prolongation_name));
9872b730f8bSJeremy L Thompson     CeedCall(CeedFree(&prolongation_name));
988addd79feSZach Atkins 
989addd79feSZach Atkins     // Check
990addd79feSZach Atkins     CeedCall(CeedOperatorCheckReady(*op_prolong));
991addd79feSZach Atkins 
992addd79feSZach Atkins     // Cleanup
993addd79feSZach Atkins     CeedCall(CeedQFunctionDestroy(&qf_prolong));
994ea6b5821SJeremy L Thompson   }
995ea6b5821SJeremy L Thompson 
99658e4b056SJeremy L Thompson   // Check
99758e4b056SJeremy L Thompson   CeedCall(CeedOperatorCheckReady(*op_coarse));
99858e4b056SJeremy L Thompson 
999eaf62fffSJeremy L Thompson   // Cleanup
10002b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&mult_vec));
1001c17ec2beSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&rstr_p_mult_fine));
10022b730f8bSJeremy L Thompson   CeedCall(CeedBasisDestroy(&basis_c_to_f));
1003eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1004eaf62fffSJeremy L Thompson }
1005eaf62fffSJeremy L Thompson 
1006eaf62fffSJeremy L Thompson /**
1007eaf62fffSJeremy L Thompson   @brief Build 1D mass matrix and Laplacian with perturbation
1008eaf62fffSJeremy L Thompson 
1009eaf62fffSJeremy L Thompson   @param[in]  interp_1d   Interpolation matrix in one dimension
1010eaf62fffSJeremy L Thompson   @param[in]  grad_1d     Gradient matrix in one dimension
1011eaf62fffSJeremy L Thompson   @param[in]  q_weight_1d Quadrature weights in one dimension
1012eaf62fffSJeremy L Thompson   @param[in]  P_1d        Number of basis nodes in one dimension
1013eaf62fffSJeremy L Thompson   @param[in]  Q_1d        Number of quadrature points in one dimension
1014eaf62fffSJeremy L Thompson   @param[in]  dim         Dimension of basis
1015eaf62fffSJeremy L Thompson   @param[out] mass        Assembled mass matrix in one dimension
1016eaf62fffSJeremy L Thompson   @param[out] laplace     Assembled perturbed Laplacian in one dimension
1017eaf62fffSJeremy L Thompson 
1018eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1019eaf62fffSJeremy L Thompson 
1020eaf62fffSJeremy L Thompson   @ref Developer
1021eaf62fffSJeremy L Thompson **/
10222c2ea1dbSJeremy L Thompson CeedPragmaOptimizeOff
10232c2ea1dbSJeremy L Thompson static int CeedBuildMassLaplace(const CeedScalar *interp_1d, const CeedScalar *grad_1d, const CeedScalar *q_weight_1d, CeedInt P_1d, CeedInt Q_1d,
10242c2ea1dbSJeremy L Thompson                                 CeedInt dim, CeedScalar *mass, CeedScalar *laplace) {
10252b730f8bSJeremy L Thompson   for (CeedInt i = 0; i < P_1d; i++) {
1026eaf62fffSJeremy L Thompson     for (CeedInt j = 0; j < P_1d; j++) {
1027eaf62fffSJeremy L Thompson       CeedScalar sum = 0.0;
10282b730f8bSJeremy L Thompson       for (CeedInt k = 0; k < Q_1d; k++) sum += interp_1d[k * P_1d + i] * q_weight_1d[k] * interp_1d[k * P_1d + j];
1029eaf62fffSJeremy L Thompson       mass[i + j * P_1d] = sum;
1030eaf62fffSJeremy L Thompson     }
10312b730f8bSJeremy L Thompson   }
1032eaf62fffSJeremy L Thompson   // -- Laplacian
10332b730f8bSJeremy L Thompson   for (CeedInt i = 0; i < P_1d; i++) {
1034eaf62fffSJeremy L Thompson     for (CeedInt j = 0; j < P_1d; j++) {
1035eaf62fffSJeremy L Thompson       CeedScalar sum = 0.0;
10361c66c397SJeremy L Thompson 
10372b730f8bSJeremy L Thompson       for (CeedInt k = 0; k < Q_1d; k++) sum += grad_1d[k * P_1d + i] * q_weight_1d[k] * grad_1d[k * P_1d + j];
1038eaf62fffSJeremy L Thompson       laplace[i + j * P_1d] = sum;
1039eaf62fffSJeremy L Thompson     }
10402b730f8bSJeremy L Thompson   }
1041eaf62fffSJeremy L Thompson   CeedScalar perturbation = dim > 2 ? 1e-6 : 1e-4;
10422b730f8bSJeremy L Thompson   for (CeedInt i = 0; i < P_1d; i++) laplace[i + P_1d * i] += perturbation;
1043eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1044eaf62fffSJeremy L Thompson }
10452c2ea1dbSJeremy L Thompson CeedPragmaOptimizeOn
1046eaf62fffSJeremy L Thompson 
1047eaf62fffSJeremy L Thompson /// @}
1048eaf62fffSJeremy L Thompson 
1049eaf62fffSJeremy L Thompson /// ----------------------------------------------------------------------------
1050480fae85SJeremy L Thompson /// CeedOperator Backend API
1051480fae85SJeremy L Thompson /// ----------------------------------------------------------------------------
1052480fae85SJeremy L Thompson /// @addtogroup CeedOperatorBackend
1053480fae85SJeremy L Thompson /// @{
1054480fae85SJeremy L Thompson 
1055480fae85SJeremy L Thompson /**
1056506b1a0cSSebastian Grimberg   @brief Create point block restriction for active operator field
1057506b1a0cSSebastian Grimberg 
1058506b1a0cSSebastian Grimberg   @param[in]  rstr             Original CeedElemRestriction for active field
1059506b1a0cSSebastian Grimberg   @param[out] point_block_rstr Address of the variable where the newly created CeedElemRestriction will be stored
1060506b1a0cSSebastian Grimberg 
1061506b1a0cSSebastian Grimberg   @return An error code: 0 - success, otherwise - failure
1062506b1a0cSSebastian Grimberg 
1063506b1a0cSSebastian Grimberg   @ref Backend
1064506b1a0cSSebastian Grimberg **/
1065506b1a0cSSebastian Grimberg int CeedOperatorCreateActivePointBlockRestriction(CeedElemRestriction rstr, CeedElemRestriction *point_block_rstr) {
1066506b1a0cSSebastian Grimberg   Ceed           ceed;
1067506b1a0cSSebastian Grimberg   CeedInt        num_elem, num_comp, shift, elem_size, comp_stride, *point_block_offsets;
1068506b1a0cSSebastian Grimberg   CeedSize       l_size;
1069506b1a0cSSebastian Grimberg   const CeedInt *offsets;
1070506b1a0cSSebastian Grimberg 
1071506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionGetCeed(rstr, &ceed));
1072506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionGetOffsets(rstr, CEED_MEM_HOST, &offsets));
1073506b1a0cSSebastian Grimberg 
1074506b1a0cSSebastian Grimberg   // Expand offsets
1075506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem));
1076506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp));
1077506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size));
1078506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionGetCompStride(rstr, &comp_stride));
1079506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size));
1080506b1a0cSSebastian Grimberg   shift = num_comp;
1081506b1a0cSSebastian Grimberg   if (comp_stride != 1) shift *= num_comp;
1082506b1a0cSSebastian Grimberg   CeedCall(CeedCalloc(num_elem * elem_size, &point_block_offsets));
1083506b1a0cSSebastian Grimberg   for (CeedInt i = 0; i < num_elem * elem_size; i++) {
1084506b1a0cSSebastian Grimberg     point_block_offsets[i] = offsets[i] * shift;
1085506b1a0cSSebastian Grimberg   }
1086506b1a0cSSebastian Grimberg 
1087506b1a0cSSebastian Grimberg   // Create new restriction
1088506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionCreate(ceed, num_elem, elem_size, num_comp * num_comp, 1, l_size * num_comp, CEED_MEM_HOST, CEED_OWN_POINTER,
1089506b1a0cSSebastian Grimberg                                      point_block_offsets, point_block_rstr));
1090506b1a0cSSebastian Grimberg 
1091506b1a0cSSebastian Grimberg   // Cleanup
1092506b1a0cSSebastian Grimberg   CeedCall(CeedElemRestrictionRestoreOffsets(rstr, &offsets));
1093506b1a0cSSebastian Grimberg   return CEED_ERROR_SUCCESS;
1094506b1a0cSSebastian Grimberg }
1095506b1a0cSSebastian Grimberg 
1096506b1a0cSSebastian Grimberg /**
1097480fae85SJeremy L Thompson   @brief Create object holding CeedQFunction assembly data for CeedOperator
1098480fae85SJeremy L Thompson 
1099480fae85SJeremy L Thompson   @param[in]  ceed A Ceed object where the CeedQFunctionAssemblyData will be created
1100ea61e9acSJeremy L Thompson   @param[out] data Address of the variable where the newly created CeedQFunctionAssemblyData will be stored
1101480fae85SJeremy L Thompson 
1102480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1103480fae85SJeremy L Thompson 
1104480fae85SJeremy L Thompson   @ref Backend
1105480fae85SJeremy L Thompson **/
1106ea61e9acSJeremy L Thompson int CeedQFunctionAssemblyDataCreate(Ceed ceed, CeedQFunctionAssemblyData *data) {
11072b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(1, data));
1108480fae85SJeremy L Thompson   (*data)->ref_count = 1;
1109480fae85SJeremy L Thompson   (*data)->ceed      = ceed;
11102b730f8bSJeremy L Thompson   CeedCall(CeedReference(ceed));
1111480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1112480fae85SJeremy L Thompson }
1113480fae85SJeremy L Thompson 
1114480fae85SJeremy L Thompson /**
1115480fae85SJeremy L Thompson   @brief Increment the reference counter for a CeedQFunctionAssemblyData
1116480fae85SJeremy L Thompson 
1117ea61e9acSJeremy L Thompson   @param[in,out] data CeedQFunctionAssemblyData to increment the reference counter
1118480fae85SJeremy L Thompson 
1119480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1120480fae85SJeremy L Thompson 
1121480fae85SJeremy L Thompson   @ref Backend
1122480fae85SJeremy L Thompson **/
1123480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataReference(CeedQFunctionAssemblyData data) {
1124480fae85SJeremy L Thompson   data->ref_count++;
1125480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1126480fae85SJeremy L Thompson }
1127480fae85SJeremy L Thompson 
1128480fae85SJeremy L Thompson /**
1129beecbf24SJeremy L Thompson   @brief Set re-use of CeedQFunctionAssemblyData
11308b919e6bSJeremy L Thompson 
1131ea61e9acSJeremy L Thompson   @param[in,out] data       CeedQFunctionAssemblyData to mark for reuse
1132ea61e9acSJeremy L Thompson   @param[in]     reuse_data Boolean flag indicating data re-use
11338b919e6bSJeremy L Thompson 
11348b919e6bSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
11358b919e6bSJeremy L Thompson 
11368b919e6bSJeremy L Thompson   @ref Backend
11378b919e6bSJeremy L Thompson **/
11382b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetReuse(CeedQFunctionAssemblyData data, bool reuse_data) {
1139beecbf24SJeremy L Thompson   data->reuse_data        = reuse_data;
1140beecbf24SJeremy L Thompson   data->needs_data_update = true;
1141beecbf24SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1142beecbf24SJeremy L Thompson }
1143beecbf24SJeremy L Thompson 
1144beecbf24SJeremy L Thompson /**
1145beecbf24SJeremy L Thompson   @brief Mark QFunctionAssemblyData as stale
1146beecbf24SJeremy L Thompson 
1147ea61e9acSJeremy L Thompson   @param[in,out] data              CeedQFunctionAssemblyData to mark as stale
1148ea61e9acSJeremy L Thompson   @param[in]     needs_data_update Boolean flag indicating if update is needed or completed
1149beecbf24SJeremy L Thompson 
1150beecbf24SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1151beecbf24SJeremy L Thompson 
1152beecbf24SJeremy L Thompson   @ref Backend
1153beecbf24SJeremy L Thompson **/
11542b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetUpdateNeeded(CeedQFunctionAssemblyData data, bool needs_data_update) {
1155beecbf24SJeremy L Thompson   data->needs_data_update = needs_data_update;
11568b919e6bSJeremy L Thompson   return CEED_ERROR_SUCCESS;
11578b919e6bSJeremy L Thompson }
11588b919e6bSJeremy L Thompson 
11598b919e6bSJeremy L Thompson /**
11608b919e6bSJeremy L Thompson   @brief Determine if QFunctionAssemblyData needs update
11618b919e6bSJeremy L Thompson 
11628b919e6bSJeremy L Thompson   @param[in]  data             CeedQFunctionAssemblyData to mark as stale
11638b919e6bSJeremy L Thompson   @param[out] is_update_needed Boolean flag indicating if re-assembly is required
11648b919e6bSJeremy L Thompson 
11658b919e6bSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
11668b919e6bSJeremy L Thompson 
11678b919e6bSJeremy L Thompson   @ref Backend
11688b919e6bSJeremy L Thompson **/
11692b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsUpdateNeeded(CeedQFunctionAssemblyData data, bool *is_update_needed) {
1170beecbf24SJeremy L Thompson   *is_update_needed = !data->reuse_data || data->needs_data_update;
11718b919e6bSJeremy L Thompson   return CEED_ERROR_SUCCESS;
11728b919e6bSJeremy L Thompson }
11738b919e6bSJeremy L Thompson 
11748b919e6bSJeremy L Thompson /**
1175ea61e9acSJeremy L Thompson   @brief Copy the pointer to a CeedQFunctionAssemblyData.
11764385fb7fSSebastian Grimberg 
1177ea61e9acSJeremy L Thompson   Both pointers should be destroyed with `CeedCeedQFunctionAssemblyDataDestroy()`.
1178512bb800SJeremy L Thompson 
1179512bb800SJeremy L Thompson   Note: If the value of `data_copy` passed to this function is non-NULL, then it is assumed that `*data_copy` is a pointer to a
1180512bb800SJeremy L Thompson         CeedQFunctionAssemblyData. This CeedQFunctionAssemblyData will be destroyed if `data_copy` is the only reference to this
1181512bb800SJeremy L Thompson         CeedQFunctionAssemblyData.
1182480fae85SJeremy L Thompson 
1183ea61e9acSJeremy L Thompson   @param[in]     data      CeedQFunctionAssemblyData to copy reference to
1184ea61e9acSJeremy L Thompson   @param[in,out] data_copy Variable to store copied reference
1185480fae85SJeremy L Thompson 
1186480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1187480fae85SJeremy L Thompson 
1188480fae85SJeremy L Thompson   @ref Backend
1189480fae85SJeremy L Thompson **/
11902b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataReferenceCopy(CeedQFunctionAssemblyData data, CeedQFunctionAssemblyData *data_copy) {
11912b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAssemblyDataReference(data));
11922b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAssemblyDataDestroy(data_copy));
1193480fae85SJeremy L Thompson   *data_copy = data;
1194480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1195480fae85SJeremy L Thompson }
1196480fae85SJeremy L Thompson 
1197480fae85SJeremy L Thompson /**
1198480fae85SJeremy L Thompson   @brief Get setup status for internal objects for CeedQFunctionAssemblyData
1199480fae85SJeremy L Thompson 
1200ea61e9acSJeremy L Thompson   @param[in]  data     CeedQFunctionAssemblyData to retrieve status
1201480fae85SJeremy L Thompson   @param[out] is_setup Boolean flag for setup status
1202480fae85SJeremy L Thompson 
1203480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1204480fae85SJeremy L Thompson 
1205480fae85SJeremy L Thompson   @ref Backend
1206480fae85SJeremy L Thompson **/
12072b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsSetup(CeedQFunctionAssemblyData data, bool *is_setup) {
1208480fae85SJeremy L Thompson   *is_setup = data->is_setup;
1209480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1210480fae85SJeremy L Thompson }
1211480fae85SJeremy L Thompson 
1212480fae85SJeremy L Thompson /**
1213480fae85SJeremy L Thompson   @brief Set internal objects for CeedQFunctionAssemblyData
1214480fae85SJeremy L Thompson 
1215ea61e9acSJeremy L Thompson   @param[in,out] data CeedQFunctionAssemblyData to set objects
1216480fae85SJeremy L Thompson   @param[in]     vec  CeedVector to store assembled CeedQFunction at quadrature points
1217480fae85SJeremy L Thompson   @param[in]     rstr CeedElemRestriction for CeedVector containing assembled CeedQFunction
1218480fae85SJeremy L Thompson 
1219480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1220480fae85SJeremy L Thompson 
1221480fae85SJeremy L Thompson   @ref Backend
1222480fae85SJeremy L Thompson **/
12232b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetObjects(CeedQFunctionAssemblyData data, CeedVector vec, CeedElemRestriction rstr) {
12242b730f8bSJeremy L Thompson   CeedCall(CeedVectorReferenceCopy(vec, &data->vec));
12252b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionReferenceCopy(rstr, &data->rstr));
1226480fae85SJeremy L Thompson 
1227480fae85SJeremy L Thompson   data->is_setup = true;
1228480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1229480fae85SJeremy L Thompson }
1230480fae85SJeremy L Thompson 
12312b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataGetObjects(CeedQFunctionAssemblyData data, CeedVector *vec, CeedElemRestriction *rstr) {
12326574a04fSJeremy L Thompson   CeedCheck(data->is_setup, data->ceed, CEED_ERROR_INCOMPLETE, "Internal objects not set; must call CeedQFunctionAssemblyDataSetObjects first.");
1233480fae85SJeremy L Thompson 
12342b730f8bSJeremy L Thompson   CeedCall(CeedVectorReferenceCopy(data->vec, vec));
12352b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionReferenceCopy(data->rstr, rstr));
1236480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1237480fae85SJeremy L Thompson }
1238480fae85SJeremy L Thompson 
1239480fae85SJeremy L Thompson /**
1240480fae85SJeremy L Thompson   @brief Destroy CeedQFunctionAssemblyData
1241480fae85SJeremy L Thompson 
1242ea61e9acSJeremy L Thompson   @param[in,out] data  CeedQFunctionAssemblyData to destroy
1243480fae85SJeremy L Thompson 
1244480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1245480fae85SJeremy L Thompson 
1246480fae85SJeremy L Thompson   @ref Backend
1247480fae85SJeremy L Thompson **/
1248480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataDestroy(CeedQFunctionAssemblyData *data) {
1249ad6481ceSJeremy L Thompson   if (!*data || --(*data)->ref_count > 0) {
1250ad6481ceSJeremy L Thompson     *data = NULL;
1251ad6481ceSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1252ad6481ceSJeremy L Thompson   }
12532b730f8bSJeremy L Thompson   CeedCall(CeedDestroy(&(*data)->ceed));
12542b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&(*data)->vec));
12552b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&(*data)->rstr));
1256480fae85SJeremy L Thompson 
12572b730f8bSJeremy L Thompson   CeedCall(CeedFree(data));
1258480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1259480fae85SJeremy L Thompson }
1260480fae85SJeremy L Thompson 
1261ed9e99e6SJeremy L Thompson /**
1262ed9e99e6SJeremy L Thompson   @brief Get CeedOperatorAssemblyData
1263ed9e99e6SJeremy L Thompson 
1264ed9e99e6SJeremy L Thompson   @param[in]  op   CeedOperator to assemble
1265ed9e99e6SJeremy L Thompson   @param[out] data CeedQFunctionAssemblyData
1266ed9e99e6SJeremy L Thompson 
1267ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1268ed9e99e6SJeremy L Thompson 
1269ed9e99e6SJeremy L Thompson   @ref Backend
1270ed9e99e6SJeremy L Thompson **/
12712b730f8bSJeremy L Thompson int CeedOperatorGetOperatorAssemblyData(CeedOperator op, CeedOperatorAssemblyData *data) {
1272ed9e99e6SJeremy L Thompson   if (!op->op_assembled) {
1273ed9e99e6SJeremy L Thompson     CeedOperatorAssemblyData data;
1274ed9e99e6SJeremy L Thompson 
12752b730f8bSJeremy L Thompson     CeedCall(CeedOperatorAssemblyDataCreate(op->ceed, op, &data));
1276ed9e99e6SJeremy L Thompson     op->op_assembled = data;
1277ed9e99e6SJeremy L Thompson   }
1278ed9e99e6SJeremy L Thompson   *data = op->op_assembled;
1279ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1280ed9e99e6SJeremy L Thompson }
1281ed9e99e6SJeremy L Thompson 
1282ed9e99e6SJeremy L Thompson /**
1283ba746a46SJeremy L Thompson   @brief Create object holding CeedOperator assembly data.
1284ba746a46SJeremy L Thompson 
1285ba746a46SJeremy L Thompson   The CeedOperatorAssemblyData holds an array with references to every active CeedBasis used in the CeedOperator.
1286ba746a46SJeremy L Thompson   An array with references to the corresponding active CeedElemRestrictions is also stored.
1287ba746a46SJeremy L Thompson   For each active CeedBasis, the CeedOperatorAssemblyData holds an array of all input and output CeedEvalModes for this CeedBasis.
1288ba746a46SJeremy L Thompson   The CeedOperatorAssemblyData holds an array of offsets for indexing into the assembled CeedQFunction arrays to the row representing each
1289ba746a46SJeremy L Thompson CeedEvalMode.
1290ba746a46SJeremy L Thompson   The number of input columns across all active bases for the assembled CeedQFunction is also stored.
1291ba746a46SJeremy L Thompson   Lastly, the CeedOperatorAssembly data holds assembled matrices representing the full action of the CeedBasis for all CeedEvalModes.
1292ed9e99e6SJeremy L Thompson 
1293ea61e9acSJeremy L Thompson   @param[in]  ceed Ceed object where the CeedOperatorAssemblyData will be created
1294ed9e99e6SJeremy L Thompson   @param[in]  op   CeedOperator to be assembled
1295ea61e9acSJeremy L Thompson   @param[out] data Address of the variable where the newly created CeedOperatorAssemblyData will be stored
1296ed9e99e6SJeremy L Thompson 
1297ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1298ed9e99e6SJeremy L Thompson 
1299ed9e99e6SJeremy L Thompson   @ref Backend
1300ed9e99e6SJeremy L Thompson **/
13012b730f8bSJeremy L Thompson int CeedOperatorAssemblyDataCreate(Ceed ceed, CeedOperator op, CeedOperatorAssemblyData *data) {
1302506b1a0cSSebastian Grimberg   CeedInt             num_active_bases_in = 0, num_active_bases_out = 0, offset = 0;
1303506b1a0cSSebastian Grimberg   CeedInt             num_input_fields, *num_eval_modes_in = NULL, num_output_fields, *num_eval_modes_out = NULL;
13041c66c397SJeremy L Thompson   CeedSize          **eval_mode_offsets_in = NULL, **eval_mode_offsets_out = NULL;
13051c66c397SJeremy L Thompson   CeedEvalMode      **eval_modes_in = NULL, **eval_modes_out = NULL;
13061c66c397SJeremy L Thompson   CeedQFunctionField *qf_fields;
13071c66c397SJeremy L Thompson   CeedQFunction       qf;
13081c66c397SJeremy L Thompson   CeedOperatorField  *op_fields;
130901f0e615SJames Wright   bool                is_composite;
131001f0e615SJames Wright 
131101f0e615SJames Wright   CeedCall(CeedOperatorIsComposite(op, &is_composite));
131201f0e615SJames Wright   CeedCheck(!is_composite, ceed, CEED_ERROR_INCOMPATIBLE, "Can only create CeedOperator assembly data for non-composite operators.");
1313437c7c90SJeremy L Thompson 
1314437c7c90SJeremy L Thompson   // Allocate
13152b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(1, data));
1316ed9e99e6SJeremy L Thompson   (*data)->ceed = ceed;
13172b730f8bSJeremy L Thompson   CeedCall(CeedReference(ceed));
1318ed9e99e6SJeremy L Thompson 
1319ed9e99e6SJeremy L Thompson   // Build OperatorAssembly data
13202b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetQFunction(op, &qf));
13212b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionGetFields(qf, &num_input_fields, &qf_fields, NULL, NULL));
13222b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL));
1323ed9e99e6SJeremy L Thompson 
1324ed9e99e6SJeremy L Thompson   // Determine active input basis
1325ed9e99e6SJeremy L Thompson   for (CeedInt i = 0; i < num_input_fields; i++) {
1326ed9e99e6SJeremy L Thompson     CeedVector vec;
13271c66c397SJeremy L Thompson 
13282b730f8bSJeremy L Thompson     CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec));
1329ed9e99e6SJeremy L Thompson     if (vec == CEED_VECTOR_ACTIVE) {
13307c1dbaffSSebastian Grimberg       CeedInt      index = -1, num_comp, q_comp;
13311c66c397SJeremy L Thompson       CeedEvalMode eval_mode;
13321c66c397SJeremy L Thompson       CeedBasis    basis_in = NULL;
13331c66c397SJeremy L Thompson 
13342b730f8bSJeremy L Thompson       CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_in));
13352b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode));
1336352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetNumComponents(basis_in, &num_comp));
1337352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetNumQuadratureComponents(basis_in, eval_mode, &q_comp));
1338506b1a0cSSebastian Grimberg       for (CeedInt i = 0; i < num_active_bases_in; i++) {
1339506b1a0cSSebastian Grimberg         if ((*data)->active_bases_in[i] == basis_in) index = i;
1340437c7c90SJeremy L Thompson       }
1341437c7c90SJeremy L Thompson       if (index == -1) {
1342437c7c90SJeremy L Thompson         CeedElemRestriction elem_rstr_in;
13431c66c397SJeremy L Thompson 
1344506b1a0cSSebastian Grimberg         index = num_active_bases_in;
1345506b1a0cSSebastian Grimberg         CeedCall(CeedRealloc(num_active_bases_in + 1, &(*data)->active_bases_in));
1346506b1a0cSSebastian Grimberg         (*data)->active_bases_in[num_active_bases_in] = NULL;
1347506b1a0cSSebastian Grimberg         CeedCall(CeedBasisReferenceCopy(basis_in, &(*data)->active_bases_in[num_active_bases_in]));
1348506b1a0cSSebastian Grimberg         CeedCall(CeedRealloc(num_active_bases_in + 1, &(*data)->active_elem_rstrs_in));
1349506b1a0cSSebastian Grimberg         (*data)->active_elem_rstrs_in[num_active_bases_in] = NULL;
1350437c7c90SJeremy L Thompson         CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr_in));
1351506b1a0cSSebastian Grimberg         CeedCall(CeedElemRestrictionReferenceCopy(elem_rstr_in, &(*data)->active_elem_rstrs_in[num_active_bases_in]));
1352506b1a0cSSebastian Grimberg         CeedCall(CeedRealloc(num_active_bases_in + 1, &num_eval_modes_in));
1353437c7c90SJeremy L Thompson         num_eval_modes_in[index] = 0;
1354506b1a0cSSebastian Grimberg         CeedCall(CeedRealloc(num_active_bases_in + 1, &eval_modes_in));
1355437c7c90SJeremy L Thompson         eval_modes_in[index] = NULL;
1356506b1a0cSSebastian Grimberg         CeedCall(CeedRealloc(num_active_bases_in + 1, &eval_mode_offsets_in));
1357437c7c90SJeremy L Thompson         eval_mode_offsets_in[index] = NULL;
1358506b1a0cSSebastian Grimberg         CeedCall(CeedRealloc(num_active_bases_in + 1, &(*data)->assembled_bases_in));
1359437c7c90SJeremy L Thompson         (*data)->assembled_bases_in[index] = NULL;
1360506b1a0cSSebastian Grimberg         num_active_bases_in++;
1361437c7c90SJeremy L Thompson       }
1362352a5e7cSSebastian Grimberg       if (eval_mode != CEED_EVAL_WEIGHT) {
1363352a5e7cSSebastian Grimberg         // q_comp = 1 if CEED_EVAL_NONE, CEED_EVAL_WEIGHT caught by QF Assembly
1364352a5e7cSSebastian Grimberg         CeedCall(CeedRealloc(num_eval_modes_in[index] + q_comp, &eval_modes_in[index]));
1365352a5e7cSSebastian Grimberg         CeedCall(CeedRealloc(num_eval_modes_in[index] + q_comp, &eval_mode_offsets_in[index]));
1366352a5e7cSSebastian Grimberg         for (CeedInt d = 0; d < q_comp; d++) {
1367437c7c90SJeremy L Thompson           eval_modes_in[index][num_eval_modes_in[index] + d]        = eval_mode;
1368437c7c90SJeremy L Thompson           eval_mode_offsets_in[index][num_eval_modes_in[index] + d] = offset;
1369352a5e7cSSebastian Grimberg           offset += num_comp;
1370ed9e99e6SJeremy L Thompson         }
1371352a5e7cSSebastian Grimberg         num_eval_modes_in[index] += q_comp;
1372ed9e99e6SJeremy L Thompson       }
1373ed9e99e6SJeremy L Thompson     }
1374ed9e99e6SJeremy L Thompson   }
1375ed9e99e6SJeremy L Thompson 
1376ed9e99e6SJeremy L Thompson   // Determine active output basis
13772b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionGetFields(qf, NULL, NULL, &num_output_fields, &qf_fields));
13782b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields));
1379437c7c90SJeremy L Thompson   offset = 0;
1380ed9e99e6SJeremy L Thompson   for (CeedInt i = 0; i < num_output_fields; i++) {
1381ed9e99e6SJeremy L Thompson     CeedVector vec;
13821c66c397SJeremy L Thompson 
13832b730f8bSJeremy L Thompson     CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec));
1384ed9e99e6SJeremy L Thompson     if (vec == CEED_VECTOR_ACTIVE) {
13857c1dbaffSSebastian Grimberg       CeedInt      index = -1, num_comp, q_comp;
13861c66c397SJeremy L Thompson       CeedEvalMode eval_mode;
13871c66c397SJeremy L Thompson       CeedBasis    basis_out = NULL;
13881c66c397SJeremy L Thompson 
1389437c7c90SJeremy L Thompson       CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_out));
13902b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode));
1391352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetNumComponents(basis_out, &num_comp));
1392352a5e7cSSebastian Grimberg       CeedCall(CeedBasisGetNumQuadratureComponents(basis_out, eval_mode, &q_comp));
1393506b1a0cSSebastian Grimberg       for (CeedInt i = 0; i < num_active_bases_out; i++) {
1394506b1a0cSSebastian Grimberg         if ((*data)->active_bases_out[i] == basis_out) index = i;
1395437c7c90SJeremy L Thompson       }
1396437c7c90SJeremy L Thompson       if (index == -1) {
1397437c7c90SJeremy L Thompson         CeedElemRestriction elem_rstr_out;
13981c66c397SJeremy L Thompson 
1399506b1a0cSSebastian Grimberg         index = num_active_bases_out;
1400506b1a0cSSebastian Grimberg         CeedCall(CeedRealloc(num_active_bases_out + 1, &(*data)->active_bases_out));
1401506b1a0cSSebastian Grimberg         (*data)->active_bases_out[num_active_bases_out] = NULL;
1402506b1a0cSSebastian Grimberg         CeedCall(CeedBasisReferenceCopy(basis_out, &(*data)->active_bases_out[num_active_bases_out]));
1403506b1a0cSSebastian Grimberg         CeedCall(CeedRealloc(num_active_bases_out + 1, &(*data)->active_elem_rstrs_out));
1404506b1a0cSSebastian Grimberg         (*data)->active_elem_rstrs_out[num_active_bases_out] = NULL;
1405437c7c90SJeremy L Thompson         CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &elem_rstr_out));
1406506b1a0cSSebastian Grimberg         CeedCall(CeedElemRestrictionReferenceCopy(elem_rstr_out, &(*data)->active_elem_rstrs_out[num_active_bases_out]));
1407506b1a0cSSebastian Grimberg         CeedCall(CeedRealloc(num_active_bases_out + 1, &num_eval_modes_out));
1408437c7c90SJeremy L Thompson         num_eval_modes_out[index] = 0;
1409506b1a0cSSebastian Grimberg         CeedCall(CeedRealloc(num_active_bases_out + 1, &eval_modes_out));
1410437c7c90SJeremy L Thompson         eval_modes_out[index] = NULL;
1411506b1a0cSSebastian Grimberg         CeedCall(CeedRealloc(num_active_bases_out + 1, &eval_mode_offsets_out));
1412437c7c90SJeremy L Thompson         eval_mode_offsets_out[index] = NULL;
1413506b1a0cSSebastian Grimberg         CeedCall(CeedRealloc(num_active_bases_out + 1, &(*data)->assembled_bases_out));
1414437c7c90SJeremy L Thompson         (*data)->assembled_bases_out[index] = NULL;
1415506b1a0cSSebastian Grimberg         num_active_bases_out++;
1416437c7c90SJeremy L Thompson       }
1417352a5e7cSSebastian Grimberg       if (eval_mode != CEED_EVAL_WEIGHT) {
1418352a5e7cSSebastian Grimberg         // q_comp = 1 if CEED_EVAL_NONE, CEED_EVAL_WEIGHT caught by QF Assembly
1419352a5e7cSSebastian Grimberg         CeedCall(CeedRealloc(num_eval_modes_out[index] + q_comp, &eval_modes_out[index]));
1420352a5e7cSSebastian Grimberg         CeedCall(CeedRealloc(num_eval_modes_out[index] + q_comp, &eval_mode_offsets_out[index]));
1421352a5e7cSSebastian Grimberg         for (CeedInt d = 0; d < q_comp; d++) {
1422437c7c90SJeremy L Thompson           eval_modes_out[index][num_eval_modes_out[index] + d]        = eval_mode;
1423437c7c90SJeremy L Thompson           eval_mode_offsets_out[index][num_eval_modes_out[index] + d] = offset;
1424352a5e7cSSebastian Grimberg           offset += num_comp;
1425ed9e99e6SJeremy L Thompson         }
1426352a5e7cSSebastian Grimberg         num_eval_modes_out[index] += q_comp;
1427ed9e99e6SJeremy L Thompson       }
1428ed9e99e6SJeremy L Thompson     }
1429ed9e99e6SJeremy L Thompson   }
1430506b1a0cSSebastian Grimberg   (*data)->num_active_bases_in   = num_active_bases_in;
143127789c4aSJed Brown   (*data)->num_eval_modes_in     = num_eval_modes_in;
143227789c4aSJed Brown   (*data)->eval_modes_in         = eval_modes_in;
143327789c4aSJed Brown   (*data)->eval_mode_offsets_in  = eval_mode_offsets_in;
1434506b1a0cSSebastian Grimberg   (*data)->num_active_bases_out  = num_active_bases_out;
1435437c7c90SJeremy L Thompson   (*data)->num_eval_modes_out    = num_eval_modes_out;
1436437c7c90SJeremy L Thompson   (*data)->eval_modes_out        = eval_modes_out;
1437437c7c90SJeremy L Thompson   (*data)->eval_mode_offsets_out = eval_mode_offsets_out;
1438506b1a0cSSebastian Grimberg   (*data)->num_output_components = offset;
1439ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1440ed9e99e6SJeremy L Thompson }
1441ed9e99e6SJeremy L Thompson 
1442ed9e99e6SJeremy L Thompson /**
1443ba746a46SJeremy L Thompson   @brief Get CeedOperator CeedEvalModes for assembly.
1444ba746a46SJeremy L Thompson 
1445ba746a46SJeremy L Thompson   Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object.
1446ed9e99e6SJeremy L Thompson 
1447ed9e99e6SJeremy L Thompson   @param[in]  data                  CeedOperatorAssemblyData
1448506b1a0cSSebastian Grimberg   @param[out] num_active_bases_in   Total number of active bases for input
1449c5d0f995SJed Brown   @param[out] num_eval_modes_in     Pointer to hold array of numbers of input CeedEvalModes, or NULL.
1450ba746a46SJeremy L Thompson                                       `eval_modes_in[0]` holds an array of eval modes for the first active basis.
1451c5d0f995SJed Brown   @param[out] eval_modes_in         Pointer to hold arrays of input CeedEvalModes, or NULL.
1452ba746a46SJeremy L Thompson   @param[out] eval_mode_offsets_in  Pointer to hold arrays of input offsets at each quadrature point.
1453506b1a0cSSebastian Grimberg   @param[out] num_active_bases_out  Total number of active bases for output
1454c5d0f995SJed Brown   @param[out] num_eval_modes_out    Pointer to hold array of numbers of output CeedEvalModes, or NULL
1455c5d0f995SJed Brown   @param[out] eval_modes_out        Pointer to hold arrays of output CeedEvalModes, or NULL.
1456437c7c90SJeremy L Thompson   @param[out] eval_mode_offsets_out Pointer to hold arrays of output offsets at each quadrature point
1457ba746a46SJeremy L Thompson   @param[out] num_output_components The number of columns in the assembled CeedQFunction matrix for each quadrature point,
1458ba746a46SJeremy L Thompson                                       including contributions of all active bases
1459ed9e99e6SJeremy L Thompson 
1460ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1461ed9e99e6SJeremy L Thompson 
1462ed9e99e6SJeremy L Thompson   @ref Backend
1463ed9e99e6SJeremy L Thompson **/
1464506b1a0cSSebastian Grimberg int CeedOperatorAssemblyDataGetEvalModes(CeedOperatorAssemblyData data, CeedInt *num_active_bases_in, CeedInt **num_eval_modes_in,
1465506b1a0cSSebastian Grimberg                                          const CeedEvalMode ***eval_modes_in, CeedSize ***eval_mode_offsets_in, CeedInt *num_active_bases_out,
1466506b1a0cSSebastian Grimberg                                          CeedInt **num_eval_modes_out, const CeedEvalMode ***eval_modes_out, CeedSize ***eval_mode_offsets_out,
1467506b1a0cSSebastian Grimberg                                          CeedSize *num_output_components) {
1468506b1a0cSSebastian Grimberg   if (num_active_bases_in) *num_active_bases_in = data->num_active_bases_in;
1469437c7c90SJeremy L Thompson   if (num_eval_modes_in) *num_eval_modes_in = data->num_eval_modes_in;
1470437c7c90SJeremy L Thompson   if (eval_modes_in) *eval_modes_in = (const CeedEvalMode **)data->eval_modes_in;
1471437c7c90SJeremy L Thompson   if (eval_mode_offsets_in) *eval_mode_offsets_in = data->eval_mode_offsets_in;
1472506b1a0cSSebastian Grimberg   if (num_active_bases_out) *num_active_bases_out = data->num_active_bases_out;
1473437c7c90SJeremy L Thompson   if (num_eval_modes_out) *num_eval_modes_out = data->num_eval_modes_out;
1474437c7c90SJeremy L Thompson   if (eval_modes_out) *eval_modes_out = (const CeedEvalMode **)data->eval_modes_out;
1475437c7c90SJeremy L Thompson   if (eval_mode_offsets_out) *eval_mode_offsets_out = data->eval_mode_offsets_out;
1476437c7c90SJeremy L Thompson   if (num_output_components) *num_output_components = data->num_output_components;
1477ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1478ed9e99e6SJeremy L Thompson }
1479ed9e99e6SJeremy L Thompson 
1480ed9e99e6SJeremy L Thompson /**
1481ba746a46SJeremy L Thompson   @brief Get CeedOperator CeedBasis data for assembly.
1482ba746a46SJeremy L Thompson 
1483ba746a46SJeremy L Thompson   Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object.
1484ed9e99e6SJeremy L Thompson 
1485ed9e99e6SJeremy L Thompson   @param[in]  data                 CeedOperatorAssemblyData
1486506b1a0cSSebastian Grimberg   @param[out] num_active_bases_in  Number of active input bases, or NULL
1487506b1a0cSSebastian Grimberg   @param[out] active_bases_in      Pointer to hold active input CeedBasis, or NULL
1488437c7c90SJeremy L Thompson   @param[out] assembled_bases_in   Pointer to hold assembled active input B, or NULL
1489506b1a0cSSebastian Grimberg   @param[out] num_active_bases_out Number of active output bases, or NULL
1490506b1a0cSSebastian Grimberg   @param[out] active_bases_out     Pointer to hold active output CeedBasis, or NULL
1491437c7c90SJeremy L Thompson   @param[out] assembled_bases_out  Pointer to hold assembled active output B, or NULL
1492ed9e99e6SJeremy L Thompson 
1493ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1494ed9e99e6SJeremy L Thompson 
1495ed9e99e6SJeremy L Thompson   @ref Backend
1496ed9e99e6SJeremy L Thompson **/
1497506b1a0cSSebastian Grimberg int CeedOperatorAssemblyDataGetBases(CeedOperatorAssemblyData data, CeedInt *num_active_bases_in, CeedBasis **active_bases_in,
1498506b1a0cSSebastian Grimberg                                      const CeedScalar ***assembled_bases_in, CeedInt *num_active_bases_out, CeedBasis **active_bases_out,
1499506b1a0cSSebastian Grimberg                                      const CeedScalar ***assembled_bases_out) {
1500ed9e99e6SJeremy L Thompson   // Assemble B_in, B_out if needed
1501437c7c90SJeremy L Thompson   if (assembled_bases_in && !data->assembled_bases_in[0]) {
1502437c7c90SJeremy L Thompson     CeedInt num_qpts;
1503437c7c90SJeremy L Thompson 
1504506b1a0cSSebastian Grimberg     if (data->active_bases_in[0] == CEED_BASIS_NONE) CeedCall(CeedElemRestrictionGetElementSize(data->active_elem_rstrs_in[0], &num_qpts));
1505506b1a0cSSebastian Grimberg     else CeedCall(CeedBasisGetNumQuadraturePoints(data->active_bases_in[0], &num_qpts));
1506506b1a0cSSebastian Grimberg     for (CeedInt b = 0; b < data->num_active_bases_in; b++) {
15071c66c397SJeremy L Thompson       bool        has_eval_none = false;
1508352a5e7cSSebastian Grimberg       CeedInt     num_nodes;
1509437c7c90SJeremy L Thompson       CeedScalar *B_in = NULL, *identity = NULL;
1510ed9e99e6SJeremy L Thompson 
1511506b1a0cSSebastian Grimberg       CeedCall(CeedElemRestrictionGetElementSize(data->active_elem_rstrs_in[b], &num_nodes));
1512352a5e7cSSebastian Grimberg       CeedCall(CeedCalloc(num_qpts * num_nodes * data->num_eval_modes_in[b], &B_in));
1513ed9e99e6SJeremy L Thompson 
1514437c7c90SJeremy L Thompson       for (CeedInt i = 0; i < data->num_eval_modes_in[b]; i++) {
1515437c7c90SJeremy L Thompson         has_eval_none = has_eval_none || (data->eval_modes_in[b][i] == CEED_EVAL_NONE);
1516ed9e99e6SJeremy L Thompson       }
1517ed9e99e6SJeremy L Thompson       if (has_eval_none) {
1518352a5e7cSSebastian Grimberg         CeedCall(CeedCalloc(num_qpts * num_nodes, &identity));
1519352a5e7cSSebastian Grimberg         for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) {
1520352a5e7cSSebastian Grimberg           identity[i * num_nodes + i] = 1.0;
1521ed9e99e6SJeremy L Thompson         }
1522ed9e99e6SJeremy L Thompson       }
1523ed9e99e6SJeremy L Thompson 
1524ed9e99e6SJeremy L Thompson       for (CeedInt q = 0; q < num_qpts; q++) {
1525352a5e7cSSebastian Grimberg         for (CeedInt n = 0; n < num_nodes; n++) {
1526352a5e7cSSebastian Grimberg           CeedInt      d_in              = 0, q_comp_in;
1527352a5e7cSSebastian Grimberg           CeedEvalMode eval_mode_in_prev = CEED_EVAL_NONE;
15281c66c397SJeremy L Thompson 
1529437c7c90SJeremy L Thompson           for (CeedInt e_in = 0; e_in < data->num_eval_modes_in[b]; e_in++) {
1530437c7c90SJeremy L Thompson             const CeedInt     qq = data->num_eval_modes_in[b] * q;
1531437c7c90SJeremy L Thompson             const CeedScalar *B  = NULL;
15321c66c397SJeremy L Thompson 
1533506b1a0cSSebastian Grimberg             CeedCall(CeedOperatorGetBasisPointer(data->active_bases_in[b], data->eval_modes_in[b][e_in], identity, &B));
1534506b1a0cSSebastian Grimberg             CeedCall(CeedBasisGetNumQuadratureComponents(data->active_bases_in[b], data->eval_modes_in[b][e_in], &q_comp_in));
1535352a5e7cSSebastian Grimberg             if (q_comp_in > 1) {
1536352a5e7cSSebastian Grimberg               if (e_in == 0 || data->eval_modes_in[b][e_in] != eval_mode_in_prev) d_in = 0;
1537352a5e7cSSebastian Grimberg               else B = &B[(++d_in) * num_qpts * num_nodes];
1538352a5e7cSSebastian Grimberg             }
1539352a5e7cSSebastian Grimberg             eval_mode_in_prev                 = data->eval_modes_in[b][e_in];
1540352a5e7cSSebastian Grimberg             B_in[(qq + e_in) * num_nodes + n] = B[q * num_nodes + n];
1541ed9e99e6SJeremy L Thompson           }
1542ed9e99e6SJeremy L Thompson         }
1543ed9e99e6SJeremy L Thompson       }
15447c1dbaffSSebastian Grimberg       if (identity) CeedCall(CeedFree(&identity));
1545437c7c90SJeremy L Thompson       data->assembled_bases_in[b] = B_in;
1546437c7c90SJeremy L Thompson     }
1547ed9e99e6SJeremy L Thompson   }
1548ed9e99e6SJeremy L Thompson 
1549437c7c90SJeremy L Thompson   if (assembled_bases_out && !data->assembled_bases_out[0]) {
1550437c7c90SJeremy L Thompson     CeedInt num_qpts;
1551437c7c90SJeremy L Thompson 
1552506b1a0cSSebastian Grimberg     if (data->active_bases_out[0] == CEED_BASIS_NONE) CeedCall(CeedElemRestrictionGetElementSize(data->active_elem_rstrs_out[0], &num_qpts));
1553506b1a0cSSebastian Grimberg     else CeedCall(CeedBasisGetNumQuadraturePoints(data->active_bases_out[0], &num_qpts));
1554506b1a0cSSebastian Grimberg     for (CeedInt b = 0; b < data->num_active_bases_out; b++) {
1555ed9e99e6SJeremy L Thompson       bool        has_eval_none = false;
15561c66c397SJeremy L Thompson       CeedInt     num_nodes;
1557437c7c90SJeremy L Thompson       CeedScalar *B_out = NULL, *identity = NULL;
1558ed9e99e6SJeremy L Thompson 
1559506b1a0cSSebastian Grimberg       CeedCall(CeedElemRestrictionGetElementSize(data->active_elem_rstrs_out[b], &num_nodes));
1560352a5e7cSSebastian Grimberg       CeedCall(CeedCalloc(num_qpts * num_nodes * data->num_eval_modes_out[b], &B_out));
1561ed9e99e6SJeremy L Thompson 
1562437c7c90SJeremy L Thompson       for (CeedInt i = 0; i < data->num_eval_modes_out[b]; i++) {
1563437c7c90SJeremy L Thompson         has_eval_none = has_eval_none || (data->eval_modes_out[b][i] == CEED_EVAL_NONE);
1564ed9e99e6SJeremy L Thompson       }
1565ed9e99e6SJeremy L Thompson       if (has_eval_none) {
1566352a5e7cSSebastian Grimberg         CeedCall(CeedCalloc(num_qpts * num_nodes, &identity));
1567352a5e7cSSebastian Grimberg         for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) {
1568352a5e7cSSebastian Grimberg           identity[i * num_nodes + i] = 1.0;
1569ed9e99e6SJeremy L Thompson         }
1570ed9e99e6SJeremy L Thompson       }
1571ed9e99e6SJeremy L Thompson 
1572ed9e99e6SJeremy L Thompson       for (CeedInt q = 0; q < num_qpts; q++) {
1573352a5e7cSSebastian Grimberg         for (CeedInt n = 0; n < num_nodes; n++) {
1574352a5e7cSSebastian Grimberg           CeedInt      d_out              = 0, q_comp_out;
1575352a5e7cSSebastian Grimberg           CeedEvalMode eval_mode_out_prev = CEED_EVAL_NONE;
15761c66c397SJeremy L Thompson 
1577437c7c90SJeremy L Thompson           for (CeedInt e_out = 0; e_out < data->num_eval_modes_out[b]; e_out++) {
1578437c7c90SJeremy L Thompson             const CeedInt     qq = data->num_eval_modes_out[b] * q;
1579437c7c90SJeremy L Thompson             const CeedScalar *B  = NULL;
15801c66c397SJeremy L Thompson 
1581506b1a0cSSebastian Grimberg             CeedCall(CeedOperatorGetBasisPointer(data->active_bases_out[b], data->eval_modes_out[b][e_out], identity, &B));
1582506b1a0cSSebastian Grimberg             CeedCall(CeedBasisGetNumQuadratureComponents(data->active_bases_out[b], data->eval_modes_out[b][e_out], &q_comp_out));
1583352a5e7cSSebastian Grimberg             if (q_comp_out > 1) {
1584352a5e7cSSebastian Grimberg               if (e_out == 0 || data->eval_modes_out[b][e_out] != eval_mode_out_prev) d_out = 0;
1585352a5e7cSSebastian Grimberg               else B = &B[(++d_out) * num_qpts * num_nodes];
1586352a5e7cSSebastian Grimberg             }
1587352a5e7cSSebastian Grimberg             eval_mode_out_prev                  = data->eval_modes_out[b][e_out];
1588352a5e7cSSebastian Grimberg             B_out[(qq + e_out) * num_nodes + n] = B[q * num_nodes + n];
1589ed9e99e6SJeremy L Thompson           }
1590ed9e99e6SJeremy L Thompson         }
1591ed9e99e6SJeremy L Thompson       }
15927c1dbaffSSebastian Grimberg       if (identity) CeedCall(CeedFree(&identity));
1593437c7c90SJeremy L Thompson       data->assembled_bases_out[b] = B_out;
1594437c7c90SJeremy L Thompson     }
1595ed9e99e6SJeremy L Thompson   }
1596ed9e99e6SJeremy L Thompson 
1597437c7c90SJeremy L Thompson   // Pass out assembled data
1598506b1a0cSSebastian Grimberg   if (num_active_bases_in) *num_active_bases_in = data->num_active_bases_in;
1599506b1a0cSSebastian Grimberg   if (active_bases_in) *active_bases_in = data->active_bases_in;
1600437c7c90SJeremy L Thompson   if (assembled_bases_in) *assembled_bases_in = (const CeedScalar **)data->assembled_bases_in;
1601506b1a0cSSebastian Grimberg   if (num_active_bases_out) *num_active_bases_out = data->num_active_bases_out;
1602506b1a0cSSebastian Grimberg   if (active_bases_out) *active_bases_out = data->active_bases_out;
1603437c7c90SJeremy L Thompson   if (assembled_bases_out) *assembled_bases_out = (const CeedScalar **)data->assembled_bases_out;
1604437c7c90SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1605437c7c90SJeremy L Thompson }
1606437c7c90SJeremy L Thompson 
1607437c7c90SJeremy L Thompson /**
1608ba746a46SJeremy L Thompson   @brief Get CeedOperator CeedBasis data for assembly.
1609ba746a46SJeremy L Thompson 
1610ba746a46SJeremy L Thompson   Note: See CeedOperatorAssemblyDataCreate for a full description of the data stored in this object.
1611437c7c90SJeremy L Thompson 
1612437c7c90SJeremy L Thompson   @param[in]  data                      CeedOperatorAssemblyData
1613506b1a0cSSebastian Grimberg   @param[out] num_active_elem_rstrs_in  Number of active input element restrictions, or NULL
1614506b1a0cSSebastian Grimberg   @param[out] active_elem_rstrs_in      Pointer to hold active input CeedElemRestrictions, or NULL
1615506b1a0cSSebastian Grimberg   @param[out] num_active_elem_rstrs_out Number of active output element restrictions, or NULL
1616506b1a0cSSebastian Grimberg   @param[out] active_elem_rstrs_out     Pointer to hold active output CeedElemRestrictions, or NULL
1617437c7c90SJeremy L Thompson 
1618437c7c90SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1619437c7c90SJeremy L Thompson 
1620437c7c90SJeremy L Thompson   @ref Backend
1621437c7c90SJeremy L Thompson **/
1622506b1a0cSSebastian Grimberg int CeedOperatorAssemblyDataGetElemRestrictions(CeedOperatorAssemblyData data, CeedInt *num_active_elem_rstrs_in,
1623506b1a0cSSebastian Grimberg                                                 CeedElemRestriction **active_elem_rstrs_in, CeedInt *num_active_elem_rstrs_out,
1624506b1a0cSSebastian Grimberg                                                 CeedElemRestriction **active_elem_rstrs_out) {
1625506b1a0cSSebastian Grimberg   if (num_active_elem_rstrs_in) *num_active_elem_rstrs_in = data->num_active_bases_in;
1626506b1a0cSSebastian Grimberg   if (active_elem_rstrs_in) *active_elem_rstrs_in = data->active_elem_rstrs_in;
1627506b1a0cSSebastian Grimberg   if (num_active_elem_rstrs_out) *num_active_elem_rstrs_out = data->num_active_bases_out;
1628506b1a0cSSebastian Grimberg   if (active_elem_rstrs_out) *active_elem_rstrs_out = data->active_elem_rstrs_out;
1629ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1630ed9e99e6SJeremy L Thompson }
1631ed9e99e6SJeremy L Thompson 
1632ed9e99e6SJeremy L Thompson /**
1633ed9e99e6SJeremy L Thompson   @brief Destroy CeedOperatorAssemblyData
1634ed9e99e6SJeremy L Thompson 
1635ea61e9acSJeremy L Thompson   @param[in,out] data CeedOperatorAssemblyData to destroy
1636ed9e99e6SJeremy L Thompson 
1637ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1638ed9e99e6SJeremy L Thompson 
1639ed9e99e6SJeremy L Thompson   @ref Backend
1640ed9e99e6SJeremy L Thompson **/
1641ed9e99e6SJeremy L Thompson int CeedOperatorAssemblyDataDestroy(CeedOperatorAssemblyData *data) {
1642ad6481ceSJeremy L Thompson   if (!*data) {
1643ad6481ceSJeremy L Thompson     *data = NULL;
1644ad6481ceSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1645ad6481ceSJeremy L Thompson   }
16462b730f8bSJeremy L Thompson   CeedCall(CeedDestroy(&(*data)->ceed));
1647506b1a0cSSebastian Grimberg   for (CeedInt b = 0; b < (*data)->num_active_bases_in; b++) {
1648506b1a0cSSebastian Grimberg     CeedCall(CeedBasisDestroy(&(*data)->active_bases_in[b]));
1649506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionDestroy(&(*data)->active_elem_rstrs_in[b]));
1650437c7c90SJeremy L Thompson     CeedCall(CeedFree(&(*data)->eval_modes_in[b]));
1651437c7c90SJeremy L Thompson     CeedCall(CeedFree(&(*data)->eval_mode_offsets_in[b]));
1652437c7c90SJeremy L Thompson     CeedCall(CeedFree(&(*data)->assembled_bases_in[b]));
1653506b1a0cSSebastian Grimberg   }
1654506b1a0cSSebastian Grimberg   for (CeedInt b = 0; b < (*data)->num_active_bases_out; b++) {
1655506b1a0cSSebastian Grimberg     CeedCall(CeedBasisDestroy(&(*data)->active_bases_out[b]));
1656506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionDestroy(&(*data)->active_elem_rstrs_out[b]));
1657506b1a0cSSebastian Grimberg     CeedCall(CeedFree(&(*data)->eval_modes_out[b]));
1658506b1a0cSSebastian Grimberg     CeedCall(CeedFree(&(*data)->eval_mode_offsets_out[b]));
1659437c7c90SJeremy L Thompson     CeedCall(CeedFree(&(*data)->assembled_bases_out[b]));
1660437c7c90SJeremy L Thompson   }
1661506b1a0cSSebastian Grimberg   CeedCall(CeedFree(&(*data)->active_bases_in));
1662506b1a0cSSebastian Grimberg   CeedCall(CeedFree(&(*data)->active_bases_out));
1663506b1a0cSSebastian Grimberg   CeedCall(CeedFree(&(*data)->active_elem_rstrs_in));
1664506b1a0cSSebastian Grimberg   CeedCall(CeedFree(&(*data)->active_elem_rstrs_out));
1665437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->num_eval_modes_in));
1666437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->num_eval_modes_out));
1667437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->eval_modes_in));
1668437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->eval_modes_out));
1669437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->eval_mode_offsets_in));
1670437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->eval_mode_offsets_out));
1671437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->assembled_bases_in));
1672437c7c90SJeremy L Thompson   CeedCall(CeedFree(&(*data)->assembled_bases_out));
1673ed9e99e6SJeremy L Thompson 
16742b730f8bSJeremy L Thompson   CeedCall(CeedFree(data));
1675ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1676ed9e99e6SJeremy L Thompson }
1677ed9e99e6SJeremy L Thompson 
1678480fae85SJeremy L Thompson /// @}
1679480fae85SJeremy L Thompson 
1680480fae85SJeremy L Thompson /// ----------------------------------------------------------------------------
1681eaf62fffSJeremy L Thompson /// CeedOperator Public API
1682eaf62fffSJeremy L Thompson /// ----------------------------------------------------------------------------
1683eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorUser
1684eaf62fffSJeremy L Thompson /// @{
1685eaf62fffSJeremy L Thompson 
1686eaf62fffSJeremy L Thompson /**
1687eaf62fffSJeremy L Thompson   @brief Assemble a linear CeedQFunction associated with a CeedOperator
1688eaf62fffSJeremy L Thompson 
1689ea61e9acSJeremy L Thompson   This returns a CeedVector containing a matrix at each quadrature point providing the action of the CeedQFunction associated with the CeedOperator.
1690859c15bbSJames Wright   The vector `assembled` is of shape `[num_elements, num_input_fields, num_output_fields, num_quad_points]` and contains column-major matrices
1691859c15bbSJames Wright representing the action of the CeedQFunction for a corresponding quadrature point on an element.
1692859c15bbSJames Wright 
16939fd66db6SSebastian Grimberg   Inputs and outputs are in the order provided by the user when adding CeedOperator fields.
16949fd66db6SSebastian Grimberg   For example, a CeedQFunction with inputs 'u' and 'gradu' and outputs 'gradv' and 'v', provided in that order, would result in an assembled QFunction
16959fd66db6SSebastian Grimberg that consists of (1 + dim) x (dim + 1) matrices at each quadrature point acting on the input [u, du_0, du_1] and producing the output [dv_0, dv_1, v].
1696eaf62fffSJeremy L Thompson 
1697ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1698f04ea552SJeremy L Thompson 
1699ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1700ea61e9acSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points
1701ea61e9acSJeremy L Thompson   @param[out] rstr      CeedElemRestriction for CeedVector containing assembled CeedQFunction
1702ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1703eaf62fffSJeremy L Thompson 
1704eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1705eaf62fffSJeremy L Thompson 
1706eaf62fffSJeremy L Thompson   @ref User
1707eaf62fffSJeremy L Thompson **/
17082b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunction(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) {
17092b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1710eaf62fffSJeremy L Thompson 
1711eaf62fffSJeremy L Thompson   if (op->LinearAssembleQFunction) {
1712d04bbc78SJeremy L Thompson     // Backend version
17132b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleQFunction(op, assembled, rstr, request));
1714eaf62fffSJeremy L Thompson   } else {
1715d04bbc78SJeremy L Thompson     // Operator fallback
1716d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1717d04bbc78SJeremy L Thompson 
17182b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
17196574a04fSJeremy L Thompson     if (op_fallback) CeedCall(CeedOperatorLinearAssembleQFunction(op_fallback, assembled, rstr, request));
17206574a04fSJeremy L Thompson     else return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunction");
172170a7ffb3SJeremy L Thompson   }
1722eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1723eaf62fffSJeremy L Thompson }
172470a7ffb3SJeremy L Thompson 
172570a7ffb3SJeremy L Thompson /**
1726ea61e9acSJeremy L Thompson   @brief Assemble CeedQFunction and store result internally.
17274385fb7fSSebastian Grimberg 
1728ea61e9acSJeremy L Thompson   Return copied references of stored data to the caller.
1729ea61e9acSJeremy L Thompson   Caller is responsible for ownership and destruction of the copied references.
1730ea61e9acSJeremy L Thompson   See also @ref CeedOperatorLinearAssembleQFunction
173170a7ffb3SJeremy L Thompson 
1732c5f45aeaSJeremy L Thompson   Note: If the value of `assembled` or `rstr` passed to this function are non-NULL, then it is assumed that they hold valid pointers.
1733c5f45aeaSJeremy L Thompson         These objects will be destroyed if `*assembled` or `*rstr` is the only reference to the object.
1734c5f45aeaSJeremy L Thompson 
1735ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1736ea61e9acSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points
1737ea61e9acSJeremy L Thompson   @param[out] rstr      CeedElemRestriction for CeedVector containing assembledCeedQFunction
1738ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
173970a7ffb3SJeremy L Thompson 
174070a7ffb3SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
174170a7ffb3SJeremy L Thompson 
174270a7ffb3SJeremy L Thompson   @ref User
174370a7ffb3SJeremy L Thompson **/
17442b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunctionBuildOrUpdate(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) {
1745b05f7e9fSJeremy L Thompson   int (*LinearAssembleQFunctionUpdate)(CeedOperator, CeedVector, CeedElemRestriction, CeedRequest *) = NULL;
1746b05f7e9fSJeremy L Thompson   CeedOperator op_assemble                                                                           = NULL;
1747bb229da9SJeremy L Thompson   CeedOperator op_fallback_parent                                                                    = NULL;
1748b05f7e9fSJeremy L Thompson 
17492b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
175070a7ffb3SJeremy L Thompson 
1751b05f7e9fSJeremy L Thompson   // Determine if fallback parent or operator has implementation
1752bb229da9SJeremy L Thompson   CeedCall(CeedOperatorGetFallbackParent(op, &op_fallback_parent));
1753bb229da9SJeremy L Thompson   if (op_fallback_parent && op_fallback_parent->LinearAssembleQFunctionUpdate) {
1754b05f7e9fSJeremy L Thompson     // -- Backend version for op fallback parent is faster, if it exists
1755bb229da9SJeremy L Thompson     LinearAssembleQFunctionUpdate = op_fallback_parent->LinearAssembleQFunctionUpdate;
1756bb229da9SJeremy L Thompson     op_assemble                   = op_fallback_parent;
1757b05f7e9fSJeremy L Thompson   } else if (op->LinearAssembleQFunctionUpdate) {
1758b05f7e9fSJeremy L Thompson     // -- Backend version for op
1759b05f7e9fSJeremy L Thompson     LinearAssembleQFunctionUpdate = op->LinearAssembleQFunctionUpdate;
1760b05f7e9fSJeremy L Thompson     op_assemble                   = op;
1761b05f7e9fSJeremy L Thompson   }
1762b05f7e9fSJeremy L Thompson 
1763b05f7e9fSJeremy L Thompson   // Assemble QFunction
1764b05f7e9fSJeremy L Thompson   if (LinearAssembleQFunctionUpdate) {
1765b05f7e9fSJeremy L Thompson     // Backend or fallback parent version
1766480fae85SJeremy L Thompson     bool                qf_assembled_is_setup;
17672efa2d85SJeremy L Thompson     CeedVector          assembled_vec  = NULL;
17682efa2d85SJeremy L Thompson     CeedElemRestriction assembled_rstr = NULL;
1769480fae85SJeremy L Thompson 
17702b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAssemblyDataIsSetup(op->qf_assembled, &qf_assembled_is_setup));
1771480fae85SJeremy L Thompson     if (qf_assembled_is_setup) {
1772d04bbc78SJeremy L Thompson       bool update_needed;
1773d04bbc78SJeremy L Thompson 
17742b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionAssemblyDataGetObjects(op->qf_assembled, &assembled_vec, &assembled_rstr));
17752b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionAssemblyDataIsUpdateNeeded(op->qf_assembled, &update_needed));
1776b05f7e9fSJeremy L Thompson       if (update_needed) CeedCall(LinearAssembleQFunctionUpdate(op_assemble, assembled_vec, assembled_rstr, request));
177770a7ffb3SJeremy L Thompson     } else {
1778b05f7e9fSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleQFunction(op_assemble, &assembled_vec, &assembled_rstr, request));
17792b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionAssemblyDataSetObjects(op->qf_assembled, assembled_vec, assembled_rstr));
178070a7ffb3SJeremy L Thompson     }
17812b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAssemblyDataSetUpdateNeeded(op->qf_assembled, false));
17822efa2d85SJeremy L Thompson 
1783d04bbc78SJeremy L Thompson     // Copy reference from internally held copy
17842b730f8bSJeremy L Thompson     CeedCall(CeedVectorReferenceCopy(assembled_vec, assembled));
17852b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionReferenceCopy(assembled_rstr, rstr));
1786c5f45aeaSJeremy L Thompson     CeedCall(CeedVectorDestroy(&assembled_vec));
17872b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionDestroy(&assembled_rstr));
178870a7ffb3SJeremy L Thompson   } else {
1789d04bbc78SJeremy L Thompson     // Operator fallback
1790d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1791d04bbc78SJeremy L Thompson 
17922b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
17936574a04fSJeremy L Thompson     if (op_fallback) CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op_fallback, assembled, rstr, request));
17946574a04fSJeremy L Thompson     else return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunctionUpdate");
179570a7ffb3SJeremy L Thompson   }
179670a7ffb3SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1797eaf62fffSJeremy L Thompson }
1798eaf62fffSJeremy L Thompson 
1799eaf62fffSJeremy L Thompson /**
1800eaf62fffSJeremy L Thompson   @brief Assemble the diagonal of a square linear CeedOperator
1801eaf62fffSJeremy L Thompson 
1802eaf62fffSJeremy L Thompson   This overwrites a CeedVector with the diagonal of a linear CeedOperator.
1803eaf62fffSJeremy L Thompson 
1804ea61e9acSJeremy L Thompson   Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported.
1805eaf62fffSJeremy L Thompson 
1806ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1807f04ea552SJeremy L Thompson 
1808ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1809eaf62fffSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedOperator diagonal
1810ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1811eaf62fffSJeremy L Thompson 
1812eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1813eaf62fffSJeremy L Thompson 
1814eaf62fffSJeremy L Thompson   @ref User
1815eaf62fffSJeremy L Thompson **/
18162b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) {
1817f3d47e36SJeremy L Thompson   bool     is_composite;
18181c66c397SJeremy L Thompson   CeedSize input_size = 0, output_size = 0;
18191c66c397SJeremy L Thompson 
18202b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1821f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1822eaf62fffSJeremy L Thompson 
18232b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size));
18246574a04fSJeremy L Thompson   CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square");
1825c9366a6bSJeremy L Thompson 
1826f3d47e36SJeremy L Thompson   // Early exit for empty operator
1827f3d47e36SJeremy L Thompson   if (!is_composite) {
1828f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
1829f3d47e36SJeremy L Thompson 
1830f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
1831f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
1832f3d47e36SJeremy L Thompson   }
1833f3d47e36SJeremy L Thompson 
1834eaf62fffSJeremy L Thompson   if (op->LinearAssembleDiagonal) {
1835d04bbc78SJeremy L Thompson     // Backend version
18362b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleDiagonal(op, assembled, request));
1837eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1838eaf62fffSJeremy L Thompson   } else if (op->LinearAssembleAddDiagonal) {
1839d04bbc78SJeremy L Thompson     // Backend version with zeroing first
18402b730f8bSJeremy L Thompson     CeedCall(CeedVectorSetValue(assembled, 0.0));
18412b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request));
1842eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1843eaf62fffSJeremy L Thompson   } else {
1844d04bbc78SJeremy L Thompson     // Operator fallback
1845d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1846d04bbc78SJeremy L Thompson 
18472b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1848d04bbc78SJeremy L Thompson     if (op_fallback) {
18492b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleDiagonal(op_fallback, assembled, request));
1850eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1851eaf62fffSJeremy L Thompson     }
1852eaf62fffSJeremy L Thompson   }
1853eaf62fffSJeremy L Thompson   // Default interface implementation
18542b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(assembled, 0.0));
18552b730f8bSJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleAddDiagonal(op, assembled, request));
1856eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1857eaf62fffSJeremy L Thompson }
1858eaf62fffSJeremy L Thompson 
1859eaf62fffSJeremy L Thompson /**
1860eaf62fffSJeremy L Thompson   @brief Assemble the diagonal of a square linear CeedOperator
1861eaf62fffSJeremy L Thompson 
1862eaf62fffSJeremy L Thompson   This sums into a CeedVector the diagonal of a linear CeedOperator.
1863eaf62fffSJeremy L Thompson 
1864ea61e9acSJeremy L Thompson   Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported.
1865eaf62fffSJeremy L Thompson 
1866ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1867f04ea552SJeremy L Thompson 
1868ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1869eaf62fffSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedOperator diagonal
1870ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1871eaf62fffSJeremy L Thompson 
1872eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1873eaf62fffSJeremy L Thompson 
1874eaf62fffSJeremy L Thompson   @ref User
1875eaf62fffSJeremy L Thompson **/
18762b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) {
1877f3d47e36SJeremy L Thompson   bool     is_composite;
18781c66c397SJeremy L Thompson   CeedSize input_size = 0, output_size = 0;
18791c66c397SJeremy L Thompson 
18802b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1881f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1882eaf62fffSJeremy L Thompson 
18832b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size));
18846574a04fSJeremy L Thompson   CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square");
1885c9366a6bSJeremy L Thompson 
1886f3d47e36SJeremy L Thompson   // Early exit for empty operator
1887f3d47e36SJeremy L Thompson   if (!is_composite) {
1888f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
1889f3d47e36SJeremy L Thompson 
1890f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
1891f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
1892f3d47e36SJeremy L Thompson   }
1893f3d47e36SJeremy L Thompson 
1894eaf62fffSJeremy L Thompson   if (op->LinearAssembleAddDiagonal) {
1895d04bbc78SJeremy L Thompson     // Backend version
18962b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request));
1897eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1898eaf62fffSJeremy L Thompson   } else {
1899d04bbc78SJeremy L Thompson     // Operator fallback
1900d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1901d04bbc78SJeremy L Thompson 
19022b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1903d04bbc78SJeremy L Thompson     if (op_fallback) {
19042b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleAddDiagonal(op_fallback, assembled, request));
1905eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1906eaf62fffSJeremy L Thompson     }
1907eaf62fffSJeremy L Thompson   }
1908eaf62fffSJeremy L Thompson   // Default interface implementation
1909eaf62fffSJeremy L Thompson   if (is_composite) {
19102b730f8bSJeremy L Thompson     CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, false, assembled));
1911eaf62fffSJeremy L Thompson   } else {
19122b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, false, assembled));
1913eaf62fffSJeremy L Thompson   }
1914d04bbc78SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1915eaf62fffSJeremy L Thompson }
1916eaf62fffSJeremy L Thompson 
1917eaf62fffSJeremy L Thompson /**
191801f0e615SJames Wright    @brief Fully assemble the point-block diagonal pattern of a linear operator.
191901f0e615SJames Wright 
192001f0e615SJames Wright    Expected to be used in conjunction with CeedOperatorLinearAssemblePointBlockDiagonal().
192101f0e615SJames Wright 
192201f0e615SJames Wright    The assembly routines use coordinate format, with `num_entries` tuples of the form (i, j, value) which indicate that value should be added to the
192301f0e615SJames Wright matrix in entry (i, j).
192401f0e615SJames Wright   Note that the (i, j) pairs are unique.
192501f0e615SJames Wright   This function returns the number of entries and their (i, j) locations, while CeedOperatorLinearAssemblePointBlockDiagonal() provides the values in
192601f0e615SJames Wright the same ordering.
192701f0e615SJames Wright 
192801f0e615SJames Wright    This will generally be slow unless your operator is low-order.
192901f0e615SJames Wright 
193001f0e615SJames Wright    Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
193101f0e615SJames Wright 
193201f0e615SJames Wright    @param[in]  op          CeedOperator to assemble
193301f0e615SJames Wright    @param[out] num_entries Number of entries in coordinate nonzero pattern
193401f0e615SJames Wright    @param[out] rows        Row number for each entry
193501f0e615SJames Wright    @param[out] cols        Column number for each entry
193601f0e615SJames Wright 
193701f0e615SJames Wright    @ref User
193801f0e615SJames Wright **/
193901f0e615SJames Wright int CeedOperatorLinearAssemblePointBlockDiagonalSymbolic(CeedOperator op, CeedSize *num_entries, CeedInt **rows, CeedInt **cols) {
194001f0e615SJames Wright   Ceed          ceed;
194101f0e615SJames Wright   bool          is_composite;
194201f0e615SJames Wright   CeedInt       num_active_components, num_sub_operators;
194301f0e615SJames Wright   CeedOperator *sub_operators;
194401f0e615SJames Wright 
194501f0e615SJames Wright   CeedCall(CeedOperatorGetCeed(op, &ceed));
194601f0e615SJames Wright   CeedCall(CeedOperatorIsComposite(op, &is_composite));
194701f0e615SJames Wright 
194801f0e615SJames Wright   CeedSize input_size = 0, output_size = 0;
194901f0e615SJames Wright   CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size));
195001f0e615SJames Wright   CeedCheck(input_size == output_size, ceed, CEED_ERROR_DIMENSION, "Operator must be square");
195101f0e615SJames Wright 
195201f0e615SJames Wright   if (is_composite) {
195301f0e615SJames Wright     CeedCall(CeedCompositeOperatorGetNumSub(op, &num_sub_operators));
195401f0e615SJames Wright     CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
195501f0e615SJames Wright   } else {
195601f0e615SJames Wright     sub_operators     = &op;
195701f0e615SJames Wright     num_sub_operators = 1;
195801f0e615SJames Wright   }
195901f0e615SJames Wright 
1960506b1a0cSSebastian Grimberg   // Verify operator can be assembled correctly
1961506b1a0cSSebastian Grimberg   {
196201f0e615SJames Wright     CeedOperatorAssemblyData data;
1963506b1a0cSSebastian Grimberg     CeedInt                  num_active_elem_rstrs, comp_stride;
196401f0e615SJames Wright     CeedElemRestriction     *active_elem_rstrs;
196501f0e615SJames Wright 
196601f0e615SJames Wright     // Get initial values to check against
196701f0e615SJames Wright     CeedCall(CeedOperatorGetOperatorAssemblyData(sub_operators[0], &data));
1968506b1a0cSSebastian Grimberg     CeedCall(CeedOperatorAssemblyDataGetElemRestrictions(data, &num_active_elem_rstrs, &active_elem_rstrs, NULL, NULL));
196901f0e615SJames Wright     CeedCall(CeedElemRestrictionGetCompStride(active_elem_rstrs[0], &comp_stride));
197001f0e615SJames Wright     CeedCall(CeedElemRestrictionGetNumComponents(active_elem_rstrs[0], &num_active_components));
197101f0e615SJames Wright 
1972506b1a0cSSebastian Grimberg     // Verify that all active element restrictions have same component stride and number of components
197301f0e615SJames Wright     for (CeedInt k = 0; k < num_sub_operators; k++) {
197401f0e615SJames Wright       CeedCall(CeedOperatorGetOperatorAssemblyData(sub_operators[k], &data));
1975506b1a0cSSebastian Grimberg       CeedCall(CeedOperatorAssemblyDataGetElemRestrictions(data, &num_active_elem_rstrs, &active_elem_rstrs, NULL, NULL));
197601f0e615SJames Wright       for (CeedInt i = 0; i < num_active_elem_rstrs; i++) {
1977506b1a0cSSebastian Grimberg         CeedInt comp_stride_sub, num_active_components_sub;
1978506b1a0cSSebastian Grimberg 
197901f0e615SJames Wright         CeedCall(CeedElemRestrictionGetCompStride(active_elem_rstrs[i], &comp_stride_sub));
198001f0e615SJames Wright         CeedCheck(comp_stride == comp_stride_sub, ceed, CEED_ERROR_DIMENSION,
198101f0e615SJames Wright                   "Active element restrictions must have the same component stride: %d vs %d", comp_stride, comp_stride_sub);
198201f0e615SJames Wright         CeedCall(CeedElemRestrictionGetNumComponents(active_elem_rstrs[i], &num_active_components_sub));
198301f0e615SJames Wright         CeedCheck(num_active_components == num_active_components_sub, ceed, CEED_ERROR_INCOMPATIBLE,
198401f0e615SJames Wright                   "All suboperators must have the same number of output components");
198501f0e615SJames Wright       }
198601f0e615SJames Wright     }
198701f0e615SJames Wright   }
198801f0e615SJames Wright   *num_entries = input_size * num_active_components;
198901f0e615SJames Wright   CeedCall(CeedCalloc(*num_entries, rows));
199001f0e615SJames Wright   CeedCall(CeedCalloc(*num_entries, cols));
199101f0e615SJames Wright 
199201f0e615SJames Wright   for (CeedInt o = 0; o < num_sub_operators; o++) {
1993506b1a0cSSebastian Grimberg     CeedElemRestriction active_elem_rstr, point_block_active_elem_rstr;
199401f0e615SJames Wright     CeedInt             comp_stride, num_elem, elem_size;
1995506b1a0cSSebastian Grimberg     const CeedInt      *offsets, *point_block_offsets;
199601f0e615SJames Wright 
199701f0e615SJames Wright     CeedCall(CeedOperatorGetActiveElemRestriction(sub_operators[o], &active_elem_rstr));
199801f0e615SJames Wright     CeedCall(CeedElemRestrictionGetCompStride(active_elem_rstr, &comp_stride));
199901f0e615SJames Wright     CeedCall(CeedElemRestrictionGetNumElements(active_elem_rstr, &num_elem));
200001f0e615SJames Wright     CeedCall(CeedElemRestrictionGetElementSize(active_elem_rstr, &elem_size));
200101f0e615SJames Wright     CeedCall(CeedElemRestrictionGetOffsets(active_elem_rstr, CEED_MEM_HOST, &offsets));
200201f0e615SJames Wright 
2003506b1a0cSSebastian Grimberg     CeedCall(CeedOperatorCreateActivePointBlockRestriction(active_elem_rstr, &point_block_active_elem_rstr));
2004506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionGetOffsets(point_block_active_elem_rstr, CEED_MEM_HOST, &point_block_offsets));
200501f0e615SJames Wright 
200601f0e615SJames Wright     for (CeedSize i = 0; i < num_elem * elem_size; i++) {
200701f0e615SJames Wright       for (CeedInt c_out = 0; c_out < num_active_components; c_out++) {
200801f0e615SJames Wright         for (CeedInt c_in = 0; c_in < num_active_components; c_in++) {
2009506b1a0cSSebastian Grimberg           (*rows)[point_block_offsets[i] + c_out * num_active_components + c_in] = offsets[i] + c_out * comp_stride;
2010506b1a0cSSebastian Grimberg           (*cols)[point_block_offsets[i] + c_out * num_active_components + c_in] = offsets[i] + c_in * comp_stride;
201101f0e615SJames Wright         }
201201f0e615SJames Wright       }
201301f0e615SJames Wright     }
201401f0e615SJames Wright 
201501f0e615SJames Wright     CeedCall(CeedElemRestrictionRestoreOffsets(active_elem_rstr, &offsets));
2016506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionRestoreOffsets(point_block_active_elem_rstr, &point_block_offsets));
2017506b1a0cSSebastian Grimberg     CeedCall(CeedElemRestrictionDestroy(&point_block_active_elem_rstr));
201801f0e615SJames Wright   }
201901f0e615SJames Wright   return CEED_ERROR_SUCCESS;
202001f0e615SJames Wright }
202101f0e615SJames Wright 
202201f0e615SJames Wright /**
2023eaf62fffSJeremy L Thompson   @brief Assemble the point block diagonal of a square linear CeedOperator
2024eaf62fffSJeremy L Thompson 
2025ea61e9acSJeremy L Thompson   This overwrites a CeedVector with the point block diagonal of a linear CeedOperator.
2026eaf62fffSJeremy L Thompson 
2027ea61e9acSJeremy L Thompson   Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported.
2028eaf62fffSJeremy L Thompson 
2029ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
2030f04ea552SJeremy L Thompson 
2031ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
2032ea61e9acSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp
2033ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out,
2034ea61e9acSJeremy L Thompson component in].
2035ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
2036eaf62fffSJeremy L Thompson 
2037eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
2038eaf62fffSJeremy L Thompson 
2039eaf62fffSJeremy L Thompson   @ref User
2040eaf62fffSJeremy L Thompson **/
20412b730f8bSJeremy L Thompson int CeedOperatorLinearAssemblePointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) {
2042f3d47e36SJeremy L Thompson   bool     is_composite;
20431c66c397SJeremy L Thompson   CeedSize input_size = 0, output_size = 0;
20441c66c397SJeremy L Thompson 
20452b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
2046f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
2047eaf62fffSJeremy L Thompson 
20482b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size));
20496574a04fSJeremy L Thompson   CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square");
2050c9366a6bSJeremy L Thompson 
2051f3d47e36SJeremy L Thompson   // Early exit for empty operator
2052f3d47e36SJeremy L Thompson   if (!is_composite) {
2053f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
2054f3d47e36SJeremy L Thompson 
2055f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
2056f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
2057f3d47e36SJeremy L Thompson   }
2058f3d47e36SJeremy L Thompson 
2059eaf62fffSJeremy L Thompson   if (op->LinearAssemblePointBlockDiagonal) {
2060d04bbc78SJeremy L Thompson     // Backend version
20612b730f8bSJeremy L Thompson     CeedCall(op->LinearAssemblePointBlockDiagonal(op, assembled, request));
2062eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
2063eaf62fffSJeremy L Thompson   } else if (op->LinearAssembleAddPointBlockDiagonal) {
2064d04bbc78SJeremy L Thompson     // Backend version with zeroing first
20652b730f8bSJeremy L Thompson     CeedCall(CeedVectorSetValue(assembled, 0.0));
20662b730f8bSJeremy L Thompson     CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request));
2067eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
2068eaf62fffSJeremy L Thompson   } else {
2069d04bbc78SJeremy L Thompson     // Operator fallback
2070d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
2071d04bbc78SJeremy L Thompson 
20722b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
2073d04bbc78SJeremy L Thompson     if (op_fallback) {
20742b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssemblePointBlockDiagonal(op_fallback, assembled, request));
2075eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
2076eaf62fffSJeremy L Thompson     }
2077eaf62fffSJeremy L Thompson   }
2078eaf62fffSJeremy L Thompson   // Default interface implementation
20792b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(assembled, 0.0));
20802b730f8bSJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request));
2081eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
2082eaf62fffSJeremy L Thompson }
2083eaf62fffSJeremy L Thompson 
2084eaf62fffSJeremy L Thompson /**
2085eaf62fffSJeremy L Thompson   @brief Assemble the point block diagonal of a square linear CeedOperator
2086eaf62fffSJeremy L Thompson 
2087ea61e9acSJeremy L Thompson   This sums into a CeedVector with the point block diagonal of a linear CeedOperator.
2088eaf62fffSJeremy L Thompson 
2089ea61e9acSJeremy L Thompson   Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported.
2090eaf62fffSJeremy L Thompson 
2091ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
2092f04ea552SJeremy L Thompson 
2093ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
2094ea61e9acSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp
2095ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out,
2096ea61e9acSJeremy L Thompson component in].
2097ea61e9acSJeremy L Thompson   @param[in]  request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
2098eaf62fffSJeremy L Thompson 
2099eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
2100eaf62fffSJeremy L Thompson 
2101eaf62fffSJeremy L Thompson   @ref User
2102eaf62fffSJeremy L Thompson **/
21032b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddPointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) {
2104f3d47e36SJeremy L Thompson   bool     is_composite;
21051c66c397SJeremy L Thompson   CeedSize input_size = 0, output_size = 0;
21061c66c397SJeremy L Thompson 
21072b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
2108f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
2109eaf62fffSJeremy L Thompson 
21102b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size));
21116574a04fSJeremy L Thompson   CeedCheck(input_size == output_size, op->ceed, CEED_ERROR_DIMENSION, "Operator must be square");
2112c9366a6bSJeremy L Thompson 
2113f3d47e36SJeremy L Thompson   // Early exit for empty operator
2114f3d47e36SJeremy L Thompson   if (!is_composite) {
2115f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
2116f3d47e36SJeremy L Thompson 
2117f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
2118f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
2119f3d47e36SJeremy L Thompson   }
2120f3d47e36SJeremy L Thompson 
2121eaf62fffSJeremy L Thompson   if (op->LinearAssembleAddPointBlockDiagonal) {
2122d04bbc78SJeremy L Thompson     // Backend version
21232b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleAddPointBlockDiagonal(op, assembled, request));
2124eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
2125eaf62fffSJeremy L Thompson   } else {
2126d04bbc78SJeremy L Thompson     // Operator fallback
2127d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
2128d04bbc78SJeremy L Thompson 
21292b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
2130d04bbc78SJeremy L Thompson     if (op_fallback) {
21312b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op_fallback, assembled, request));
2132eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
2133eaf62fffSJeremy L Thompson     }
2134eaf62fffSJeremy L Thompson   }
2135ea61e9acSJeremy L Thompson   // Default interface implementation
2136eaf62fffSJeremy L Thompson   if (is_composite) {
21372b730f8bSJeremy L Thompson     CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, true, assembled));
2138eaf62fffSJeremy L Thompson   } else {
21392b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, true, assembled));
2140eaf62fffSJeremy L Thompson   }
2141d04bbc78SJeremy L Thompson   return CEED_ERROR_SUCCESS;
2142eaf62fffSJeremy L Thompson }
2143eaf62fffSJeremy L Thompson 
2144eaf62fffSJeremy L Thompson /**
2145eaf62fffSJeremy L Thompson    @brief Fully assemble the nonzero pattern of a linear operator.
2146eaf62fffSJeremy L Thompson 
2147ea61e9acSJeremy L Thompson    Expected to be used in conjunction with CeedOperatorLinearAssemble().
2148eaf62fffSJeremy L Thompson 
2149ea61e9acSJeremy L Thompson    The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the
21509fd66db6SSebastian Grimberg matrix in entry (i, j).
21519fd66db6SSebastian Grimberg   Note that the (i, j) pairs are not unique and may repeat.
21529fd66db6SSebastian Grimberg   This function returns the number of entries and their (i, j) locations, while CeedOperatorLinearAssemble() provides the values in the same ordering.
2153eaf62fffSJeremy L Thompson 
2154eaf62fffSJeremy L Thompson    This will generally be slow unless your operator is low-order.
2155eaf62fffSJeremy L Thompson 
2156ea61e9acSJeremy L Thompson    Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
2157f04ea552SJeremy L Thompson 
2158eaf62fffSJeremy L Thompson    @param[in]  op          CeedOperator to assemble
2159eaf62fffSJeremy L Thompson    @param[out] num_entries Number of entries in coordinate nonzero pattern
2160eaf62fffSJeremy L Thompson    @param[out] rows        Row number for each entry
2161eaf62fffSJeremy L Thompson    @param[out] cols        Column number for each entry
2162eaf62fffSJeremy L Thompson 
2163eaf62fffSJeremy L Thompson    @ref User
2164eaf62fffSJeremy L Thompson **/
21652b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleSymbolic(CeedOperator op, CeedSize *num_entries, CeedInt **rows, CeedInt **cols) {
21661c66c397SJeremy L Thompson   bool          is_composite;
21671c66c397SJeremy L Thompson   CeedInt       num_suboperators, offset = 0;
2168b94338b9SJed Brown   CeedSize      single_entries;
2169eaf62fffSJeremy L Thompson   CeedOperator *sub_operators;
21701c66c397SJeremy L Thompson 
21712b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
2172f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
2173eaf62fffSJeremy L Thompson 
2174eaf62fffSJeremy L Thompson   if (op->LinearAssembleSymbolic) {
2175d04bbc78SJeremy L Thompson     // Backend version
21762b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleSymbolic(op, num_entries, rows, cols));
2177eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
2178eaf62fffSJeremy L Thompson   } else {
2179d04bbc78SJeremy L Thompson     // Operator fallback
2180d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
2181d04bbc78SJeremy L Thompson 
21822b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
2183d04bbc78SJeremy L Thompson     if (op_fallback) {
21842b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleSymbolic(op_fallback, num_entries, rows, cols));
2185eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
2186eaf62fffSJeremy L Thompson     }
2187eaf62fffSJeremy L Thompson   }
2188eaf62fffSJeremy L Thompson 
2189eaf62fffSJeremy L Thompson   // Default interface implementation
2190eaf62fffSJeremy L Thompson 
2191506b1a0cSSebastian Grimberg   // Count entries and allocate rows, cols arrays
2192eaf62fffSJeremy L Thompson   *num_entries = 0;
2193eaf62fffSJeremy L Thompson   if (is_composite) {
2194c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
2195c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
219692ae7e47SJeremy L Thompson     for (CeedInt k = 0; k < num_suboperators; ++k) {
21972b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries));
2198eaf62fffSJeremy L Thompson       *num_entries += single_entries;
2199eaf62fffSJeremy L Thompson     }
2200eaf62fffSJeremy L Thompson   } else {
22012b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssemblyCountEntries(op, &single_entries));
2202eaf62fffSJeremy L Thompson     *num_entries += single_entries;
2203eaf62fffSJeremy L Thompson   }
22042b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(*num_entries, rows));
22052b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(*num_entries, cols));
2206eaf62fffSJeremy L Thompson 
2207506b1a0cSSebastian Grimberg   // Assemble nonzero locations
2208eaf62fffSJeremy L Thompson   if (is_composite) {
2209c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
2210c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
221192ae7e47SJeremy L Thompson     for (CeedInt k = 0; k < num_suboperators; ++k) {
22122b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssembleSymbolic(sub_operators[k], offset, *rows, *cols));
22132b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries));
2214eaf62fffSJeremy L Thompson       offset += single_entries;
2215eaf62fffSJeremy L Thompson     }
2216eaf62fffSJeremy L Thompson   } else {
22172b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssembleSymbolic(op, offset, *rows, *cols));
2218eaf62fffSJeremy L Thompson   }
2219eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
2220eaf62fffSJeremy L Thompson }
2221eaf62fffSJeremy L Thompson 
2222eaf62fffSJeremy L Thompson /**
2223eaf62fffSJeremy L Thompson    @brief Fully assemble the nonzero entries of a linear operator.
2224eaf62fffSJeremy L Thompson 
2225ea61e9acSJeremy L Thompson    Expected to be used in conjunction with CeedOperatorLinearAssembleSymbolic().
2226eaf62fffSJeremy L Thompson 
2227ea61e9acSJeremy L Thompson    The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the
22289fd66db6SSebastian Grimberg matrix in entry (i, j).
22299fd66db6SSebastian Grimberg   Note that the (i, j) pairs are not unique and may repeat.
22309fd66db6SSebastian Grimberg   This function returns the values of the nonzero entries to be added, their (i, j) locations are provided by CeedOperatorLinearAssembleSymbolic()
2231eaf62fffSJeremy L Thompson 
2232eaf62fffSJeremy L Thompson    This will generally be slow unless your operator is low-order.
2233eaf62fffSJeremy L Thompson 
2234ea61e9acSJeremy L Thompson    Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
2235f04ea552SJeremy L Thompson 
2236eaf62fffSJeremy L Thompson    @param[in]  op     CeedOperator to assemble
2237eaf62fffSJeremy L Thompson    @param[out] values Values to assemble into matrix
2238eaf62fffSJeremy L Thompson 
2239eaf62fffSJeremy L Thompson    @ref User
2240eaf62fffSJeremy L Thompson **/
2241eaf62fffSJeremy L Thompson int CeedOperatorLinearAssemble(CeedOperator op, CeedVector values) {
22421c66c397SJeremy L Thompson   bool          is_composite;
22431c66c397SJeremy L Thompson   CeedInt       num_suboperators, offset = 0;
2244b94338b9SJed Brown   CeedSize      single_entries = 0;
2245eaf62fffSJeremy L Thompson   CeedOperator *sub_operators;
22461c66c397SJeremy L Thompson 
22472b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
2248f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
2249f3d47e36SJeremy L Thompson 
2250f3d47e36SJeremy L Thompson   // Early exit for empty operator
2251f3d47e36SJeremy L Thompson   if (!is_composite) {
2252f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
2253f3d47e36SJeremy L Thompson 
2254f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
2255f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
2256f3d47e36SJeremy L Thompson   }
2257eaf62fffSJeremy L Thompson 
2258eaf62fffSJeremy L Thompson   if (op->LinearAssemble) {
2259d04bbc78SJeremy L Thompson     // Backend version
22602b730f8bSJeremy L Thompson     CeedCall(op->LinearAssemble(op, values));
2261eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
2262eaf62fffSJeremy L Thompson   } else {
2263d04bbc78SJeremy L Thompson     // Operator fallback
2264d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
2265d04bbc78SJeremy L Thompson 
22662b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
2267d04bbc78SJeremy L Thompson     if (op_fallback) {
22682b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssemble(op_fallback, values));
2269eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
2270eaf62fffSJeremy L Thompson     }
2271eaf62fffSJeremy L Thompson   }
2272eaf62fffSJeremy L Thompson 
2273eaf62fffSJeremy L Thompson   // Default interface implementation
227428ec399dSJeremy L Thompson   CeedCall(CeedVectorSetValue(values, 0.0));
2275eaf62fffSJeremy L Thompson   if (is_composite) {
2276c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
2277c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
2278cefa2673SJeremy L Thompson     for (CeedInt k = 0; k < num_suboperators; k++) {
22792b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemble(sub_operators[k], offset, values));
22802b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries));
2281eaf62fffSJeremy L Thompson       offset += single_entries;
2282eaf62fffSJeremy L Thompson     }
2283eaf62fffSJeremy L Thompson   } else {
22842b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssemble(op, offset, values));
2285eaf62fffSJeremy L Thompson   }
2286eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
2287eaf62fffSJeremy L Thompson }
2288eaf62fffSJeremy L Thompson 
2289eaf62fffSJeremy L Thompson /**
229075f0d5a4SJeremy L Thompson   @brief Get the multiplicity of nodes across suboperators in a composite CeedOperator
229175f0d5a4SJeremy L Thompson 
229275f0d5a4SJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
229375f0d5a4SJeremy L Thompson 
229475f0d5a4SJeremy L Thompson   @param[in]  op               Composite CeedOperator
229575f0d5a4SJeremy L Thompson   @param[in]  num_skip_indices Number of suboperators to skip
229675f0d5a4SJeremy L Thompson   @param[in]  skip_indices     Array of indices of suboperators to skip
229775f0d5a4SJeremy L Thompson   @param[out] mult             Vector to store multiplicity (of size l_size)
229875f0d5a4SJeremy L Thompson 
229975f0d5a4SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
230075f0d5a4SJeremy L Thompson 
230175f0d5a4SJeremy L Thompson   @ref User
230275f0d5a4SJeremy L Thompson **/
230375f0d5a4SJeremy L Thompson int CeedCompositeOperatorGetMultiplicity(CeedOperator op, CeedInt num_skip_indices, CeedInt *skip_indices, CeedVector mult) {
230475f0d5a4SJeremy L Thompson   Ceed                ceed;
2305b275c451SJeremy L Thompson   CeedInt             num_suboperators;
230675f0d5a4SJeremy L Thompson   CeedSize            l_vec_len;
230775f0d5a4SJeremy L Thompson   CeedScalar         *mult_array;
230875f0d5a4SJeremy L Thompson   CeedVector          ones_l_vec;
23097c1dbaffSSebastian Grimberg   CeedElemRestriction elem_rstr, mult_elem_rstr;
2310b275c451SJeremy L Thompson   CeedOperator       *sub_operators;
231175f0d5a4SJeremy L Thompson 
23121c66c397SJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
23131c66c397SJeremy L Thompson 
231475f0d5a4SJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
231575f0d5a4SJeremy L Thompson 
231675f0d5a4SJeremy L Thompson   // Zero mult vector
231775f0d5a4SJeremy L Thompson   CeedCall(CeedVectorSetValue(mult, 0.0));
231875f0d5a4SJeremy L Thompson 
231975f0d5a4SJeremy L Thompson   // Get suboperators
2320b275c451SJeremy L Thompson   CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
2321b275c451SJeremy L Thompson   CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
2322b275c451SJeremy L Thompson   if (num_suboperators == 0) return CEED_ERROR_SUCCESS;
232375f0d5a4SJeremy L Thompson 
232475f0d5a4SJeremy L Thompson   // Work vector
232575f0d5a4SJeremy L Thompson   CeedCall(CeedVectorGetLength(mult, &l_vec_len));
232675f0d5a4SJeremy L Thompson   CeedCall(CeedVectorCreate(ceed, l_vec_len, &ones_l_vec));
232775f0d5a4SJeremy L Thompson   CeedCall(CeedVectorSetValue(ones_l_vec, 1.0));
232875f0d5a4SJeremy L Thompson   CeedCall(CeedVectorGetArray(mult, CEED_MEM_HOST, &mult_array));
232975f0d5a4SJeremy L Thompson 
233075f0d5a4SJeremy L Thompson   // Compute multiplicity across suboperators
2331b275c451SJeremy L Thompson   for (CeedInt i = 0; i < num_suboperators; i++) {
233275f0d5a4SJeremy L Thompson     const CeedScalar *sub_mult_array;
233375f0d5a4SJeremy L Thompson     CeedVector        sub_mult_l_vec, ones_e_vec;
233475f0d5a4SJeremy L Thompson 
233575f0d5a4SJeremy L Thompson     // -- Check for suboperator to skip
233675f0d5a4SJeremy L Thompson     for (CeedInt j = 0; j < num_skip_indices; j++) {
233775f0d5a4SJeremy L Thompson       if (skip_indices[j] == i) continue;
233875f0d5a4SJeremy L Thompson     }
233975f0d5a4SJeremy L Thompson 
234075f0d5a4SJeremy L Thompson     // -- Sub operator multiplicity
2341437c7c90SJeremy L Thompson     CeedCall(CeedOperatorGetActiveElemRestriction(sub_operators[i], &elem_rstr));
23427c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionCreateUnorientedCopy(elem_rstr, &mult_elem_rstr));
23437c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionCreateVector(mult_elem_rstr, &sub_mult_l_vec, &ones_e_vec));
234475f0d5a4SJeremy L Thompson     CeedCall(CeedVectorSetValue(sub_mult_l_vec, 0.0));
23457c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionApply(mult_elem_rstr, CEED_NOTRANSPOSE, ones_l_vec, ones_e_vec, CEED_REQUEST_IMMEDIATE));
23467c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionApply(mult_elem_rstr, CEED_TRANSPOSE, ones_e_vec, sub_mult_l_vec, CEED_REQUEST_IMMEDIATE));
234775f0d5a4SJeremy L Thompson     CeedCall(CeedVectorGetArrayRead(sub_mult_l_vec, CEED_MEM_HOST, &sub_mult_array));
234875f0d5a4SJeremy L Thompson     // ---- Flag every node present in the current suboperator
234975f0d5a4SJeremy L Thompson     for (CeedInt j = 0; j < l_vec_len; j++) {
235075f0d5a4SJeremy L Thompson       if (sub_mult_array[j] > 0.0) mult_array[j] += 1.0;
235175f0d5a4SJeremy L Thompson     }
235275f0d5a4SJeremy L Thompson     CeedCall(CeedVectorRestoreArrayRead(sub_mult_l_vec, &sub_mult_array));
235375f0d5a4SJeremy L Thompson     CeedCall(CeedVectorDestroy(&sub_mult_l_vec));
235475f0d5a4SJeremy L Thompson     CeedCall(CeedVectorDestroy(&ones_e_vec));
23557c1dbaffSSebastian Grimberg     CeedCall(CeedElemRestrictionDestroy(&mult_elem_rstr));
235675f0d5a4SJeremy L Thompson   }
235775f0d5a4SJeremy L Thompson   CeedCall(CeedVectorRestoreArray(mult, &mult_array));
2358811d0ccfSJeremy L Thompson   CeedCall(CeedVectorDestroy(&ones_l_vec));
235975f0d5a4SJeremy L Thompson   return CEED_ERROR_SUCCESS;
236075f0d5a4SJeremy L Thompson }
236175f0d5a4SJeremy L Thompson 
236275f0d5a4SJeremy L Thompson /**
2363ea61e9acSJeremy L Thompson   @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator, creating the prolongation basis from the fine and coarse
2364ea61e9acSJeremy L Thompson grid interpolation
2365eaf62fffSJeremy L Thompson 
236658e4b056SJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable.
2367f04ea552SJeremy L Thompson 
2368eaf62fffSJeremy L Thompson   @param[in]  op_fine      Fine grid operator
236985bb9dcfSJeremy L Thompson   @param[in]  p_mult_fine  L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators
2370eaf62fffSJeremy L Thompson   @param[in]  rstr_coarse  Coarse grid restriction
2371eaf62fffSJeremy L Thompson   @param[in]  basis_coarse Coarse grid active vector basis
2372eaf62fffSJeremy L Thompson   @param[out] op_coarse    Coarse grid operator
237385bb9dcfSJeremy L Thompson   @param[out] op_prolong   Coarse to fine operator, or NULL
23747758292fSSebastian Grimberg   @param[out] op_restrict  Fine to coarse operator, or NULL
2375eaf62fffSJeremy L Thompson 
2376eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
2377eaf62fffSJeremy L Thompson 
2378eaf62fffSJeremy L Thompson   @ref User
2379eaf62fffSJeremy L Thompson **/
23802b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreate(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse,
23817758292fSSebastian Grimberg                                      CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) {
23821c66c397SJeremy L Thompson   CeedBasis basis_c_to_f = NULL;
23831c66c397SJeremy L Thompson 
23842b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op_fine));
2385eaf62fffSJeremy L Thompson 
238683d6adf3SZach Atkins   // Build prolongation matrix, if required
23877758292fSSebastian Grimberg   if (op_prolong || op_restrict) {
238883d6adf3SZach Atkins     CeedBasis basis_fine;
23891c66c397SJeremy L Thompson 
23902b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine));
23912b730f8bSJeremy L Thompson     CeedCall(CeedBasisCreateProjection(basis_coarse, basis_fine, &basis_c_to_f));
239283d6adf3SZach Atkins   }
2393eaf62fffSJeremy L Thompson 
2394f113e5dcSJeremy L Thompson   // Core code
23957758292fSSebastian Grimberg   CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict));
2396eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
2397eaf62fffSJeremy L Thompson }
2398eaf62fffSJeremy L Thompson 
2399eaf62fffSJeremy L Thompson /**
2400ea61e9acSJeremy L Thompson   @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a tensor basis for the active basis
2401eaf62fffSJeremy L Thompson 
240258e4b056SJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable.
2403f04ea552SJeremy L Thompson 
2404eaf62fffSJeremy L Thompson   @param[in]  op_fine       Fine grid operator
240585bb9dcfSJeremy L Thompson   @param[in]  p_mult_fine   L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators
2406eaf62fffSJeremy L Thompson   @param[in]  rstr_coarse   Coarse grid restriction
2407eaf62fffSJeremy L Thompson   @param[in]  basis_coarse  Coarse grid active vector basis
240885bb9dcfSJeremy L Thompson   @param[in]  interp_c_to_f Matrix for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators
2409eaf62fffSJeremy L Thompson   @param[out] op_coarse     Coarse grid operator
241085bb9dcfSJeremy L Thompson   @param[out] op_prolong    Coarse to fine operator, or NULL
24117758292fSSebastian Grimberg   @param[out] op_restrict   Fine to coarse operator, or NULL
2412eaf62fffSJeremy L Thompson 
2413eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
2414eaf62fffSJeremy L Thompson 
2415eaf62fffSJeremy L Thompson   @ref User
2416eaf62fffSJeremy L Thompson **/
24172b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateTensorH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse,
24182b730f8bSJeremy L Thompson                                              const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong,
24197758292fSSebastian Grimberg                                              CeedOperator *op_restrict) {
2420eaf62fffSJeremy L Thompson   Ceed      ceed;
24211c66c397SJeremy L Thompson   CeedInt   Q_f, Q_c;
24221c66c397SJeremy L Thompson   CeedBasis basis_fine, basis_c_to_f = NULL;
24231c66c397SJeremy L Thompson 
24241c66c397SJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op_fine));
24252b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op_fine, &ceed));
2426eaf62fffSJeremy L Thompson 
2427eaf62fffSJeremy L Thompson   // Check for compatible quadrature spaces
24282b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine));
24292b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f));
24302b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c));
24316574a04fSJeremy L Thompson   CeedCheck(Q_f == Q_c, ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces");
2432eaf62fffSJeremy L Thompson 
243383d6adf3SZach Atkins   // Create coarse to fine basis, if required
24347758292fSSebastian Grimberg   if (op_prolong || op_restrict) {
24351c66c397SJeremy L Thompson     CeedInt     dim, num_comp, num_nodes_c, P_1d_f, P_1d_c;
24361c66c397SJeremy L Thompson     CeedScalar *q_ref, *q_weight, *grad;
24371c66c397SJeremy L Thompson 
243883d6adf3SZach Atkins     // Check if interpolation matrix is provided
24396574a04fSJeremy L Thompson     CeedCheck(interp_c_to_f, ceed, CEED_ERROR_INCOMPATIBLE,
24406574a04fSJeremy L Thompson               "Prolongation or restriction operator creation requires coarse-to-fine interpolation matrix");
24412b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetDimension(basis_fine, &dim));
24422b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp));
24432b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumNodes1D(basis_fine, &P_1d_f));
24442b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c));
24452b730f8bSJeremy L Thompson     P_1d_c = dim == 1 ? num_nodes_c : dim == 2 ? sqrt(num_nodes_c) : cbrt(num_nodes_c);
24462b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(P_1d_f, &q_ref));
24472b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(P_1d_f, &q_weight));
24482b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(P_1d_f * P_1d_c * dim, &grad));
24492b730f8bSJeremy L Thompson     CeedCall(CeedBasisCreateTensorH1(ceed, dim, num_comp, P_1d_c, P_1d_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f));
24502b730f8bSJeremy L Thompson     CeedCall(CeedFree(&q_ref));
24512b730f8bSJeremy L Thompson     CeedCall(CeedFree(&q_weight));
24522b730f8bSJeremy L Thompson     CeedCall(CeedFree(&grad));
245383d6adf3SZach Atkins   }
2454eaf62fffSJeremy L Thompson 
2455eaf62fffSJeremy L Thompson   // Core code
24567758292fSSebastian Grimberg   CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict));
2457eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
2458eaf62fffSJeremy L Thompson }
2459eaf62fffSJeremy L Thompson 
2460eaf62fffSJeremy L Thompson /**
2461ea61e9acSJeremy L Thompson   @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a non-tensor basis for the active vector
2462eaf62fffSJeremy L Thompson 
246358e4b056SJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable.
2464f04ea552SJeremy L Thompson 
2465eaf62fffSJeremy L Thompson   @param[in]  op_fine       Fine grid operator
246685bb9dcfSJeremy L Thompson   @param[in]  p_mult_fine   L-vector multiplicity in parallel gather/scatter, or NULL if not creating prolongation/restriction operators
2467eaf62fffSJeremy L Thompson   @param[in]  rstr_coarse   Coarse grid restriction
2468eaf62fffSJeremy L Thompson   @param[in]  basis_coarse  Coarse grid active vector basis
246985bb9dcfSJeremy L Thompson   @param[in]  interp_c_to_f Matrix for coarse to fine interpolation, or NULL if not creating prolongation/restriction operators
2470eaf62fffSJeremy L Thompson   @param[out] op_coarse     Coarse grid operator
247185bb9dcfSJeremy L Thompson   @param[out] op_prolong    Coarse to fine operator, or NULL
24727758292fSSebastian Grimberg   @param[out] op_restrict   Fine to coarse operator, or NULL
2473eaf62fffSJeremy L Thompson 
2474eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
2475eaf62fffSJeremy L Thompson 
2476eaf62fffSJeremy L Thompson   @ref User
2477eaf62fffSJeremy L Thompson **/
24782b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse,
24797758292fSSebastian Grimberg                                        const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong,
24807758292fSSebastian Grimberg                                        CeedOperator *op_restrict) {
2481eaf62fffSJeremy L Thompson   Ceed      ceed;
24821c66c397SJeremy L Thompson   CeedInt   Q_f, Q_c;
24831c66c397SJeremy L Thompson   CeedBasis basis_fine, basis_c_to_f = NULL;
24841c66c397SJeremy L Thompson 
24851c66c397SJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op_fine));
24862b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op_fine, &ceed));
2487eaf62fffSJeremy L Thompson 
2488eaf62fffSJeremy L Thompson   // Check for compatible quadrature spaces
24892b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine));
24902b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f));
24912b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c));
24926574a04fSJeremy L Thompson   CeedCheck(Q_f == Q_c, ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces");
2493eaf62fffSJeremy L Thompson 
2494eaf62fffSJeremy L Thompson   // Coarse to fine basis
24957758292fSSebastian Grimberg   if (op_prolong || op_restrict) {
24961c66c397SJeremy L Thompson     CeedInt          dim, num_comp, num_nodes_c, num_nodes_f;
24971c66c397SJeremy L Thompson     CeedScalar      *q_ref, *q_weight, *grad;
24981c66c397SJeremy L Thompson     CeedElemTopology topo;
24991c66c397SJeremy L Thompson 
250083d6adf3SZach Atkins     // Check if interpolation matrix is provided
25016574a04fSJeremy L Thompson     CeedCheck(interp_c_to_f, ceed, CEED_ERROR_INCOMPATIBLE,
25026574a04fSJeremy L Thompson               "Prolongation or restriction operator creation requires coarse-to-fine interpolation matrix");
25032b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetTopology(basis_fine, &topo));
25042b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetDimension(basis_fine, &dim));
25052b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp));
25062b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumNodes(basis_fine, &num_nodes_f));
25072b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c));
25082b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(num_nodes_f * dim, &q_ref));
25092b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(num_nodes_f, &q_weight));
25102b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(num_nodes_f * num_nodes_c * dim, &grad));
25112b730f8bSJeremy L Thompson     CeedCall(CeedBasisCreateH1(ceed, topo, num_comp, num_nodes_c, num_nodes_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f));
25122b730f8bSJeremy L Thompson     CeedCall(CeedFree(&q_ref));
25132b730f8bSJeremy L Thompson     CeedCall(CeedFree(&q_weight));
25142b730f8bSJeremy L Thompson     CeedCall(CeedFree(&grad));
251583d6adf3SZach Atkins   }
2516eaf62fffSJeremy L Thompson 
2517eaf62fffSJeremy L Thompson   // Core code
25187758292fSSebastian Grimberg   CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict));
2519eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
2520eaf62fffSJeremy L Thompson }
2521eaf62fffSJeremy L Thompson 
2522eaf62fffSJeremy L Thompson /**
2523ea61e9acSJeremy L Thompson   @brief Build a FDM based approximate inverse for each element for a CeedOperator
2524eaf62fffSJeremy L Thompson 
2525ea61e9acSJeremy L Thompson   This returns a CeedOperator and CeedVector to apply a Fast Diagonalization Method based approximate inverse.
2526859c15bbSJames Wright   This function obtains the simultaneous diagonalization for the 1D mass and Laplacian operators, \f$M = V^T V, K = V^T S V\f$.
2527859c15bbSJames Wright   The assembled QFunction is used to modify the eigenvalues from simultaneous diagonalization and obtain an approximate inverse of the form \f$V^T
25289fd66db6SSebastian Grimberg \hat S V\f$.
25299fd66db6SSebastian Grimberg   The CeedOperator must be linear and non-composite.
25309fd66db6SSebastian Grimberg   The associated CeedQFunction must therefore also be linear.
2531eaf62fffSJeremy L Thompson 
2532ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
2533f04ea552SJeremy L Thompson 
2534ea61e9acSJeremy L Thompson   @param[in]  op      CeedOperator to create element inverses
2535ea61e9acSJeremy L Thompson   @param[out] fdm_inv CeedOperator to apply the action of a FDM based inverse for each element
2536ea61e9acSJeremy L Thompson   @param[in]  request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
2537eaf62fffSJeremy L Thompson 
2538eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
2539eaf62fffSJeremy L Thompson 
2540480fae85SJeremy L Thompson   @ref User
2541eaf62fffSJeremy L Thompson **/
25422b730f8bSJeremy L Thompson int CeedOperatorCreateFDMElementInverse(CeedOperator op, CeedOperator *fdm_inv, CeedRequest *request) {
25431c66c397SJeremy L Thompson   Ceed                 ceed, ceed_parent;
25441c66c397SJeremy L Thompson   bool                 interp = false, grad = false, is_tensor_basis = true;
25451c66c397SJeremy L Thompson   CeedInt              num_input_fields, P_1d, Q_1d, num_nodes, num_qpts, dim, num_comp = 1, num_elem = 1;
25461c66c397SJeremy L Thompson   CeedSize             l_size = 1;
25471c66c397SJeremy L Thompson   CeedScalar          *mass, *laplace, *x, *fdm_interp, *lambda, *elem_avg;
25481c66c397SJeremy L Thompson   const CeedScalar    *interp_1d, *grad_1d, *q_weight_1d;
25491c66c397SJeremy L Thompson   CeedVector           q_data;
25501c66c397SJeremy L Thompson   CeedElemRestriction  rstr  = NULL, rstr_qd_i;
25511c66c397SJeremy L Thompson   CeedBasis            basis = NULL, fdm_basis;
25521c66c397SJeremy L Thompson   CeedQFunctionContext ctx_fdm;
25531c66c397SJeremy L Thompson   CeedQFunctionField  *qf_fields;
25541c66c397SJeremy L Thompson   CeedQFunction        qf, qf_fdm;
25551c66c397SJeremy L Thompson   CeedOperatorField   *op_fields;
25561c66c397SJeremy L Thompson 
25572b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
2558eaf62fffSJeremy L Thompson 
2559eaf62fffSJeremy L Thompson   if (op->CreateFDMElementInverse) {
2560d04bbc78SJeremy L Thompson     // Backend version
25612b730f8bSJeremy L Thompson     CeedCall(op->CreateFDMElementInverse(op, fdm_inv, request));
2562eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
2563eaf62fffSJeremy L Thompson   } else {
2564d04bbc78SJeremy L Thompson     // Operator fallback
2565d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
2566d04bbc78SJeremy L Thompson 
25672b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
2568d04bbc78SJeremy L Thompson     if (op_fallback) {
25692b730f8bSJeremy L Thompson       CeedCall(CeedOperatorCreateFDMElementInverse(op_fallback, fdm_inv, request));
2570eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
2571eaf62fffSJeremy L Thompson     }
2572eaf62fffSJeremy L Thompson   }
2573eaf62fffSJeremy L Thompson 
2574d04bbc78SJeremy L Thompson   // Default interface implementation
25752b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
2576bb229da9SJeremy L Thompson   CeedCall(CeedOperatorGetFallbackParentCeed(op, &ceed_parent));
25772b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetQFunction(op, &qf));
2578eaf62fffSJeremy L Thompson 
2579eaf62fffSJeremy L Thompson   // Determine active input basis
25802b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetFields(op, &num_input_fields, &op_fields, NULL, NULL));
25812b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL));
2582eaf62fffSJeremy L Thompson   for (CeedInt i = 0; i < num_input_fields; i++) {
2583eaf62fffSJeremy L Thompson     CeedVector vec;
25841c66c397SJeremy L Thompson 
25852b730f8bSJeremy L Thompson     CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec));
2586eaf62fffSJeremy L Thompson     if (vec == CEED_VECTOR_ACTIVE) {
2587eaf62fffSJeremy L Thompson       CeedEvalMode eval_mode;
25881c66c397SJeremy L Thompson 
25892b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode));
2590eaf62fffSJeremy L Thompson       interp = interp || eval_mode == CEED_EVAL_INTERP;
2591eaf62fffSJeremy L Thompson       grad   = grad || eval_mode == CEED_EVAL_GRAD;
25922b730f8bSJeremy L Thompson       CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis));
25932b730f8bSJeremy L Thompson       CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr));
2594eaf62fffSJeremy L Thompson     }
2595eaf62fffSJeremy L Thompson   }
25966574a04fSJeremy L Thompson   CeedCheck(basis, ceed, CEED_ERROR_BACKEND, "No active field set");
25972b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumNodes1D(basis, &P_1d));
2598352a5e7cSSebastian Grimberg   CeedCall(CeedBasisGetNumNodes(basis, &num_nodes));
25992b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints1D(basis, &Q_1d));
26002b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis, &num_qpts));
26012b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetDimension(basis, &dim));
26022b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumComponents(basis, &num_comp));
26032b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem));
26042b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size));
2605eaf62fffSJeremy L Thompson 
2606eaf62fffSJeremy L Thompson   // Build and diagonalize 1D Mass and Laplacian
26076574a04fSJeremy L Thompson   CeedCall(CeedBasisIsTensor(basis, &is_tensor_basis));
26086574a04fSJeremy L Thompson   CeedCheck(is_tensor_basis, ceed, CEED_ERROR_BACKEND, "FDMElementInverse only supported for tensor bases");
26092b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &mass));
26102b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &laplace));
26112b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &x));
26122b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &fdm_interp));
26132b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d, &lambda));
2614eaf62fffSJeremy L Thompson   // -- Build matrices
26152b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetInterp1D(basis, &interp_1d));
26162b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetGrad1D(basis, &grad_1d));
26172b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetQWeights(basis, &q_weight_1d));
26182b730f8bSJeremy L Thompson   CeedCall(CeedBuildMassLaplace(interp_1d, grad_1d, q_weight_1d, P_1d, Q_1d, dim, mass, laplace));
2619eaf62fffSJeremy L Thompson 
2620eaf62fffSJeremy L Thompson   // -- Diagonalize
26212b730f8bSJeremy L Thompson   CeedCall(CeedSimultaneousDiagonalization(ceed, laplace, mass, x, lambda, P_1d));
26222b730f8bSJeremy L Thompson   CeedCall(CeedFree(&mass));
26232b730f8bSJeremy L Thompson   CeedCall(CeedFree(&laplace));
26242b730f8bSJeremy L Thompson   for (CeedInt i = 0; i < P_1d; i++) {
26252b730f8bSJeremy L Thompson     for (CeedInt j = 0; j < P_1d; j++) fdm_interp[i + j * P_1d] = x[j + i * P_1d];
26262b730f8bSJeremy L Thompson   }
26272b730f8bSJeremy L Thompson   CeedCall(CeedFree(&x));
2628eaf62fffSJeremy L Thompson 
26291c66c397SJeremy L Thompson   {
26301c66c397SJeremy L Thompson     CeedInt             layout[3], num_modes = (interp ? 1 : 0) + (grad ? dim : 0);
26311c66c397SJeremy L Thompson     CeedScalar          max_norm = 0;
26321c66c397SJeremy L Thompson     const CeedScalar   *assembled_array, *q_weight_array;
26331c66c397SJeremy L Thompson     CeedVector          assembled = NULL, q_weight;
2634c5f45aeaSJeremy L Thompson     CeedElemRestriction rstr_qf   = NULL;
26351c66c397SJeremy L Thompson 
26361c66c397SJeremy L Thompson     // Assemble QFunction
26372b730f8bSJeremy L Thompson     CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled, &rstr_qf, request));
26382b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionGetELayout(rstr_qf, &layout));
26392b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionDestroy(&rstr_qf));
26402b730f8bSJeremy L Thompson     CeedCall(CeedVectorNorm(assembled, CEED_NORM_MAX, &max_norm));
2641eaf62fffSJeremy L Thompson 
2642eaf62fffSJeremy L Thompson     // Calculate element averages
26432b730f8bSJeremy L Thompson     CeedCall(CeedVectorCreate(ceed_parent, num_qpts, &q_weight));
26442b730f8bSJeremy L Thompson     CeedCall(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, q_weight));
26452b730f8bSJeremy L Thompson     CeedCall(CeedVectorGetArrayRead(assembled, CEED_MEM_HOST, &assembled_array));
26462b730f8bSJeremy L Thompson     CeedCall(CeedVectorGetArrayRead(q_weight, CEED_MEM_HOST, &q_weight_array));
26472b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(num_elem, &elem_avg));
2648eaf62fffSJeremy L Thompson     const CeedScalar qf_value_bound = max_norm * 100 * CEED_EPSILON;
26491c66c397SJeremy L Thompson 
2650eaf62fffSJeremy L Thompson     for (CeedInt e = 0; e < num_elem; e++) {
2651eaf62fffSJeremy L Thompson       CeedInt count = 0;
26521c66c397SJeremy L Thompson 
26532b730f8bSJeremy L Thompson       for (CeedInt q = 0; q < num_qpts; q++) {
26542b730f8bSJeremy L Thompson         for (CeedInt i = 0; i < num_comp * num_comp * num_modes * num_modes; i++) {
26552b730f8bSJeremy L Thompson           if (fabs(assembled_array[q * layout[0] + i * layout[1] + e * layout[2]]) > qf_value_bound) {
26562b730f8bSJeremy L Thompson             elem_avg[e] += assembled_array[q * layout[0] + i * layout[1] + e * layout[2]] / q_weight_array[q];
2657eaf62fffSJeremy L Thompson             count++;
2658eaf62fffSJeremy L Thompson           }
26592b730f8bSJeremy L Thompson         }
26602b730f8bSJeremy L Thompson       }
2661eaf62fffSJeremy L Thompson       if (count) {
2662eaf62fffSJeremy L Thompson         elem_avg[e] /= count;
2663eaf62fffSJeremy L Thompson       } else {
2664eaf62fffSJeremy L Thompson         elem_avg[e] = 1.0;
2665eaf62fffSJeremy L Thompson       }
2666eaf62fffSJeremy L Thompson     }
26672b730f8bSJeremy L Thompson     CeedCall(CeedVectorRestoreArrayRead(assembled, &assembled_array));
26682b730f8bSJeremy L Thompson     CeedCall(CeedVectorDestroy(&assembled));
26692b730f8bSJeremy L Thompson     CeedCall(CeedVectorRestoreArrayRead(q_weight, &q_weight_array));
26702b730f8bSJeremy L Thompson     CeedCall(CeedVectorDestroy(&q_weight));
26711c66c397SJeremy L Thompson   }
2672eaf62fffSJeremy L Thompson 
2673eaf62fffSJeremy L Thompson   // Build FDM diagonal
26741c66c397SJeremy L Thompson   {
2675eaf62fffSJeremy L Thompson     CeedScalar *q_data_array, *fdm_diagonal;
26761c66c397SJeremy L Thompson 
2677352a5e7cSSebastian Grimberg     CeedCall(CeedCalloc(num_comp * num_nodes, &fdm_diagonal));
2678352a5e7cSSebastian Grimberg     const CeedScalar fdm_diagonal_bound = num_nodes * CEED_EPSILON;
26792b730f8bSJeremy L Thompson     for (CeedInt c = 0; c < num_comp; c++) {
2680352a5e7cSSebastian Grimberg       for (CeedInt n = 0; n < num_nodes; n++) {
2681352a5e7cSSebastian Grimberg         if (interp) fdm_diagonal[c * num_nodes + n] = 1.0;
26822b730f8bSJeremy L Thompson         if (grad) {
2683eaf62fffSJeremy L Thompson           for (CeedInt d = 0; d < dim; d++) {
2684eaf62fffSJeremy L Thompson             CeedInt i = (n / CeedIntPow(P_1d, d)) % P_1d;
2685352a5e7cSSebastian Grimberg             fdm_diagonal[c * num_nodes + n] += lambda[i];
2686eaf62fffSJeremy L Thompson           }
2687eaf62fffSJeremy L Thompson         }
2688352a5e7cSSebastian Grimberg         if (fabs(fdm_diagonal[c * num_nodes + n]) < fdm_diagonal_bound) fdm_diagonal[c * num_nodes + n] = fdm_diagonal_bound;
26892b730f8bSJeremy L Thompson       }
26902b730f8bSJeremy L Thompson     }
2691352a5e7cSSebastian Grimberg     CeedCall(CeedVectorCreate(ceed_parent, num_elem * num_comp * num_nodes, &q_data));
26922b730f8bSJeremy L Thompson     CeedCall(CeedVectorSetValue(q_data, 0.0));
26932b730f8bSJeremy L Thompson     CeedCall(CeedVectorGetArrayWrite(q_data, CEED_MEM_HOST, &q_data_array));
26942b730f8bSJeremy L Thompson     for (CeedInt e = 0; e < num_elem; e++) {
26952b730f8bSJeremy L Thompson       for (CeedInt c = 0; c < num_comp; c++) {
26961c66c397SJeremy L Thompson         for (CeedInt n = 0; n < num_nodes; n++)
26971c66c397SJeremy L Thompson           q_data_array[(e * num_comp + c) * num_nodes + n] = 1. / (elem_avg[e] * fdm_diagonal[c * num_nodes + n]);
26982b730f8bSJeremy L Thompson       }
26992b730f8bSJeremy L Thompson     }
27002b730f8bSJeremy L Thompson     CeedCall(CeedFree(&elem_avg));
27012b730f8bSJeremy L Thompson     CeedCall(CeedFree(&fdm_diagonal));
27022b730f8bSJeremy L Thompson     CeedCall(CeedVectorRestoreArray(q_data, &q_data_array));
27031c66c397SJeremy L Thompson   }
2704eaf62fffSJeremy L Thompson 
2705eaf62fffSJeremy L Thompson   // Setup FDM operator
2706eaf62fffSJeremy L Thompson   // -- Basis
27071c66c397SJeremy L Thompson   {
2708eaf62fffSJeremy L Thompson     CeedScalar *grad_dummy, *q_ref_dummy, *q_weight_dummy;
27091c66c397SJeremy L Thompson 
27102b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(P_1d * P_1d, &grad_dummy));
27112b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(P_1d, &q_ref_dummy));
27122b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(P_1d, &q_weight_dummy));
27132b730f8bSJeremy L Thompson     CeedCall(CeedBasisCreateTensorH1(ceed_parent, dim, num_comp, P_1d, P_1d, fdm_interp, grad_dummy, q_ref_dummy, q_weight_dummy, &fdm_basis));
27142b730f8bSJeremy L Thompson     CeedCall(CeedFree(&fdm_interp));
27152b730f8bSJeremy L Thompson     CeedCall(CeedFree(&grad_dummy));
27162b730f8bSJeremy L Thompson     CeedCall(CeedFree(&q_ref_dummy));
27172b730f8bSJeremy L Thompson     CeedCall(CeedFree(&q_weight_dummy));
27182b730f8bSJeremy L Thompson     CeedCall(CeedFree(&lambda));
27191c66c397SJeremy L Thompson   }
2720eaf62fffSJeremy L Thompson 
2721eaf62fffSJeremy L Thompson   // -- Restriction
27221c66c397SJeremy L Thompson   {
2723352a5e7cSSebastian Grimberg     CeedInt strides[3] = {1, num_nodes, num_nodes * num_comp};
2724352a5e7cSSebastian Grimberg     CeedCall(CeedElemRestrictionCreateStrided(ceed_parent, num_elem, num_nodes, num_comp, num_elem * num_comp * num_nodes, strides, &rstr_qd_i));
27251c66c397SJeremy L Thompson   }
27261c66c397SJeremy L Thompson 
2727eaf62fffSJeremy L Thompson   // -- QFunction
27282b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionCreateInteriorByName(ceed_parent, "Scale", &qf_fdm));
27292b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAddInput(qf_fdm, "input", num_comp, CEED_EVAL_INTERP));
27302b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAddInput(qf_fdm, "scale", num_comp, CEED_EVAL_NONE));
27312b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAddOutput(qf_fdm, "output", num_comp, CEED_EVAL_INTERP));
27322b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_fdm, num_comp));
27331c66c397SJeremy L Thompson 
2734eaf62fffSJeremy L Thompson   // -- QFunction context
27351c66c397SJeremy L Thompson   {
2736eaf62fffSJeremy L Thompson     CeedInt *num_comp_data;
27371c66c397SJeremy L Thompson 
27382b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(1, &num_comp_data));
2739eaf62fffSJeremy L Thompson     num_comp_data[0] = num_comp;
27402b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextCreate(ceed, &ctx_fdm));
27412b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionContextSetData(ctx_fdm, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_data), num_comp_data));
27421c66c397SJeremy L Thompson   }
27432b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionSetContext(qf_fdm, ctx_fdm));
27442b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionContextDestroy(&ctx_fdm));
27451c66c397SJeremy L Thompson 
2746eaf62fffSJeremy L Thompson   // -- Operator
27472b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCreate(ceed_parent, qf_fdm, NULL, NULL, fdm_inv));
27482b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetField(*fdm_inv, "input", rstr, fdm_basis, CEED_VECTOR_ACTIVE));
2749356036faSJeremy L Thompson   CeedCall(CeedOperatorSetField(*fdm_inv, "scale", rstr_qd_i, CEED_BASIS_NONE, q_data));
27502b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetField(*fdm_inv, "output", rstr, fdm_basis, CEED_VECTOR_ACTIVE));
2751eaf62fffSJeremy L Thompson 
2752eaf62fffSJeremy L Thompson   // Cleanup
27532b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&q_data));
27542b730f8bSJeremy L Thompson   CeedCall(CeedBasisDestroy(&fdm_basis));
27552b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&rstr_qd_i));
27562b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionDestroy(&qf_fdm));
2757eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
2758eaf62fffSJeremy L Thompson }
2759eaf62fffSJeremy L Thompson 
2760eaf62fffSJeremy L Thompson /// @}
2761