xref: /libCEED/interface/ceed-preconditioning.c (revision f3d47e3642aeddb363a2ee1bc484555cc57cbb59)
13d8e8822SJeremy L Thompson // Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors.
23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details.
3eaf62fffSJeremy L Thompson //
43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause
5eaf62fffSJeremy L Thompson //
63d8e8822SJeremy L Thompson // This file is part of CEED:  http://github.com/ceed
7eaf62fffSJeremy L Thompson 
8ed9e99e6SJeremy L Thompson #include <assert.h>
92b730f8bSJeremy L Thompson #include <ceed-impl.h>
102b730f8bSJeremy L Thompson #include <ceed/backend.h>
112b730f8bSJeremy L Thompson #include <ceed/ceed.h>
122b730f8bSJeremy L Thompson #include <math.h>
13eaf62fffSJeremy L Thompson #include <stdbool.h>
14eaf62fffSJeremy L Thompson #include <stdio.h>
15eaf62fffSJeremy L Thompson #include <string.h>
16eaf62fffSJeremy L Thompson 
17eaf62fffSJeremy L Thompson /// @file
18eaf62fffSJeremy L Thompson /// Implementation of CeedOperator preconditioning interfaces
19eaf62fffSJeremy L Thompson 
20eaf62fffSJeremy L Thompson /// ----------------------------------------------------------------------------
21eaf62fffSJeremy L Thompson /// CeedOperator Library Internal Preconditioning Functions
22eaf62fffSJeremy L Thompson /// ----------------------------------------------------------------------------
23eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorDeveloper
24eaf62fffSJeremy L Thompson /// @{
25eaf62fffSJeremy L Thompson 
26eaf62fffSJeremy L Thompson /**
27ea61e9acSJeremy L Thompson   @brief Duplicate a CeedQFunction with a reference Ceed to fallback for advanced CeedOperator functionality
289e77b9c8SJeremy L Thompson 
2901ea9c81SJed Brown   @param[in]  fallback_ceed Ceed on which to create fallback CeedQFunction
309e77b9c8SJeremy L Thompson   @param[in]  qf            CeedQFunction to create fallback for
3101ea9c81SJed Brown   @param[out] qf_fallback   fallback CeedQFunction
329e77b9c8SJeremy L Thompson 
339e77b9c8SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
349e77b9c8SJeremy L Thompson 
359e77b9c8SJeremy L Thompson   @ref Developer
369e77b9c8SJeremy L Thompson **/
372b730f8bSJeremy L Thompson static int CeedQFunctionCreateFallback(Ceed fallback_ceed, CeedQFunction qf, CeedQFunction *qf_fallback) {
389e77b9c8SJeremy L Thompson   // Check if NULL qf passed in
399e77b9c8SJeremy L Thompson   if (!qf) return CEED_ERROR_SUCCESS;
409e77b9c8SJeremy L Thompson 
41d04bbc78SJeremy L Thompson   CeedDebug256(qf->ceed, 1, "---------- CeedOperator Fallback ----------\n");
4213f886e9SJeremy L Thompson   CeedDebug(qf->ceed, "Creating fallback CeedQFunction\n");
43d04bbc78SJeremy L Thompson 
449e77b9c8SJeremy L Thompson   char *source_path_with_name = "";
459e77b9c8SJeremy L Thompson   if (qf->source_path) {
462b730f8bSJeremy L Thompson     size_t path_len = strlen(qf->source_path), name_len = strlen(qf->kernel_name);
472b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(path_len + name_len + 2, &source_path_with_name));
489e77b9c8SJeremy L Thompson     memcpy(source_path_with_name, qf->source_path, path_len);
499e77b9c8SJeremy L Thompson     memcpy(&source_path_with_name[path_len], ":", 1);
509e77b9c8SJeremy L Thompson     memcpy(&source_path_with_name[path_len + 1], qf->kernel_name, name_len);
519e77b9c8SJeremy L Thompson   } else {
522b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(1, &source_path_with_name));
539e77b9c8SJeremy L Thompson   }
549e77b9c8SJeremy L Thompson 
552b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionCreateInterior(fallback_ceed, qf->vec_length, qf->function, source_path_with_name, qf_fallback));
569e77b9c8SJeremy L Thompson   {
579e77b9c8SJeremy L Thompson     CeedQFunctionContext ctx;
589e77b9c8SJeremy L Thompson 
592b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionGetContext(qf, &ctx));
602b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionSetContext(*qf_fallback, ctx));
619e77b9c8SJeremy L Thompson   }
629e77b9c8SJeremy L Thompson   for (CeedInt i = 0; i < qf->num_input_fields; i++) {
632b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddInput(*qf_fallback, qf->input_fields[i]->field_name, qf->input_fields[i]->size, qf->input_fields[i]->eval_mode));
649e77b9c8SJeremy L Thompson   }
659e77b9c8SJeremy L Thompson   for (CeedInt i = 0; i < qf->num_output_fields; i++) {
662b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAddOutput(*qf_fallback, qf->output_fields[i]->field_name, qf->output_fields[i]->size, qf->output_fields[i]->eval_mode));
679e77b9c8SJeremy L Thompson   }
682b730f8bSJeremy L Thompson   CeedCall(CeedFree(&source_path_with_name));
699e77b9c8SJeremy L Thompson 
709e77b9c8SJeremy L Thompson   return CEED_ERROR_SUCCESS;
719e77b9c8SJeremy L Thompson }
729e77b9c8SJeremy L Thompson 
739e77b9c8SJeremy L Thompson /**
74ea61e9acSJeremy L Thompson   @brief Duplicate a CeedOperator with a reference Ceed to fallback for advanced CeedOperator functionality
75eaf62fffSJeremy L Thompson 
76ea61e9acSJeremy L Thompson   @param[in,out] op CeedOperator to create fallback for
77eaf62fffSJeremy L Thompson 
78eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
79eaf62fffSJeremy L Thompson 
80eaf62fffSJeremy L Thompson   @ref Developer
81eaf62fffSJeremy L Thompson **/
82d04bbc78SJeremy L Thompson static int CeedOperatorCreateFallback(CeedOperator op) {
839e77b9c8SJeremy L Thompson   Ceed ceed_fallback;
84eaf62fffSJeremy L Thompson 
85805fe78eSJeremy L Thompson   // Check not already created
86805fe78eSJeremy L Thompson   if (op->op_fallback) return CEED_ERROR_SUCCESS;
87805fe78eSJeremy L Thompson 
88eaf62fffSJeremy L Thompson   // Fallback Ceed
892b730f8bSJeremy L Thompson   CeedCall(CeedGetOperatorFallbackCeed(op->ceed, &ceed_fallback));
90d04bbc78SJeremy L Thompson   if (!ceed_fallback) return CEED_ERROR_SUCCESS;
91d04bbc78SJeremy L Thompson 
92d04bbc78SJeremy L Thompson   CeedDebug256(op->ceed, 1, "---------- CeedOperator Fallback ----------\n");
9313f886e9SJeremy L Thompson   CeedDebug(op->ceed, "Creating fallback CeedOperator\n");
94eaf62fffSJeremy L Thompson 
95eaf62fffSJeremy L Thompson   // Clone Op
96805fe78eSJeremy L Thompson   CeedOperator op_fallback;
97805fe78eSJeremy L Thompson   if (op->is_composite) {
982b730f8bSJeremy L Thompson     CeedCall(CeedCompositeOperatorCreate(ceed_fallback, &op_fallback));
99805fe78eSJeremy L Thompson     for (CeedInt i = 0; i < op->num_suboperators; i++) {
100d04bbc78SJeremy L Thompson       CeedOperator op_sub_fallback;
101d04bbc78SJeremy L Thompson 
1022b730f8bSJeremy L Thompson       CeedCall(CeedOperatorGetFallback(op->sub_operators[i], &op_sub_fallback));
1032b730f8bSJeremy L Thompson       CeedCall(CeedCompositeOperatorAddSub(op_fallback, op_sub_fallback));
104805fe78eSJeremy L Thompson     }
105805fe78eSJeremy L Thompson   } else {
1069e77b9c8SJeremy L Thompson     CeedQFunction qf_fallback = NULL, dqf_fallback = NULL, dqfT_fallback = NULL;
1072b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->qf, &qf_fallback));
1082b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqf, &dqf_fallback));
1092b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionCreateFallback(ceed_fallback, op->dqfT, &dqfT_fallback));
1102b730f8bSJeremy L Thompson     CeedCall(CeedOperatorCreate(ceed_fallback, qf_fallback, dqf_fallback, dqfT_fallback, &op_fallback));
111805fe78eSJeremy L Thompson     for (CeedInt i = 0; i < op->qf->num_input_fields; i++) {
1122b730f8bSJeremy L Thompson       CeedCall(CeedOperatorSetField(op_fallback, op->input_fields[i]->field_name, op->input_fields[i]->elem_restr, op->input_fields[i]->basis,
1132b730f8bSJeremy L Thompson                                     op->input_fields[i]->vec));
114805fe78eSJeremy L Thompson     }
115805fe78eSJeremy L Thompson     for (CeedInt i = 0; i < op->qf->num_output_fields; i++) {
1162b730f8bSJeremy L Thompson       CeedCall(CeedOperatorSetField(op_fallback, op->output_fields[i]->field_name, op->output_fields[i]->elem_restr, op->output_fields[i]->basis,
1172b730f8bSJeremy L Thompson                                     op->output_fields[i]->vec));
118805fe78eSJeremy L Thompson     }
1192b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op->qf_assembled, &op_fallback->qf_assembled));
120805fe78eSJeremy L Thompson     if (op_fallback->num_qpts == 0) {
1212b730f8bSJeremy L Thompson       CeedCall(CeedOperatorSetNumQuadraturePoints(op_fallback, op->num_qpts));
122805fe78eSJeremy L Thompson     }
1239e77b9c8SJeremy L Thompson     // Cleanup
1242b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionDestroy(&qf_fallback));
1252b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionDestroy(&dqf_fallback));
1262b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionDestroy(&dqfT_fallback));
127805fe78eSJeremy L Thompson   }
1282b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetName(op_fallback, op->name));
1292b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op_fallback));
130805fe78eSJeremy L Thompson   op->op_fallback = op_fallback;
131eaf62fffSJeremy L Thompson 
132eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
133eaf62fffSJeremy L Thompson }
134eaf62fffSJeremy L Thompson 
135eaf62fffSJeremy L Thompson /**
136ea61e9acSJeremy L Thompson   @brief Retrieve fallback CeedOperator with a reference Ceed for advanced CeedOperator functionality
137d04bbc78SJeremy L Thompson 
138d04bbc78SJeremy L Thompson   @param[in]  op          CeedOperator to retrieve fallback for
139d04bbc78SJeremy L Thompson   @param[out] op_fallback Fallback CeedOperator
140d04bbc78SJeremy L Thompson 
141d04bbc78SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
142d04bbc78SJeremy L Thompson 
143d04bbc78SJeremy L Thompson   @ref Developer
144d04bbc78SJeremy L Thompson **/
145d04bbc78SJeremy L Thompson int CeedOperatorGetFallback(CeedOperator op, CeedOperator *op_fallback) {
146d04bbc78SJeremy L Thompson   // Create if needed
147d04bbc78SJeremy L Thompson   if (!op->op_fallback) {
1482b730f8bSJeremy L Thompson     CeedCall(CeedOperatorCreateFallback(op));
149d04bbc78SJeremy L Thompson   }
150d04bbc78SJeremy L Thompson   if (op->op_fallback) {
151d04bbc78SJeremy L Thompson     bool is_debug;
152d04bbc78SJeremy L Thompson 
1532b730f8bSJeremy L Thompson     CeedCall(CeedIsDebug(op->ceed, &is_debug));
154d04bbc78SJeremy L Thompson     if (is_debug) {
155d04bbc78SJeremy L Thompson       Ceed        ceed_fallback;
156d04bbc78SJeremy L Thompson       const char *resource, *resource_fallback;
157d04bbc78SJeremy L Thompson 
1582b730f8bSJeremy L Thompson       CeedCall(CeedGetOperatorFallbackCeed(op->ceed, &ceed_fallback));
1592b730f8bSJeremy L Thompson       CeedCall(CeedGetResource(op->ceed, &resource));
1602b730f8bSJeremy L Thompson       CeedCall(CeedGetResource(ceed_fallback, &resource_fallback));
161d04bbc78SJeremy L Thompson 
162d04bbc78SJeremy L Thompson       CeedDebug256(op->ceed, 1, "---------- CeedOperator Fallback ----------\n");
1632b730f8bSJeremy L Thompson       CeedDebug(op->ceed, "Falling back from %s operator at address %ld to %s operator at address %ld\n", resource, op, resource_fallback,
1642b730f8bSJeremy L Thompson                 op->op_fallback);
165d04bbc78SJeremy L Thompson     }
166d04bbc78SJeremy L Thompson   }
167d04bbc78SJeremy L Thompson   *op_fallback = op->op_fallback;
168d04bbc78SJeremy L Thompson 
169d04bbc78SJeremy L Thompson   return CEED_ERROR_SUCCESS;
170d04bbc78SJeremy L Thompson }
171d04bbc78SJeremy L Thompson 
172d04bbc78SJeremy L Thompson /**
173eaf62fffSJeremy L Thompson   @brief Select correct basis matrix pointer based on CeedEvalMode
174eaf62fffSJeremy L Thompson 
175eaf62fffSJeremy L Thompson   @param[in]  eval_mode Current basis evaluation mode
176eaf62fffSJeremy L Thompson   @param[in]  identity  Pointer to identity matrix
177eaf62fffSJeremy L Thompson   @param[in]  interp    Pointer to interpolation matrix
178eaf62fffSJeremy L Thompson   @param[in]  grad      Pointer to gradient matrix
179eaf62fffSJeremy L Thompson   @param[out] basis_ptr Basis pointer to set
180eaf62fffSJeremy L Thompson 
181eaf62fffSJeremy L Thompson   @ref Developer
182eaf62fffSJeremy L Thompson **/
1832b730f8bSJeremy L Thompson static inline void CeedOperatorGetBasisPointer(CeedEvalMode eval_mode, const CeedScalar *identity, const CeedScalar *interp, const CeedScalar *grad,
1842b730f8bSJeremy L Thompson                                                const CeedScalar **basis_ptr) {
185eaf62fffSJeremy L Thompson   switch (eval_mode) {
186eaf62fffSJeremy L Thompson     case CEED_EVAL_NONE:
187eaf62fffSJeremy L Thompson       *basis_ptr = identity;
188eaf62fffSJeremy L Thompson       break;
189eaf62fffSJeremy L Thompson     case CEED_EVAL_INTERP:
190eaf62fffSJeremy L Thompson       *basis_ptr = interp;
191eaf62fffSJeremy L Thompson       break;
192eaf62fffSJeremy L Thompson     case CEED_EVAL_GRAD:
193eaf62fffSJeremy L Thompson       *basis_ptr = grad;
194eaf62fffSJeremy L Thompson       break;
195eaf62fffSJeremy L Thompson     case CEED_EVAL_WEIGHT:
196eaf62fffSJeremy L Thompson     case CEED_EVAL_DIV:
197eaf62fffSJeremy L Thompson     case CEED_EVAL_CURL:
198eaf62fffSJeremy L Thompson       break;  // Caught by QF Assembly
199eaf62fffSJeremy L Thompson   }
200ed9e99e6SJeremy L Thompson   assert(*basis_ptr != NULL);
201eaf62fffSJeremy L Thompson }
202eaf62fffSJeremy L Thompson 
203eaf62fffSJeremy L Thompson /**
204eaf62fffSJeremy L Thompson   @brief Create point block restriction for active operator field
205eaf62fffSJeremy L Thompson 
206eaf62fffSJeremy L Thompson   @param[in]  rstr            Original CeedElemRestriction for active field
207ea61e9acSJeremy L Thompson   @param[out] pointblock_rstr Address of the variable where the newly created CeedElemRestriction will be stored
208eaf62fffSJeremy L Thompson 
209eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
210eaf62fffSJeremy L Thompson 
211eaf62fffSJeremy L Thompson   @ref Developer
212eaf62fffSJeremy L Thompson **/
2132b730f8bSJeremy L Thompson static int CeedOperatorCreateActivePointBlockRestriction(CeedElemRestriction rstr, CeedElemRestriction *pointblock_rstr) {
214eaf62fffSJeremy L Thompson   Ceed ceed;
2152b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetCeed(rstr, &ceed));
216eaf62fffSJeremy L Thompson   const CeedInt *offsets;
2172b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetOffsets(rstr, CEED_MEM_HOST, &offsets));
218eaf62fffSJeremy L Thompson 
219eaf62fffSJeremy L Thompson   // Expand offsets
2207b63f5c6SJed Brown   CeedInt  num_elem, num_comp, elem_size, comp_stride, *pointblock_offsets;
2217b63f5c6SJed Brown   CeedSize l_size;
2222b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem));
2232b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp));
2242b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size));
2252b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetCompStride(rstr, &comp_stride));
2262b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size));
227eaf62fffSJeremy L Thompson   CeedInt shift = num_comp;
2282b730f8bSJeremy L Thompson   if (comp_stride != 1) shift *= num_comp;
2292b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(num_elem * elem_size, &pointblock_offsets));
230eaf62fffSJeremy L Thompson   for (CeedInt i = 0; i < num_elem * elem_size; i++) {
231eaf62fffSJeremy L Thompson     pointblock_offsets[i] = offsets[i] * shift;
232eaf62fffSJeremy L Thompson   }
233eaf62fffSJeremy L Thompson 
234eaf62fffSJeremy L Thompson   // Create new restriction
2352b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionCreate(ceed, num_elem, elem_size, num_comp * num_comp, 1, l_size * num_comp, CEED_MEM_HOST, CEED_OWN_POINTER,
2362b730f8bSJeremy L Thompson                                      pointblock_offsets, pointblock_rstr));
237eaf62fffSJeremy L Thompson 
238eaf62fffSJeremy L Thompson   // Cleanup
2392b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionRestoreOffsets(rstr, &offsets));
240eaf62fffSJeremy L Thompson 
241eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
242eaf62fffSJeremy L Thompson }
243eaf62fffSJeremy L Thompson 
244eaf62fffSJeremy L Thompson /**
245eaf62fffSJeremy L Thompson   @brief Core logic for assembling operator diagonal or point block diagonal
246eaf62fffSJeremy L Thompson 
247eaf62fffSJeremy L Thompson   @param[in]  op            CeedOperator to assemble point block diagonal
248ea61e9acSJeremy L Thompson   @param[in]  request       Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE
249eaf62fffSJeremy L Thompson   @param[in]  is_pointblock Boolean flag to assemble diagonal or point block diagonal
250eaf62fffSJeremy L Thompson   @param[out] assembled     CeedVector to store assembled diagonal
251eaf62fffSJeremy L Thompson 
252eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
253eaf62fffSJeremy L Thompson 
254eaf62fffSJeremy L Thompson   @ref Developer
255eaf62fffSJeremy L Thompson **/
2562b730f8bSJeremy L Thompson static inline int CeedSingleOperatorAssembleAddDiagonal_Core(CeedOperator op, CeedRequest *request, const bool is_pointblock, CeedVector assembled) {
257eaf62fffSJeremy L Thompson   Ceed ceed;
2582b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
259eaf62fffSJeremy L Thompson 
260eaf62fffSJeremy L Thompson   // Assemble QFunction
261eaf62fffSJeremy L Thompson   CeedQFunction qf;
2622b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetQFunction(op, &qf));
263eaf62fffSJeremy L Thompson   CeedInt num_input_fields, num_output_fields;
2642b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionGetNumArgs(qf, &num_input_fields, &num_output_fields));
265eaf62fffSJeremy L Thompson   CeedVector          assembled_qf;
266eaf62fffSJeremy L Thompson   CeedElemRestriction rstr;
2672b730f8bSJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &rstr, request));
268eaf62fffSJeremy L Thompson   CeedInt layout[3];
2692b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetELayout(rstr, &layout));
2702b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&rstr));
271eaf62fffSJeremy L Thompson 
272ed9e99e6SJeremy L Thompson   // Get assembly data
273ed9e99e6SJeremy L Thompson   CeedOperatorAssemblyData data;
2742b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data));
275ed9e99e6SJeremy L Thompson   const CeedEvalMode *eval_mode_in, *eval_mode_out;
276ed9e99e6SJeremy L Thompson   CeedInt             num_eval_mode_in, num_eval_mode_out;
2772b730f8bSJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_eval_mode_in, &eval_mode_in, &num_eval_mode_out, &eval_mode_out));
278ed9e99e6SJeremy L Thompson   CeedBasis basis_in, basis_out;
2792b730f8bSJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetBases(data, &basis_in, NULL, &basis_out, NULL));
280ed9e99e6SJeremy L Thompson   CeedInt num_comp;
2812b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumComponents(basis_in, &num_comp));
282eaf62fffSJeremy L Thompson 
283eaf62fffSJeremy L Thompson   // Assemble point block diagonal restriction, if needed
284ed9e99e6SJeremy L Thompson   CeedElemRestriction diag_rstr;
2852b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveElemRestriction(op, &diag_rstr));
286eaf62fffSJeremy L Thompson   if (is_pointblock) {
287ed9e99e6SJeremy L Thompson     CeedElemRestriction point_block_rstr;
2882b730f8bSJeremy L Thompson     CeedCall(CeedOperatorCreateActivePointBlockRestriction(diag_rstr, &point_block_rstr));
289ed9e99e6SJeremy L Thompson     diag_rstr = point_block_rstr;
290eaf62fffSJeremy L Thompson   }
291eaf62fffSJeremy L Thompson 
292eaf62fffSJeremy L Thompson   // Create diagonal vector
293eaf62fffSJeremy L Thompson   CeedVector elem_diag;
2942b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionCreateVector(diag_rstr, NULL, &elem_diag));
295eaf62fffSJeremy L Thompson 
296eaf62fffSJeremy L Thompson   // Assemble element operator diagonals
2979c774eddSJeremy L Thompson   CeedScalar       *elem_diag_array;
2989c774eddSJeremy L Thompson   const CeedScalar *assembled_qf_array;
2992b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(elem_diag, 0.0));
3002b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArray(elem_diag, CEED_MEM_HOST, &elem_diag_array));
3012b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array));
302eaf62fffSJeremy L Thompson   CeedInt num_elem, num_nodes, num_qpts;
3032b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(diag_rstr, &num_elem));
3042b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumNodes(basis_in, &num_nodes));
3052b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_in, &num_qpts));
306ed9e99e6SJeremy L Thompson 
307eaf62fffSJeremy L Thompson   // Basis matrices
308eaf62fffSJeremy L Thompson   const CeedScalar *interp_in, *interp_out, *grad_in, *grad_out;
309eaf62fffSJeremy L Thompson   CeedScalar       *identity      = NULL;
310ed9e99e6SJeremy L Thompson   bool              has_eval_none = false;
311ed9e99e6SJeremy L Thompson   for (CeedInt i = 0; i < num_eval_mode_in; i++) {
312ed9e99e6SJeremy L Thompson     has_eval_none = has_eval_none || (eval_mode_in[i] == CEED_EVAL_NONE);
313ed9e99e6SJeremy L Thompson   }
314ed9e99e6SJeremy L Thompson   for (CeedInt i = 0; i < num_eval_mode_out; i++) {
315ed9e99e6SJeremy L Thompson     has_eval_none = has_eval_none || (eval_mode_out[i] == CEED_EVAL_NONE);
316ed9e99e6SJeremy L Thompson   }
317ed9e99e6SJeremy L Thompson   if (has_eval_none) {
3182b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(num_qpts * num_nodes, &identity));
3192b730f8bSJeremy L Thompson     for (CeedInt i = 0; i < (num_nodes < num_qpts ? num_nodes : num_qpts); i++) identity[i * num_nodes + i] = 1.0;
320eaf62fffSJeremy L Thompson   }
3212b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetInterp(basis_in, &interp_in));
3222b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetInterp(basis_out, &interp_out));
3232b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetGrad(basis_in, &grad_in));
3242b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetGrad(basis_out, &grad_out));
325eaf62fffSJeremy L Thompson   // Compute the diagonal of B^T D B
326eaf62fffSJeremy L Thompson   // Each element
327eaf62fffSJeremy L Thompson   for (CeedInt e = 0; e < num_elem; e++) {
328eaf62fffSJeremy L Thompson     CeedInt d_out = -1;
329eaf62fffSJeremy L Thompson     // Each basis eval mode pair
330eaf62fffSJeremy L Thompson     for (CeedInt e_out = 0; e_out < num_eval_mode_out; e_out++) {
331eaf62fffSJeremy L Thompson       const CeedScalar *bt = NULL;
3322b730f8bSJeremy L Thompson       if (eval_mode_out[e_out] == CEED_EVAL_GRAD) d_out += 1;
3332b730f8bSJeremy L Thompson       CeedOperatorGetBasisPointer(eval_mode_out[e_out], identity, interp_out, &grad_out[d_out * num_qpts * num_nodes], &bt);
334eaf62fffSJeremy L Thompson       CeedInt d_in = -1;
335eaf62fffSJeremy L Thompson       for (CeedInt e_in = 0; e_in < num_eval_mode_in; e_in++) {
336eaf62fffSJeremy L Thompson         const CeedScalar *b = NULL;
3372b730f8bSJeremy L Thompson         if (eval_mode_in[e_in] == CEED_EVAL_GRAD) d_in += 1;
3382b730f8bSJeremy L Thompson         CeedOperatorGetBasisPointer(eval_mode_in[e_in], identity, interp_in, &grad_in[d_in * num_qpts * num_nodes], &b);
339eaf62fffSJeremy L Thompson         // Each component
3402b730f8bSJeremy L Thompson         for (CeedInt c_out = 0; c_out < num_comp; c_out++) {
341eaf62fffSJeremy L Thompson           // Each qpoint/node pair
3422b730f8bSJeremy L Thompson           for (CeedInt q = 0; q < num_qpts; q++) {
343eaf62fffSJeremy L Thompson             if (is_pointblock) {
344eaf62fffSJeremy L Thompson               // Point Block Diagonal
345eaf62fffSJeremy L Thompson               for (CeedInt c_in = 0; c_in < num_comp; c_in++) {
346eaf62fffSJeremy L Thompson                 const CeedScalar qf_value =
3472b730f8bSJeremy L Thompson                     assembled_qf_array[q * layout[0] + (((e_in * num_comp + c_in) * num_eval_mode_out + e_out) * num_comp + c_out) * layout[1] +
3482b730f8bSJeremy L Thompson                                        e * layout[2]];
3492b730f8bSJeremy L Thompson                 for (CeedInt n = 0; n < num_nodes; n++) {
350eaf62fffSJeremy L Thompson                   elem_diag_array[((e * num_comp + c_out) * num_comp + c_in) * num_nodes + n] +=
351eaf62fffSJeremy L Thompson                       bt[q * num_nodes + n] * qf_value * b[q * num_nodes + n];
352eaf62fffSJeremy L Thompson                 }
3532b730f8bSJeremy L Thompson               }
354eaf62fffSJeremy L Thompson             } else {
355eaf62fffSJeremy L Thompson               // Diagonal Only
356eaf62fffSJeremy L Thompson               const CeedScalar qf_value =
3572b730f8bSJeremy L Thompson                   assembled_qf_array[q * layout[0] + (((e_in * num_comp + c_out) * num_eval_mode_out + e_out) * num_comp + c_out) * layout[1] +
3582b730f8bSJeremy L Thompson                                      e * layout[2]];
3592b730f8bSJeremy L Thompson               for (CeedInt n = 0; n < num_nodes; n++) {
3602b730f8bSJeremy L Thompson                 elem_diag_array[(e * num_comp + c_out) * num_nodes + n] += bt[q * num_nodes + n] * qf_value * b[q * num_nodes + n];
361eaf62fffSJeremy L Thompson               }
362eaf62fffSJeremy L Thompson             }
363eaf62fffSJeremy L Thompson           }
364eaf62fffSJeremy L Thompson         }
3652b730f8bSJeremy L Thompson       }
3662b730f8bSJeremy L Thompson     }
3672b730f8bSJeremy L Thompson   }
3682b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArray(elem_diag, &elem_diag_array));
3692b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array));
370eaf62fffSJeremy L Thompson 
371eaf62fffSJeremy L Thompson   // Assemble local operator diagonal
3722b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionApply(diag_rstr, CEED_TRANSPOSE, elem_diag, assembled, request));
373eaf62fffSJeremy L Thompson 
374eaf62fffSJeremy L Thompson   // Cleanup
375eaf62fffSJeremy L Thompson   if (is_pointblock) {
3762b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionDestroy(&diag_rstr));
377eaf62fffSJeremy L Thompson   }
3782b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&assembled_qf));
3792b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&elem_diag));
3802b730f8bSJeremy L Thompson   CeedCall(CeedFree(&identity));
381eaf62fffSJeremy L Thompson 
382eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
383eaf62fffSJeremy L Thompson }
384eaf62fffSJeremy L Thompson 
385eaf62fffSJeremy L Thompson /**
386eaf62fffSJeremy L Thompson   @brief Core logic for assembling composite operator diagonal
387eaf62fffSJeremy L Thompson 
388eaf62fffSJeremy L Thompson   @param[in]  op            CeedOperator to assemble point block diagonal
389ea61e9acSJeremy L Thompson   @param[in]  request       Address of CeedRequest for non-blocking completion, else CEED_REQUEST_IMMEDIATE
390eaf62fffSJeremy L Thompson   @param[in]  is_pointblock Boolean flag to assemble diagonal or point block diagonal
391eaf62fffSJeremy L Thompson   @param[out] assembled     CeedVector to store assembled diagonal
392eaf62fffSJeremy L Thompson 
393eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
394eaf62fffSJeremy L Thompson 
395eaf62fffSJeremy L Thompson   @ref Developer
396eaf62fffSJeremy L Thompson **/
3972b730f8bSJeremy L Thompson static inline int CeedCompositeOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedRequest *request, const bool is_pointblock,
398eaf62fffSJeremy L Thompson                                                                  CeedVector assembled) {
399eaf62fffSJeremy L Thompson   CeedInt       num_sub;
400eaf62fffSJeremy L Thompson   CeedOperator *suboperators;
401c6ebc35dSJeremy L Thompson   CeedCall(CeedCompositeOperatorGetNumSub(op, &num_sub));
402c6ebc35dSJeremy L Thompson   CeedCall(CeedCompositeOperatorGetSubList(op, &suboperators));
403eaf62fffSJeremy L Thompson   for (CeedInt i = 0; i < num_sub; i++) {
4046aa95790SJeremy L Thompson     if (is_pointblock) {
4052b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(suboperators[i], assembled, request));
4066aa95790SJeremy L Thompson     } else {
4072b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleAddDiagonal(suboperators[i], assembled, request));
4086aa95790SJeremy L Thompson     }
409eaf62fffSJeremy L Thompson   }
410eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
411eaf62fffSJeremy L Thompson }
412eaf62fffSJeremy L Thompson 
413eaf62fffSJeremy L Thompson /**
414eaf62fffSJeremy L Thompson   @brief Build nonzero pattern for non-composite operator
415eaf62fffSJeremy L Thompson 
416eaf62fffSJeremy L Thompson   Users should generally use CeedOperatorLinearAssembleSymbolic()
417eaf62fffSJeremy L Thompson 
418eaf62fffSJeremy L Thompson   @param[in]  op     CeedOperator to assemble nonzero pattern
419eaf62fffSJeremy L Thompson   @param[in]  offset Offset for number of entries
420eaf62fffSJeremy L Thompson   @param[out] rows   Row number for each entry
421eaf62fffSJeremy L Thompson   @param[out] cols   Column number for each entry
422eaf62fffSJeremy L Thompson 
423eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
424eaf62fffSJeremy L Thompson 
425eaf62fffSJeremy L Thompson   @ref Developer
426eaf62fffSJeremy L Thompson **/
4272b730f8bSJeremy L Thompson static int CeedSingleOperatorAssembleSymbolic(CeedOperator op, CeedInt offset, CeedInt *rows, CeedInt *cols) {
428*f3d47e36SJeremy L Thompson   Ceed ceed;
429*f3d47e36SJeremy L Thompson   bool is_composite;
430*f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
431*f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
432*f3d47e36SJeremy L Thompson 
4332b730f8bSJeremy L Thompson   if (op->is_composite) {
434eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
4352b730f8bSJeremy L Thompson     return CeedError(ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported");
436eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
4372b730f8bSJeremy L Thompson   }
438eaf62fffSJeremy L Thompson 
439c9366a6bSJeremy L Thompson   CeedSize num_nodes;
4402b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &num_nodes, NULL));
441eaf62fffSJeremy L Thompson   CeedElemRestriction rstr_in;
4422b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveElemRestriction(op, &rstr_in));
443e79b91d9SJeremy L Thompson   CeedInt num_elem, elem_size, num_comp;
4442b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(rstr_in, &num_elem));
4452b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetElementSize(rstr_in, &elem_size));
4462b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumComponents(rstr_in, &num_comp));
447eaf62fffSJeremy L Thompson   CeedInt layout_er[3];
4482b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetELayout(rstr_in, &layout_er));
449eaf62fffSJeremy L Thompson 
450eaf62fffSJeremy L Thompson   CeedInt local_num_entries = elem_size * num_comp * elem_size * num_comp * num_elem;
451eaf62fffSJeremy L Thompson 
452eaf62fffSJeremy L Thompson   // Determine elem_dof relation
453eaf62fffSJeremy L Thompson   CeedVector index_vec;
4542b730f8bSJeremy L Thompson   CeedCall(CeedVectorCreate(ceed, num_nodes, &index_vec));
455eaf62fffSJeremy L Thompson   CeedScalar *array;
4562b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayWrite(index_vec, CEED_MEM_HOST, &array));
457ed9e99e6SJeremy L Thompson   for (CeedInt i = 0; i < num_nodes; i++) array[i] = i;
4582b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArray(index_vec, &array));
459eaf62fffSJeremy L Thompson   CeedVector elem_dof;
4602b730f8bSJeremy L Thompson   CeedCall(CeedVectorCreate(ceed, num_elem * elem_size * num_comp, &elem_dof));
4612b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(elem_dof, 0.0));
4622b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionApply(rstr_in, CEED_NOTRANSPOSE, index_vec, elem_dof, CEED_REQUEST_IMMEDIATE));
463eaf62fffSJeremy L Thompson   const CeedScalar *elem_dof_a;
4642b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayRead(elem_dof, CEED_MEM_HOST, &elem_dof_a));
4652b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&index_vec));
466eaf62fffSJeremy L Thompson 
467eaf62fffSJeremy L Thompson   // Determine i, j locations for element matrices
468eaf62fffSJeremy L Thompson   CeedInt count = 0;
469ed9e99e6SJeremy L Thompson   for (CeedInt e = 0; e < num_elem; e++) {
470ed9e99e6SJeremy L Thompson     for (CeedInt comp_in = 0; comp_in < num_comp; comp_in++) {
471ed9e99e6SJeremy L Thompson       for (CeedInt comp_out = 0; comp_out < num_comp; comp_out++) {
472ed9e99e6SJeremy L Thompson         for (CeedInt i = 0; i < elem_size; i++) {
473ed9e99e6SJeremy L Thompson           for (CeedInt j = 0; j < elem_size; j++) {
4742b730f8bSJeremy L Thompson             const CeedInt elem_dof_index_row = i * layout_er[0] + (comp_out)*layout_er[1] + e * layout_er[2];
4752b730f8bSJeremy L Thompson             const CeedInt elem_dof_index_col = j * layout_er[0] + comp_in * layout_er[1] + e * layout_er[2];
476eaf62fffSJeremy L Thompson 
477eaf62fffSJeremy L Thompson             const CeedInt row = elem_dof_a[elem_dof_index_row];
478eaf62fffSJeremy L Thompson             const CeedInt col = elem_dof_a[elem_dof_index_col];
479eaf62fffSJeremy L Thompson 
480eaf62fffSJeremy L Thompson             rows[offset + count] = row;
481eaf62fffSJeremy L Thompson             cols[offset + count] = col;
482eaf62fffSJeremy L Thompson             count++;
483eaf62fffSJeremy L Thompson           }
484eaf62fffSJeremy L Thompson         }
485eaf62fffSJeremy L Thompson       }
486eaf62fffSJeremy L Thompson     }
487eaf62fffSJeremy L Thompson   }
4882b730f8bSJeremy L Thompson   if (count != local_num_entries) {
489eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
490eaf62fffSJeremy L Thompson     return CeedError(ceed, CEED_ERROR_MAJOR, "Error computing assembled entries");
491eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
4922b730f8bSJeremy L Thompson   }
4932b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArrayRead(elem_dof, &elem_dof_a));
4942b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&elem_dof));
495eaf62fffSJeremy L Thompson 
496eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
497eaf62fffSJeremy L Thompson }
498eaf62fffSJeremy L Thompson 
499eaf62fffSJeremy L Thompson /**
500eaf62fffSJeremy L Thompson   @brief Assemble nonzero entries for non-composite operator
501eaf62fffSJeremy L Thompson 
502eaf62fffSJeremy L Thompson   Users should generally use CeedOperatorLinearAssemble()
503eaf62fffSJeremy L Thompson 
504eaf62fffSJeremy L Thompson   @param[in]  op     CeedOperator to assemble
505ea61e9acSJeremy L Thompson   @param[in]  offset Offset for number of entries
506eaf62fffSJeremy L Thompson   @param[out] values Values to assemble into matrix
507eaf62fffSJeremy L Thompson 
508eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
509eaf62fffSJeremy L Thompson 
510eaf62fffSJeremy L Thompson   @ref Developer
511eaf62fffSJeremy L Thompson **/
5122b730f8bSJeremy L Thompson static int CeedSingleOperatorAssemble(CeedOperator op, CeedInt offset, CeedVector values) {
513*f3d47e36SJeremy L Thompson   Ceed ceed;
514*f3d47e36SJeremy L Thompson   bool is_composite;
515*f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
516*f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
517*f3d47e36SJeremy L Thompson 
518*f3d47e36SJeremy L Thompson   if (is_composite) {
519eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
5202b730f8bSJeremy L Thompson     return CeedError(ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported");
521eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
5222b730f8bSJeremy L Thompson   }
523*f3d47e36SJeremy L Thompson 
524*f3d47e36SJeremy L Thompson   // Early exit for empty operator
525*f3d47e36SJeremy L Thompson   {
526*f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
527*f3d47e36SJeremy L Thompson 
528*f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
529*f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
530*f3d47e36SJeremy L Thompson   }
531eaf62fffSJeremy L Thompson 
532cefa2673SJeremy L Thompson   if (op->LinearAssembleSingle) {
533cefa2673SJeremy L Thompson     // Backend version
5342b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleSingle(op, offset, values));
535cefa2673SJeremy L Thompson     return CEED_ERROR_SUCCESS;
536cefa2673SJeremy L Thompson   } else {
537cefa2673SJeremy L Thompson     // Operator fallback
538cefa2673SJeremy L Thompson     CeedOperator op_fallback;
539cefa2673SJeremy L Thompson 
5402b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
541cefa2673SJeremy L Thompson     if (op_fallback) {
5422b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemble(op_fallback, offset, values));
543cefa2673SJeremy L Thompson       return CEED_ERROR_SUCCESS;
544cefa2673SJeremy L Thompson     }
545cefa2673SJeremy L Thompson   }
546cefa2673SJeremy L Thompson 
547eaf62fffSJeremy L Thompson   // Assemble QFunction
548eaf62fffSJeremy L Thompson   CeedQFunction qf;
5492b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetQFunction(op, &qf));
550eaf62fffSJeremy L Thompson   CeedVector          assembled_qf;
551eaf62fffSJeremy L Thompson   CeedElemRestriction rstr_q;
5522b730f8bSJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled_qf, &rstr_q, CEED_REQUEST_IMMEDIATE));
5531f9221feSJeremy L Thompson   CeedSize qf_length;
5542b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetLength(assembled_qf, &qf_length));
555eaf62fffSJeremy L Thompson 
5567e7773b5SJeremy L Thompson   CeedInt            num_input_fields, num_output_fields;
557eaf62fffSJeremy L Thompson   CeedOperatorField *input_fields;
558eaf62fffSJeremy L Thompson   CeedOperatorField *output_fields;
5592b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetFields(op, &num_input_fields, &input_fields, &num_output_fields, &output_fields));
560eaf62fffSJeremy L Thompson 
561ed9e99e6SJeremy L Thompson   // Get assembly data
562ed9e99e6SJeremy L Thompson   CeedOperatorAssemblyData data;
5632b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetOperatorAssemblyData(op, &data));
564ed9e99e6SJeremy L Thompson   const CeedEvalMode *eval_mode_in, *eval_mode_out;
565ed9e99e6SJeremy L Thompson   CeedInt             num_eval_mode_in, num_eval_mode_out;
5662b730f8bSJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetEvalModes(data, &num_eval_mode_in, &eval_mode_in, &num_eval_mode_out, &eval_mode_out));
567ed9e99e6SJeremy L Thompson   CeedBasis basis_in, basis_out;
5682b730f8bSJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetBases(data, &basis_in, NULL, &basis_out, NULL));
569eaf62fffSJeremy L Thompson 
5702b730f8bSJeremy L Thompson   if (num_eval_mode_in == 0 || num_eval_mode_out == 0) {
571eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
5722b730f8bSJeremy L Thompson     return CeedError(ceed, CEED_ERROR_UNSUPPORTED, "Cannot assemble operator with out inputs/outputs");
573eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
5742b730f8bSJeremy L Thompson   }
575eaf62fffSJeremy L Thompson 
576ed9e99e6SJeremy L Thompson   CeedElemRestriction active_rstr;
577eaf62fffSJeremy L Thompson   CeedInt             num_elem, elem_size, num_qpts, num_comp;
5782b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveElemRestriction(op, &active_rstr));
5792b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(active_rstr, &num_elem));
5802b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetElementSize(active_rstr, &elem_size));
5812b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumComponents(active_rstr, &num_comp));
5822b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_in, &num_qpts));
583eaf62fffSJeremy L Thompson 
584eaf62fffSJeremy L Thompson   CeedInt local_num_entries = elem_size * num_comp * elem_size * num_comp * num_elem;
585eaf62fffSJeremy L Thompson 
586eaf62fffSJeremy L Thompson   // loop over elements and put in data structure
587eaf62fffSJeremy L Thompson   const CeedScalar *interp_in, *grad_in;
5882b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetInterp(basis_in, &interp_in));
5892b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetGrad(basis_in, &grad_in));
590eaf62fffSJeremy L Thompson 
591eaf62fffSJeremy L Thompson   const CeedScalar *assembled_qf_array;
5922b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayRead(assembled_qf, CEED_MEM_HOST, &assembled_qf_array));
593eaf62fffSJeremy L Thompson 
594eaf62fffSJeremy L Thompson   CeedInt layout_qf[3];
5952b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetELayout(rstr_q, &layout_qf));
5962b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&rstr_q));
597eaf62fffSJeremy L Thompson 
598eaf62fffSJeremy L Thompson   // we store B_mat_in, B_mat_out, BTD, elem_mat in row-major order
599ed9e99e6SJeremy L Thompson   const CeedScalar *B_mat_in, *B_mat_out;
6002b730f8bSJeremy L Thompson   CeedCall(CeedOperatorAssemblyDataGetBases(data, NULL, &B_mat_in, NULL, &B_mat_out));
601ed9e99e6SJeremy L Thompson   CeedScalar  BTD_mat[elem_size * num_qpts * num_eval_mode_in];
602eaf62fffSJeremy L Thompson   CeedScalar  elem_mat[elem_size * elem_size];
60392ae7e47SJeremy L Thompson   CeedInt     count = 0;
604eaf62fffSJeremy L Thompson   CeedScalar *vals;
6052b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayWrite(values, CEED_MEM_HOST, &vals));
606ed9e99e6SJeremy L Thompson   for (CeedInt e = 0; e < num_elem; e++) {
607ed9e99e6SJeremy L Thompson     for (CeedInt comp_in = 0; comp_in < num_comp; comp_in++) {
608ed9e99e6SJeremy L Thompson       for (CeedInt comp_out = 0; comp_out < num_comp; comp_out++) {
609ed9e99e6SJeremy L Thompson         // Compute B^T*D
610ed9e99e6SJeremy L Thompson         for (CeedInt n = 0; n < elem_size; n++) {
611ed9e99e6SJeremy L Thompson           for (CeedInt q = 0; q < num_qpts; q++) {
612ed9e99e6SJeremy L Thompson             for (CeedInt e_in = 0; e_in < num_eval_mode_in; e_in++) {
6132b730f8bSJeremy L Thompson               const CeedInt btd_index = n * (num_qpts * num_eval_mode_in) + (num_eval_mode_in * q + e_in);
614067fd99fSJeremy L Thompson               CeedScalar    sum       = 0.0;
615067fd99fSJeremy L Thompson               for (CeedInt e_out = 0; e_out < num_eval_mode_out; e_out++) {
616ed9e99e6SJeremy L Thompson                 const CeedInt b_out_index     = (num_eval_mode_out * q + e_out) * elem_size + n;
6172b730f8bSJeremy L Thompson                 const CeedInt eval_mode_index = ((e_in * num_comp + comp_in) * num_eval_mode_out + e_out) * num_comp + comp_out;
6182b730f8bSJeremy L Thompson                 const CeedInt qf_index        = q * layout_qf[0] + eval_mode_index * layout_qf[1] + e * layout_qf[2];
619067fd99fSJeremy L Thompson                 sum += B_mat_out[b_out_index] * assembled_qf_array[qf_index];
620eaf62fffSJeremy L Thompson               }
621067fd99fSJeremy L Thompson               BTD_mat[btd_index] = sum;
622ed9e99e6SJeremy L Thompson             }
623ed9e99e6SJeremy L Thompson           }
624eaf62fffSJeremy L Thompson         }
625eaf62fffSJeremy L Thompson         // form element matrix itself (for each block component)
6262b730f8bSJeremy L Thompson         CeedCall(CeedMatrixMatrixMultiply(ceed, BTD_mat, B_mat_in, elem_mat, elem_size, elem_size, num_qpts * num_eval_mode_in));
627eaf62fffSJeremy L Thompson 
628eaf62fffSJeremy L Thompson         // put element matrix in coordinate data structure
629ed9e99e6SJeremy L Thompson         for (CeedInt i = 0; i < elem_size; i++) {
630ed9e99e6SJeremy L Thompson           for (CeedInt j = 0; j < elem_size; j++) {
631eaf62fffSJeremy L Thompson             vals[offset + count] = elem_mat[i * elem_size + j];
632eaf62fffSJeremy L Thompson             count++;
633eaf62fffSJeremy L Thompson           }
634eaf62fffSJeremy L Thompson         }
635eaf62fffSJeremy L Thompson       }
636eaf62fffSJeremy L Thompson     }
637eaf62fffSJeremy L Thompson   }
6382b730f8bSJeremy L Thompson   if (count != local_num_entries) {
639eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
640eaf62fffSJeremy L Thompson     return CeedError(ceed, CEED_ERROR_MAJOR, "Error computing entries");
641eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
6422b730f8bSJeremy L Thompson   }
6432b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArray(values, &vals));
644eaf62fffSJeremy L Thompson 
6452b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArrayRead(assembled_qf, &assembled_qf_array));
6462b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&assembled_qf));
647eaf62fffSJeremy L Thompson 
648eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
649eaf62fffSJeremy L Thompson }
650eaf62fffSJeremy L Thompson 
651eaf62fffSJeremy L Thompson /**
652eaf62fffSJeremy L Thompson   @brief Count number of entries for assembled CeedOperator
653eaf62fffSJeremy L Thompson 
654eaf62fffSJeremy L Thompson   @param[in]  op          CeedOperator to assemble
655eaf62fffSJeremy L Thompson   @param[out] num_entries Number of entries in assembled representation
656eaf62fffSJeremy L Thompson 
657eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
658eaf62fffSJeremy L Thompson 
659eaf62fffSJeremy L Thompson   @ref Utility
660eaf62fffSJeremy L Thompson **/
6612b730f8bSJeremy L Thompson static int CeedSingleOperatorAssemblyCountEntries(CeedOperator op, CeedInt *num_entries) {
662eaf62fffSJeremy L Thompson   CeedElemRestriction rstr;
663eaf62fffSJeremy L Thompson   CeedInt             num_elem, elem_size, num_comp;
664eaf62fffSJeremy L Thompson 
6652b730f8bSJeremy L Thompson   if (op->is_composite) {
666eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
6672b730f8bSJeremy L Thompson     return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Composite operator not supported");
668eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
6692b730f8bSJeremy L Thompson   }
6702b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveElemRestriction(op, &rstr));
6712b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem));
6722b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetElementSize(rstr, &elem_size));
6732b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumComponents(rstr, &num_comp));
674eaf62fffSJeremy L Thompson   *num_entries = elem_size * num_comp * elem_size * num_comp * num_elem;
675eaf62fffSJeremy L Thompson 
676eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
677eaf62fffSJeremy L Thompson }
678eaf62fffSJeremy L Thompson 
679eaf62fffSJeremy L Thompson /**
680ea61e9acSJeremy L Thompson   @brief Common code for creating a multigrid coarse operator and level transfer operators for a CeedOperator
681eaf62fffSJeremy L Thompson 
682eaf62fffSJeremy L Thompson   @param[in]  op_fine      Fine grid operator
683eaf62fffSJeremy L Thompson   @param[in]  p_mult_fine  L-vector multiplicity in parallel gather/scatter
684eaf62fffSJeremy L Thompson   @param[in]  rstr_coarse  Coarse grid restriction
685eaf62fffSJeremy L Thompson   @param[in]  basis_coarse Coarse grid active vector basis
686eaf62fffSJeremy L Thompson   @param[in]  basis_c_to_f Basis for coarse to fine interpolation
687eaf62fffSJeremy L Thompson   @param[out] op_coarse    Coarse grid operator
688eaf62fffSJeremy L Thompson   @param[out] op_prolong   Coarse to fine operator
689eaf62fffSJeremy L Thompson   @param[out] op_restrict  Fine to coarse operator
690eaf62fffSJeremy L Thompson 
691eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
692eaf62fffSJeremy L Thompson 
693eaf62fffSJeremy L Thompson   @ref Developer
694eaf62fffSJeremy L Thompson **/
6952b730f8bSJeremy L Thompson static int CeedSingleOperatorMultigridLevel(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse,
6962b730f8bSJeremy L Thompson                                             CeedBasis basis_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) {
697eaf62fffSJeremy L Thompson   Ceed ceed;
6982b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op_fine, &ceed));
699eaf62fffSJeremy L Thompson 
700eaf62fffSJeremy L Thompson   // Check for composite operator
701eaf62fffSJeremy L Thompson   bool is_composite;
7022b730f8bSJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op_fine, &is_composite));
7032b730f8bSJeremy L Thompson   if (is_composite) {
704eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
7052b730f8bSJeremy L Thompson     return CeedError(ceed, CEED_ERROR_UNSUPPORTED, "Automatic multigrid setup for composite operators not supported");
706eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
7072b730f8bSJeremy L Thompson   }
708eaf62fffSJeremy L Thompson 
709eaf62fffSJeremy L Thompson   // Coarse Grid
7102b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCreate(ceed, op_fine->qf, op_fine->dqf, op_fine->dqfT, op_coarse));
711eaf62fffSJeremy L Thompson   CeedElemRestriction rstr_fine = NULL;
712eaf62fffSJeremy L Thompson   // -- Clone input fields
71392ae7e47SJeremy L Thompson   for (CeedInt i = 0; i < op_fine->qf->num_input_fields; i++) {
714eaf62fffSJeremy L Thompson     if (op_fine->input_fields[i]->vec == CEED_VECTOR_ACTIVE) {
715eaf62fffSJeremy L Thompson       rstr_fine = op_fine->input_fields[i]->elem_restr;
7162b730f8bSJeremy L Thompson       CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE));
717eaf62fffSJeremy L Thompson     } else {
7182b730f8bSJeremy L Thompson       CeedCall(CeedOperatorSetField(*op_coarse, op_fine->input_fields[i]->field_name, op_fine->input_fields[i]->elem_restr,
7192b730f8bSJeremy L Thompson                                     op_fine->input_fields[i]->basis, op_fine->input_fields[i]->vec));
720eaf62fffSJeremy L Thompson     }
721eaf62fffSJeremy L Thompson   }
722eaf62fffSJeremy L Thompson   // -- Clone output fields
72392ae7e47SJeremy L Thompson   for (CeedInt i = 0; i < op_fine->qf->num_output_fields; i++) {
724eaf62fffSJeremy L Thompson     if (op_fine->output_fields[i]->vec == CEED_VECTOR_ACTIVE) {
7252b730f8bSJeremy L Thompson       CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, rstr_coarse, basis_coarse, CEED_VECTOR_ACTIVE));
726eaf62fffSJeremy L Thompson     } else {
7272b730f8bSJeremy L Thompson       CeedCall(CeedOperatorSetField(*op_coarse, op_fine->output_fields[i]->field_name, op_fine->output_fields[i]->elem_restr,
7282b730f8bSJeremy L Thompson                                     op_fine->output_fields[i]->basis, op_fine->output_fields[i]->vec));
729eaf62fffSJeremy L Thompson     }
730eaf62fffSJeremy L Thompson   }
731af99e877SJeremy L Thompson   // -- Clone QFunctionAssemblyData
7322b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAssemblyDataReferenceCopy(op_fine->qf_assembled, &(*op_coarse)->qf_assembled));
733eaf62fffSJeremy L Thompson 
734eaf62fffSJeremy L Thompson   // Multiplicity vector
735eaf62fffSJeremy L Thompson   CeedVector mult_vec, mult_e_vec;
7362b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionCreateVector(rstr_fine, &mult_vec, &mult_e_vec));
7372b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(mult_e_vec, 0.0));
7382b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionApply(rstr_fine, CEED_NOTRANSPOSE, p_mult_fine, mult_e_vec, CEED_REQUEST_IMMEDIATE));
7392b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(mult_vec, 0.0));
7402b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionApply(rstr_fine, CEED_TRANSPOSE, mult_e_vec, mult_vec, CEED_REQUEST_IMMEDIATE));
7412b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&mult_e_vec));
7422b730f8bSJeremy L Thompson   CeedCall(CeedVectorReciprocal(mult_vec));
743eaf62fffSJeremy L Thompson 
744eaf62fffSJeremy L Thompson   // Restriction
745eaf62fffSJeremy L Thompson   CeedInt num_comp;
7462b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumComponents(basis_coarse, &num_comp));
747eaf62fffSJeremy L Thompson   CeedQFunction qf_restrict;
7482b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_restrict));
749eaf62fffSJeremy L Thompson   CeedInt *num_comp_r_data;
7502b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(1, &num_comp_r_data));
751eaf62fffSJeremy L Thompson   num_comp_r_data[0] = num_comp;
752eaf62fffSJeremy L Thompson   CeedQFunctionContext ctx_r;
7532b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionContextCreate(ceed, &ctx_r));
7542b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionContextSetData(ctx_r, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_r_data), num_comp_r_data));
7552b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionSetContext(qf_restrict, ctx_r));
7562b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionContextDestroy(&ctx_r));
7572b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAddInput(qf_restrict, "input", num_comp, CEED_EVAL_NONE));
7582b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAddInput(qf_restrict, "scale", num_comp, CEED_EVAL_NONE));
7592b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAddOutput(qf_restrict, "output", num_comp, CEED_EVAL_INTERP));
7602b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_restrict, num_comp));
761eaf62fffSJeremy L Thompson 
7622b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCreate(ceed, qf_restrict, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_restrict));
7632b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetField(*op_restrict, "input", rstr_fine, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE));
7642b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetField(*op_restrict, "scale", rstr_fine, CEED_BASIS_COLLOCATED, mult_vec));
7652b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetField(*op_restrict, "output", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE));
766eaf62fffSJeremy L Thompson 
767eaf62fffSJeremy L Thompson   // Prolongation
768eaf62fffSJeremy L Thompson   CeedQFunction qf_prolong;
7692b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionCreateInteriorByName(ceed, "Scale", &qf_prolong));
770eaf62fffSJeremy L Thompson   CeedInt *num_comp_p_data;
7712b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(1, &num_comp_p_data));
772eaf62fffSJeremy L Thompson   num_comp_p_data[0] = num_comp;
773eaf62fffSJeremy L Thompson   CeedQFunctionContext ctx_p;
7742b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionContextCreate(ceed, &ctx_p));
7752b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionContextSetData(ctx_p, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_p_data), num_comp_p_data));
7762b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionSetContext(qf_prolong, ctx_p));
7772b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionContextDestroy(&ctx_p));
7782b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAddInput(qf_prolong, "input", num_comp, CEED_EVAL_INTERP));
7792b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAddInput(qf_prolong, "scale", num_comp, CEED_EVAL_NONE));
7802b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAddOutput(qf_prolong, "output", num_comp, CEED_EVAL_NONE));
7812b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_prolong, num_comp));
782eaf62fffSJeremy L Thompson 
7832b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCreate(ceed, qf_prolong, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE, op_prolong));
7842b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetField(*op_prolong, "input", rstr_coarse, basis_c_to_f, CEED_VECTOR_ACTIVE));
7852b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetField(*op_prolong, "scale", rstr_fine, CEED_BASIS_COLLOCATED, mult_vec));
7862b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetField(*op_prolong, "output", rstr_fine, CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE));
787eaf62fffSJeremy L Thompson 
788ea6b5821SJeremy L Thompson   // Clone name
789ea6b5821SJeremy L Thompson   bool   has_name = op_fine->name;
790ea6b5821SJeremy L Thompson   size_t name_len = op_fine->name ? strlen(op_fine->name) : 0;
7912b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetName(*op_coarse, op_fine->name));
792ea6b5821SJeremy L Thompson   {
793ea6b5821SJeremy L Thompson     char *prolongation_name;
7942b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(18 + name_len, &prolongation_name));
7952b730f8bSJeremy L Thompson     sprintf(prolongation_name, "prolongation%s%s", has_name ? " for " : "", has_name ? op_fine->name : "");
7962b730f8bSJeremy L Thompson     CeedCall(CeedOperatorSetName(*op_prolong, prolongation_name));
7972b730f8bSJeremy L Thompson     CeedCall(CeedFree(&prolongation_name));
798ea6b5821SJeremy L Thompson   }
799ea6b5821SJeremy L Thompson   {
800ea6b5821SJeremy L Thompson     char *restriction_name;
8012b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(17 + name_len, &restriction_name));
8022b730f8bSJeremy L Thompson     sprintf(restriction_name, "restriction%s%s", has_name ? " for " : "", has_name ? op_fine->name : "");
8032b730f8bSJeremy L Thompson     CeedCall(CeedOperatorSetName(*op_restrict, restriction_name));
8042b730f8bSJeremy L Thompson     CeedCall(CeedFree(&restriction_name));
805ea6b5821SJeremy L Thompson   }
806ea6b5821SJeremy L Thompson 
80758e4b056SJeremy L Thompson   // Check
80858e4b056SJeremy L Thompson   CeedCall(CeedOperatorCheckReady(*op_coarse));
80958e4b056SJeremy L Thompson   CeedCall(CeedOperatorCheckReady(*op_prolong));
81058e4b056SJeremy L Thompson   CeedCall(CeedOperatorCheckReady(*op_restrict));
81158e4b056SJeremy L Thompson 
812eaf62fffSJeremy L Thompson   // Cleanup
8132b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&mult_vec));
8142b730f8bSJeremy L Thompson   CeedCall(CeedBasisDestroy(&basis_c_to_f));
8152b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionDestroy(&qf_restrict));
8162b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionDestroy(&qf_prolong));
817805fe78eSJeremy L Thompson 
818eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
819eaf62fffSJeremy L Thompson }
820eaf62fffSJeremy L Thompson 
821eaf62fffSJeremy L Thompson /**
822eaf62fffSJeremy L Thompson   @brief Build 1D mass matrix and Laplacian with perturbation
823eaf62fffSJeremy L Thompson 
824eaf62fffSJeremy L Thompson   @param[in]  interp_1d   Interpolation matrix in one dimension
825eaf62fffSJeremy L Thompson   @param[in]  grad_1d     Gradient matrix in one dimension
826eaf62fffSJeremy L Thompson   @param[in]  q_weight_1d Quadrature weights in one dimension
827eaf62fffSJeremy L Thompson   @param[in]  P_1d        Number of basis nodes in one dimension
828eaf62fffSJeremy L Thompson   @param[in]  Q_1d        Number of quadrature points in one dimension
829eaf62fffSJeremy L Thompson   @param[in]  dim         Dimension of basis
830eaf62fffSJeremy L Thompson   @param[out] mass        Assembled mass matrix in one dimension
831eaf62fffSJeremy L Thompson   @param[out] laplace     Assembled perturbed Laplacian in one dimension
832eaf62fffSJeremy L Thompson 
833eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
834eaf62fffSJeremy L Thompson 
835eaf62fffSJeremy L Thompson   @ref Developer
836eaf62fffSJeremy L Thompson **/
8372b730f8bSJeremy L Thompson CeedPragmaOptimizeOff static int CeedBuildMassLaplace(const CeedScalar *interp_1d, const CeedScalar *grad_1d, const CeedScalar *q_weight_1d,
8382b730f8bSJeremy L Thompson                                                       CeedInt P_1d, CeedInt Q_1d, CeedInt dim, CeedScalar *mass, CeedScalar *laplace) {
8392b730f8bSJeremy L Thompson   for (CeedInt i = 0; i < P_1d; i++) {
840eaf62fffSJeremy L Thompson     for (CeedInt j = 0; j < P_1d; j++) {
841eaf62fffSJeremy L Thompson       CeedScalar sum = 0.0;
8422b730f8bSJeremy L Thompson       for (CeedInt k = 0; k < Q_1d; k++) sum += interp_1d[k * P_1d + i] * q_weight_1d[k] * interp_1d[k * P_1d + j];
843eaf62fffSJeremy L Thompson       mass[i + j * P_1d] = sum;
844eaf62fffSJeremy L Thompson     }
8452b730f8bSJeremy L Thompson   }
846eaf62fffSJeremy L Thompson   // -- Laplacian
8472b730f8bSJeremy L Thompson   for (CeedInt i = 0; i < P_1d; i++) {
848eaf62fffSJeremy L Thompson     for (CeedInt j = 0; j < P_1d; j++) {
849eaf62fffSJeremy L Thompson       CeedScalar sum = 0.0;
8502b730f8bSJeremy L Thompson       for (CeedInt k = 0; k < Q_1d; k++) sum += grad_1d[k * P_1d + i] * q_weight_1d[k] * grad_1d[k * P_1d + j];
851eaf62fffSJeremy L Thompson       laplace[i + j * P_1d] = sum;
852eaf62fffSJeremy L Thompson     }
8532b730f8bSJeremy L Thompson   }
854eaf62fffSJeremy L Thompson   CeedScalar perturbation = dim > 2 ? 1e-6 : 1e-4;
8552b730f8bSJeremy L Thompson   for (CeedInt i = 0; i < P_1d; i++) laplace[i + P_1d * i] += perturbation;
856eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
857eaf62fffSJeremy L Thompson }
858ea61e9acSJeremy L Thompson CeedPragmaOptimizeOn;
859eaf62fffSJeremy L Thompson 
860eaf62fffSJeremy L Thompson /// @}
861eaf62fffSJeremy L Thompson 
862eaf62fffSJeremy L Thompson /// ----------------------------------------------------------------------------
863480fae85SJeremy L Thompson /// CeedOperator Backend API
864480fae85SJeremy L Thompson /// ----------------------------------------------------------------------------
865480fae85SJeremy L Thompson /// @addtogroup CeedOperatorBackend
866480fae85SJeremy L Thompson /// @{
867480fae85SJeremy L Thompson 
868480fae85SJeremy L Thompson /**
869480fae85SJeremy L Thompson   @brief Create object holding CeedQFunction assembly data for CeedOperator
870480fae85SJeremy L Thompson 
871480fae85SJeremy L Thompson   @param[in]  ceed A Ceed object where the CeedQFunctionAssemblyData will be created
872ea61e9acSJeremy L Thompson   @param[out] data Address of the variable where the newly created CeedQFunctionAssemblyData will be stored
873480fae85SJeremy L Thompson 
874480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
875480fae85SJeremy L Thompson 
876480fae85SJeremy L Thompson   @ref Backend
877480fae85SJeremy L Thompson **/
878ea61e9acSJeremy L Thompson int CeedQFunctionAssemblyDataCreate(Ceed ceed, CeedQFunctionAssemblyData *data) {
8792b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(1, data));
880480fae85SJeremy L Thompson   (*data)->ref_count = 1;
881480fae85SJeremy L Thompson   (*data)->ceed      = ceed;
8822b730f8bSJeremy L Thompson   CeedCall(CeedReference(ceed));
883480fae85SJeremy L Thompson 
884480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
885480fae85SJeremy L Thompson }
886480fae85SJeremy L Thompson 
887480fae85SJeremy L Thompson /**
888480fae85SJeremy L Thompson   @brief Increment the reference counter for a CeedQFunctionAssemblyData
889480fae85SJeremy L Thompson 
890ea61e9acSJeremy L Thompson   @param[in,out] data CeedQFunctionAssemblyData to increment the reference counter
891480fae85SJeremy L Thompson 
892480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
893480fae85SJeremy L Thompson 
894480fae85SJeremy L Thompson   @ref Backend
895480fae85SJeremy L Thompson **/
896480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataReference(CeedQFunctionAssemblyData data) {
897480fae85SJeremy L Thompson   data->ref_count++;
898480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
899480fae85SJeremy L Thompson }
900480fae85SJeremy L Thompson 
901480fae85SJeremy L Thompson /**
902beecbf24SJeremy L Thompson   @brief Set re-use of CeedQFunctionAssemblyData
9038b919e6bSJeremy L Thompson 
904ea61e9acSJeremy L Thompson   @param[in,out] data       CeedQFunctionAssemblyData to mark for reuse
905ea61e9acSJeremy L Thompson   @param[in]     reuse_data Boolean flag indicating data re-use
9068b919e6bSJeremy L Thompson 
9078b919e6bSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
9088b919e6bSJeremy L Thompson 
9098b919e6bSJeremy L Thompson   @ref Backend
9108b919e6bSJeremy L Thompson **/
9112b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetReuse(CeedQFunctionAssemblyData data, bool reuse_data) {
912beecbf24SJeremy L Thompson   data->reuse_data        = reuse_data;
913beecbf24SJeremy L Thompson   data->needs_data_update = true;
914beecbf24SJeremy L Thompson   return CEED_ERROR_SUCCESS;
915beecbf24SJeremy L Thompson }
916beecbf24SJeremy L Thompson 
917beecbf24SJeremy L Thompson /**
918beecbf24SJeremy L Thompson   @brief Mark QFunctionAssemblyData as stale
919beecbf24SJeremy L Thompson 
920ea61e9acSJeremy L Thompson   @param[in,out] data              CeedQFunctionAssemblyData to mark as stale
921ea61e9acSJeremy L Thompson   @param[in]     needs_data_update Boolean flag indicating if update is needed or completed
922beecbf24SJeremy L Thompson 
923beecbf24SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
924beecbf24SJeremy L Thompson 
925beecbf24SJeremy L Thompson   @ref Backend
926beecbf24SJeremy L Thompson **/
9272b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetUpdateNeeded(CeedQFunctionAssemblyData data, bool needs_data_update) {
928beecbf24SJeremy L Thompson   data->needs_data_update = needs_data_update;
9298b919e6bSJeremy L Thompson   return CEED_ERROR_SUCCESS;
9308b919e6bSJeremy L Thompson }
9318b919e6bSJeremy L Thompson 
9328b919e6bSJeremy L Thompson /**
9338b919e6bSJeremy L Thompson   @brief Determine if QFunctionAssemblyData needs update
9348b919e6bSJeremy L Thompson 
9358b919e6bSJeremy L Thompson   @param[in]  data             CeedQFunctionAssemblyData to mark as stale
9368b919e6bSJeremy L Thompson   @param[out] is_update_needed Boolean flag indicating if re-assembly is required
9378b919e6bSJeremy L Thompson 
9388b919e6bSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
9398b919e6bSJeremy L Thompson 
9408b919e6bSJeremy L Thompson   @ref Backend
9418b919e6bSJeremy L Thompson **/
9422b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsUpdateNeeded(CeedQFunctionAssemblyData data, bool *is_update_needed) {
943beecbf24SJeremy L Thompson   *is_update_needed = !data->reuse_data || data->needs_data_update;
9448b919e6bSJeremy L Thompson   return CEED_ERROR_SUCCESS;
9458b919e6bSJeremy L Thompson }
9468b919e6bSJeremy L Thompson 
9478b919e6bSJeremy L Thompson /**
948ea61e9acSJeremy L Thompson   @brief Copy the pointer to a CeedQFunctionAssemblyData.
949ea61e9acSJeremy L Thompson            Both pointers should be destroyed with `CeedCeedQFunctionAssemblyDataDestroy()`.
950ea61e9acSJeremy L Thompson            Note: If `*data_copy` is non-NULL, then it is assumed that `*data_copy` is a pointer to a CeedQFunctionAssemblyData.
951ea61e9acSJeremy L Thompson              This CeedQFunctionAssemblyData will be destroyed if `*data_copy` is the only reference to this CeedQFunctionAssemblyData.
952480fae85SJeremy L Thompson 
953ea61e9acSJeremy L Thompson   @param[in]     data      CeedQFunctionAssemblyData to copy reference to
954ea61e9acSJeremy L Thompson   @param[in,out] data_copy Variable to store copied reference
955480fae85SJeremy L Thompson 
956480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
957480fae85SJeremy L Thompson 
958480fae85SJeremy L Thompson   @ref Backend
959480fae85SJeremy L Thompson **/
9602b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataReferenceCopy(CeedQFunctionAssemblyData data, CeedQFunctionAssemblyData *data_copy) {
9612b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAssemblyDataReference(data));
9622b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAssemblyDataDestroy(data_copy));
963480fae85SJeremy L Thompson   *data_copy = data;
964480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
965480fae85SJeremy L Thompson }
966480fae85SJeremy L Thompson 
967480fae85SJeremy L Thompson /**
968480fae85SJeremy L Thompson   @brief Get setup status for internal objects for CeedQFunctionAssemblyData
969480fae85SJeremy L Thompson 
970ea61e9acSJeremy L Thompson   @param[in]  data     CeedQFunctionAssemblyData to retrieve status
971480fae85SJeremy L Thompson   @param[out] is_setup Boolean flag for setup status
972480fae85SJeremy L Thompson 
973480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
974480fae85SJeremy L Thompson 
975480fae85SJeremy L Thompson   @ref Backend
976480fae85SJeremy L Thompson **/
9772b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataIsSetup(CeedQFunctionAssemblyData data, bool *is_setup) {
978480fae85SJeremy L Thompson   *is_setup = data->is_setup;
979480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
980480fae85SJeremy L Thompson }
981480fae85SJeremy L Thompson 
982480fae85SJeremy L Thompson /**
983480fae85SJeremy L Thompson   @brief Set internal objects for CeedQFunctionAssemblyData
984480fae85SJeremy L Thompson 
985ea61e9acSJeremy L Thompson   @param[in,out] data CeedQFunctionAssemblyData to set objects
986480fae85SJeremy L Thompson   @param[in]     vec  CeedVector to store assembled CeedQFunction at quadrature points
987480fae85SJeremy L Thompson   @param[in]     rstr CeedElemRestriction for CeedVector containing assembled CeedQFunction
988480fae85SJeremy L Thompson 
989480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
990480fae85SJeremy L Thompson 
991480fae85SJeremy L Thompson   @ref Backend
992480fae85SJeremy L Thompson **/
9932b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataSetObjects(CeedQFunctionAssemblyData data, CeedVector vec, CeedElemRestriction rstr) {
9942b730f8bSJeremy L Thompson   CeedCall(CeedVectorReferenceCopy(vec, &data->vec));
9952b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionReferenceCopy(rstr, &data->rstr));
996480fae85SJeremy L Thompson 
997480fae85SJeremy L Thompson   data->is_setup = true;
998480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
999480fae85SJeremy L Thompson }
1000480fae85SJeremy L Thompson 
10012b730f8bSJeremy L Thompson int CeedQFunctionAssemblyDataGetObjects(CeedQFunctionAssemblyData data, CeedVector *vec, CeedElemRestriction *rstr) {
10022b730f8bSJeremy L Thompson   if (!data->is_setup) {
1003480fae85SJeremy L Thompson     // LCOV_EXCL_START
10042b730f8bSJeremy L Thompson     return CeedError(data->ceed, CEED_ERROR_INCOMPLETE, "Internal objects not set; must call CeedQFunctionAssemblyDataSetObjects first.");
1005480fae85SJeremy L Thompson     // LCOV_EXCL_STOP
10062b730f8bSJeremy L Thompson   }
1007480fae85SJeremy L Thompson 
10082b730f8bSJeremy L Thompson   CeedCall(CeedVectorReferenceCopy(data->vec, vec));
10092b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionReferenceCopy(data->rstr, rstr));
1010480fae85SJeremy L Thompson 
1011480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1012480fae85SJeremy L Thompson }
1013480fae85SJeremy L Thompson 
1014480fae85SJeremy L Thompson /**
1015480fae85SJeremy L Thompson   @brief Destroy CeedQFunctionAssemblyData
1016480fae85SJeremy L Thompson 
1017ea61e9acSJeremy L Thompson   @param[in,out] data  CeedQFunctionAssemblyData to destroy
1018480fae85SJeremy L Thompson 
1019480fae85SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1020480fae85SJeremy L Thompson 
1021480fae85SJeremy L Thompson   @ref Backend
1022480fae85SJeremy L Thompson **/
1023480fae85SJeremy L Thompson int CeedQFunctionAssemblyDataDestroy(CeedQFunctionAssemblyData *data) {
1024480fae85SJeremy L Thompson   if (!*data || --(*data)->ref_count > 0) return CEED_ERROR_SUCCESS;
1025480fae85SJeremy L Thompson 
10262b730f8bSJeremy L Thompson   CeedCall(CeedDestroy(&(*data)->ceed));
10272b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&(*data)->vec));
10282b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&(*data)->rstr));
1029480fae85SJeremy L Thompson 
10302b730f8bSJeremy L Thompson   CeedCall(CeedFree(data));
1031480fae85SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1032480fae85SJeremy L Thompson }
1033480fae85SJeremy L Thompson 
1034ed9e99e6SJeremy L Thompson /**
1035ed9e99e6SJeremy L Thompson   @brief Get CeedOperatorAssemblyData
1036ed9e99e6SJeremy L Thompson 
1037ed9e99e6SJeremy L Thompson   @param[in]  op   CeedOperator to assemble
1038ed9e99e6SJeremy L Thompson   @param[out] data CeedQFunctionAssemblyData
1039ed9e99e6SJeremy L Thompson 
1040ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1041ed9e99e6SJeremy L Thompson 
1042ed9e99e6SJeremy L Thompson   @ref Backend
1043ed9e99e6SJeremy L Thompson **/
10442b730f8bSJeremy L Thompson int CeedOperatorGetOperatorAssemblyData(CeedOperator op, CeedOperatorAssemblyData *data) {
1045ed9e99e6SJeremy L Thompson   if (!op->op_assembled) {
1046ed9e99e6SJeremy L Thompson     CeedOperatorAssemblyData data;
1047ed9e99e6SJeremy L Thompson 
10482b730f8bSJeremy L Thompson     CeedCall(CeedOperatorAssemblyDataCreate(op->ceed, op, &data));
1049ed9e99e6SJeremy L Thompson     op->op_assembled = data;
1050ed9e99e6SJeremy L Thompson   }
1051ed9e99e6SJeremy L Thompson   *data = op->op_assembled;
1052ed9e99e6SJeremy L Thompson 
1053ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1054ed9e99e6SJeremy L Thompson }
1055ed9e99e6SJeremy L Thompson 
1056ed9e99e6SJeremy L Thompson /**
1057ed9e99e6SJeremy L Thompson   @brief Create object holding CeedOperator assembly data
1058ed9e99e6SJeremy L Thompson 
1059ea61e9acSJeremy L Thompson   @param[in]  ceed Ceed object where the CeedOperatorAssemblyData will be created
1060ed9e99e6SJeremy L Thompson   @param[in]  op   CeedOperator to be assembled
1061ea61e9acSJeremy L Thompson   @param[out] data Address of the variable where the newly created CeedOperatorAssemblyData will be stored
1062ed9e99e6SJeremy L Thompson 
1063ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1064ed9e99e6SJeremy L Thompson 
1065ed9e99e6SJeremy L Thompson   @ref Backend
1066ed9e99e6SJeremy L Thompson **/
10672b730f8bSJeremy L Thompson int CeedOperatorAssemblyDataCreate(Ceed ceed, CeedOperator op, CeedOperatorAssemblyData *data) {
10682b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(1, data));
1069ed9e99e6SJeremy L Thompson   (*data)->ceed = ceed;
10702b730f8bSJeremy L Thompson   CeedCall(CeedReference(ceed));
1071ed9e99e6SJeremy L Thompson 
1072ed9e99e6SJeremy L Thompson   // Build OperatorAssembly data
1073ed9e99e6SJeremy L Thompson   CeedQFunction       qf;
1074ed9e99e6SJeremy L Thompson   CeedQFunctionField *qf_fields;
1075ed9e99e6SJeremy L Thompson   CeedOperatorField  *op_fields;
1076ed9e99e6SJeremy L Thompson   CeedInt             num_input_fields;
10772b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetQFunction(op, &qf));
10782b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionGetFields(qf, &num_input_fields, &qf_fields, NULL, NULL));
10792b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetFields(op, NULL, &op_fields, NULL, NULL));
1080ed9e99e6SJeremy L Thompson 
1081ed9e99e6SJeremy L Thompson   // Determine active input basis
1082ed9e99e6SJeremy L Thompson   CeedInt       num_eval_mode_in = 0, dim = 1;
1083ed9e99e6SJeremy L Thompson   CeedEvalMode *eval_mode_in = NULL;
1084ed9e99e6SJeremy L Thompson   CeedBasis     basis_in     = NULL;
1085ed9e99e6SJeremy L Thompson   for (CeedInt i = 0; i < num_input_fields; i++) {
1086ed9e99e6SJeremy L Thompson     CeedVector vec;
10872b730f8bSJeremy L Thompson     CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec));
1088ed9e99e6SJeremy L Thompson     if (vec == CEED_VECTOR_ACTIVE) {
10892b730f8bSJeremy L Thompson       CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_in));
10902b730f8bSJeremy L Thompson       CeedCall(CeedBasisGetDimension(basis_in, &dim));
1091ed9e99e6SJeremy L Thompson       CeedEvalMode eval_mode;
10922b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode));
1093ed9e99e6SJeremy L Thompson       switch (eval_mode) {
1094ed9e99e6SJeremy L Thompson         case CEED_EVAL_NONE:
1095ed9e99e6SJeremy L Thompson         case CEED_EVAL_INTERP:
10962b730f8bSJeremy L Thompson           CeedCall(CeedRealloc(num_eval_mode_in + 1, &eval_mode_in));
1097ed9e99e6SJeremy L Thompson           eval_mode_in[num_eval_mode_in] = eval_mode;
1098ed9e99e6SJeremy L Thompson           num_eval_mode_in += 1;
1099ed9e99e6SJeremy L Thompson           break;
1100ed9e99e6SJeremy L Thompson         case CEED_EVAL_GRAD:
11012b730f8bSJeremy L Thompson           CeedCall(CeedRealloc(num_eval_mode_in + dim, &eval_mode_in));
1102ed9e99e6SJeremy L Thompson           for (CeedInt d = 0; d < dim; d++) {
1103ed9e99e6SJeremy L Thompson             eval_mode_in[num_eval_mode_in + d] = eval_mode;
1104ed9e99e6SJeremy L Thompson           }
1105ed9e99e6SJeremy L Thompson           num_eval_mode_in += dim;
1106ed9e99e6SJeremy L Thompson           break;
1107ed9e99e6SJeremy L Thompson         case CEED_EVAL_WEIGHT:
1108ed9e99e6SJeremy L Thompson         case CEED_EVAL_DIV:
1109ed9e99e6SJeremy L Thompson         case CEED_EVAL_CURL:
1110ed9e99e6SJeremy L Thompson           break;  // Caught by QF Assembly
1111ed9e99e6SJeremy L Thompson       }
1112ed9e99e6SJeremy L Thompson     }
1113ed9e99e6SJeremy L Thompson   }
1114ed9e99e6SJeremy L Thompson   (*data)->num_eval_mode_in = num_eval_mode_in;
1115ed9e99e6SJeremy L Thompson   (*data)->eval_mode_in     = eval_mode_in;
11162b730f8bSJeremy L Thompson   CeedCall(CeedBasisReferenceCopy(basis_in, &(*data)->basis_in));
1117ed9e99e6SJeremy L Thompson 
1118ed9e99e6SJeremy L Thompson   // Determine active output basis
1119ed9e99e6SJeremy L Thompson   CeedInt num_output_fields;
11202b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionGetFields(qf, NULL, NULL, &num_output_fields, &qf_fields));
11212b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetFields(op, NULL, NULL, NULL, &op_fields));
1122ed9e99e6SJeremy L Thompson   CeedInt       num_eval_mode_out = 0;
1123ed9e99e6SJeremy L Thompson   CeedEvalMode *eval_mode_out     = NULL;
1124ed9e99e6SJeremy L Thompson   CeedBasis     basis_out         = NULL;
1125ed9e99e6SJeremy L Thompson   for (CeedInt i = 0; i < num_output_fields; i++) {
1126ed9e99e6SJeremy L Thompson     CeedVector vec;
11272b730f8bSJeremy L Thompson     CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec));
1128ed9e99e6SJeremy L Thompson     if (vec == CEED_VECTOR_ACTIVE) {
11292b730f8bSJeremy L Thompson       CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis_out));
1130ed9e99e6SJeremy L Thompson       CeedEvalMode eval_mode;
11312b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode));
1132ed9e99e6SJeremy L Thompson       switch (eval_mode) {
1133ed9e99e6SJeremy L Thompson         case CEED_EVAL_NONE:
1134ed9e99e6SJeremy L Thompson         case CEED_EVAL_INTERP:
11352b730f8bSJeremy L Thompson           CeedCall(CeedRealloc(num_eval_mode_out + 1, &eval_mode_out));
1136ed9e99e6SJeremy L Thompson           eval_mode_out[num_eval_mode_out] = eval_mode;
1137ed9e99e6SJeremy L Thompson           num_eval_mode_out += 1;
1138ed9e99e6SJeremy L Thompson           break;
1139ed9e99e6SJeremy L Thompson         case CEED_EVAL_GRAD:
11402b730f8bSJeremy L Thompson           CeedCall(CeedRealloc(num_eval_mode_out + dim, &eval_mode_out));
1141ed9e99e6SJeremy L Thompson           for (CeedInt d = 0; d < dim; d++) {
1142ed9e99e6SJeremy L Thompson             eval_mode_out[num_eval_mode_out + d] = eval_mode;
1143ed9e99e6SJeremy L Thompson           }
1144ed9e99e6SJeremy L Thompson           num_eval_mode_out += dim;
1145ed9e99e6SJeremy L Thompson           break;
1146ed9e99e6SJeremy L Thompson         case CEED_EVAL_WEIGHT:
1147ed9e99e6SJeremy L Thompson         case CEED_EVAL_DIV:
1148ed9e99e6SJeremy L Thompson         case CEED_EVAL_CURL:
1149ed9e99e6SJeremy L Thompson           break;  // Caught by QF Assembly
1150ed9e99e6SJeremy L Thompson       }
1151ed9e99e6SJeremy L Thompson     }
1152ed9e99e6SJeremy L Thompson   }
1153ed9e99e6SJeremy L Thompson   (*data)->num_eval_mode_out = num_eval_mode_out;
1154ed9e99e6SJeremy L Thompson   (*data)->eval_mode_out     = eval_mode_out;
11552b730f8bSJeremy L Thompson   CeedCall(CeedBasisReferenceCopy(basis_out, &(*data)->basis_out));
1156ed9e99e6SJeremy L Thompson 
1157ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1158ed9e99e6SJeremy L Thompson }
1159ed9e99e6SJeremy L Thompson 
1160ed9e99e6SJeremy L Thompson /**
1161ed9e99e6SJeremy L Thompson   @brief Get CeedOperator CeedEvalModes for assembly
1162ed9e99e6SJeremy L Thompson 
1163ed9e99e6SJeremy L Thompson   @param[in]  data              CeedOperatorAssemblyData
1164ed9e99e6SJeremy L Thompson   @param[out] num_eval_mode_in  Pointer to hold number of input CeedEvalModes, or NULL
1165ed9e99e6SJeremy L Thompson   @param[out] eval_mode_in      Pointer to hold input CeedEvalModes, or NULL
1166ed9e99e6SJeremy L Thompson   @param[out] num_eval_mode_out Pointer to hold number of output CeedEvalModes, or NULL
1167ed9e99e6SJeremy L Thompson   @param[out] eval_mode_out     Pointer to hold output CeedEvalModes, or NULL
1168ed9e99e6SJeremy L Thompson 
1169ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1170ed9e99e6SJeremy L Thompson 
1171ed9e99e6SJeremy L Thompson   @ref Backend
1172ed9e99e6SJeremy L Thompson **/
11732b730f8bSJeremy L Thompson int CeedOperatorAssemblyDataGetEvalModes(CeedOperatorAssemblyData data, CeedInt *num_eval_mode_in, const CeedEvalMode **eval_mode_in,
1174ed9e99e6SJeremy L Thompson                                          CeedInt *num_eval_mode_out, const CeedEvalMode **eval_mode_out) {
1175ed9e99e6SJeremy L Thompson   if (num_eval_mode_in) *num_eval_mode_in = data->num_eval_mode_in;
1176ed9e99e6SJeremy L Thompson   if (eval_mode_in) *eval_mode_in = data->eval_mode_in;
1177ed9e99e6SJeremy L Thompson   if (num_eval_mode_out) *num_eval_mode_out = data->num_eval_mode_out;
1178ed9e99e6SJeremy L Thompson   if (eval_mode_out) *eval_mode_out = data->eval_mode_out;
1179ed9e99e6SJeremy L Thompson 
1180ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1181ed9e99e6SJeremy L Thompson }
1182ed9e99e6SJeremy L Thompson 
1183ed9e99e6SJeremy L Thompson /**
1184ed9e99e6SJeremy L Thompson   @brief Get CeedOperator CeedBasis data for assembly
1185ed9e99e6SJeremy L Thompson 
1186ed9e99e6SJeremy L Thompson   @param[in]  data      CeedOperatorAssemblyData
1187ed9e99e6SJeremy L Thompson   @param[out] basis_in  Pointer to hold active input CeedBasis, or NULL
1188ed9e99e6SJeremy L Thompson   @param[out] B_in      Pointer to hold assembled active input B, or NULL
1189ed9e99e6SJeremy L Thompson   @param[out] basis_out Pointer to hold active output CeedBasis, or NULL
1190ed9e99e6SJeremy L Thompson   @param[out] B_out     Pointer to hold assembled active output B, or NULL
1191ed9e99e6SJeremy L Thompson 
1192ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1193ed9e99e6SJeremy L Thompson 
1194ed9e99e6SJeremy L Thompson   @ref Backend
1195ed9e99e6SJeremy L Thompson **/
11962b730f8bSJeremy L Thompson int CeedOperatorAssemblyDataGetBases(CeedOperatorAssemblyData data, CeedBasis *basis_in, const CeedScalar **B_in, CeedBasis *basis_out,
1197ed9e99e6SJeremy L Thompson                                      const CeedScalar **B_out) {
1198ed9e99e6SJeremy L Thompson   // Assemble B_in, B_out if needed
1199ed9e99e6SJeremy L Thompson   if (B_in && !data->B_in) {
1200ed9e99e6SJeremy L Thompson     CeedInt           num_qpts, elem_size;
1201ed9e99e6SJeremy L Thompson     CeedScalar       *B_in, *identity = NULL;
1202ed9e99e6SJeremy L Thompson     const CeedScalar *interp_in, *grad_in;
1203ed9e99e6SJeremy L Thompson     bool              has_eval_none = false;
1204ed9e99e6SJeremy L Thompson 
12052b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumQuadraturePoints(data->basis_in, &num_qpts));
12062b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumNodes(data->basis_in, &elem_size));
12072b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(num_qpts * elem_size * data->num_eval_mode_in, &B_in));
1208ed9e99e6SJeremy L Thompson 
1209ed9e99e6SJeremy L Thompson     for (CeedInt i = 0; i < data->num_eval_mode_in; i++) {
1210ed9e99e6SJeremy L Thompson       has_eval_none = has_eval_none || (data->eval_mode_in[i] == CEED_EVAL_NONE);
1211ed9e99e6SJeremy L Thompson     }
1212ed9e99e6SJeremy L Thompson     if (has_eval_none) {
12132b730f8bSJeremy L Thompson       CeedCall(CeedCalloc(num_qpts * elem_size, &identity));
1214ed9e99e6SJeremy L Thompson       for (CeedInt i = 0; i < (elem_size < num_qpts ? elem_size : num_qpts); i++) {
1215ed9e99e6SJeremy L Thompson         identity[i * elem_size + i] = 1.0;
1216ed9e99e6SJeremy L Thompson       }
1217ed9e99e6SJeremy L Thompson     }
12182b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetInterp(data->basis_in, &interp_in));
12192b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetGrad(data->basis_in, &grad_in));
1220ed9e99e6SJeremy L Thompson 
1221ed9e99e6SJeremy L Thompson     for (CeedInt q = 0; q < num_qpts; q++) {
1222ed9e99e6SJeremy L Thompson       for (CeedInt n = 0; n < elem_size; n++) {
1223ed9e99e6SJeremy L Thompson         CeedInt d_in = -1;
1224ed9e99e6SJeremy L Thompson         for (CeedInt e_in = 0; e_in < data->num_eval_mode_in; e_in++) {
1225ed9e99e6SJeremy L Thompson           const CeedInt     qq = data->num_eval_mode_in * q;
1226ed9e99e6SJeremy L Thompson           const CeedScalar *b  = NULL;
1227ed9e99e6SJeremy L Thompson 
1228ed9e99e6SJeremy L Thompson           if (data->eval_mode_in[e_in] == CEED_EVAL_GRAD) d_in++;
12292b730f8bSJeremy L Thompson           CeedOperatorGetBasisPointer(data->eval_mode_in[e_in], identity, interp_in, &grad_in[d_in * num_qpts * elem_size], &b);
1230ed9e99e6SJeremy L Thompson           B_in[(qq + e_in) * elem_size + n] = b[q * elem_size + n];
1231ed9e99e6SJeremy L Thompson         }
1232ed9e99e6SJeremy L Thompson       }
1233ed9e99e6SJeremy L Thompson     }
1234ed9e99e6SJeremy L Thompson     data->B_in = B_in;
1235ed9e99e6SJeremy L Thompson   }
1236ed9e99e6SJeremy L Thompson 
1237ed9e99e6SJeremy L Thompson   if (B_out && !data->B_out) {
1238ed9e99e6SJeremy L Thompson     CeedInt           num_qpts, elem_size;
1239ed9e99e6SJeremy L Thompson     CeedScalar       *B_out, *identity = NULL;
1240ed9e99e6SJeremy L Thompson     const CeedScalar *interp_out, *grad_out;
1241ed9e99e6SJeremy L Thompson     bool              has_eval_none = false;
1242ed9e99e6SJeremy L Thompson 
12432b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumQuadraturePoints(data->basis_out, &num_qpts));
12442b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetNumNodes(data->basis_out, &elem_size));
12452b730f8bSJeremy L Thompson     CeedCall(CeedCalloc(num_qpts * elem_size * data->num_eval_mode_out, &B_out));
1246ed9e99e6SJeremy L Thompson 
1247ed9e99e6SJeremy L Thompson     for (CeedInt i = 0; i < data->num_eval_mode_out; i++) {
1248ed9e99e6SJeremy L Thompson       has_eval_none = has_eval_none || (data->eval_mode_out[i] == CEED_EVAL_NONE);
1249ed9e99e6SJeremy L Thompson     }
1250ed9e99e6SJeremy L Thompson     if (has_eval_none) {
12512b730f8bSJeremy L Thompson       CeedCall(CeedCalloc(num_qpts * elem_size, &identity));
1252ed9e99e6SJeremy L Thompson       for (CeedInt i = 0; i < (elem_size < num_qpts ? elem_size : num_qpts); i++) {
1253ed9e99e6SJeremy L Thompson         identity[i * elem_size + i] = 1.0;
1254ed9e99e6SJeremy L Thompson       }
1255ed9e99e6SJeremy L Thompson     }
12562b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetInterp(data->basis_out, &interp_out));
12572b730f8bSJeremy L Thompson     CeedCall(CeedBasisGetGrad(data->basis_out, &grad_out));
1258ed9e99e6SJeremy L Thompson 
1259ed9e99e6SJeremy L Thompson     for (CeedInt q = 0; q < num_qpts; q++) {
1260ed9e99e6SJeremy L Thompson       for (CeedInt n = 0; n < elem_size; n++) {
1261ed9e99e6SJeremy L Thompson         CeedInt d_out = -1;
1262ed9e99e6SJeremy L Thompson         for (CeedInt e_out = 0; e_out < data->num_eval_mode_out; e_out++) {
1263ed9e99e6SJeremy L Thompson           const CeedInt     qq = data->num_eval_mode_out * q;
1264ed9e99e6SJeremy L Thompson           const CeedScalar *b  = NULL;
1265ed9e99e6SJeremy L Thompson 
1266ed9e99e6SJeremy L Thompson           if (data->eval_mode_out[e_out] == CEED_EVAL_GRAD) d_out++;
12672b730f8bSJeremy L Thompson           CeedOperatorGetBasisPointer(data->eval_mode_out[e_out], identity, interp_out, &grad_out[d_out * num_qpts * elem_size], &b);
1268ed9e99e6SJeremy L Thompson           B_out[(qq + e_out) * elem_size + n] = b[q * elem_size + n];
1269ed9e99e6SJeremy L Thompson         }
1270ed9e99e6SJeremy L Thompson       }
1271ed9e99e6SJeremy L Thompson     }
1272ed9e99e6SJeremy L Thompson     data->B_out = B_out;
1273ed9e99e6SJeremy L Thompson   }
1274ed9e99e6SJeremy L Thompson 
1275ed9e99e6SJeremy L Thompson   if (basis_in) *basis_in = data->basis_in;
1276ed9e99e6SJeremy L Thompson   if (B_in) *B_in = data->B_in;
1277ed9e99e6SJeremy L Thompson   if (basis_out) *basis_out = data->basis_out;
1278ed9e99e6SJeremy L Thompson   if (B_out) *B_out = data->B_out;
1279ed9e99e6SJeremy L Thompson 
1280ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1281ed9e99e6SJeremy L Thompson }
1282ed9e99e6SJeremy L Thompson 
1283ed9e99e6SJeremy L Thompson /**
1284ed9e99e6SJeremy L Thompson   @brief Destroy CeedOperatorAssemblyData
1285ed9e99e6SJeremy L Thompson 
1286ea61e9acSJeremy L Thompson   @param[in,out] data CeedOperatorAssemblyData to destroy
1287ed9e99e6SJeremy L Thompson 
1288ed9e99e6SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1289ed9e99e6SJeremy L Thompson 
1290ed9e99e6SJeremy L Thompson   @ref Backend
1291ed9e99e6SJeremy L Thompson **/
1292ed9e99e6SJeremy L Thompson int CeedOperatorAssemblyDataDestroy(CeedOperatorAssemblyData *data) {
1293ed9e99e6SJeremy L Thompson   if (!*data) return CEED_ERROR_SUCCESS;
1294ed9e99e6SJeremy L Thompson 
12952b730f8bSJeremy L Thompson   CeedCall(CeedDestroy(&(*data)->ceed));
12962b730f8bSJeremy L Thompson   CeedCall(CeedBasisDestroy(&(*data)->basis_in));
12972b730f8bSJeremy L Thompson   CeedCall(CeedBasisDestroy(&(*data)->basis_out));
12982b730f8bSJeremy L Thompson   CeedCall(CeedFree(&(*data)->eval_mode_in));
12992b730f8bSJeremy L Thompson   CeedCall(CeedFree(&(*data)->eval_mode_out));
13002b730f8bSJeremy L Thompson   CeedCall(CeedFree(&(*data)->B_in));
13012b730f8bSJeremy L Thompson   CeedCall(CeedFree(&(*data)->B_out));
1302ed9e99e6SJeremy L Thompson 
13032b730f8bSJeremy L Thompson   CeedCall(CeedFree(data));
1304ed9e99e6SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1305ed9e99e6SJeremy L Thompson }
1306ed9e99e6SJeremy L Thompson 
1307480fae85SJeremy L Thompson /// @}
1308480fae85SJeremy L Thompson 
1309480fae85SJeremy L Thompson /// ----------------------------------------------------------------------------
1310eaf62fffSJeremy L Thompson /// CeedOperator Public API
1311eaf62fffSJeremy L Thompson /// ----------------------------------------------------------------------------
1312eaf62fffSJeremy L Thompson /// @addtogroup CeedOperatorUser
1313eaf62fffSJeremy L Thompson /// @{
1314eaf62fffSJeremy L Thompson 
1315eaf62fffSJeremy L Thompson /**
1316eaf62fffSJeremy L Thompson   @brief Assemble a linear CeedQFunction associated with a CeedOperator
1317eaf62fffSJeremy L Thompson 
1318ea61e9acSJeremy L Thompson   This returns a CeedVector containing a matrix at each quadrature point providing the action of the CeedQFunction associated with the CeedOperator.
1319ea61e9acSJeremy L Thompson     The vector 'assembled' is of shape [num_elements, num_input_fields, num_output_fields, num_quad_points] and contains column-major matrices
1320ea61e9acSJeremy L Thompson representing the action of the CeedQFunction for a corresponding quadrature point on an element. Inputs and outputs are in the order provided by the
1321ea61e9acSJeremy L Thompson user when adding CeedOperator fields. For example, a CeedQFunction with inputs 'u' and 'gradu' and outputs 'gradv' and 'v', provided in that order,
1322ea61e9acSJeremy L Thompson would result in an assembled QFunction that consists of (1 + dim) x (dim + 1) matrices at each quadrature point acting on the input [u, du_0, du_1]
1323ea61e9acSJeremy L Thompson and producing the output [dv_0, dv_1, v].
1324eaf62fffSJeremy L Thompson 
1325ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1326f04ea552SJeremy L Thompson 
1327ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1328ea61e9acSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points
1329ea61e9acSJeremy L Thompson   @param[out] rstr      CeedElemRestriction for CeedVector containing assembled CeedQFunction
1330ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1331eaf62fffSJeremy L Thompson 
1332eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1333eaf62fffSJeremy L Thompson 
1334eaf62fffSJeremy L Thompson   @ref User
1335eaf62fffSJeremy L Thompson **/
13362b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunction(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) {
13372b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1338eaf62fffSJeremy L Thompson 
1339eaf62fffSJeremy L Thompson   if (op->LinearAssembleQFunction) {
1340d04bbc78SJeremy L Thompson     // Backend version
13412b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleQFunction(op, assembled, rstr, request));
1342eaf62fffSJeremy L Thompson   } else {
1343d04bbc78SJeremy L Thompson     // Operator fallback
1344d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1345d04bbc78SJeremy L Thompson 
13462b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1347d04bbc78SJeremy L Thompson     if (op_fallback) {
13482b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleQFunction(op_fallback, assembled, rstr, request));
1349d04bbc78SJeremy L Thompson     } else {
1350d04bbc78SJeremy L Thompson       // LCOV_EXCL_START
13512b730f8bSJeremy L Thompson       return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunction");
1352d04bbc78SJeremy L Thompson       // LCOV_EXCL_STOP
1353d04bbc78SJeremy L Thompson     }
135470a7ffb3SJeremy L Thompson   }
1355eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1356eaf62fffSJeremy L Thompson }
135770a7ffb3SJeremy L Thompson 
135870a7ffb3SJeremy L Thompson /**
1359ea61e9acSJeremy L Thompson   @brief Assemble CeedQFunction and store result internally.
1360ea61e9acSJeremy L Thompson            Return copied references of stored data to the caller.
1361ea61e9acSJeremy L Thompson            Caller is responsible for ownership and destruction of the copied references.
1362ea61e9acSJeremy L Thompson            See also @ref CeedOperatorLinearAssembleQFunction
136370a7ffb3SJeremy L Thompson 
1364ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1365ea61e9acSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedQFunction at quadrature points
1366ea61e9acSJeremy L Thompson   @param[out] rstr      CeedElemRestriction for CeedVector containing assembledCeedQFunction
1367ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
136870a7ffb3SJeremy L Thompson 
136970a7ffb3SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
137070a7ffb3SJeremy L Thompson 
137170a7ffb3SJeremy L Thompson   @ref User
137270a7ffb3SJeremy L Thompson **/
13732b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleQFunctionBuildOrUpdate(CeedOperator op, CeedVector *assembled, CeedElemRestriction *rstr, CeedRequest *request) {
13742b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
137570a7ffb3SJeremy L Thompson 
137670a7ffb3SJeremy L Thompson   if (op->LinearAssembleQFunctionUpdate) {
1377d04bbc78SJeremy L Thompson     // Backend version
1378480fae85SJeremy L Thompson     bool                qf_assembled_is_setup;
13792efa2d85SJeremy L Thompson     CeedVector          assembled_vec  = NULL;
13802efa2d85SJeremy L Thompson     CeedElemRestriction assembled_rstr = NULL;
1381480fae85SJeremy L Thompson 
13822b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAssemblyDataIsSetup(op->qf_assembled, &qf_assembled_is_setup));
1383480fae85SJeremy L Thompson     if (qf_assembled_is_setup) {
1384d04bbc78SJeremy L Thompson       bool update_needed;
1385d04bbc78SJeremy L Thompson 
13862b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionAssemblyDataGetObjects(op->qf_assembled, &assembled_vec, &assembled_rstr));
13872b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionAssemblyDataIsUpdateNeeded(op->qf_assembled, &update_needed));
13888b919e6bSJeremy L Thompson       if (update_needed) {
13892b730f8bSJeremy L Thompson         CeedCall(op->LinearAssembleQFunctionUpdate(op, assembled_vec, assembled_rstr, request));
13908b919e6bSJeremy L Thompson       }
139170a7ffb3SJeremy L Thompson     } else {
13922b730f8bSJeremy L Thompson       CeedCall(op->LinearAssembleQFunction(op, &assembled_vec, &assembled_rstr, request));
13932b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionAssemblyDataSetObjects(op->qf_assembled, assembled_vec, assembled_rstr));
139470a7ffb3SJeremy L Thompson     }
13952b730f8bSJeremy L Thompson     CeedCall(CeedQFunctionAssemblyDataSetUpdateNeeded(op->qf_assembled, false));
13962efa2d85SJeremy L Thompson 
1397d04bbc78SJeremy L Thompson     // Copy reference from internally held copy
139870a7ffb3SJeremy L Thompson     *assembled = NULL;
139970a7ffb3SJeremy L Thompson     *rstr      = NULL;
14002b730f8bSJeremy L Thompson     CeedCall(CeedVectorReferenceCopy(assembled_vec, assembled));
14012b730f8bSJeremy L Thompson     CeedCall(CeedVectorDestroy(&assembled_vec));
14022b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionReferenceCopy(assembled_rstr, rstr));
14032b730f8bSJeremy L Thompson     CeedCall(CeedElemRestrictionDestroy(&assembled_rstr));
140470a7ffb3SJeremy L Thompson   } else {
1405d04bbc78SJeremy L Thompson     // Operator fallback
1406d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1407d04bbc78SJeremy L Thompson 
14082b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1409d04bbc78SJeremy L Thompson     if (op_fallback) {
14102b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op_fallback, assembled, rstr, request));
1411d04bbc78SJeremy L Thompson     } else {
1412d04bbc78SJeremy L Thompson       // LCOV_EXCL_START
14132b730f8bSJeremy L Thompson       return CeedError(op->ceed, CEED_ERROR_UNSUPPORTED, "Backend does not support CeedOperatorLinearAssembleQFunctionUpdate");
1414d04bbc78SJeremy L Thompson       // LCOV_EXCL_STOP
141570a7ffb3SJeremy L Thompson     }
141670a7ffb3SJeremy L Thompson   }
141770a7ffb3SJeremy L Thompson 
141870a7ffb3SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1419eaf62fffSJeremy L Thompson }
1420eaf62fffSJeremy L Thompson 
1421eaf62fffSJeremy L Thompson /**
1422eaf62fffSJeremy L Thompson   @brief Assemble the diagonal of a square linear CeedOperator
1423eaf62fffSJeremy L Thompson 
1424eaf62fffSJeremy L Thompson   This overwrites a CeedVector with the diagonal of a linear CeedOperator.
1425eaf62fffSJeremy L Thompson 
1426ea61e9acSJeremy L Thompson   Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported.
1427eaf62fffSJeremy L Thompson 
1428ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1429f04ea552SJeremy L Thompson 
1430ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1431eaf62fffSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedOperator diagonal
1432ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1433eaf62fffSJeremy L Thompson 
1434eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1435eaf62fffSJeremy L Thompson 
1436eaf62fffSJeremy L Thompson   @ref User
1437eaf62fffSJeremy L Thompson **/
14382b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) {
1439*f3d47e36SJeremy L Thompson   bool is_composite;
14402b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1441*f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1442eaf62fffSJeremy L Thompson 
1443c9366a6bSJeremy L Thompson   CeedSize input_size = 0, output_size = 0;
14442b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size));
14452b730f8bSJeremy L Thompson   if (input_size != output_size) {
1446c9366a6bSJeremy L Thompson     // LCOV_EXCL_START
1447c9366a6bSJeremy L Thompson     return CeedError(op->ceed, CEED_ERROR_DIMENSION, "Operator must be square");
1448c9366a6bSJeremy L Thompson     // LCOV_EXCL_STOP
14492b730f8bSJeremy L Thompson   }
1450c9366a6bSJeremy L Thompson 
1451*f3d47e36SJeremy L Thompson   // Early exit for empty operator
1452*f3d47e36SJeremy L Thompson   if (!is_composite) {
1453*f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
1454*f3d47e36SJeremy L Thompson 
1455*f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
1456*f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
1457*f3d47e36SJeremy L Thompson   }
1458*f3d47e36SJeremy L Thompson 
1459eaf62fffSJeremy L Thompson   if (op->LinearAssembleDiagonal) {
1460d04bbc78SJeremy L Thompson     // Backend version
14612b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleDiagonal(op, assembled, request));
1462eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1463eaf62fffSJeremy L Thompson   } else if (op->LinearAssembleAddDiagonal) {
1464d04bbc78SJeremy L Thompson     // Backend version with zeroing first
14652b730f8bSJeremy L Thompson     CeedCall(CeedVectorSetValue(assembled, 0.0));
14662b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request));
1467eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1468eaf62fffSJeremy L Thompson   } else {
1469d04bbc78SJeremy L Thompson     // Operator fallback
1470d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1471d04bbc78SJeremy L Thompson 
14722b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1473d04bbc78SJeremy L Thompson     if (op_fallback) {
14742b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleDiagonal(op_fallback, assembled, request));
1475eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1476eaf62fffSJeremy L Thompson     }
1477eaf62fffSJeremy L Thompson   }
1478eaf62fffSJeremy L Thompson   // Default interface implementation
14792b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(assembled, 0.0));
14802b730f8bSJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleAddDiagonal(op, assembled, request));
1481d04bbc78SJeremy L Thompson 
1482eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1483eaf62fffSJeremy L Thompson }
1484eaf62fffSJeremy L Thompson 
1485eaf62fffSJeremy L Thompson /**
1486eaf62fffSJeremy L Thompson   @brief Assemble the diagonal of a square linear CeedOperator
1487eaf62fffSJeremy L Thompson 
1488eaf62fffSJeremy L Thompson   This sums into a CeedVector the diagonal of a linear CeedOperator.
1489eaf62fffSJeremy L Thompson 
1490ea61e9acSJeremy L Thompson   Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported.
1491eaf62fffSJeremy L Thompson 
1492ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1493f04ea552SJeremy L Thompson 
1494ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1495eaf62fffSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedOperator diagonal
1496ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1497eaf62fffSJeremy L Thompson 
1498eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1499eaf62fffSJeremy L Thompson 
1500eaf62fffSJeremy L Thompson   @ref User
1501eaf62fffSJeremy L Thompson **/
15022b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) {
1503*f3d47e36SJeremy L Thompson   bool is_composite;
15042b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1505*f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1506eaf62fffSJeremy L Thompson 
1507c9366a6bSJeremy L Thompson   CeedSize input_size = 0, output_size = 0;
15082b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size));
15092b730f8bSJeremy L Thompson   if (input_size != output_size) {
1510c9366a6bSJeremy L Thompson     // LCOV_EXCL_START
1511c9366a6bSJeremy L Thompson     return CeedError(op->ceed, CEED_ERROR_DIMENSION, "Operator must be square");
1512c9366a6bSJeremy L Thompson     // LCOV_EXCL_STOP
15132b730f8bSJeremy L Thompson   }
1514c9366a6bSJeremy L Thompson 
1515*f3d47e36SJeremy L Thompson   // Early exit for empty operator
1516*f3d47e36SJeremy L Thompson   if (!is_composite) {
1517*f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
1518*f3d47e36SJeremy L Thompson 
1519*f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
1520*f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
1521*f3d47e36SJeremy L Thompson   }
1522*f3d47e36SJeremy L Thompson 
1523eaf62fffSJeremy L Thompson   if (op->LinearAssembleAddDiagonal) {
1524d04bbc78SJeremy L Thompson     // Backend version
15252b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleAddDiagonal(op, assembled, request));
1526eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1527eaf62fffSJeremy L Thompson   } else {
1528d04bbc78SJeremy L Thompson     // Operator fallback
1529d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1530d04bbc78SJeremy L Thompson 
15312b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1532d04bbc78SJeremy L Thompson     if (op_fallback) {
15332b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleAddDiagonal(op_fallback, assembled, request));
1534eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1535eaf62fffSJeremy L Thompson     }
1536eaf62fffSJeremy L Thompson   }
1537eaf62fffSJeremy L Thompson   // Default interface implementation
1538eaf62fffSJeremy L Thompson   if (is_composite) {
15392b730f8bSJeremy L Thompson     CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, false, assembled));
1540eaf62fffSJeremy L Thompson   } else {
15412b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, false, assembled));
1542eaf62fffSJeremy L Thompson   }
1543d04bbc78SJeremy L Thompson 
1544d04bbc78SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1545eaf62fffSJeremy L Thompson }
1546eaf62fffSJeremy L Thompson 
1547eaf62fffSJeremy L Thompson /**
1548eaf62fffSJeremy L Thompson   @brief Assemble the point block diagonal of a square linear CeedOperator
1549eaf62fffSJeremy L Thompson 
1550ea61e9acSJeremy L Thompson   This overwrites a CeedVector with the point block diagonal of a linear CeedOperator.
1551eaf62fffSJeremy L Thompson 
1552ea61e9acSJeremy L Thompson   Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported.
1553eaf62fffSJeremy L Thompson 
1554ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1555f04ea552SJeremy L Thompson 
1556ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1557ea61e9acSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp
1558ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out,
1559ea61e9acSJeremy L Thompson component in].
1560ea61e9acSJeremy L Thompson   @param[in]  request   Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1561eaf62fffSJeremy L Thompson 
1562eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1563eaf62fffSJeremy L Thompson 
1564eaf62fffSJeremy L Thompson   @ref User
1565eaf62fffSJeremy L Thompson **/
15662b730f8bSJeremy L Thompson int CeedOperatorLinearAssemblePointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) {
1567*f3d47e36SJeremy L Thompson   bool is_composite;
15682b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1569*f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1570eaf62fffSJeremy L Thompson 
1571c9366a6bSJeremy L Thompson   CeedSize input_size = 0, output_size = 0;
15722b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size));
15732b730f8bSJeremy L Thompson   if (input_size != output_size) {
1574c9366a6bSJeremy L Thompson     // LCOV_EXCL_START
1575c9366a6bSJeremy L Thompson     return CeedError(op->ceed, CEED_ERROR_DIMENSION, "Operator must be square");
1576c9366a6bSJeremy L Thompson     // LCOV_EXCL_STOP
15772b730f8bSJeremy L Thompson   }
1578c9366a6bSJeremy L Thompson 
1579*f3d47e36SJeremy L Thompson   // Early exit for empty operator
1580*f3d47e36SJeremy L Thompson   if (!is_composite) {
1581*f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
1582*f3d47e36SJeremy L Thompson 
1583*f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
1584*f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
1585*f3d47e36SJeremy L Thompson   }
1586*f3d47e36SJeremy L Thompson 
1587eaf62fffSJeremy L Thompson   if (op->LinearAssemblePointBlockDiagonal) {
1588d04bbc78SJeremy L Thompson     // Backend version
15892b730f8bSJeremy L Thompson     CeedCall(op->LinearAssemblePointBlockDiagonal(op, assembled, request));
1590eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1591eaf62fffSJeremy L Thompson   } else if (op->LinearAssembleAddPointBlockDiagonal) {
1592d04bbc78SJeremy L Thompson     // Backend version with zeroing first
15932b730f8bSJeremy L Thompson     CeedCall(CeedVectorSetValue(assembled, 0.0));
15942b730f8bSJeremy L Thompson     CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request));
1595eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1596eaf62fffSJeremy L Thompson   } else {
1597d04bbc78SJeremy L Thompson     // Operator fallback
1598d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1599d04bbc78SJeremy L Thompson 
16002b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1601d04bbc78SJeremy L Thompson     if (op_fallback) {
16022b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssemblePointBlockDiagonal(op_fallback, assembled, request));
1603eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1604eaf62fffSJeremy L Thompson     }
1605eaf62fffSJeremy L Thompson   }
1606eaf62fffSJeremy L Thompson   // Default interface implementation
16072b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(assembled, 0.0));
16082b730f8bSJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op, assembled, request));
1609d04bbc78SJeremy L Thompson 
1610eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1611eaf62fffSJeremy L Thompson }
1612eaf62fffSJeremy L Thompson 
1613eaf62fffSJeremy L Thompson /**
1614eaf62fffSJeremy L Thompson   @brief Assemble the point block diagonal of a square linear CeedOperator
1615eaf62fffSJeremy L Thompson 
1616ea61e9acSJeremy L Thompson   This sums into a CeedVector with the point block diagonal of a linear CeedOperator.
1617eaf62fffSJeremy L Thompson 
1618ea61e9acSJeremy L Thompson   Note: Currently only non-composite CeedOperators with a single field and composite CeedOperators with single field sub-operators are supported.
1619eaf62fffSJeremy L Thompson 
1620ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1621f04ea552SJeremy L Thompson 
1622ea61e9acSJeremy L Thompson   @param[in]  op        CeedOperator to assemble CeedQFunction
1623ea61e9acSJeremy L Thompson   @param[out] assembled CeedVector to store assembled CeedOperator point block diagonal, provided in row-major form with an @a num_comp * @a num_comp
1624ea61e9acSJeremy L Thompson block at each node. The dimensions of this vector are derived from the active vector for the CeedOperator. The array has shape [nodes, component out,
1625ea61e9acSJeremy L Thompson component in].
1626ea61e9acSJeremy L Thompson   @param[in]  request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
1627eaf62fffSJeremy L Thompson 
1628eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1629eaf62fffSJeremy L Thompson 
1630eaf62fffSJeremy L Thompson   @ref User
1631eaf62fffSJeremy L Thompson **/
16322b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleAddPointBlockDiagonal(CeedOperator op, CeedVector assembled, CeedRequest *request) {
1633*f3d47e36SJeremy L Thompson   bool is_composite;
16342b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1635*f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1636eaf62fffSJeremy L Thompson 
1637c9366a6bSJeremy L Thompson   CeedSize input_size = 0, output_size = 0;
16382b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveVectorLengths(op, &input_size, &output_size));
16392b730f8bSJeremy L Thompson   if (input_size != output_size) {
1640c9366a6bSJeremy L Thompson     // LCOV_EXCL_START
1641c9366a6bSJeremy L Thompson     return CeedError(op->ceed, CEED_ERROR_DIMENSION, "Operator must be square");
1642c9366a6bSJeremy L Thompson     // LCOV_EXCL_STOP
16432b730f8bSJeremy L Thompson   }
1644c9366a6bSJeremy L Thompson 
1645*f3d47e36SJeremy L Thompson   // Early exit for empty operator
1646*f3d47e36SJeremy L Thompson   if (!is_composite) {
1647*f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
1648*f3d47e36SJeremy L Thompson 
1649*f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
1650*f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
1651*f3d47e36SJeremy L Thompson   }
1652*f3d47e36SJeremy L Thompson 
1653eaf62fffSJeremy L Thompson   if (op->LinearAssembleAddPointBlockDiagonal) {
1654d04bbc78SJeremy L Thompson     // Backend version
16552b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleAddPointBlockDiagonal(op, assembled, request));
1656eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1657eaf62fffSJeremy L Thompson   } else {
1658d04bbc78SJeremy L Thompson     // Operator fallback
1659d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1660d04bbc78SJeremy L Thompson 
16612b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1662d04bbc78SJeremy L Thompson     if (op_fallback) {
16632b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleAddPointBlockDiagonal(op_fallback, assembled, request));
1664eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1665eaf62fffSJeremy L Thompson     }
1666eaf62fffSJeremy L Thompson   }
1667ea61e9acSJeremy L Thompson   // Default interface implementation
1668eaf62fffSJeremy L Thompson   if (is_composite) {
16692b730f8bSJeremy L Thompson     CeedCall(CeedCompositeOperatorLinearAssembleAddDiagonal(op, request, true, assembled));
1670eaf62fffSJeremy L Thompson   } else {
16712b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssembleAddDiagonal_Core(op, request, true, assembled));
1672eaf62fffSJeremy L Thompson   }
1673d04bbc78SJeremy L Thompson 
1674d04bbc78SJeremy L Thompson   return CEED_ERROR_SUCCESS;
1675eaf62fffSJeremy L Thompson }
1676eaf62fffSJeremy L Thompson 
1677eaf62fffSJeremy L Thompson /**
1678eaf62fffSJeremy L Thompson    @brief Fully assemble the nonzero pattern of a linear operator.
1679eaf62fffSJeremy L Thompson 
1680ea61e9acSJeremy L Thompson    Expected to be used in conjunction with CeedOperatorLinearAssemble().
1681eaf62fffSJeremy L Thompson 
1682ea61e9acSJeremy L Thompson    The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the
1683ea61e9acSJeremy L Thompson matrix in entry (i, j). Note that the (i, j) pairs are not unique and may repeat. This function returns the number of entries and their (i, j)
1684ea61e9acSJeremy L Thompson locations, while CeedOperatorLinearAssemble() provides the values in the same ordering.
1685eaf62fffSJeremy L Thompson 
1686eaf62fffSJeremy L Thompson    This will generally be slow unless your operator is low-order.
1687eaf62fffSJeremy L Thompson 
1688ea61e9acSJeremy L Thompson    Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1689f04ea552SJeremy L Thompson 
1690eaf62fffSJeremy L Thompson    @param[in]  op          CeedOperator to assemble
1691eaf62fffSJeremy L Thompson    @param[out] num_entries Number of entries in coordinate nonzero pattern
1692eaf62fffSJeremy L Thompson    @param[out] rows        Row number for each entry
1693eaf62fffSJeremy L Thompson    @param[out] cols        Column number for each entry
1694eaf62fffSJeremy L Thompson 
1695eaf62fffSJeremy L Thompson    @ref User
1696eaf62fffSJeremy L Thompson **/
16972b730f8bSJeremy L Thompson int CeedOperatorLinearAssembleSymbolic(CeedOperator op, CeedSize *num_entries, CeedInt **rows, CeedInt **cols) {
1698eaf62fffSJeremy L Thompson   CeedInt       num_suboperators, single_entries;
1699eaf62fffSJeremy L Thompson   CeedOperator *sub_operators;
1700eaf62fffSJeremy L Thompson   bool          is_composite;
17012b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1702*f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1703eaf62fffSJeremy L Thompson 
1704eaf62fffSJeremy L Thompson   if (op->LinearAssembleSymbolic) {
1705d04bbc78SJeremy L Thompson     // Backend version
17062b730f8bSJeremy L Thompson     CeedCall(op->LinearAssembleSymbolic(op, num_entries, rows, cols));
1707eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1708eaf62fffSJeremy L Thompson   } else {
1709d04bbc78SJeremy L Thompson     // Operator fallback
1710d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1711d04bbc78SJeremy L Thompson 
17122b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1713d04bbc78SJeremy L Thompson     if (op_fallback) {
17142b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssembleSymbolic(op_fallback, num_entries, rows, cols));
1715eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1716eaf62fffSJeremy L Thompson     }
1717eaf62fffSJeremy L Thompson   }
1718eaf62fffSJeremy L Thompson 
1719eaf62fffSJeremy L Thompson   // Default interface implementation
1720eaf62fffSJeremy L Thompson 
1721eaf62fffSJeremy L Thompson   // count entries and allocate rows, cols arrays
1722eaf62fffSJeremy L Thompson   *num_entries = 0;
1723eaf62fffSJeremy L Thompson   if (is_composite) {
1724c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
1725c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
172692ae7e47SJeremy L Thompson     for (CeedInt k = 0; k < num_suboperators; ++k) {
17272b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries));
1728eaf62fffSJeremy L Thompson       *num_entries += single_entries;
1729eaf62fffSJeremy L Thompson     }
1730eaf62fffSJeremy L Thompson   } else {
17312b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssemblyCountEntries(op, &single_entries));
1732eaf62fffSJeremy L Thompson     *num_entries += single_entries;
1733eaf62fffSJeremy L Thompson   }
17342b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(*num_entries, rows));
17352b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(*num_entries, cols));
1736eaf62fffSJeremy L Thompson 
1737eaf62fffSJeremy L Thompson   // assemble nonzero locations
1738eaf62fffSJeremy L Thompson   CeedInt offset = 0;
1739eaf62fffSJeremy L Thompson   if (is_composite) {
1740c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
1741c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
174292ae7e47SJeremy L Thompson     for (CeedInt k = 0; k < num_suboperators; ++k) {
17432b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssembleSymbolic(sub_operators[k], offset, *rows, *cols));
17442b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries));
1745eaf62fffSJeremy L Thompson       offset += single_entries;
1746eaf62fffSJeremy L Thompson     }
1747eaf62fffSJeremy L Thompson   } else {
17482b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssembleSymbolic(op, offset, *rows, *cols));
1749eaf62fffSJeremy L Thompson   }
1750eaf62fffSJeremy L Thompson 
1751eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1752eaf62fffSJeremy L Thompson }
1753eaf62fffSJeremy L Thompson 
1754eaf62fffSJeremy L Thompson /**
1755eaf62fffSJeremy L Thompson    @brief Fully assemble the nonzero entries of a linear operator.
1756eaf62fffSJeremy L Thompson 
1757ea61e9acSJeremy L Thompson    Expected to be used in conjunction with CeedOperatorLinearAssembleSymbolic().
1758eaf62fffSJeremy L Thompson 
1759ea61e9acSJeremy L Thompson    The assembly routines use coordinate format, with num_entries tuples of the form (i, j, value) which indicate that value should be added to the
1760ea61e9acSJeremy L Thompson matrix in entry (i, j). Note that the (i, j) pairs are not unique and may repeat. This function returns the values of the nonzero entries to be added,
1761ea61e9acSJeremy L Thompson their (i, j) locations are provided by CeedOperatorLinearAssembleSymbolic()
1762eaf62fffSJeremy L Thompson 
1763eaf62fffSJeremy L Thompson    This will generally be slow unless your operator is low-order.
1764eaf62fffSJeremy L Thompson 
1765ea61e9acSJeremy L Thompson    Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
1766f04ea552SJeremy L Thompson 
1767eaf62fffSJeremy L Thompson    @param[in]  op     CeedOperator to assemble
1768eaf62fffSJeremy L Thompson    @param[out] values Values to assemble into matrix
1769eaf62fffSJeremy L Thompson 
1770eaf62fffSJeremy L Thompson    @ref User
1771eaf62fffSJeremy L Thompson **/
1772eaf62fffSJeremy L Thompson int CeedOperatorLinearAssemble(CeedOperator op, CeedVector values) {
1773eaf62fffSJeremy L Thompson   CeedInt       num_suboperators, single_entries = 0;
1774eaf62fffSJeremy L Thompson   CeedOperator *sub_operators;
1775*f3d47e36SJeremy L Thompson   bool          is_composite;
17762b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
1777*f3d47e36SJeremy L Thompson   CeedCall(CeedOperatorIsComposite(op, &is_composite));
1778*f3d47e36SJeremy L Thompson 
1779*f3d47e36SJeremy L Thompson   // Early exit for empty operator
1780*f3d47e36SJeremy L Thompson   if (!is_composite) {
1781*f3d47e36SJeremy L Thompson     CeedInt num_elem = 0;
1782*f3d47e36SJeremy L Thompson 
1783*f3d47e36SJeremy L Thompson     CeedCall(CeedOperatorGetNumElements(op, &num_elem));
1784*f3d47e36SJeremy L Thompson     if (num_elem == 0) return CEED_ERROR_SUCCESS;
1785*f3d47e36SJeremy L Thompson   }
1786eaf62fffSJeremy L Thompson 
1787eaf62fffSJeremy L Thompson   if (op->LinearAssemble) {
1788d04bbc78SJeremy L Thompson     // Backend version
17892b730f8bSJeremy L Thompson     CeedCall(op->LinearAssemble(op, values));
1790eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
1791eaf62fffSJeremy L Thompson   } else {
1792d04bbc78SJeremy L Thompson     // Operator fallback
1793d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
1794d04bbc78SJeremy L Thompson 
17952b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
1796d04bbc78SJeremy L Thompson     if (op_fallback) {
17972b730f8bSJeremy L Thompson       CeedCall(CeedOperatorLinearAssemble(op_fallback, values));
1798eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
1799eaf62fffSJeremy L Thompson     }
1800eaf62fffSJeremy L Thompson   }
1801eaf62fffSJeremy L Thompson 
1802eaf62fffSJeremy L Thompson   // Default interface implementation
1803eaf62fffSJeremy L Thompson   CeedInt offset = 0;
1804eaf62fffSJeremy L Thompson   if (is_composite) {
1805c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetNumSub(op, &num_suboperators));
1806c6ebc35dSJeremy L Thompson     CeedCall(CeedCompositeOperatorGetSubList(op, &sub_operators));
1807cefa2673SJeremy L Thompson     for (CeedInt k = 0; k < num_suboperators; k++) {
18082b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemble(sub_operators[k], offset, values));
18092b730f8bSJeremy L Thompson       CeedCall(CeedSingleOperatorAssemblyCountEntries(sub_operators[k], &single_entries));
1810eaf62fffSJeremy L Thompson       offset += single_entries;
1811eaf62fffSJeremy L Thompson     }
1812eaf62fffSJeremy L Thompson   } else {
18132b730f8bSJeremy L Thompson     CeedCall(CeedSingleOperatorAssemble(op, offset, values));
1814eaf62fffSJeremy L Thompson   }
1815eaf62fffSJeremy L Thompson 
1816eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1817eaf62fffSJeremy L Thompson }
1818eaf62fffSJeremy L Thompson 
1819eaf62fffSJeremy L Thompson /**
182075f0d5a4SJeremy L Thompson   @brief Get the multiplicity of nodes across suboperators in a composite CeedOperator
182175f0d5a4SJeremy L Thompson 
182275f0d5a4SJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
182375f0d5a4SJeremy L Thompson 
182475f0d5a4SJeremy L Thompson   @param[in]  op               Composite CeedOperator
182575f0d5a4SJeremy L Thompson   @param[in]  num_skip_indices Number of suboperators to skip
182675f0d5a4SJeremy L Thompson   @param[in]  skip_indices     Array of indices of suboperators to skip
182775f0d5a4SJeremy L Thompson   @param[out] mult             Vector to store multiplicity (of size l_size)
182875f0d5a4SJeremy L Thompson 
182975f0d5a4SJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
183075f0d5a4SJeremy L Thompson 
183175f0d5a4SJeremy L Thompson   @ref User
183275f0d5a4SJeremy L Thompson **/
183375f0d5a4SJeremy L Thompson int CeedCompositeOperatorGetMultiplicity(CeedOperator op, CeedInt num_skip_indices, CeedInt *skip_indices, CeedVector mult) {
183475f0d5a4SJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
183575f0d5a4SJeremy L Thompson 
183675f0d5a4SJeremy L Thompson   Ceed                ceed;
183775f0d5a4SJeremy L Thompson   CeedInt             num_sub_ops;
183875f0d5a4SJeremy L Thompson   CeedSize            l_vec_len;
183975f0d5a4SJeremy L Thompson   CeedScalar         *mult_array;
184075f0d5a4SJeremy L Thompson   CeedVector          ones_l_vec;
184175f0d5a4SJeremy L Thompson   CeedElemRestriction elem_restr;
184275f0d5a4SJeremy L Thompson   CeedOperator       *sub_ops;
184375f0d5a4SJeremy L Thompson 
184475f0d5a4SJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
184575f0d5a4SJeremy L Thompson 
184675f0d5a4SJeremy L Thompson   // Zero mult vector
184775f0d5a4SJeremy L Thompson   CeedCall(CeedVectorSetValue(mult, 0.0));
184875f0d5a4SJeremy L Thompson 
184975f0d5a4SJeremy L Thompson   // Get suboperators
1850c6ebc35dSJeremy L Thompson   CeedCall(CeedCompositeOperatorGetNumSub(op, &num_sub_ops));
1851c6ebc35dSJeremy L Thompson   CeedCall(CeedCompositeOperatorGetSubList(op, &sub_ops));
185275f0d5a4SJeremy L Thompson   if (num_sub_ops == 0) return CEED_ERROR_SUCCESS;
185375f0d5a4SJeremy L Thompson 
185475f0d5a4SJeremy L Thompson   // Work vector
185575f0d5a4SJeremy L Thompson   CeedCall(CeedVectorGetLength(mult, &l_vec_len));
185675f0d5a4SJeremy L Thompson   CeedCall(CeedVectorCreate(ceed, l_vec_len, &ones_l_vec));
185775f0d5a4SJeremy L Thompson   CeedCall(CeedVectorSetValue(ones_l_vec, 1.0));
185875f0d5a4SJeremy L Thompson   CeedCall(CeedVectorGetArray(mult, CEED_MEM_HOST, &mult_array));
185975f0d5a4SJeremy L Thompson 
186075f0d5a4SJeremy L Thompson   // Compute multiplicity across suboperators
186175f0d5a4SJeremy L Thompson   for (CeedInt i = 0; i < num_sub_ops; i++) {
186275f0d5a4SJeremy L Thompson     const CeedScalar *sub_mult_array;
186375f0d5a4SJeremy L Thompson     CeedVector        sub_mult_l_vec, ones_e_vec;
186475f0d5a4SJeremy L Thompson 
186575f0d5a4SJeremy L Thompson     // -- Check for suboperator to skip
186675f0d5a4SJeremy L Thompson     for (CeedInt j = 0; j < num_skip_indices; j++) {
186775f0d5a4SJeremy L Thompson       if (skip_indices[j] == i) continue;
186875f0d5a4SJeremy L Thompson     }
186975f0d5a4SJeremy L Thompson 
187075f0d5a4SJeremy L Thompson     // -- Sub operator multiplicity
187175f0d5a4SJeremy L Thompson     CeedCall(CeedOperatorGetActiveElemRestriction(sub_ops[i], &elem_restr));
187275f0d5a4SJeremy L Thompson     CeedCall(CeedElemRestrictionCreateVector(elem_restr, &sub_mult_l_vec, &ones_e_vec));
187375f0d5a4SJeremy L Thompson     CeedCall(CeedVectorSetValue(sub_mult_l_vec, 0.0));
187475f0d5a4SJeremy L Thompson     CeedCall(CeedElemRestrictionApply(elem_restr, CEED_NOTRANSPOSE, ones_l_vec, ones_e_vec, CEED_REQUEST_IMMEDIATE));
187575f0d5a4SJeremy L Thompson     CeedCall(CeedElemRestrictionApply(elem_restr, CEED_TRANSPOSE, ones_e_vec, sub_mult_l_vec, CEED_REQUEST_IMMEDIATE));
187675f0d5a4SJeremy L Thompson     CeedCall(CeedVectorGetArrayRead(sub_mult_l_vec, CEED_MEM_HOST, &sub_mult_array));
187775f0d5a4SJeremy L Thompson     // ---- Flag every node present in the current suboperator
187875f0d5a4SJeremy L Thompson     for (CeedInt j = 0; j < l_vec_len; j++) {
187975f0d5a4SJeremy L Thompson       if (sub_mult_array[j] > 0.0) mult_array[j] += 1.0;
188075f0d5a4SJeremy L Thompson     }
188175f0d5a4SJeremy L Thompson     CeedCall(CeedVectorRestoreArrayRead(sub_mult_l_vec, &sub_mult_array));
188275f0d5a4SJeremy L Thompson     CeedCall(CeedVectorDestroy(&sub_mult_l_vec));
188375f0d5a4SJeremy L Thompson     CeedCall(CeedVectorDestroy(&ones_e_vec));
188475f0d5a4SJeremy L Thompson   }
188575f0d5a4SJeremy L Thompson   CeedCall(CeedVectorRestoreArray(mult, &mult_array));
1886811d0ccfSJeremy L Thompson   CeedCall(CeedVectorDestroy(&ones_l_vec));
188775f0d5a4SJeremy L Thompson 
188875f0d5a4SJeremy L Thompson   return CEED_ERROR_SUCCESS;
188975f0d5a4SJeremy L Thompson }
189075f0d5a4SJeremy L Thompson 
189175f0d5a4SJeremy L Thompson /**
1892ea61e9acSJeremy L Thompson   @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator, creating the prolongation basis from the fine and coarse
1893ea61e9acSJeremy L Thompson grid interpolation
1894eaf62fffSJeremy L Thompson 
189558e4b056SJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable.
1896f04ea552SJeremy L Thompson 
1897eaf62fffSJeremy L Thompson   @param[in]  op_fine      Fine grid operator
1898eaf62fffSJeremy L Thompson   @param[in]  p_mult_fine  L-vector multiplicity in parallel gather/scatter
1899eaf62fffSJeremy L Thompson   @param[in]  rstr_coarse  Coarse grid restriction
1900eaf62fffSJeremy L Thompson   @param[in]  basis_coarse Coarse grid active vector basis
1901eaf62fffSJeremy L Thompson   @param[out] op_coarse    Coarse grid operator
1902eaf62fffSJeremy L Thompson   @param[out] op_prolong   Coarse to fine operator
1903eaf62fffSJeremy L Thompson   @param[out] op_restrict  Fine to coarse operator
1904eaf62fffSJeremy L Thompson 
1905eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1906eaf62fffSJeremy L Thompson 
1907eaf62fffSJeremy L Thompson   @ref User
1908eaf62fffSJeremy L Thompson **/
19092b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreate(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse,
19102b730f8bSJeremy L Thompson                                      CeedOperator *op_coarse, CeedOperator *op_prolong, CeedOperator *op_restrict) {
19112b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op_fine));
1912eaf62fffSJeremy L Thompson 
1913f113e5dcSJeremy L Thompson   // Build prolongation matrix
1914f113e5dcSJeremy L Thompson   CeedBasis basis_fine, basis_c_to_f;
19152b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine));
19162b730f8bSJeremy L Thompson   CeedCall(CeedBasisCreateProjection(basis_coarse, basis_fine, &basis_c_to_f));
1917eaf62fffSJeremy L Thompson 
1918f113e5dcSJeremy L Thompson   // Core code
19192b730f8bSJeremy L Thompson   CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict));
1920f113e5dcSJeremy L Thompson 
1921eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1922eaf62fffSJeremy L Thompson }
1923eaf62fffSJeremy L Thompson 
1924eaf62fffSJeremy L Thompson /**
1925ea61e9acSJeremy L Thompson   @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a tensor basis for the active basis
1926eaf62fffSJeremy L Thompson 
192758e4b056SJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable.
1928f04ea552SJeremy L Thompson 
1929eaf62fffSJeremy L Thompson   @param[in]  op_fine       Fine grid operator
1930eaf62fffSJeremy L Thompson   @param[in]  p_mult_fine   L-vector multiplicity in parallel gather/scatter
1931eaf62fffSJeremy L Thompson   @param[in]  rstr_coarse   Coarse grid restriction
1932eaf62fffSJeremy L Thompson   @param[in]  basis_coarse  Coarse grid active vector basis
1933eaf62fffSJeremy L Thompson   @param[in]  interp_c_to_f Matrix for coarse to fine interpolation
1934eaf62fffSJeremy L Thompson   @param[out] op_coarse     Coarse grid operator
1935eaf62fffSJeremy L Thompson   @param[out] op_prolong    Coarse to fine operator
1936eaf62fffSJeremy L Thompson   @param[out] op_restrict   Fine to coarse operator
1937eaf62fffSJeremy L Thompson 
1938eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1939eaf62fffSJeremy L Thompson 
1940eaf62fffSJeremy L Thompson   @ref User
1941eaf62fffSJeremy L Thompson **/
19422b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateTensorH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse,
19432b730f8bSJeremy L Thompson                                              const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong,
19442b730f8bSJeremy L Thompson                                              CeedOperator *op_restrict) {
19452b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op_fine));
1946eaf62fffSJeremy L Thompson   Ceed ceed;
19472b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op_fine, &ceed));
1948eaf62fffSJeremy L Thompson 
1949eaf62fffSJeremy L Thompson   // Check for compatible quadrature spaces
1950eaf62fffSJeremy L Thompson   CeedBasis basis_fine;
19512b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine));
1952eaf62fffSJeremy L Thompson   CeedInt Q_f, Q_c;
19532b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f));
19542b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c));
19552b730f8bSJeremy L Thompson   if (Q_f != Q_c) {
1956eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
19572b730f8bSJeremy L Thompson     return CeedError(ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces");
1958eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
19592b730f8bSJeremy L Thompson   }
1960eaf62fffSJeremy L Thompson 
1961eaf62fffSJeremy L Thompson   // Coarse to fine basis
1962eaf62fffSJeremy L Thompson   CeedInt dim, num_comp, num_nodes_c, P_1d_f, P_1d_c;
19632b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetDimension(basis_fine, &dim));
19642b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp));
19652b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumNodes1D(basis_fine, &P_1d_f));
19662b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c));
19672b730f8bSJeremy L Thompson   P_1d_c = dim == 1 ? num_nodes_c : dim == 2 ? sqrt(num_nodes_c) : cbrt(num_nodes_c);
1968eaf62fffSJeremy L Thompson   CeedScalar *q_ref, *q_weight, *grad;
19692b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d_f, &q_ref));
19702b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d_f, &q_weight));
19712b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d_f * P_1d_c * dim, &grad));
1972eaf62fffSJeremy L Thompson   CeedBasis basis_c_to_f;
19732b730f8bSJeremy L Thompson   CeedCall(CeedBasisCreateTensorH1(ceed, dim, num_comp, P_1d_c, P_1d_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f));
19742b730f8bSJeremy L Thompson   CeedCall(CeedFree(&q_ref));
19752b730f8bSJeremy L Thompson   CeedCall(CeedFree(&q_weight));
19762b730f8bSJeremy L Thompson   CeedCall(CeedFree(&grad));
1977eaf62fffSJeremy L Thompson 
1978eaf62fffSJeremy L Thompson   // Core code
19792b730f8bSJeremy L Thompson   CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict));
1980eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
1981eaf62fffSJeremy L Thompson }
1982eaf62fffSJeremy L Thompson 
1983eaf62fffSJeremy L Thompson /**
1984ea61e9acSJeremy L Thompson   @brief Create a multigrid coarse operator and level transfer operators for a CeedOperator with a non-tensor basis for the active vector
1985eaf62fffSJeremy L Thompson 
198658e4b056SJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets all four CeedOperators as immutable.
1987f04ea552SJeremy L Thompson 
1988eaf62fffSJeremy L Thompson   @param[in]  op_fine       Fine grid operator
1989eaf62fffSJeremy L Thompson   @param[in]  p_mult_fine   L-vector multiplicity in parallel gather/scatter
1990eaf62fffSJeremy L Thompson   @param[in]  rstr_coarse   Coarse grid restriction
1991eaf62fffSJeremy L Thompson   @param[in]  basis_coarse  Coarse grid active vector basis
1992eaf62fffSJeremy L Thompson   @param[in]  interp_c_to_f Matrix for coarse to fine interpolation
1993eaf62fffSJeremy L Thompson   @param[out] op_coarse     Coarse grid operator
1994eaf62fffSJeremy L Thompson   @param[out] op_prolong    Coarse to fine operator
1995eaf62fffSJeremy L Thompson   @param[out] op_restrict   Fine to coarse operator
1996eaf62fffSJeremy L Thompson 
1997eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
1998eaf62fffSJeremy L Thompson 
1999eaf62fffSJeremy L Thompson   @ref User
2000eaf62fffSJeremy L Thompson **/
20012b730f8bSJeremy L Thompson int CeedOperatorMultigridLevelCreateH1(CeedOperator op_fine, CeedVector p_mult_fine, CeedElemRestriction rstr_coarse, CeedBasis basis_coarse,
20022b730f8bSJeremy L Thompson                                        const CeedScalar *interp_c_to_f, CeedOperator *op_coarse, CeedOperator *op_prolong,
2003eaf62fffSJeremy L Thompson                                        CeedOperator *op_restrict) {
20042b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op_fine));
2005eaf62fffSJeremy L Thompson   Ceed ceed;
20062b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op_fine, &ceed));
2007eaf62fffSJeremy L Thompson 
2008eaf62fffSJeremy L Thompson   // Check for compatible quadrature spaces
2009eaf62fffSJeremy L Thompson   CeedBasis basis_fine;
20102b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetActiveBasis(op_fine, &basis_fine));
2011eaf62fffSJeremy L Thompson   CeedInt Q_f, Q_c;
20122b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_fine, &Q_f));
20132b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis_coarse, &Q_c));
20142b730f8bSJeremy L Thompson   if (Q_f != Q_c) {
2015eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
20162b730f8bSJeremy L Thompson     return CeedError(ceed, CEED_ERROR_DIMENSION, "Bases must have compatible quadrature spaces");
2017eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
20182b730f8bSJeremy L Thompson   }
2019eaf62fffSJeremy L Thompson 
2020eaf62fffSJeremy L Thompson   // Coarse to fine basis
2021eaf62fffSJeremy L Thompson   CeedElemTopology topo;
20222b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetTopology(basis_fine, &topo));
2023eaf62fffSJeremy L Thompson   CeedInt dim, num_comp, num_nodes_c, num_nodes_f;
20242b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetDimension(basis_fine, &dim));
20252b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumComponents(basis_fine, &num_comp));
20262b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumNodes(basis_fine, &num_nodes_f));
20272b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetElementSize(rstr_coarse, &num_nodes_c));
2028eaf62fffSJeremy L Thompson   CeedScalar *q_ref, *q_weight, *grad;
20292b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(num_nodes_f * dim, &q_ref));
20302b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(num_nodes_f, &q_weight));
20312b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(num_nodes_f * num_nodes_c * dim, &grad));
2032eaf62fffSJeremy L Thompson   CeedBasis basis_c_to_f;
20332b730f8bSJeremy L Thompson   CeedCall(CeedBasisCreateH1(ceed, topo, num_comp, num_nodes_c, num_nodes_f, interp_c_to_f, grad, q_ref, q_weight, &basis_c_to_f));
20342b730f8bSJeremy L Thompson   CeedCall(CeedFree(&q_ref));
20352b730f8bSJeremy L Thompson   CeedCall(CeedFree(&q_weight));
20362b730f8bSJeremy L Thompson   CeedCall(CeedFree(&grad));
2037eaf62fffSJeremy L Thompson 
2038eaf62fffSJeremy L Thompson   // Core code
20392b730f8bSJeremy L Thompson   CeedCall(CeedSingleOperatorMultigridLevel(op_fine, p_mult_fine, rstr_coarse, basis_coarse, basis_c_to_f, op_coarse, op_prolong, op_restrict));
2040eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
2041eaf62fffSJeremy L Thompson }
2042eaf62fffSJeremy L Thompson 
2043eaf62fffSJeremy L Thompson /**
2044ea61e9acSJeremy L Thompson   @brief Build a FDM based approximate inverse for each element for a CeedOperator
2045eaf62fffSJeremy L Thompson 
2046ea61e9acSJeremy L Thompson   This returns a CeedOperator and CeedVector to apply a Fast Diagonalization Method based approximate inverse.
2047ea61e9acSJeremy L Thompson     This function obtains the simultaneous diagonalization for the 1D mass and Laplacian operators, M = V^T V, K = V^T S V.
2048ea61e9acSJeremy L Thompson     The assembled QFunction is used to modify the eigenvalues from simultaneous diagonalization and obtain an approximate inverse of the form V^T
2049ea61e9acSJeremy L Thompson S^hat V. The CeedOperator must be linear and non-composite. The associated CeedQFunction must therefore also be linear.
2050eaf62fffSJeremy L Thompson 
2051ea61e9acSJeremy L Thompson   Note: Calling this function asserts that setup is complete and sets the CeedOperator as immutable.
2052f04ea552SJeremy L Thompson 
2053ea61e9acSJeremy L Thompson   @param[in]  op      CeedOperator to create element inverses
2054ea61e9acSJeremy L Thompson   @param[out] fdm_inv CeedOperator to apply the action of a FDM based inverse for each element
2055ea61e9acSJeremy L Thompson   @param[in]  request Address of CeedRequest for non-blocking completion, else @ref CEED_REQUEST_IMMEDIATE
2056eaf62fffSJeremy L Thompson 
2057eaf62fffSJeremy L Thompson   @return An error code: 0 - success, otherwise - failure
2058eaf62fffSJeremy L Thompson 
2059480fae85SJeremy L Thompson   @ref User
2060eaf62fffSJeremy L Thompson **/
20612b730f8bSJeremy L Thompson int CeedOperatorCreateFDMElementInverse(CeedOperator op, CeedOperator *fdm_inv, CeedRequest *request) {
20622b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCheckReady(op));
2063eaf62fffSJeremy L Thompson 
2064eaf62fffSJeremy L Thompson   if (op->CreateFDMElementInverse) {
2065d04bbc78SJeremy L Thompson     // Backend version
20662b730f8bSJeremy L Thompson     CeedCall(op->CreateFDMElementInverse(op, fdm_inv, request));
2067eaf62fffSJeremy L Thompson     return CEED_ERROR_SUCCESS;
2068eaf62fffSJeremy L Thompson   } else {
2069d04bbc78SJeremy L Thompson     // Operator fallback
2070d04bbc78SJeremy L Thompson     CeedOperator op_fallback;
2071d04bbc78SJeremy L Thompson 
20722b730f8bSJeremy L Thompson     CeedCall(CeedOperatorGetFallback(op, &op_fallback));
2073d04bbc78SJeremy L Thompson     if (op_fallback) {
20742b730f8bSJeremy L Thompson       CeedCall(CeedOperatorCreateFDMElementInverse(op_fallback, fdm_inv, request));
2075eaf62fffSJeremy L Thompson       return CEED_ERROR_SUCCESS;
2076eaf62fffSJeremy L Thompson     }
2077eaf62fffSJeremy L Thompson   }
2078eaf62fffSJeremy L Thompson 
2079d04bbc78SJeremy L Thompson   // Default interface implementation
2080eaf62fffSJeremy L Thompson   Ceed ceed, ceed_parent;
20812b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetCeed(op, &ceed));
20822b730f8bSJeremy L Thompson   CeedCall(CeedGetOperatorFallbackParentCeed(ceed, &ceed_parent));
2083eaf62fffSJeremy L Thompson   ceed_parent = ceed_parent ? ceed_parent : ceed;
2084eaf62fffSJeremy L Thompson   CeedQFunction qf;
20852b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetQFunction(op, &qf));
2086eaf62fffSJeremy L Thompson 
2087eaf62fffSJeremy L Thompson   // Determine active input basis
2088eaf62fffSJeremy L Thompson   bool                interp = false, grad = false;
2089eaf62fffSJeremy L Thompson   CeedBasis           basis = NULL;
2090eaf62fffSJeremy L Thompson   CeedElemRestriction rstr  = NULL;
2091eaf62fffSJeremy L Thompson   CeedOperatorField  *op_fields;
2092eaf62fffSJeremy L Thompson   CeedQFunctionField *qf_fields;
2093eaf62fffSJeremy L Thompson   CeedInt             num_input_fields;
20942b730f8bSJeremy L Thompson   CeedCall(CeedOperatorGetFields(op, &num_input_fields, &op_fields, NULL, NULL));
20952b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionGetFields(qf, NULL, &qf_fields, NULL, NULL));
2096eaf62fffSJeremy L Thompson   for (CeedInt i = 0; i < num_input_fields; i++) {
2097eaf62fffSJeremy L Thompson     CeedVector vec;
20982b730f8bSJeremy L Thompson     CeedCall(CeedOperatorFieldGetVector(op_fields[i], &vec));
2099eaf62fffSJeremy L Thompson     if (vec == CEED_VECTOR_ACTIVE) {
2100eaf62fffSJeremy L Thompson       CeedEvalMode eval_mode;
21012b730f8bSJeremy L Thompson       CeedCall(CeedQFunctionFieldGetEvalMode(qf_fields[i], &eval_mode));
2102eaf62fffSJeremy L Thompson       interp = interp || eval_mode == CEED_EVAL_INTERP;
2103eaf62fffSJeremy L Thompson       grad   = grad || eval_mode == CEED_EVAL_GRAD;
21042b730f8bSJeremy L Thompson       CeedCall(CeedOperatorFieldGetBasis(op_fields[i], &basis));
21052b730f8bSJeremy L Thompson       CeedCall(CeedOperatorFieldGetElemRestriction(op_fields[i], &rstr));
2106eaf62fffSJeremy L Thompson     }
2107eaf62fffSJeremy L Thompson   }
21082b730f8bSJeremy L Thompson   if (!basis) {
2109eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
2110eaf62fffSJeremy L Thompson     return CeedError(ceed, CEED_ERROR_BACKEND, "No active field set");
2111eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
21122b730f8bSJeremy L Thompson   }
2113e79b91d9SJeremy L Thompson   CeedSize l_size = 1;
2114e79b91d9SJeremy L Thompson   CeedInt  P_1d, Q_1d, elem_size, num_qpts, dim, num_comp = 1, num_elem = 1;
21152b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumNodes1D(basis, &P_1d));
21162b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumNodes(basis, &elem_size));
21172b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints1D(basis, &Q_1d));
21182b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumQuadraturePoints(basis, &num_qpts));
21192b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetDimension(basis, &dim));
21202b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetNumComponents(basis, &num_comp));
21212b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetNumElements(rstr, &num_elem));
21222b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetLVectorSize(rstr, &l_size));
2123eaf62fffSJeremy L Thompson 
2124eaf62fffSJeremy L Thompson   // Build and diagonalize 1D Mass and Laplacian
2125eaf62fffSJeremy L Thompson   bool tensor_basis;
21262b730f8bSJeremy L Thompson   CeedCall(CeedBasisIsTensor(basis, &tensor_basis));
21272b730f8bSJeremy L Thompson   if (!tensor_basis) {
2128eaf62fffSJeremy L Thompson     // LCOV_EXCL_START
21292b730f8bSJeremy L Thompson     return CeedError(ceed, CEED_ERROR_BACKEND, "FDMElementInverse only supported for tensor bases");
2130eaf62fffSJeremy L Thompson     // LCOV_EXCL_STOP
21312b730f8bSJeremy L Thompson   }
2132eaf62fffSJeremy L Thompson   CeedScalar *mass, *laplace, *x, *fdm_interp, *lambda;
21332b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &mass));
21342b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &laplace));
21352b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &x));
21362b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &fdm_interp));
21372b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d, &lambda));
2138eaf62fffSJeremy L Thompson   // -- Build matrices
2139eaf62fffSJeremy L Thompson   const CeedScalar *interp_1d, *grad_1d, *q_weight_1d;
21402b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetInterp1D(basis, &interp_1d));
21412b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetGrad1D(basis, &grad_1d));
21422b730f8bSJeremy L Thompson   CeedCall(CeedBasisGetQWeights(basis, &q_weight_1d));
21432b730f8bSJeremy L Thompson   CeedCall(CeedBuildMassLaplace(interp_1d, grad_1d, q_weight_1d, P_1d, Q_1d, dim, mass, laplace));
2144eaf62fffSJeremy L Thompson 
2145eaf62fffSJeremy L Thompson   // -- Diagonalize
21462b730f8bSJeremy L Thompson   CeedCall(CeedSimultaneousDiagonalization(ceed, laplace, mass, x, lambda, P_1d));
21472b730f8bSJeremy L Thompson   CeedCall(CeedFree(&mass));
21482b730f8bSJeremy L Thompson   CeedCall(CeedFree(&laplace));
21492b730f8bSJeremy L Thompson   for (CeedInt i = 0; i < P_1d; i++) {
21502b730f8bSJeremy L Thompson     for (CeedInt j = 0; j < P_1d; j++) fdm_interp[i + j * P_1d] = x[j + i * P_1d];
21512b730f8bSJeremy L Thompson   }
21522b730f8bSJeremy L Thompson   CeedCall(CeedFree(&x));
2153eaf62fffSJeremy L Thompson 
2154eaf62fffSJeremy L Thompson   // Assemble QFunction
2155eaf62fffSJeremy L Thompson   CeedVector          assembled;
2156eaf62fffSJeremy L Thompson   CeedElemRestriction rstr_qf;
21572b730f8bSJeremy L Thompson   CeedCall(CeedOperatorLinearAssembleQFunctionBuildOrUpdate(op, &assembled, &rstr_qf, request));
2158eaf62fffSJeremy L Thompson   CeedInt layout[3];
21592b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionGetELayout(rstr_qf, &layout));
21602b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&rstr_qf));
2161eaf62fffSJeremy L Thompson   CeedScalar max_norm = 0;
21622b730f8bSJeremy L Thompson   CeedCall(CeedVectorNorm(assembled, CEED_NORM_MAX, &max_norm));
2163eaf62fffSJeremy L Thompson 
2164eaf62fffSJeremy L Thompson   // Calculate element averages
2165eaf62fffSJeremy L Thompson   CeedInt           num_modes = (interp ? 1 : 0) + (grad ? dim : 0);
2166eaf62fffSJeremy L Thompson   CeedScalar       *elem_avg;
2167eaf62fffSJeremy L Thompson   const CeedScalar *assembled_array, *q_weight_array;
2168eaf62fffSJeremy L Thompson   CeedVector        q_weight;
21692b730f8bSJeremy L Thompson   CeedCall(CeedVectorCreate(ceed_parent, num_qpts, &q_weight));
21702b730f8bSJeremy L Thompson   CeedCall(CeedBasisApply(basis, 1, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT, CEED_VECTOR_NONE, q_weight));
21712b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayRead(assembled, CEED_MEM_HOST, &assembled_array));
21722b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayRead(q_weight, CEED_MEM_HOST, &q_weight_array));
21732b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(num_elem, &elem_avg));
2174eaf62fffSJeremy L Thompson   const CeedScalar qf_value_bound = max_norm * 100 * CEED_EPSILON;
2175eaf62fffSJeremy L Thompson   for (CeedInt e = 0; e < num_elem; e++) {
2176eaf62fffSJeremy L Thompson     CeedInt count = 0;
21772b730f8bSJeremy L Thompson     for (CeedInt q = 0; q < num_qpts; q++) {
21782b730f8bSJeremy L Thompson       for (CeedInt i = 0; i < num_comp * num_comp * num_modes * num_modes; i++) {
21792b730f8bSJeremy L Thompson         if (fabs(assembled_array[q * layout[0] + i * layout[1] + e * layout[2]]) > qf_value_bound) {
21802b730f8bSJeremy L Thompson           elem_avg[e] += assembled_array[q * layout[0] + i * layout[1] + e * layout[2]] / q_weight_array[q];
2181eaf62fffSJeremy L Thompson           count++;
2182eaf62fffSJeremy L Thompson         }
21832b730f8bSJeremy L Thompson       }
21842b730f8bSJeremy L Thompson     }
2185eaf62fffSJeremy L Thompson     if (count) {
2186eaf62fffSJeremy L Thompson       elem_avg[e] /= count;
2187eaf62fffSJeremy L Thompson     } else {
2188eaf62fffSJeremy L Thompson       elem_avg[e] = 1.0;
2189eaf62fffSJeremy L Thompson     }
2190eaf62fffSJeremy L Thompson   }
21912b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArrayRead(assembled, &assembled_array));
21922b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&assembled));
21932b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArrayRead(q_weight, &q_weight_array));
21942b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&q_weight));
2195eaf62fffSJeremy L Thompson 
2196eaf62fffSJeremy L Thompson   // Build FDM diagonal
2197eaf62fffSJeremy L Thompson   CeedVector  q_data;
2198eaf62fffSJeremy L Thompson   CeedScalar *q_data_array, *fdm_diagonal;
21992b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(num_comp * elem_size, &fdm_diagonal));
2200eaf62fffSJeremy L Thompson   const CeedScalar fdm_diagonal_bound = elem_size * CEED_EPSILON;
22012b730f8bSJeremy L Thompson   for (CeedInt c = 0; c < num_comp; c++) {
2202eaf62fffSJeremy L Thompson     for (CeedInt n = 0; n < elem_size; n++) {
22032b730f8bSJeremy L Thompson       if (interp) fdm_diagonal[c * elem_size + n] = 1.0;
22042b730f8bSJeremy L Thompson       if (grad) {
2205eaf62fffSJeremy L Thompson         for (CeedInt d = 0; d < dim; d++) {
2206eaf62fffSJeremy L Thompson           CeedInt i = (n / CeedIntPow(P_1d, d)) % P_1d;
2207eaf62fffSJeremy L Thompson           fdm_diagonal[c * elem_size + n] += lambda[i];
2208eaf62fffSJeremy L Thompson         }
2209eaf62fffSJeremy L Thompson       }
22102b730f8bSJeremy L Thompson       if (fabs(fdm_diagonal[c * elem_size + n]) < fdm_diagonal_bound) fdm_diagonal[c * elem_size + n] = fdm_diagonal_bound;
22112b730f8bSJeremy L Thompson     }
22122b730f8bSJeremy L Thompson   }
22132b730f8bSJeremy L Thompson   CeedCall(CeedVectorCreate(ceed_parent, num_elem * num_comp * elem_size, &q_data));
22142b730f8bSJeremy L Thompson   CeedCall(CeedVectorSetValue(q_data, 0.0));
22152b730f8bSJeremy L Thompson   CeedCall(CeedVectorGetArrayWrite(q_data, CEED_MEM_HOST, &q_data_array));
22162b730f8bSJeremy L Thompson   for (CeedInt e = 0; e < num_elem; e++) {
22172b730f8bSJeremy L Thompson     for (CeedInt c = 0; c < num_comp; c++) {
22182b730f8bSJeremy L Thompson       for (CeedInt n = 0; n < elem_size; n++) q_data_array[(e * num_comp + c) * elem_size + n] = 1. / (elem_avg[e] * fdm_diagonal[c * elem_size + n]);
22192b730f8bSJeremy L Thompson     }
22202b730f8bSJeremy L Thompson   }
22212b730f8bSJeremy L Thompson   CeedCall(CeedFree(&elem_avg));
22222b730f8bSJeremy L Thompson   CeedCall(CeedFree(&fdm_diagonal));
22232b730f8bSJeremy L Thompson   CeedCall(CeedVectorRestoreArray(q_data, &q_data_array));
2224eaf62fffSJeremy L Thompson 
2225eaf62fffSJeremy L Thompson   // Setup FDM operator
2226eaf62fffSJeremy L Thompson   // -- Basis
2227eaf62fffSJeremy L Thompson   CeedBasis   fdm_basis;
2228eaf62fffSJeremy L Thompson   CeedScalar *grad_dummy, *q_ref_dummy, *q_weight_dummy;
22292b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d * P_1d, &grad_dummy));
22302b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d, &q_ref_dummy));
22312b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(P_1d, &q_weight_dummy));
22322b730f8bSJeremy L Thompson   CeedCall(CeedBasisCreateTensorH1(ceed_parent, dim, num_comp, P_1d, P_1d, fdm_interp, grad_dummy, q_ref_dummy, q_weight_dummy, &fdm_basis));
22332b730f8bSJeremy L Thompson   CeedCall(CeedFree(&fdm_interp));
22342b730f8bSJeremy L Thompson   CeedCall(CeedFree(&grad_dummy));
22352b730f8bSJeremy L Thompson   CeedCall(CeedFree(&q_ref_dummy));
22362b730f8bSJeremy L Thompson   CeedCall(CeedFree(&q_weight_dummy));
22372b730f8bSJeremy L Thompson   CeedCall(CeedFree(&lambda));
2238eaf62fffSJeremy L Thompson 
2239eaf62fffSJeremy L Thompson   // -- Restriction
2240eaf62fffSJeremy L Thompson   CeedElemRestriction rstr_qd_i;
2241eaf62fffSJeremy L Thompson   CeedInt             strides[3] = {1, elem_size, elem_size * num_comp};
22422b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionCreateStrided(ceed_parent, num_elem, elem_size, num_comp, num_elem * num_comp * elem_size, strides, &rstr_qd_i));
2243eaf62fffSJeremy L Thompson   // -- QFunction
2244eaf62fffSJeremy L Thompson   CeedQFunction qf_fdm;
22452b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionCreateInteriorByName(ceed_parent, "Scale", &qf_fdm));
22462b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAddInput(qf_fdm, "input", num_comp, CEED_EVAL_INTERP));
22472b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAddInput(qf_fdm, "scale", num_comp, CEED_EVAL_NONE));
22482b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionAddOutput(qf_fdm, "output", num_comp, CEED_EVAL_INTERP));
22492b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionSetUserFlopsEstimate(qf_fdm, num_comp));
2250eaf62fffSJeremy L Thompson   // -- QFunction context
2251eaf62fffSJeremy L Thompson   CeedInt *num_comp_data;
22522b730f8bSJeremy L Thompson   CeedCall(CeedCalloc(1, &num_comp_data));
2253eaf62fffSJeremy L Thompson   num_comp_data[0] = num_comp;
2254eaf62fffSJeremy L Thompson   CeedQFunctionContext ctx_fdm;
22552b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionContextCreate(ceed, &ctx_fdm));
22562b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionContextSetData(ctx_fdm, CEED_MEM_HOST, CEED_OWN_POINTER, sizeof(*num_comp_data), num_comp_data));
22572b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionSetContext(qf_fdm, ctx_fdm));
22582b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionContextDestroy(&ctx_fdm));
2259eaf62fffSJeremy L Thompson   // -- Operator
22602b730f8bSJeremy L Thompson   CeedCall(CeedOperatorCreate(ceed_parent, qf_fdm, NULL, NULL, fdm_inv));
22612b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetField(*fdm_inv, "input", rstr, fdm_basis, CEED_VECTOR_ACTIVE));
22622b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetField(*fdm_inv, "scale", rstr_qd_i, CEED_BASIS_COLLOCATED, q_data));
22632b730f8bSJeremy L Thompson   CeedCall(CeedOperatorSetField(*fdm_inv, "output", rstr, fdm_basis, CEED_VECTOR_ACTIVE));
2264eaf62fffSJeremy L Thompson 
2265eaf62fffSJeremy L Thompson   // Cleanup
22662b730f8bSJeremy L Thompson   CeedCall(CeedVectorDestroy(&q_data));
22672b730f8bSJeremy L Thompson   CeedCall(CeedBasisDestroy(&fdm_basis));
22682b730f8bSJeremy L Thompson   CeedCall(CeedElemRestrictionDestroy(&rstr_qd_i));
22692b730f8bSJeremy L Thompson   CeedCall(CeedQFunctionDestroy(&qf_fdm));
2270eaf62fffSJeremy L Thompson 
2271eaf62fffSJeremy L Thompson   return CEED_ERROR_SUCCESS;
2272eaf62fffSJeremy L Thompson }
2273eaf62fffSJeremy L Thompson 
2274eaf62fffSJeremy L Thompson /// @}
2275