xref: /honee/src/spanstats/spanstats.c (revision dae7673a5083879fe11419a8756d38cb937fd63d) !
1*dae7673aSJames Wright // SPDX-FileCopyrightText: Copyright (c) 2017-2024, HONEE contributors.
2*dae7673aSJames Wright // SPDX-License-Identifier: Apache-2.0 OR BSD-2-Clause
3*dae7673aSJames Wright /// @file
4*dae7673aSJames Wright /// Functions for setting up and performing spanwise-statistics collection
5*dae7673aSJames Wright ///
6*dae7673aSJames Wright /// "Parent" refers to the 2D plane on which statistics are collected *onto*.
7*dae7673aSJames Wright /// "Child" refers to the 3D domain where statistics are gathered *from*.
8*dae7673aSJames Wright /// Each quadrature point on the parent plane has several children in the child domain that it performs spanwise averaging with.
9*dae7673aSJames Wright 
10*dae7673aSJames Wright #include <ceed.h>
11*dae7673aSJames Wright #include <petscdmplex.h>
12*dae7673aSJames Wright #include <petscsf.h>
13*dae7673aSJames Wright #include <spanstats.h>
14*dae7673aSJames Wright 
15*dae7673aSJames Wright #include <navierstokes.h>
16*dae7673aSJames Wright #include <petsc_ops.h>
17*dae7673aSJames Wright 
18*dae7673aSJames Wright PetscErrorCode SpanStatsCtxDestroy(void **ctx) {
19*dae7673aSJames Wright   SpanStatsCtx spanstats = *(SpanStatsCtx *)ctx;
20*dae7673aSJames Wright 
21*dae7673aSJames Wright   PetscFunctionBeginUser;
22*dae7673aSJames Wright   if (spanstats == NULL) PetscFunctionReturn(PETSC_SUCCESS);
23*dae7673aSJames Wright   PetscCall(VecDestroy(&spanstats->Child_Stats_loc));
24*dae7673aSJames Wright   PetscCall(VecDestroy(&spanstats->Parent_Stats_loc));
25*dae7673aSJames Wright 
26*dae7673aSJames Wright   PetscCall(OperatorApplyContextDestroy(spanstats->op_stats_collect_ctx));
27*dae7673aSJames Wright   PetscCall(OperatorApplyContextDestroy(spanstats->op_proj_rhs_ctx));
28*dae7673aSJames Wright   PetscCall(OperatorApplyContextDestroy(spanstats->mms_error_ctx));
29*dae7673aSJames Wright 
30*dae7673aSJames Wright   PetscCall(KSPDestroy(&spanstats->ksp));
31*dae7673aSJames Wright   PetscCall(PetscSFDestroy(&spanstats->sf));
32*dae7673aSJames Wright   PetscCall(DMDestroy(&spanstats->dm));
33*dae7673aSJames Wright   PetscCall(PetscFree(spanstats->prefix));
34*dae7673aSJames Wright   PetscCall(PetscFree(spanstats));
35*dae7673aSJames Wright   PetscFunctionReturn(PETSC_SUCCESS);
36*dae7673aSJames Wright }
37*dae7673aSJames Wright 
38*dae7673aSJames Wright static PetscErrorCode SpanwiseStatisticssCreateDM(Honee honee, SpanStatsCtx spanstats, PetscInt degree, PetscInt num_comps) {
39*dae7673aSJames Wright   PetscReal     domain_min[3], domain_max[3];
40*dae7673aSJames Wright   PetscLogStage stage_stats_setup;
41*dae7673aSJames Wright   MPI_Comm      comm = PetscObjectComm((PetscObject)honee->dm);
42*dae7673aSJames Wright 
43*dae7673aSJames Wright   PetscFunctionBeginUser;
44*dae7673aSJames Wright   PetscCall(PetscLogStageGetId("Stats Setup", &stage_stats_setup));
45*dae7673aSJames Wright   if (stage_stats_setup == -1) PetscCall(PetscLogStageRegister("Stats Setup", &stage_stats_setup));
46*dae7673aSJames Wright   PetscCall(PetscLogStagePush(stage_stats_setup));
47*dae7673aSJames Wright 
48*dae7673aSJames Wright   spanstats->num_comp_stats = num_comps;
49*dae7673aSJames Wright 
50*dae7673aSJames Wright   // Get spanwise length
51*dae7673aSJames Wright   PetscCall(DMGetBoundingBox(honee->dm, domain_min, domain_max));
52*dae7673aSJames Wright   spanstats->span_width = domain_max[2] - domain_min[2];
53*dae7673aSJames Wright 
54*dae7673aSJames Wright   {  // Get DM from surface
55*dae7673aSJames Wright     DM             parent_distributed_dm;
56*dae7673aSJames Wright     const PetscSF *isoperiodicface;
57*dae7673aSJames Wright     PetscInt       num_isoperiodicface;
58*dae7673aSJames Wright     DMLabel        label;
59*dae7673aSJames Wright     PetscMPIInt    size;
60*dae7673aSJames Wright 
61*dae7673aSJames Wright     PetscCall(DMPlexGetIsoperiodicFaceSF(honee->dm, &num_isoperiodicface, &isoperiodicface));
62*dae7673aSJames Wright 
63*dae7673aSJames Wright     if (isoperiodicface) {
64*dae7673aSJames Wright       PetscSF         inv_isoperiodicface;
65*dae7673aSJames Wright       PetscInt        nleaves, isoperiodicface_index = -1;
66*dae7673aSJames Wright       const PetscInt *ilocal;
67*dae7673aSJames Wright       char            isoperiodicface_key[1024];
68*dae7673aSJames Wright 
69*dae7673aSJames Wright       PetscCall(PetscSNPrintf(isoperiodicface_key, sizeof isoperiodicface_key, "-%sisoperiodic_facesf", spanstats->prefix));
70*dae7673aSJames Wright       PetscCall(PetscOptionsGetInt(NULL, NULL, isoperiodicface_key, &isoperiodicface_index, NULL));
71*dae7673aSJames Wright       isoperiodicface_index = isoperiodicface_index == -1 ? num_isoperiodicface - 1 : isoperiodicface_index;
72*dae7673aSJames Wright       PetscCall(PetscSFCreateInverseSF(isoperiodicface[isoperiodicface_index], &inv_isoperiodicface));
73*dae7673aSJames Wright       PetscCall(PetscSFGetGraph(inv_isoperiodicface, NULL, &nleaves, &ilocal, NULL));
74*dae7673aSJames Wright       PetscCall(DMCreateLabel(honee->dm, "Periodic Face"));
75*dae7673aSJames Wright       PetscCall(DMGetLabel(honee->dm, "Periodic Face", &label));
76*dae7673aSJames Wright       for (PetscInt i = 0; i < nleaves; i++) {
77*dae7673aSJames Wright         PetscCall(DMLabelSetValue(label, ilocal[i], 1));
78*dae7673aSJames Wright       }
79*dae7673aSJames Wright       PetscCall(PetscSFDestroy(&inv_isoperiodicface));
80*dae7673aSJames Wright     } else {
81*dae7673aSJames Wright       PetscCall(DMGetLabel(honee->dm, "Face Sets", &label));
82*dae7673aSJames Wright     }
83*dae7673aSJames Wright 
84*dae7673aSJames Wright     PetscCall(DMPlexLabelComplete(honee->dm, label));
85*dae7673aSJames Wright     PetscCall(DMPlexFilter(honee->dm, label, 1, PETSC_FALSE, PETSC_FALSE, NULL, &spanstats->dm));
86*dae7673aSJames Wright     PetscCall(DMSetCoordinateDisc(spanstats->dm, NULL, PETSC_FALSE, PETSC_TRUE));  // Ensure that a coordinate FE exists
87*dae7673aSJames Wright 
88*dae7673aSJames Wright     PetscCall(DMPlexDistribute(spanstats->dm, 0, NULL, &parent_distributed_dm));
89*dae7673aSJames Wright     PetscCallMPI(MPI_Comm_size(comm, &size));
90*dae7673aSJames Wright     if (parent_distributed_dm) {
91*dae7673aSJames Wright       PetscCall(DMDestroy(&spanstats->dm));
92*dae7673aSJames Wright       spanstats->dm = parent_distributed_dm;
93*dae7673aSJames Wright     } else if (size > 1) {
94*dae7673aSJames Wright       PetscCall(PetscPrintf(comm, "WARNING: Spanwise statistics: parent DM could not be distributed accross %d ranks.\n", size));
95*dae7673aSJames Wright     }
96*dae7673aSJames Wright   }
97*dae7673aSJames Wright   {
98*dae7673aSJames Wright     PetscBool is_simplex = PETSC_FALSE;
99*dae7673aSJames Wright     PetscCall(DMPlexIsSimplex(spanstats->dm, &is_simplex));
100*dae7673aSJames Wright     PetscCheck(is_simplex != PETSC_TRUE, comm, PETSC_ERR_ARG_WRONGSTATE, "Spanwise statistics is not implemented for non-tensor product grids");
101*dae7673aSJames Wright   }
102*dae7673aSJames Wright 
103*dae7673aSJames Wright   PetscCall(PetscObjectSetName((PetscObject)spanstats->dm, "Spanwise_Stats"));
104*dae7673aSJames Wright   PetscCall(DMSetOptionsPrefix(spanstats->dm, spanstats->prefix));
105*dae7673aSJames Wright   PetscCall(DMSetFromOptions(spanstats->dm));
106*dae7673aSJames Wright   PetscCall(DMViewFromOptions(spanstats->dm, NULL, "-dm_view"));
107*dae7673aSJames Wright 
108*dae7673aSJames Wright   // Create FE space for parent DM
109*dae7673aSJames Wright   PetscCall(
110*dae7673aSJames Wright       DMSetupByOrder_FEM(PETSC_TRUE, PETSC_TRUE, honee->app_ctx->degree, 1, honee->app_ctx->q_extra, 1, &spanstats->num_comp_stats, spanstats->dm));
111*dae7673aSJames Wright 
112*dae7673aSJames Wright   PetscCall(PetscLogStagePop());
113*dae7673aSJames Wright   PetscFunctionReturn(PETSC_SUCCESS);
114*dae7673aSJames Wright }
115*dae7673aSJames Wright 
116*dae7673aSJames Wright /** @brief Create CeedElemRestriction for collocated data in component-major order.
117*dae7673aSJames Wright a. Sets the strides of the restriction to component-major order
118*dae7673aSJames Wright  Number of quadrature points is used from the CeedBasis, and number of elements is used from the CeedElemRestriction.
119*dae7673aSJames Wright */
120*dae7673aSJames Wright static PetscErrorCode CreateElemRestrColloc_CompMajor(Ceed ceed, CeedInt num_comp, CeedBasis basis, CeedElemRestriction elem_restr_base,
121*dae7673aSJames Wright                                                       CeedElemRestriction *elem_restr_collocated) {
122*dae7673aSJames Wright   CeedInt num_elem_qpts, loc_num_elem;
123*dae7673aSJames Wright 
124*dae7673aSJames Wright   PetscFunctionBeginUser;
125*dae7673aSJames Wright   PetscCallCeed(ceed, CeedBasisGetNumQuadraturePoints(basis, &num_elem_qpts));
126*dae7673aSJames Wright   PetscCallCeed(ceed, CeedElemRestrictionGetNumElements(elem_restr_base, &loc_num_elem));
127*dae7673aSJames Wright 
128*dae7673aSJames Wright   const CeedInt strides[] = {num_comp, 1, num_elem_qpts * num_comp};
129*dae7673aSJames Wright   PetscCallCeed(ceed, CeedElemRestrictionCreateStrided(ceed, loc_num_elem, num_elem_qpts, num_comp, num_comp * loc_num_elem * num_elem_qpts, strides,
130*dae7673aSJames Wright                                                        elem_restr_collocated));
131*dae7673aSJames Wright   PetscFunctionReturn(PETSC_SUCCESS);
132*dae7673aSJames Wright }
133*dae7673aSJames Wright 
134*dae7673aSJames Wright // Get coordinates of quadrature points
135*dae7673aSJames Wright static PetscErrorCode GetQuadratureCoords(Ceed ceed, DM dm, CeedElemRestriction elem_restr_x, CeedBasis basis_x, CeedVector x_coords, Vec *Qx_coords,
136*dae7673aSJames Wright                                           PetscInt *total_nqpnts) {
137*dae7673aSJames Wright   CeedElemRestriction  elem_restr_qx;
138*dae7673aSJames Wright   CeedQFunction        qf_quad_coords;
139*dae7673aSJames Wright   CeedOperator         op_quad_coords;
140*dae7673aSJames Wright   CeedInt              num_comp_x;
141*dae7673aSJames Wright   CeedSize             l_vec_size;
142*dae7673aSJames Wright   OperatorApplyContext op_quad_coords_ctx;
143*dae7673aSJames Wright 
144*dae7673aSJames Wright   PetscFunctionBeginUser;
145*dae7673aSJames Wright   PetscCallCeed(ceed, CeedElemRestrictionGetNumComponents(elem_restr_x, &num_comp_x));
146*dae7673aSJames Wright   PetscCall(CreateElemRestrColloc_CompMajor(ceed, num_comp_x, basis_x, elem_restr_x, &elem_restr_qx));
147*dae7673aSJames Wright   PetscCallCeed(ceed, CeedElemRestrictionGetLVectorSize(elem_restr_qx, &l_vec_size));
148*dae7673aSJames Wright   *total_nqpnts = l_vec_size / num_comp_x;
149*dae7673aSJames Wright 
150*dae7673aSJames Wright   // Create QFunction
151*dae7673aSJames Wright   PetscCallCeed(ceed, CeedQFunctionCreateIdentity(ceed, num_comp_x, CEED_EVAL_INTERP, CEED_EVAL_NONE, &qf_quad_coords));
152*dae7673aSJames Wright 
153*dae7673aSJames Wright   // Create Operator
154*dae7673aSJames Wright   PetscCallCeed(ceed, CeedOperatorCreate(ceed, qf_quad_coords, NULL, NULL, &op_quad_coords));
155*dae7673aSJames Wright   PetscCallCeed(ceed, CeedOperatorSetField(op_quad_coords, "input", elem_restr_x, basis_x, x_coords));
156*dae7673aSJames Wright   PetscCallCeed(ceed, CeedOperatorSetField(op_quad_coords, "output", elem_restr_qx, CEED_BASIS_NONE, CEED_VECTOR_ACTIVE));
157*dae7673aSJames Wright 
158*dae7673aSJames Wright   PetscCall(CeedOperatorCreateLocalVecs(op_quad_coords, DMReturnVecType(dm), PETSC_COMM_SELF, NULL, Qx_coords));
159*dae7673aSJames Wright   PetscCall(OperatorApplyContextCreate(NULL, NULL, ceed, op_quad_coords, CEED_VECTOR_NONE, NULL, NULL, NULL, &op_quad_coords_ctx));
160*dae7673aSJames Wright 
161*dae7673aSJames Wright   PetscCall(ApplyCeedOperatorLocalToLocal(NULL, *Qx_coords, op_quad_coords_ctx));
162*dae7673aSJames Wright 
163*dae7673aSJames Wright   PetscCall(OperatorApplyContextDestroy(op_quad_coords_ctx));
164*dae7673aSJames Wright   PetscCallCeed(ceed, CeedElemRestrictionDestroy(&elem_restr_qx));
165*dae7673aSJames Wright   PetscCallCeed(ceed, CeedQFunctionDestroy(&qf_quad_coords));
166*dae7673aSJames Wright   PetscCallCeed(ceed, CeedOperatorDestroy(&op_quad_coords));
167*dae7673aSJames Wright   PetscFunctionReturn(PETSC_SUCCESS);
168*dae7673aSJames Wright }
169*dae7673aSJames Wright 
170*dae7673aSJames Wright static PetscErrorCode SpanwiseStatisticsSetupDataCreate(Honee honee, SpanStatsCtx spanstats, SpanStatsSetupData *stats_setup_data) {
171*dae7673aSJames Wright   Ceed     ceed = honee->ceed;
172*dae7673aSJames Wright   DM       dm   = spanstats->dm;
173*dae7673aSJames Wright   Vec      X_loc;
174*dae7673aSJames Wright   DMLabel  domain_label = NULL;
175*dae7673aSJames Wright   CeedInt  num_comp_x, num_comp_stats = spanstats->num_comp_stats;
176*dae7673aSJames Wright   PetscInt label_value = 0, height = 0, dm_field = 0;
177*dae7673aSJames Wright 
178*dae7673aSJames Wright   PetscFunctionBeginUser;
179*dae7673aSJames Wright   PetscCall(PetscNew(stats_setup_data));
180*dae7673aSJames Wright 
181*dae7673aSJames Wright   PetscCall(DMPlexCeedElemRestrictionCreate(ceed, dm, domain_label, label_value, height, dm_field, &(*stats_setup_data)->elem_restr_parent_stats));
182*dae7673aSJames Wright   PetscCall(DMPlexCeedElemRestrictionCoordinateCreate(ceed, dm, domain_label, label_value, height, &(*stats_setup_data)->elem_restr_parent_x));
183*dae7673aSJames Wright   PetscCallCeed(ceed, CeedElemRestrictionGetNumComponents((*stats_setup_data)->elem_restr_parent_x, &num_comp_x));
184*dae7673aSJames Wright   PetscCallCeed(ceed, CeedElemRestrictionCreateVector((*stats_setup_data)->elem_restr_parent_x, &(*stats_setup_data)->x_coord, NULL));
185*dae7673aSJames Wright 
186*dae7673aSJames Wright   {
187*dae7673aSJames Wright     DM dm_coord;
188*dae7673aSJames Wright     PetscCall(DMGetCoordinateDM(dm, &dm_coord));
189*dae7673aSJames Wright     PetscCall(CreateBasisFromPlex(ceed, dm_coord, domain_label, label_value, height, dm_field, &(*stats_setup_data)->basis_x));
190*dae7673aSJames Wright     PetscCall(CreateBasisFromPlex(ceed, dm, domain_label, label_value, height, dm_field, &(*stats_setup_data)->basis_stats));
191*dae7673aSJames Wright   }
192*dae7673aSJames Wright 
193*dae7673aSJames Wright   PetscCall(CreateElemRestrColloc_CompMajor(ceed, num_comp_stats, (*stats_setup_data)->basis_stats, (*stats_setup_data)->elem_restr_parent_stats,
194*dae7673aSJames Wright                                             &(*stats_setup_data)->elem_restr_parent_colloc));
195*dae7673aSJames Wright   PetscCall(
196*dae7673aSJames Wright       CreateElemRestrColloc_CompMajor(ceed, num_comp_stats, honee->basis_q, honee->elem_restr_q, &(*stats_setup_data)->elem_restr_child_colloc));
197*dae7673aSJames Wright 
198*dae7673aSJames Wright   {  // -- Copy DM coordinates into CeedVector
199*dae7673aSJames Wright     DM cdm;
200*dae7673aSJames Wright     PetscCall(DMGetCellCoordinateDM(dm, &cdm));
201*dae7673aSJames Wright     if (cdm) {
202*dae7673aSJames Wright       PetscCall(DMGetCellCoordinatesLocal(dm, &X_loc));
203*dae7673aSJames Wright     } else {
204*dae7673aSJames Wright       PetscCall(DMGetCoordinatesLocal(dm, &X_loc));
205*dae7673aSJames Wright     }
206*dae7673aSJames Wright   }
207*dae7673aSJames Wright   PetscCall(VecScale(X_loc, honee->units->meter));
208*dae7673aSJames Wright   PetscCall(VecCopyPetscToCeed(X_loc, (*stats_setup_data)->x_coord));
209*dae7673aSJames Wright   PetscFunctionReturn(PETSC_SUCCESS);
210*dae7673aSJames Wright }
211*dae7673aSJames Wright 
212*dae7673aSJames Wright static PetscErrorCode SpanwiseStatisticsSetupDataDestroy(SpanStatsSetupData data) {
213*dae7673aSJames Wright   Ceed ceed;
214*dae7673aSJames Wright 
215*dae7673aSJames Wright   PetscFunctionBeginUser;
216*dae7673aSJames Wright   PetscCall(CeedElemRestrictionGetCeed(data->elem_restr_parent_x, &ceed));
217*dae7673aSJames Wright   PetscCallCeed(ceed, CeedElemRestrictionDestroy(&data->elem_restr_parent_x));
218*dae7673aSJames Wright   PetscCallCeed(ceed, CeedElemRestrictionDestroy(&data->elem_restr_parent_stats));
219*dae7673aSJames Wright   PetscCallCeed(ceed, CeedElemRestrictionDestroy(&data->elem_restr_parent_colloc));
220*dae7673aSJames Wright   PetscCallCeed(ceed, CeedElemRestrictionDestroy(&data->elem_restr_child_colloc));
221*dae7673aSJames Wright   PetscCallCeed(ceed, CeedBasisDestroy(&data->basis_x));
222*dae7673aSJames Wright   PetscCallCeed(ceed, CeedBasisDestroy(&data->basis_stats));
223*dae7673aSJames Wright   PetscCallCeed(ceed, CeedVectorDestroy(&data->x_coord));
224*dae7673aSJames Wright   PetscCall(PetscFree(data));
225*dae7673aSJames Wright   PetscCheck(CeedDestroy(&ceed) == CEED_ERROR_SUCCESS, PETSC_COMM_SELF, PETSC_ERR_LIB, "Destroying Ceed object failed");
226*dae7673aSJames Wright   PetscFunctionReturn(PETSC_SUCCESS);
227*dae7673aSJames Wright }
228*dae7673aSJames Wright 
229*dae7673aSJames Wright // Create PetscSF for child-to-parent communication
230*dae7673aSJames Wright static PetscErrorCode SpanwiseStatisticsCreateSF(Honee honee, SpanStatsSetupData stats_setup_data, DM parentdm, DM childdm, PetscSF *statssf) {
231*dae7673aSJames Wright   Ceed     ceed = honee->ceed;
232*dae7673aSJames Wright   PetscInt child_num_qpnts, parent_num_qpnts;
233*dae7673aSJames Wright   CeedInt  num_comp_x;
234*dae7673aSJames Wright   Vec      Child_qx_coords, Parent_qx_coords;
235*dae7673aSJames Wright 
236*dae7673aSJames Wright   PetscFunctionBeginUser;
237*dae7673aSJames Wright   PetscCall(PetscSFCreate(PetscObjectComm((PetscObject)childdm), statssf));
238*dae7673aSJames Wright 
239*dae7673aSJames Wright   // Assume that child and parent have the same number of components
240*dae7673aSJames Wright   PetscCallCeed(ceed, CeedBasisGetNumComponents(honee->basis_x, &num_comp_x));
241*dae7673aSJames Wright   const PetscInt num_comp_sf = num_comp_x - 1;  // Number of coord components used in the creation of the SF
242*dae7673aSJames Wright 
243*dae7673aSJames Wright   // Get quad_coords for child and parent DM
244*dae7673aSJames Wright   PetscCall(GetQuadratureCoords(ceed, childdm, honee->elem_restr_x, honee->basis_x, honee->x_coord, &Child_qx_coords, &child_num_qpnts));
245*dae7673aSJames Wright   PetscCall(GetQuadratureCoords(ceed, parentdm, stats_setup_data->elem_restr_parent_x, stats_setup_data->basis_x, stats_setup_data->x_coord,
246*dae7673aSJames Wright                                 &Parent_qx_coords, &parent_num_qpnts));
247*dae7673aSJames Wright 
248*dae7673aSJames Wright   {  // Remove z component of coordinates for matching
249*dae7673aSJames Wright     const PetscReal *child_quad_coords, *parent_quad_coords;
250*dae7673aSJames Wright     PetscReal       *child_coords, *parent_coords;
251*dae7673aSJames Wright 
252*dae7673aSJames Wright     PetscCall(VecGetArrayRead(Child_qx_coords, &child_quad_coords));
253*dae7673aSJames Wright     PetscCall(VecGetArrayRead(Parent_qx_coords, &parent_quad_coords));
254*dae7673aSJames Wright 
255*dae7673aSJames Wright     PetscCall(PetscMalloc2(child_num_qpnts * 2, &child_coords, parent_num_qpnts * 2, &parent_coords));
256*dae7673aSJames Wright     for (int i = 0; i < child_num_qpnts; i++) {
257*dae7673aSJames Wright       child_coords[0 + i * num_comp_sf] = child_quad_coords[0 + i * num_comp_x];
258*dae7673aSJames Wright       child_coords[1 + i * num_comp_sf] = child_quad_coords[1 + i * num_comp_x];
259*dae7673aSJames Wright     }
260*dae7673aSJames Wright     for (int i = 0; i < parent_num_qpnts; i++) {
261*dae7673aSJames Wright       parent_coords[0 + i * num_comp_sf] = parent_quad_coords[0 + i * num_comp_x];
262*dae7673aSJames Wright       parent_coords[1 + i * num_comp_sf] = parent_quad_coords[1 + i * num_comp_x];
263*dae7673aSJames Wright     }
264*dae7673aSJames Wright     PetscCall(VecRestoreArrayRead(Child_qx_coords, &child_quad_coords));
265*dae7673aSJames Wright     PetscCall(VecRestoreArrayRead(Parent_qx_coords, &parent_quad_coords));
266*dae7673aSJames Wright 
267*dae7673aSJames Wright     PetscCall(PetscSFSetGraphFromCoordinates(*statssf, parent_num_qpnts, child_num_qpnts, num_comp_sf, 1e-12, parent_coords, child_coords));
268*dae7673aSJames Wright     PetscCall(PetscFree2(child_coords, parent_coords));
269*dae7673aSJames Wright   }
270*dae7673aSJames Wright 
271*dae7673aSJames Wright   PetscCall(PetscSFViewFromOptions(*statssf, NULL, "-spanstats_sf_view"));
272*dae7673aSJames Wright 
273*dae7673aSJames Wright   PetscCall(VecDestroy(&Child_qx_coords));
274*dae7673aSJames Wright   PetscCall(VecDestroy(&Parent_qx_coords));
275*dae7673aSJames Wright   PetscFunctionReturn(PETSC_SUCCESS);
276*dae7673aSJames Wright }
277*dae7673aSJames Wright 
278*dae7673aSJames Wright // @brief Setup RHS and LHS for L^2 projection of statistics
279*dae7673aSJames Wright static PetscErrorCode SpanwiseStatisticsSetupL2Projection(Honee honee, SpanStatsCtx spanstats, SpanStatsSetupData stats_setup_data) {
280*dae7673aSJames Wright   Ceed                ceed = honee->ceed;
281*dae7673aSJames Wright   CeedOperator        op_mass, op_proj_rhs;
282*dae7673aSJames Wright   CeedQFunction       qf_mass, qf_stats_proj;
283*dae7673aSJames Wright   CeedInt             q_data_size, num_comp_stats = spanstats->num_comp_stats;
284*dae7673aSJames Wright   CeedElemRestriction elem_restr_qd;
285*dae7673aSJames Wright   CeedVector          q_data;
286*dae7673aSJames Wright   DMLabel             domain_label = NULL;
287*dae7673aSJames Wright   PetscInt            label_value  = 0;
288*dae7673aSJames Wright 
289*dae7673aSJames Wright   PetscFunctionBeginUser;
290*dae7673aSJames Wright   // -- Create Operator for RHS of L^2 projection of statistics
291*dae7673aSJames Wright   // Simply take collocated parent data (with quadrature weight already applied) and multiply by weight function.
292*dae7673aSJames Wright   // Therefore, an Identity QF is sufficient
293*dae7673aSJames Wright   PetscCallCeed(ceed, CeedQFunctionCreateIdentity(ceed, num_comp_stats, CEED_EVAL_NONE, CEED_EVAL_INTERP, &qf_stats_proj));
294*dae7673aSJames Wright 
295*dae7673aSJames Wright   PetscCallCeed(ceed, CeedOperatorCreate(ceed, qf_stats_proj, NULL, NULL, &op_proj_rhs));
296*dae7673aSJames Wright   PetscCallCeed(ceed, CeedOperatorSetField(op_proj_rhs, "input", stats_setup_data->elem_restr_parent_colloc, CEED_BASIS_NONE, CEED_VECTOR_ACTIVE));
297*dae7673aSJames Wright   PetscCallCeed(ceed, CeedOperatorSetField(op_proj_rhs, "output", stats_setup_data->elem_restr_parent_stats, stats_setup_data->basis_stats,
298*dae7673aSJames Wright                                            CEED_VECTOR_ACTIVE));
299*dae7673aSJames Wright 
300*dae7673aSJames Wright   PetscCall(OperatorApplyContextCreate(NULL, spanstats->dm, ceed, op_proj_rhs, NULL, NULL, NULL, NULL, &spanstats->op_proj_rhs_ctx));
301*dae7673aSJames Wright   PetscCall(CeedOperatorCreateLocalVecs(op_proj_rhs, DMReturnVecType(spanstats->dm), PETSC_COMM_SELF, &spanstats->Parent_Stats_loc, NULL));
302*dae7673aSJames Wright   PetscCall(QDataGet(ceed, spanstats->dm, domain_label, label_value, stats_setup_data->elem_restr_parent_x, stats_setup_data->basis_x,
303*dae7673aSJames Wright                      stats_setup_data->x_coord, &elem_restr_qd, &q_data, &q_data_size));
304*dae7673aSJames Wright 
305*dae7673aSJames Wright   // Create Mass CeedOperator
306*dae7673aSJames Wright   PetscCall(HoneeMassQFunctionCreate(ceed, num_comp_stats, q_data_size, &qf_mass));
307*dae7673aSJames Wright   PetscCallCeed(ceed, CeedOperatorCreate(ceed, qf_mass, NULL, NULL, &op_mass));
308*dae7673aSJames Wright   PetscCallCeed(ceed,
309*dae7673aSJames Wright                 CeedOperatorSetField(op_mass, "u", stats_setup_data->elem_restr_parent_stats, stats_setup_data->basis_stats, CEED_VECTOR_ACTIVE));
310*dae7673aSJames Wright   PetscCallCeed(ceed, CeedOperatorSetField(op_mass, "qdata", elem_restr_qd, CEED_BASIS_NONE, q_data));
311*dae7673aSJames Wright   PetscCallCeed(ceed,
312*dae7673aSJames Wright                 CeedOperatorSetField(op_mass, "v", stats_setup_data->elem_restr_parent_stats, stats_setup_data->basis_stats, CEED_VECTOR_ACTIVE));
313*dae7673aSJames Wright 
314*dae7673aSJames Wright   {  // Setup KSP for L^2 projection
315*dae7673aSJames Wright     Mat mat_mass;
316*dae7673aSJames Wright     KSP ksp;
317*dae7673aSJames Wright 
318*dae7673aSJames Wright     PetscCall(MatCreateCeed(spanstats->dm, spanstats->dm, op_mass, NULL, &mat_mass));
319*dae7673aSJames Wright 
320*dae7673aSJames Wright     PetscCall(KSPCreate(PetscObjectComm((PetscObject)spanstats->dm), &ksp));
321*dae7673aSJames Wright     PetscCall(KSPSetOptionsPrefix(ksp, spanstats->prefix));
322*dae7673aSJames Wright     {
323*dae7673aSJames Wright       PC pc;
324*dae7673aSJames Wright       PetscCall(KSPGetPC(ksp, &pc));
325*dae7673aSJames Wright       PetscCall(PCSetType(pc, PCJACOBI));
326*dae7673aSJames Wright       PetscCall(PCJacobiSetType(pc, PC_JACOBI_DIAGONAL));
327*dae7673aSJames Wright       PetscCall(KSPSetType(ksp, KSPCG));
328*dae7673aSJames Wright       PetscCall(KSPSetNormType(ksp, KSP_NORM_NATURAL));
329*dae7673aSJames Wright       PetscCall(KSPSetTolerances(ksp, 1e-10, PETSC_DEFAULT, PETSC_DEFAULT, PETSC_DEFAULT));
330*dae7673aSJames Wright     }
331*dae7673aSJames Wright     PetscCall(KSPSetFromOptions_WithMatCeed(ksp, mat_mass));
332*dae7673aSJames Wright     spanstats->ksp = ksp;
333*dae7673aSJames Wright     PetscCall(MatDestroy(&mat_mass));
334*dae7673aSJames Wright   }
335*dae7673aSJames Wright 
336*dae7673aSJames Wright   PetscCallCeed(ceed, CeedElemRestrictionDestroy(&elem_restr_qd));
337*dae7673aSJames Wright   PetscCallCeed(ceed, CeedVectorDestroy(&q_data));
338*dae7673aSJames Wright   PetscCallCeed(ceed, CeedQFunctionDestroy(&qf_mass));
339*dae7673aSJames Wright   PetscCallCeed(ceed, CeedQFunctionDestroy(&qf_stats_proj));
340*dae7673aSJames Wright   PetscCallCeed(ceed, CeedOperatorDestroy(&op_mass));
341*dae7673aSJames Wright   PetscCallCeed(ceed, CeedOperatorDestroy(&op_proj_rhs));
342*dae7673aSJames Wright   PetscFunctionReturn(PETSC_SUCCESS);
343*dae7673aSJames Wright }
344*dae7673aSJames Wright 
345*dae7673aSJames Wright PetscErrorCode SpanwiseStatisticsSetupInitialize(Honee honee, PetscInt degree, PetscInt num_comps, const char *prefix,
346*dae7673aSJames Wright                                                  SpanStatsSetupData *stats_setup_data, SpanStatsCtx *spanstats_new) {
347*dae7673aSJames Wright   PetscLogStage stage_stats_setup;
348*dae7673aSJames Wright   SpanStatsCtx  spanstats;
349*dae7673aSJames Wright 
350*dae7673aSJames Wright   PetscFunctionBeginUser;
351*dae7673aSJames Wright   PetscCall(PetscLogStageGetId("Stats Setup", &stage_stats_setup));
352*dae7673aSJames Wright   if (stage_stats_setup == -1) PetscCall(PetscLogStageRegister("Stats Setup", &stage_stats_setup));
353*dae7673aSJames Wright   PetscCall(PetscLogStagePush(stage_stats_setup));
354*dae7673aSJames Wright 
355*dae7673aSJames Wright   PetscCall(PetscNew(&spanstats));
356*dae7673aSJames Wright   PetscCall(PetscStrallocpy(prefix, &spanstats->prefix));
357*dae7673aSJames Wright 
358*dae7673aSJames Wright   spanstats->collect_interval = 1;
359*dae7673aSJames Wright   PetscCall(PetscOptionsGetInt(NULL, prefix, "-collect_interval", &spanstats->collect_interval, NULL));
360*dae7673aSJames Wright 
361*dae7673aSJames Wright   // Create parent DM
362*dae7673aSJames Wright   PetscCall(SpanwiseStatisticssCreateDM(honee, spanstats, degree, num_comps));
363*dae7673aSJames Wright 
364*dae7673aSJames Wright   // Create necessary CeedObjects for setting up statistics
365*dae7673aSJames Wright   PetscCall(SpanwiseStatisticsSetupDataCreate(honee, spanstats, stats_setup_data));
366*dae7673aSJames Wright   //
367*dae7673aSJames Wright   // Create SF for communicating child data back their respective parents
368*dae7673aSJames Wright   PetscCall(SpanwiseStatisticsCreateSF(honee, *stats_setup_data, honee->dm, spanstats->dm, &spanstats->sf));
369*dae7673aSJames Wright 
370*dae7673aSJames Wright   *spanstats_new = spanstats;
371*dae7673aSJames Wright   PetscFunctionReturn(PETSC_SUCCESS);
372*dae7673aSJames Wright }
373*dae7673aSJames Wright 
374*dae7673aSJames Wright PetscErrorCode SpanwiseStatisticsSetupFinalize(TS ts, Honee honee, SpanStatsCtx spanstats, PetscViewerAndFormat *ctx,
375*dae7673aSJames Wright                                                SpanStatsSetupData *stats_setup_data) {
376*dae7673aSJames Wright   PetscFunctionBeginUser;
377*dae7673aSJames Wright   // Setup KSP and Mat for L^2 projection of statistics
378*dae7673aSJames Wright   PetscCall(SpanwiseStatisticsSetupL2Projection(honee, spanstats, *stats_setup_data));
379*dae7673aSJames Wright 
380*dae7673aSJames Wright   PetscCall(PetscViewerSetOptionsPrefix(ctx->viewer, spanstats->prefix));
381*dae7673aSJames Wright   PetscCall(PetscViewerSetFromOptions(ctx->viewer));
382*dae7673aSJames Wright 
383*dae7673aSJames Wright   PetscCall(TSGetTime(ts, &spanstats->initial_solution_time));
384*dae7673aSJames Wright   PetscCall(TSGetStepNumber(ts, &spanstats->initial_solution_step));
385*dae7673aSJames Wright   CeedScalar initial_solution_time = spanstats->initial_solution_time;  // done for type conversion
386*dae7673aSJames Wright   PetscCallCeed(honee->ceed,
387*dae7673aSJames Wright                 CeedOperatorSetContextDouble(spanstats->op_stats_collect_ctx->op, spanstats->previous_time_label, &initial_solution_time));
388*dae7673aSJames Wright 
389*dae7673aSJames Wright   PetscCall(SpanwiseStatisticsSetupDataDestroy(*stats_setup_data));
390*dae7673aSJames Wright   PetscCall(PetscLogStagePop());
391*dae7673aSJames Wright   PetscFunctionReturn(PETSC_SUCCESS);
392*dae7673aSJames Wright }
393*dae7673aSJames Wright 
394*dae7673aSJames Wright // Collect statistics based on the solution Q
395*dae7673aSJames Wright PetscErrorCode SpanwiseStatisticsCollect(Honee honee, SpanStatsCtx spanstats, PetscScalar solution_time, Vec Q) {
396*dae7673aSJames Wright   PetscFunctionBeginUser;
397*dae7673aSJames Wright   PetscLogStage stage_stats_collect;
398*dae7673aSJames Wright   PetscCall(PetscLogStageGetId("Stats Collect", &stage_stats_collect));
399*dae7673aSJames Wright   if (stage_stats_collect == -1) PetscCall(PetscLogStageRegister("Stats Collect", &stage_stats_collect));
400*dae7673aSJames Wright   PetscCall(PetscLogStagePush(stage_stats_collect));
401*dae7673aSJames Wright 
402*dae7673aSJames Wright   PetscCall(UpdateBoundaryValues(honee, honee->Q_loc, solution_time));
403*dae7673aSJames Wright   PetscCallCeed(honee->ceed, CeedOperatorSetContextDouble(spanstats->op_stats_collect_ctx->op, spanstats->solution_time_label, &solution_time));
404*dae7673aSJames Wright   PetscCall(DMGlobalToLocal(honee->dm, Q, INSERT_VALUES, honee->Q_loc));
405*dae7673aSJames Wright   PetscCall(ApplyAddCeedOperatorLocalToLocal(honee->Q_loc, spanstats->Child_Stats_loc, spanstats->op_stats_collect_ctx));
406*dae7673aSJames Wright 
407*dae7673aSJames Wright   PetscCallCeed(honee->ceed, CeedOperatorSetContextDouble(spanstats->op_stats_collect_ctx->op, spanstats->previous_time_label, &solution_time));
408*dae7673aSJames Wright 
409*dae7673aSJames Wright   PetscCall(PetscLogStagePop());
410*dae7673aSJames Wright   PetscFunctionReturn(PETSC_SUCCESS);
411*dae7673aSJames Wright }
412*dae7673aSJames Wright 
413*dae7673aSJames Wright // Process the child statistics into parent statistics and project them onto stats
414*dae7673aSJames Wright PetscErrorCode SpanwiseStatisticsProcess(Honee honee, SpanStatsCtx spanstats, Vec stats) {
415*dae7673aSJames Wright   const PetscScalar *child_stats;
416*dae7673aSJames Wright   PetscScalar       *parent_stats;
417*dae7673aSJames Wright   MPI_Datatype       unit;
418*dae7673aSJames Wright   Vec                RHS;
419*dae7673aSJames Wright 
420*dae7673aSJames Wright   PetscFunctionBeginUser;
421*dae7673aSJames Wright   PetscLogStage stage_stats_process;
422*dae7673aSJames Wright   PetscCall(PetscLogStageGetId("Stats Process", &stage_stats_process));
423*dae7673aSJames Wright   if (stage_stats_process == -1) PetscCall(PetscLogStageRegister("Stats Process", &stage_stats_process));
424*dae7673aSJames Wright   PetscCall(PetscLogStagePush(stage_stats_process));
425*dae7673aSJames Wright 
426*dae7673aSJames Wright   PetscCall(VecZeroEntries(spanstats->Parent_Stats_loc));
427*dae7673aSJames Wright 
428*dae7673aSJames Wright   PetscCall(VecGetArrayRead(spanstats->Child_Stats_loc, &child_stats));
429*dae7673aSJames Wright   PetscCall(VecGetArray(spanstats->Parent_Stats_loc, &parent_stats));
430*dae7673aSJames Wright 
431*dae7673aSJames Wright   if (spanstats->num_comp_stats == 1) unit = MPIU_REAL;
432*dae7673aSJames Wright   else {
433*dae7673aSJames Wright     PetscCallMPI(MPI_Type_contiguous(spanstats->num_comp_stats, MPIU_REAL, &unit));
434*dae7673aSJames Wright     PetscCallMPI(MPI_Type_commit(&unit));
435*dae7673aSJames Wright   }
436*dae7673aSJames Wright 
437*dae7673aSJames Wright   PetscCall(PetscSFReduceBegin(spanstats->sf, unit, child_stats, parent_stats, MPI_SUM));
438*dae7673aSJames Wright   PetscCall(PetscSFReduceEnd(spanstats->sf, unit, child_stats, parent_stats, MPI_SUM));
439*dae7673aSJames Wright 
440*dae7673aSJames Wright   PetscCall(VecRestoreArrayRead(spanstats->Child_Stats_loc, &child_stats));
441*dae7673aSJames Wright   PetscCall(VecRestoreArray(spanstats->Parent_Stats_loc, &parent_stats));
442*dae7673aSJames Wright   PetscCallMPI(MPI_Type_free(&unit));
443*dae7673aSJames Wright 
444*dae7673aSJames Wright   PetscReal solution_time;
445*dae7673aSJames Wright   PetscCall(DMGetOutputSequenceNumber(spanstats->dm, NULL, &solution_time));
446*dae7673aSJames Wright   PetscReal summing_duration = solution_time - honee->app_ctx->cont_time;
447*dae7673aSJames Wright   PetscCall(VecScale(spanstats->Parent_Stats_loc, 1 / (summing_duration * spanstats->span_width)));
448*dae7673aSJames Wright 
449*dae7673aSJames Wright   // L^2 projection with the parent_data
450*dae7673aSJames Wright   PetscCall(DMGetGlobalVector(spanstats->dm, &RHS));
451*dae7673aSJames Wright   PetscCall(ApplyCeedOperatorLocalToGlobal(spanstats->Parent_Stats_loc, RHS, spanstats->op_proj_rhs_ctx));
452*dae7673aSJames Wright 
453*dae7673aSJames Wright   PetscCall(KSPSolve(spanstats->ksp, RHS, stats));
454*dae7673aSJames Wright 
455*dae7673aSJames Wright   PetscCall(DMRestoreGlobalVector(spanstats->dm, &RHS));
456*dae7673aSJames Wright   PetscCall(PetscLogStagePop());
457*dae7673aSJames Wright   PetscFunctionReturn(PETSC_SUCCESS);
458*dae7673aSJames Wright }
459