1ae2b091fSJames Wright // SPDX-FileCopyrightText: Copyright (c) 2017-2024, HONEE contributors.
2ae2b091fSJames Wright // SPDX-License-Identifier: Apache-2.0 OR BSD-2-Clause
362b7942eSJames Wright
462b7942eSJames Wright #include "../qfunctions/sgs_dd_model.h"
562b7942eSJames Wright
662b7942eSJames Wright #include <petscdmplex.h>
762b7942eSJames Wright
8149fb536SJames Wright #include <navierstokes.h>
94c07ec22SJames Wright #include <sgs_model_torch.h>
1062b7942eSJames Wright
1182baf964SJames Wright typedef PetscErrorCode (*SgsDDNodalStressEval)(Honee honee, Vec Q_loc, Vec VelocityGradient, Vec SGSNodal_loc);
1282baf964SJames Wright typedef PetscErrorCode (*SgsDDNodalStressInference)(Vec DD_Inputs_loc, Vec DD_Outputs_loc, void *ctx);
1382baf964SJames Wright typedef struct {
1482baf964SJames Wright DM dm_sgs, dm_dd_inputs, dm_dd_outputs;
1582baf964SJames Wright PetscInt num_comp_sgs, num_comp_inputs, num_comp_outputs;
1682baf964SJames Wright OperatorApplyContext op_nodal_evaluation_ctx, op_nodal_dd_inputs_ctx, op_nodal_dd_outputs_ctx, op_sgs_apply_ctx;
1782baf964SJames Wright CeedVector sgs_nodal_ceed, grad_velo_ceed;
1882baf964SJames Wright SgsDDNodalStressEval sgs_nodal_eval;
1982baf964SJames Wright SgsDDNodalStressInference sgs_nodal_inference;
2082baf964SJames Wright void *sgs_nodal_inference_ctx;
21*26d401f3SJames Wright PetscCtxDestroyFn *sgs_nodal_inference_ctx_destroy;
2282baf964SJames Wright } *SgsDDData;
2382baf964SJames Wright
2482baf964SJames Wright // @brief Destroy `SgsDDData` object
SgsDDDataDestroy(SgsDDData * sgs_dd_data)2582baf964SJames Wright static PetscErrorCode SgsDDDataDestroy(SgsDDData *sgs_dd_data) {
2682baf964SJames Wright SgsDDData sgs_dd_data_ = *sgs_dd_data;
2714bd2a07SJames Wright
2882baf964SJames Wright PetscFunctionBeginUser;
2982baf964SJames Wright if (!sgs_dd_data_) PetscFunctionReturn(PETSC_SUCCESS);
3082baf964SJames Wright Ceed ceed = sgs_dd_data_->op_sgs_apply_ctx->ceed;
3182baf964SJames Wright
3282baf964SJames Wright PetscCallCeed(ceed, CeedVectorDestroy(&sgs_dd_data_->sgs_nodal_ceed));
3382baf964SJames Wright PetscCallCeed(ceed, CeedVectorDestroy(&sgs_dd_data_->grad_velo_ceed));
3482baf964SJames Wright PetscCall(OperatorApplyContextDestroy(sgs_dd_data_->op_nodal_evaluation_ctx));
3582baf964SJames Wright PetscCall(OperatorApplyContextDestroy(sgs_dd_data_->op_sgs_apply_ctx));
3682baf964SJames Wright PetscCall(OperatorApplyContextDestroy(sgs_dd_data_->op_nodal_dd_inputs_ctx));
3782baf964SJames Wright PetscCall(OperatorApplyContextDestroy(sgs_dd_data_->op_nodal_dd_outputs_ctx));
3882baf964SJames Wright PetscCall(DMDestroy(&sgs_dd_data_->dm_sgs));
3982baf964SJames Wright PetscCall(DMDestroy(&sgs_dd_data_->dm_dd_inputs));
4082baf964SJames Wright PetscCall(DMDestroy(&sgs_dd_data_->dm_dd_outputs));
4182baf964SJames Wright if (sgs_dd_data_->sgs_nodal_inference_ctx) PetscCall(sgs_dd_data_->sgs_nodal_inference_ctx_destroy(sgs_dd_data_->sgs_nodal_inference_ctx));
4282baf964SJames Wright PetscCall(PetscFree(sgs_dd_data_));
4382baf964SJames Wright *sgs_dd_data = NULL;
4482baf964SJames Wright PetscFunctionReturn(PETSC_SUCCESS);
4582baf964SJames Wright }
4682baf964SJames Wright
47c38c977aSJames Wright typedef struct {
48c38c977aSJames Wright CeedElemRestriction elem_restr_grid_aniso, elem_restr_sgs;
49c38c977aSJames Wright CeedVector grid_aniso_ceed;
5040816385SJames Wright CeedQFunctionContext sgsdd_qfctx, ifunction_qfctx;
514c07ec22SJames Wright SGSModelDDImplementation sgs_dd_model_implementation;
52ad494f68SJames Wright } *SgsDDSetupData;
53c38c977aSJames Wright
548340219bSJames Wright #define GRAD_VELO_PROJ_KEY "Gradient of Velocity Projection"
5582baf964SJames Wright #define SGS_DD_DATA_KEY "SGS Data Driven Data"
568340219bSJames Wright
SgsDDSetupDataDestroy(SgsDDSetupData sgs_dd_setup_data)57ad494f68SJames Wright PetscErrorCode SgsDDSetupDataDestroy(SgsDDSetupData sgs_dd_setup_data) {
58b4c37c5cSJames Wright Ceed ceed;
59ad494f68SJames Wright
60c38c977aSJames Wright PetscFunctionBeginUser;
61b4c37c5cSJames Wright PetscCall(CeedElemRestrictionGetCeed(sgs_dd_setup_data->elem_restr_sgs, &ceed));
62ad494f68SJames Wright
63b4c37c5cSJames Wright PetscCallCeed(ceed, CeedElemRestrictionDestroy(&sgs_dd_setup_data->elem_restr_grid_aniso));
64b4c37c5cSJames Wright PetscCallCeed(ceed, CeedElemRestrictionDestroy(&sgs_dd_setup_data->elem_restr_sgs));
65b4c37c5cSJames Wright PetscCallCeed(ceed, CeedVectorDestroy(&sgs_dd_setup_data->grid_aniso_ceed));
66b4c37c5cSJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&sgs_dd_setup_data->sgsdd_qfctx));
6740816385SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&sgs_dd_setup_data->ifunction_qfctx));
68c38c977aSJames Wright PetscCall(PetscFree(sgs_dd_setup_data));
69519781aeSJames Wright PetscCheck(CeedDestroy(&ceed) == CEED_ERROR_SUCCESS, PETSC_COMM_SELF, PETSC_ERR_LIB, "Destroying Ceed object failed");
70d949ddfcSJames Wright PetscFunctionReturn(PETSC_SUCCESS);
71c38c977aSJames Wright }
72c38c977aSJames Wright
73ee1455b7SJames Wright // @brief Create DM for storing subgrid stress at nodes
SgsDDCreateDM(DM dm_source,DM * dm_sgs,PetscInt degree,PetscInt q_extra,PetscInt * num_components)74ad494f68SJames Wright static PetscErrorCode SgsDDCreateDM(DM dm_source, DM *dm_sgs, PetscInt degree, PetscInt q_extra, PetscInt *num_components) {
75ee1455b7SJames Wright PetscSection section;
76ee1455b7SJames Wright
77ee1455b7SJames Wright PetscFunctionBeginUser;
78ee1455b7SJames Wright *num_components = 6;
79ee1455b7SJames Wright
80ee1455b7SJames Wright PetscCall(DMClone(dm_source, dm_sgs));
810dee9b8eSJames Wright PetscCall(DMSetMatrixPreallocateSkip(*dm_sgs, PETSC_TRUE));
82ee1455b7SJames Wright PetscCall(PetscObjectSetName((PetscObject)*dm_sgs, "Subgrid Stress Projection"));
83ee1455b7SJames Wright
84da4ca0cfSJames Wright PetscCall(DMSetupByOrder_FEM(PETSC_TRUE, PETSC_TRUE, degree, 1, q_extra, 1, num_components, *dm_sgs));
85ee1455b7SJames Wright
86ee1455b7SJames Wright PetscCall(DMGetLocalSection(*dm_sgs, §ion));
87ee1455b7SJames Wright PetscCall(PetscSectionSetFieldName(section, 0, ""));
88ee1455b7SJames Wright PetscCall(PetscSectionSetComponentName(section, 0, 0, "KMSubgridStressXX"));
89ee1455b7SJames Wright PetscCall(PetscSectionSetComponentName(section, 0, 1, "KMSubgridStressYY"));
90ee1455b7SJames Wright PetscCall(PetscSectionSetComponentName(section, 0, 2, "KMSubgridStressZZ"));
91ee1455b7SJames Wright PetscCall(PetscSectionSetComponentName(section, 0, 3, "KMSubgridStressYZ"));
92ee1455b7SJames Wright PetscCall(PetscSectionSetComponentName(section, 0, 4, "KMSubgridStressXZ"));
93ee1455b7SJames Wright PetscCall(PetscSectionSetComponentName(section, 0, 5, "KMSubgridStressXY"));
94d949ddfcSJames Wright PetscFunctionReturn(PETSC_SUCCESS);
95ee1455b7SJames Wright };
96ee1455b7SJames Wright
97ad494f68SJames Wright // @brief Evaluate data-driven SGS using fused method
SgsDDNodalStressEval_Fused(Honee honee,Vec Q_loc,Vec VelocityGradient,Vec SGSNodal_loc)980c373b74SJames Wright static PetscErrorCode SgsDDNodalStressEval_Fused(Honee honee, Vec Q_loc, Vec VelocityGradient, Vec SGSNodal_loc) {
9982baf964SJames Wright SgsDDData sgs_dd_data;
100cceb3143SJames Wright PetscMemType q_mem_type;
101cceb3143SJames Wright
102cceb3143SJames Wright PetscFunctionBeginUser;
1030c70a8bcSJames Wright PetscCall(HoneeGetContainer(honee, SGS_DD_DATA_KEY, &sgs_dd_data));
1040c373b74SJames Wright PetscCall(VecPetscToCeed(Q_loc, &q_mem_type, honee->q_ceed)); // q_ceed is an implicit input
105cceb3143SJames Wright
106cceb3143SJames Wright PetscCall(ApplyCeedOperatorGlobalToLocal(VelocityGradient, SGSNodal_loc, sgs_dd_data->op_nodal_evaluation_ctx));
107cceb3143SJames Wright
1080c373b74SJames Wright PetscCall(VecCeedToPetsc(honee->q_ceed, q_mem_type, Q_loc));
109cceb3143SJames Wright PetscFunctionReturn(PETSC_SUCCESS);
110cceb3143SJames Wright }
111cceb3143SJames Wright
112b87d60b3SJames Wright // @brief Create CeedOperator to calculate data-drive SGS at nodes using fused operator
SgsDDSetupNodalEvaluation_Fused(Ceed ceed,Honee honee,SgsDDSetupData sgs_dd_setup_data)113e3663b90SJames Wright static PetscErrorCode SgsDDSetupNodalEvaluation_Fused(Ceed ceed, Honee honee, SgsDDSetupData sgs_dd_setup_data) {
11482baf964SJames Wright SgsDDData sgs_dd_data;
1155930f037SJames Wright CeedQFunction qf_sgs_dd_nodal;
1165930f037SJames Wright CeedOperator op_sgs_dd_nodal;
1174fe35dceSJames Wright CeedInt num_comp_q, num_comp_grad_velo, num_comp_grid_aniso;
1184fe35dceSJames Wright PetscInt num_comp_x;
1194fe35dceSJames Wright CeedVector inv_multiplicity, x_coord;
1204fe35dceSJames Wright CeedElemRestriction elem_restr_inv_multiplicity, elem_restr_grad_velo, elem_restr_sgs, elem_restr_q, elem_restr_x;
1214fe35dceSJames Wright CeedBasis basis_x;
122e3db12f8SJames Wright PetscInt height = 0, dm_field = 0;
1238340219bSJames Wright NodalProjectionData grad_velo_proj;
124ee1455b7SJames Wright
125ee1455b7SJames Wright PetscFunctionBeginUser;
126cf8f12c8SJames Wright PetscCall(DMPlexCeedElemRestrictionCreate(ceed, honee->dm, DMLABEL_DEFAULT, DMLABEL_DEFAULT_VALUE, 0, 0, &elem_restr_q));
1274fe35dceSJames Wright PetscCall(DMGetCoordinateNumComps(honee->dm, &num_comp_x));
128cf8f12c8SJames Wright PetscCallCeed(ceed, CeedElemRestrictionGetNumComponents(elem_restr_q, &num_comp_q));
129b4c37c5cSJames Wright PetscCallCeed(ceed, CeedElemRestrictionGetNumComponents(sgs_dd_setup_data->elem_restr_grid_aniso, &num_comp_grid_aniso));
1300c70a8bcSJames Wright PetscCall(HoneeGetContainer(honee, SGS_DD_DATA_KEY, &sgs_dd_data));
1310c70a8bcSJames Wright PetscCall(HoneeGetContainer(honee, GRAD_VELO_PROJ_KEY, &grad_velo_proj));
132ee1455b7SJames Wright
133ee1455b7SJames Wright { // Get velocity gradient information
134ee1455b7SJames Wright CeedOperatorField op_field;
1358340219bSJames Wright PetscCallCeed(ceed, CeedOperatorGetFieldByName(grad_velo_proj->l2_rhs_ctx->op, "velocity gradient", &op_field));
136b4c37c5cSJames Wright PetscCallCeed(ceed, CeedOperatorFieldGetElemRestriction(op_field, &elem_restr_grad_velo));
137b4c37c5cSJames Wright PetscCallCeed(ceed, CeedElemRestrictionGetNumComponents(elem_restr_grad_velo, &num_comp_grad_velo));
138ee1455b7SJames Wright }
1394fe35dceSJames Wright PetscCall(DMPlexCeedCoordinateCreateField(ceed, honee->dm, DMLABEL_DEFAULT, DMLABEL_DEFAULT_VALUE, 0, &elem_restr_x, &basis_x, &x_coord));
140e3db12f8SJames Wright PetscCall(DMPlexCeedElemRestrictionCreate(ceed, sgs_dd_data->dm_sgs, DMLABEL_DEFAULT, DMLABEL_DEFAULT_VALUE, height, dm_field, &elem_restr_sgs));
141b4c37c5cSJames Wright PetscCallCeed(ceed, CeedElemRestrictionCreateVector(elem_restr_sgs, &sgs_dd_data->sgs_nodal_ceed, NULL));
142ee1455b7SJames Wright
143e3db12f8SJames Wright PetscCall(GetInverseMultiplicity(ceed, sgs_dd_data->dm_sgs, DMLABEL_DEFAULT, DMLABEL_DEFAULT_VALUE, height, dm_field, PETSC_FALSE,
144e3db12f8SJames Wright &elem_restr_inv_multiplicity, &inv_multiplicity));
145ee1455b7SJames Wright
146ee1455b7SJames Wright // -- Create operator for SGS DD model nodal evaluation
1470c373b74SJames Wright switch (honee->phys->state_var) {
148ee1455b7SJames Wright case STATEVAR_PRIMITIVE:
149ad494f68SJames Wright PetscCallCeed(ceed, CeedQFunctionCreateInterior(ceed, 1, ComputeSgsDDNodal_Prim, ComputeSgsDDNodal_Prim_loc, &qf_sgs_dd_nodal));
150ee1455b7SJames Wright break;
151ee1455b7SJames Wright case STATEVAR_CONSERVATIVE:
152ad494f68SJames Wright PetscCallCeed(ceed, CeedQFunctionCreateInterior(ceed, 1, ComputeSgsDDNodal_Conserv, ComputeSgsDDNodal_Conserv_loc, &qf_sgs_dd_nodal));
153ee1455b7SJames Wright break;
1549b103f75SJames Wright case STATEVAR_ENTROPY:
1559b103f75SJames Wright PetscCallCeed(ceed, CeedQFunctionCreateInterior(ceed, 1, ComputeSgsDDNodal_Entropy, ComputeSgsDDNodal_Entropy_loc, &qf_sgs_dd_nodal));
1569b103f75SJames Wright break;
157ee1455b7SJames Wright }
158ee1455b7SJames Wright
159ee1455b7SJames Wright // Mesh/geometry order and solution basis order may differ, therefore must interpolate
160cf8f12c8SJames Wright CeedBasis basis_x_to_q, basis_q;
161cf8f12c8SJames Wright PetscCall(DMPlexCeedBasisCreate(ceed, honee->dm, DMLABEL_DEFAULT, DMLABEL_DEFAULT_VALUE, 0, 0, &basis_q));
1624fe35dceSJames Wright PetscCallCeed(ceed, CeedBasisCreateProjection(basis_x, basis_q, &basis_x_to_q));
163ee1455b7SJames Wright
164b4c37c5cSJames Wright PetscCallCeed(ceed, CeedQFunctionSetContext(qf_sgs_dd_nodal, sgs_dd_setup_data->sgsdd_qfctx));
165b4c37c5cSJames Wright PetscCallCeed(ceed, CeedQFunctionAddInput(qf_sgs_dd_nodal, "q", num_comp_q, CEED_EVAL_NONE));
166b4c37c5cSJames Wright PetscCallCeed(ceed, CeedQFunctionAddInput(qf_sgs_dd_nodal, "x", num_comp_x, CEED_EVAL_INTERP));
167b4c37c5cSJames Wright PetscCallCeed(ceed, CeedQFunctionAddInput(qf_sgs_dd_nodal, "gradient velocity", num_comp_grad_velo, CEED_EVAL_NONE));
168b4c37c5cSJames Wright PetscCallCeed(ceed, CeedQFunctionAddInput(qf_sgs_dd_nodal, "anisotropy tensor", num_comp_grid_aniso, CEED_EVAL_NONE));
169b4c37c5cSJames Wright PetscCallCeed(ceed, CeedQFunctionAddInput(qf_sgs_dd_nodal, "inverse multiplicity", 1, CEED_EVAL_NONE));
170b4c37c5cSJames Wright PetscCallCeed(ceed, CeedQFunctionAddOutput(qf_sgs_dd_nodal, "km_sgs", sgs_dd_data->num_comp_sgs, CEED_EVAL_NONE));
171ee1455b7SJames Wright
172b4c37c5cSJames Wright PetscCallCeed(ceed, CeedOperatorCreate(ceed, qf_sgs_dd_nodal, NULL, NULL, &op_sgs_dd_nodal));
173cf8f12c8SJames Wright PetscCallCeed(ceed, CeedOperatorSetField(op_sgs_dd_nodal, "q", elem_restr_q, CEED_BASIS_NONE, honee->q_ceed));
1744fe35dceSJames Wright PetscCallCeed(ceed, CeedOperatorSetField(op_sgs_dd_nodal, "x", elem_restr_x, basis_x_to_q, x_coord));
17558e1cbfdSJeremy L Thompson PetscCallCeed(ceed, CeedOperatorSetField(op_sgs_dd_nodal, "gradient velocity", elem_restr_grad_velo, CEED_BASIS_NONE, CEED_VECTOR_ACTIVE));
17658e1cbfdSJeremy L Thompson PetscCallCeed(ceed, CeedOperatorSetField(op_sgs_dd_nodal, "anisotropy tensor", sgs_dd_setup_data->elem_restr_grid_aniso, CEED_BASIS_NONE,
177b4c37c5cSJames Wright sgs_dd_setup_data->grid_aniso_ceed));
17858e1cbfdSJeremy L Thompson PetscCallCeed(ceed, CeedOperatorSetField(op_sgs_dd_nodal, "inverse multiplicity", elem_restr_inv_multiplicity, CEED_BASIS_NONE, inv_multiplicity));
17958e1cbfdSJeremy L Thompson PetscCallCeed(ceed, CeedOperatorSetField(op_sgs_dd_nodal, "km_sgs", elem_restr_sgs, CEED_BASIS_NONE, CEED_VECTOR_ACTIVE));
180ee1455b7SJames Wright
1818340219bSJames Wright PetscCall(OperatorApplyContextCreate(grad_velo_proj->dm, sgs_dd_data->dm_sgs, ceed, op_sgs_dd_nodal, NULL, sgs_dd_data->sgs_nodal_ceed, NULL, NULL,
1828340219bSJames Wright &sgs_dd_data->op_nodal_evaluation_ctx));
183ee1455b7SJames Wright
184ee1455b7SJames Wright sgs_dd_setup_data->elem_restr_sgs = elem_restr_sgs;
185ad494f68SJames Wright sgs_dd_data->sgs_nodal_eval = SgsDDNodalStressEval_Fused;
186ee1455b7SJames Wright
187b4c37c5cSJames Wright PetscCallCeed(ceed, CeedVectorDestroy(&inv_multiplicity));
1884fe35dceSJames Wright PetscCallCeed(ceed, CeedVectorDestroy(&x_coord));
189b4c37c5cSJames Wright PetscCallCeed(ceed, CeedBasisDestroy(&basis_x_to_q));
190cf8f12c8SJames Wright PetscCallCeed(ceed, CeedBasisDestroy(&basis_q));
1914fe35dceSJames Wright PetscCallCeed(ceed, CeedBasisDestroy(&basis_x));
192cf8f12c8SJames Wright PetscCallCeed(ceed, CeedElemRestrictionDestroy(&elem_restr_q));
1934fe35dceSJames Wright PetscCallCeed(ceed, CeedElemRestrictionDestroy(&elem_restr_x));
194b4c37c5cSJames Wright PetscCallCeed(ceed, CeedElemRestrictionDestroy(&elem_restr_inv_multiplicity));
195fff85bd3SJames Wright PetscCallCeed(ceed, CeedElemRestrictionDestroy(&elem_restr_grad_velo));
196b4c37c5cSJames Wright PetscCallCeed(ceed, CeedQFunctionDestroy(&qf_sgs_dd_nodal));
197b4c37c5cSJames Wright PetscCallCeed(ceed, CeedOperatorDestroy(&op_sgs_dd_nodal));
198d949ddfcSJames Wright PetscFunctionReturn(PETSC_SUCCESS);
199ee1455b7SJames Wright }
200ee1455b7SJames Wright
2014c07ec22SJames Wright // @brief Setup data-driven model inference using libCEED native implementation
SgsDDSetupNodalEvaluation_Sequential_Ceed(Ceed ceed,SgsDDData sgs_dd_data,SgsDDSetupData sgs_dd_setup_data,CeedElemRestriction elem_restr_dd_inputs,CeedElemRestriction elem_restr_dd_outputs,CeedElemRestriction elem_restr_inv_multiplicity,CeedVector inv_multiplicity,void ** ctx)2024c07ec22SJames Wright static PetscErrorCode SgsDDSetupNodalEvaluation_Sequential_Ceed(Ceed ceed, SgsDDData sgs_dd_data, SgsDDSetupData sgs_dd_setup_data,
2034c07ec22SJames Wright CeedElemRestriction elem_restr_dd_inputs, CeedElemRestriction elem_restr_dd_outputs,
204b87d60b3SJames Wright CeedElemRestriction elem_restr_inv_multiplicity, CeedVector inv_multiplicity,
205b87d60b3SJames Wright void **ctx) {
206b87d60b3SJames Wright CeedQFunction qf_sgs_dd_inference;
207b87d60b3SJames Wright CeedOperator op_sgs_dd_inference;
208b87d60b3SJames Wright OperatorApplyContext *op_context = (OperatorApplyContext *)ctx;
209b87d60b3SJames Wright
210b87d60b3SJames Wright PetscFunctionBeginUser;
211b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionCreateInterior(ceed, 1, ComputeSgsDDNodal_Sequential_Inference, ComputeSgsDDNodal_Sequential_Inference_loc,
212b87d60b3SJames Wright &qf_sgs_dd_inference));
213b87d60b3SJames Wright
214b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionSetContext(qf_sgs_dd_inference, sgs_dd_setup_data->sgsdd_qfctx));
215b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionAddInput(qf_sgs_dd_inference, "model inputs", sgs_dd_data->num_comp_inputs, CEED_EVAL_NONE));
216b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionAddInput(qf_sgs_dd_inference, "inverse multiplicity", 1, CEED_EVAL_NONE));
217b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionAddOutput(qf_sgs_dd_inference, "model outputs", sgs_dd_data->num_comp_outputs, CEED_EVAL_NONE));
218b87d60b3SJames Wright
219b87d60b3SJames Wright PetscCallCeed(ceed, CeedOperatorCreate(ceed, qf_sgs_dd_inference, NULL, NULL, &op_sgs_dd_inference));
220b87d60b3SJames Wright PetscCallCeed(ceed, CeedOperatorSetField(op_sgs_dd_inference, "model inputs", elem_restr_dd_inputs, CEED_BASIS_NONE, CEED_VECTOR_ACTIVE));
221b87d60b3SJames Wright PetscCallCeed(ceed,
222b87d60b3SJames Wright CeedOperatorSetField(op_sgs_dd_inference, "inverse multiplicity", elem_restr_inv_multiplicity, CEED_BASIS_NONE, inv_multiplicity));
223b87d60b3SJames Wright PetscCallCeed(ceed, CeedOperatorSetField(op_sgs_dd_inference, "model outputs", elem_restr_dd_outputs, CEED_BASIS_NONE, CEED_VECTOR_ACTIVE));
224b87d60b3SJames Wright
225b87d60b3SJames Wright PetscCall(OperatorApplyContextCreate(sgs_dd_data->dm_dd_inputs, sgs_dd_data->dm_dd_outputs, ceed, op_sgs_dd_inference, NULL, NULL, NULL, NULL,
226b87d60b3SJames Wright op_context));
227*26d401f3SJames Wright sgs_dd_data->sgs_nodal_inference_ctx_destroy = (PetscCtxDestroyFn *)OperatorApplyContextDestroy;
228b87d60b3SJames Wright
229b87d60b3SJames Wright PetscCallCeed(ceed, CeedOperatorDestroy(&op_sgs_dd_inference));
230b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionDestroy(&qf_sgs_dd_inference));
231b87d60b3SJames Wright PetscFunctionReturn(PETSC_SUCCESS);
232b87d60b3SJames Wright }
233b87d60b3SJames Wright
2344c07ec22SJames Wright // @brief Perform data-driven model inference using libCEED native implementation
SgsDDNodalStressEval_Sequential_Ceed(Vec DD_Inputs_loc,Vec DD_Outputs_loc,void * ctx)2354c07ec22SJames Wright PetscErrorCode SgsDDNodalStressEval_Sequential_Ceed(Vec DD_Inputs_loc, Vec DD_Outputs_loc, void *ctx) {
236b87d60b3SJames Wright OperatorApplyContext op_context = *(OperatorApplyContext *)ctx;
237b87d60b3SJames Wright
238b87d60b3SJames Wright PetscFunctionBeginUser;
239ea615d4cSJames Wright PetscCall(PetscLogEventBegin(HONEE_SgsModelDDData, DD_Inputs_loc, DD_Outputs_loc, NULL, NULL));
240ea615d4cSJames Wright PetscCall(PetscLogEventBegin(HONEE_SgsModelDDInference, DD_Inputs_loc, DD_Outputs_loc, NULL, NULL));
241b40a7e63SJames Wright PetscCall(PetscLogGpuTimeBegin());
242b87d60b3SJames Wright PetscCall(ApplyCeedOperatorLocalToLocal(DD_Inputs_loc, DD_Outputs_loc, op_context));
243b40a7e63SJames Wright PetscCall(PetscLogGpuTimeEnd());
244ea615d4cSJames Wright PetscCall(PetscLogEventEnd(HONEE_SgsModelDDInference, DD_Inputs_loc, DD_Outputs_loc, NULL, NULL));
245ea615d4cSJames Wright PetscCall(PetscLogEventEnd(HONEE_SgsModelDDData, DD_Inputs_loc, DD_Outputs_loc, NULL, NULL));
246b87d60b3SJames Wright PetscFunctionReturn(PETSC_SUCCESS);
247b87d60b3SJames Wright }
248b87d60b3SJames Wright
2494c07ec22SJames Wright // @brief Setup data-driven model inference using libtorch
SgsDDSetupNodalEvaluation_Sequential_Torch(Ceed ceed,SgsDDData sgs_dd_data,SgsDDSetupData sgs_dd_setup_data,CeedElemRestriction elem_restr_dd_inputs,CeedElemRestriction elem_restr_dd_outputs,CeedElemRestriction elem_restr_inv_multiplicity,CeedVector inv_multiplicity,void ** ctx)2504c07ec22SJames Wright static PetscErrorCode SgsDDSetupNodalEvaluation_Sequential_Torch(Ceed ceed, SgsDDData sgs_dd_data, SgsDDSetupData sgs_dd_setup_data,
2514c07ec22SJames Wright CeedElemRestriction elem_restr_dd_inputs, CeedElemRestriction elem_restr_dd_outputs,
2524c07ec22SJames Wright CeedElemRestriction elem_restr_inv_multiplicity, CeedVector inv_multiplicity,
2534c07ec22SJames Wright void **ctx) {
2544c07ec22SJames Wright const char *ceed_resource;
2554c07ec22SJames Wright char model_path[PETSC_MAX_PATH_LEN] = "";
2564c07ec22SJames Wright TorchDeviceType model_device_type;
2574c07ec22SJames Wright
2584c07ec22SJames Wright PetscFunctionBeginUser;
2594c07ec22SJames Wright PetscCallCeed(ceed, CeedGetResource(ceed, &ceed_resource));
2604c07ec22SJames Wright if (strstr(ceed_resource, "/gpu/cuda")) model_device_type = TORCH_DEVICE_CUDA;
2614c07ec22SJames Wright else if (strstr(ceed_resource, "/gpu/hip")) model_device_type = TORCH_DEVICE_HIP;
2627ffa0ff8SJames Wright // On-device XPU is not working reliably currently, default to CPU inference evaluation
2637ffa0ff8SJames Wright // else if (strstr(ceed_resource, "/gpu/sycl")) model_device_type = TORCH_DEVICE_XPU;
2644c07ec22SJames Wright else model_device_type = TORCH_DEVICE_CPU;
2654c07ec22SJames Wright PetscCall(PetscOptionsGetEnum(NULL, NULL, "-sgs_model_dd_torch_model_device", TorchDeviceTypes, (PetscEnum *)&model_device_type, NULL));
2664c07ec22SJames Wright PetscCall(PetscOptionsGetString(NULL, NULL, "-sgs_model_dd_torch_model_path", model_path, sizeof(model_path), NULL));
2674c07ec22SJames Wright
2684c07ec22SJames Wright PetscCall(LoadModel_Torch(model_path, model_device_type));
2694c07ec22SJames Wright PetscFunctionReturn(PETSC_SUCCESS);
2704c07ec22SJames Wright }
2714c07ec22SJames Wright
2724c07ec22SJames Wright // @brief Perform data-driven model inference using libtorch
SgsDDNodalStressEval_Sequential_Torch(Vec DD_Inputs_loc,Vec DD_Outputs_loc,void * ctx)2734c07ec22SJames Wright static PetscErrorCode SgsDDNodalStressEval_Sequential_Torch(Vec DD_Inputs_loc, Vec DD_Outputs_loc, void *ctx) {
2744c07ec22SJames Wright static PetscBool run_through = PETSC_FALSE;
27514bd2a07SJames Wright
2764c07ec22SJames Wright PetscFunctionBeginUser;
2774c07ec22SJames Wright if (!run_through) {
2784c07ec22SJames Wright PetscCall(VecViewFromOptions(DD_Inputs_loc, NULL, "-dd_inputs_loc_view"));
2794c07ec22SJames Wright }
2804c07ec22SJames Wright PetscCall(ModelInference_Torch(DD_Inputs_loc, DD_Outputs_loc));
2814c07ec22SJames Wright if (!run_through) {
2824c07ec22SJames Wright PetscCall(VecViewFromOptions(DD_Outputs_loc, NULL, "-dd_outputs_loc_view"));
2834c07ec22SJames Wright run_through = PETSC_TRUE;
2844c07ec22SJames Wright }
2854c07ec22SJames Wright PetscFunctionReturn(PETSC_SUCCESS);
2864c07ec22SJames Wright }
2874c07ec22SJames Wright
288b87d60b3SJames Wright // @brief Evaluate data-driven SGS using sequential method
SgsDDNodalStressEval_Sequential(Honee honee,Vec Q_loc,Vec VelocityGradient,Vec SGSNodal_loc)2890c373b74SJames Wright PetscErrorCode SgsDDNodalStressEval_Sequential(Honee honee, Vec Q_loc, Vec VelocityGradient, Vec SGSNodal_loc) {
29082baf964SJames Wright SgsDDData sgs_dd_data;
291b87d60b3SJames Wright PetscMemType q_mem_type;
292b87d60b3SJames Wright Vec DD_Inputs_loc, DD_Outputs_loc;
293b87d60b3SJames Wright
294b87d60b3SJames Wright PetscFunctionBeginUser;
2950c70a8bcSJames Wright PetscCall(HoneeGetContainer(honee, SGS_DD_DATA_KEY, &sgs_dd_data));
296b87d60b3SJames Wright PetscCall(DMGetLocalVector(sgs_dd_data->dm_dd_inputs, &DD_Inputs_loc));
297b87d60b3SJames Wright PetscCall(DMGetLocalVector(sgs_dd_data->dm_dd_outputs, &DD_Outputs_loc));
2980c373b74SJames Wright PetscCall(VecPetscToCeed(Q_loc, &q_mem_type, honee->q_ceed)); // q_ceed is an implicit input
299b87d60b3SJames Wright
300b87d60b3SJames Wright PetscCall(ApplyCeedOperatorGlobalToLocal(VelocityGradient, DD_Inputs_loc, sgs_dd_data->op_nodal_dd_inputs_ctx));
301b87d60b3SJames Wright PetscCall(sgs_dd_data->sgs_nodal_inference(DD_Inputs_loc, DD_Outputs_loc, &sgs_dd_data->sgs_nodal_inference_ctx));
302b87d60b3SJames Wright PetscCall(ApplyCeedOperatorLocalToLocal(DD_Outputs_loc, SGSNodal_loc, sgs_dd_data->op_nodal_dd_outputs_ctx));
303b87d60b3SJames Wright
3040c373b74SJames Wright PetscCall(VecCeedToPetsc(honee->q_ceed, q_mem_type, Q_loc));
305b87d60b3SJames Wright PetscCall(DMRestoreLocalVector(sgs_dd_data->dm_dd_inputs, &DD_Inputs_loc));
306b87d60b3SJames Wright PetscCall(DMRestoreLocalVector(sgs_dd_data->dm_dd_outputs, &DD_Outputs_loc));
307b87d60b3SJames Wright PetscFunctionReturn(PETSC_SUCCESS);
308b87d60b3SJames Wright }
309b87d60b3SJames Wright
310b87d60b3SJames Wright // @brief Create CeedOperator to calculate data-drive SGS at nodes using sequentially-applied operators
SgsDDSetupNodalEvaluation_Sequential(Ceed ceed,Honee honee,SgsDDSetupData sgs_dd_setup_data)311e3663b90SJames Wright static PetscErrorCode SgsDDSetupNodalEvaluation_Sequential(Ceed ceed, Honee honee, SgsDDSetupData sgs_dd_setup_data) {
31282baf964SJames Wright SgsDDData sgs_dd_data;
3134fe35dceSJames Wright CeedInt num_comp_grad_velo, num_comp_grid_aniso, num_comp_eigvec = 9 + 1;
3144fe35dceSJames Wright PetscInt num_comp_x, num_comp_q;
315b87d60b3SJames Wright CeedVector inv_multiplicity, eigvec;
3168340219bSJames Wright NodalProjectionData grad_velo_proj;
317b87d60b3SJames Wright CeedElemRestriction elem_restr_inv_multiplicity, elem_restr_grad_velo, elem_restr_sgs, elem_restr_eigvec, elem_restr_dd_inputs,
318cf8f12c8SJames Wright elem_restr_dd_outputs, elem_restr_q;
319e3db12f8SJames Wright PetscInt height = 0, dm_field = 0;
320b87d60b3SJames Wright
321b87d60b3SJames Wright PetscFunctionBeginUser;
3220c70a8bcSJames Wright PetscCall(HoneeGetContainer(honee, SGS_DD_DATA_KEY, &sgs_dd_data));
323b87d60b3SJames Wright { // Create DMs for data-driven input and output values
324b87d60b3SJames Wright PetscSection section;
325b87d60b3SJames Wright PetscInt degree, q_extra;
326b87d60b3SJames Wright { // Get degree and number of quadrature points from dm_sgs
327b87d60b3SJames Wright PetscFE fe;
328b87d60b3SJames Wright PetscSpace basis;
329b87d60b3SJames Wright PetscQuadrature quadrature;
330b87d60b3SJames Wright PetscInt num_qpnts;
331b87d60b3SJames Wright PetscCall(DMGetField(sgs_dd_data->dm_sgs, 0, NULL, (PetscObject *)&fe));
332b87d60b3SJames Wright PetscCall(PetscFEGetBasisSpace(fe, &basis));
333b87d60b3SJames Wright PetscCall(PetscSpaceGetDegree(basis, °ree, NULL));
334b87d60b3SJames Wright PetscCall(PetscFEGetQuadrature(fe, &quadrature));
335b87d60b3SJames Wright PetscCall(PetscQuadratureGetOrder(quadrature, &num_qpnts));
336b87d60b3SJames Wright q_extra = degree - num_qpnts;
337b87d60b3SJames Wright }
338b87d60b3SJames Wright
339b87d60b3SJames Wright PetscCall(DMClone(sgs_dd_data->dm_sgs, &sgs_dd_data->dm_dd_inputs));
3400dee9b8eSJames Wright PetscCall(DMSetMatrixPreallocateSkip(sgs_dd_data->dm_dd_inputs, PETSC_TRUE));
341b87d60b3SJames Wright PetscCall(PetscObjectSetName((PetscObject)sgs_dd_data->dm_dd_inputs, "Data-Driven Model Inputs"));
342b87d60b3SJames Wright PetscCall(DMSetupByOrder_FEM(PETSC_TRUE, PETSC_TRUE, degree, 1, q_extra, 1, &sgs_dd_data->num_comp_inputs, sgs_dd_data->dm_dd_inputs));
343b87d60b3SJames Wright PetscCall(DMGetLocalSection(sgs_dd_data->dm_dd_inputs, §ion));
344b87d60b3SJames Wright PetscCall(PetscSectionSetFieldName(section, 0, ""));
345b87d60b3SJames Wright for (CeedInt i = 0; i < sgs_dd_data->num_comp_inputs; i++) {
346b87d60b3SJames Wright char component_name[PETSC_MAX_PATH_LEN];
347b87d60b3SJames Wright
348b87d60b3SJames Wright PetscCall(PetscSNPrintf(component_name, sizeof component_name, "DataDrivenInput%" CeedInt_FMT, i + 1));
349b87d60b3SJames Wright PetscCall(PetscSectionSetComponentName(section, 0, i, component_name));
350b87d60b3SJames Wright }
351b87d60b3SJames Wright
352b87d60b3SJames Wright PetscCall(DMClone(sgs_dd_data->dm_sgs, &sgs_dd_data->dm_dd_outputs));
3530dee9b8eSJames Wright PetscCall(DMSetMatrixPreallocateSkip(sgs_dd_data->dm_dd_outputs, PETSC_TRUE));
354b87d60b3SJames Wright PetscCall(PetscObjectSetName((PetscObject)sgs_dd_data->dm_dd_outputs, "Data-Driven Model Outputs"));
355b87d60b3SJames Wright PetscCall(DMSetupByOrder_FEM(PETSC_TRUE, PETSC_TRUE, degree, 1, q_extra, 1, &sgs_dd_data->num_comp_outputs, sgs_dd_data->dm_dd_outputs));
356b87d60b3SJames Wright PetscCall(DMGetLocalSection(sgs_dd_data->dm_dd_outputs, §ion));
357b87d60b3SJames Wright PetscCall(PetscSectionSetFieldName(section, 0, ""));
358b87d60b3SJames Wright for (CeedInt i = 0; i < sgs_dd_data->num_comp_outputs; i++) {
359b87d60b3SJames Wright char component_name[PETSC_MAX_PATH_LEN];
360b87d60b3SJames Wright
361b87d60b3SJames Wright PetscCall(PetscSNPrintf(component_name, sizeof component_name, "DataDrivenOutput%" CeedInt_FMT, i + 1));
362b87d60b3SJames Wright PetscCall(PetscSectionSetComponentName(section, 0, i, component_name));
363b87d60b3SJames Wright }
364b87d60b3SJames Wright }
365b87d60b3SJames Wright
3664fe35dceSJames Wright PetscCall(DMGetCoordinateNumComps(honee->dm, &num_comp_x));
3674fe35dceSJames Wright PetscCall(DMGetFieldNumComps(honee->dm, 0, &num_comp_q));
368b87d60b3SJames Wright PetscCallCeed(ceed, CeedElemRestrictionGetNumComponents(sgs_dd_setup_data->elem_restr_grid_aniso, &num_comp_grid_aniso));
3690c70a8bcSJames Wright PetscCall(HoneeGetContainer(honee, GRAD_VELO_PROJ_KEY, &grad_velo_proj));
370b87d60b3SJames Wright
371b87d60b3SJames Wright { // Get velocity gradient information
372b87d60b3SJames Wright CeedOperatorField op_field;
3738340219bSJames Wright PetscCallCeed(ceed, CeedOperatorGetFieldByName(grad_velo_proj->l2_rhs_ctx->op, "velocity gradient", &op_field));
374b87d60b3SJames Wright PetscCallCeed(ceed, CeedOperatorFieldGetElemRestriction(op_field, &elem_restr_grad_velo));
375b87d60b3SJames Wright PetscCallCeed(ceed, CeedElemRestrictionGetNumComponents(elem_restr_grad_velo, &num_comp_grad_velo));
376b87d60b3SJames Wright PetscCallCeed(ceed, CeedElemRestrictionCreateVector(elem_restr_grad_velo, &sgs_dd_data->grad_velo_ceed, NULL));
377b87d60b3SJames Wright }
3784fe35dceSJames Wright PetscCall(DMPlexCeedElemRestrictionCreate(ceed, honee->dm, DMLABEL_DEFAULT, DMLABEL_DEFAULT_VALUE, 0, 0, &elem_restr_q));
379e3db12f8SJames Wright PetscCall(DMPlexCeedElemRestrictionCreate(ceed, sgs_dd_data->dm_sgs, DMLABEL_DEFAULT, DMLABEL_DEFAULT_VALUE, height, dm_field, &elem_restr_sgs));
380b87d60b3SJames Wright PetscCallCeed(ceed, CeedElemRestrictionCreateVector(elem_restr_sgs, &sgs_dd_data->sgs_nodal_ceed, NULL));
381e3db12f8SJames Wright PetscCall(DMPlexCeedElemRestrictionCollocatedCreate(ceed, sgs_dd_data->dm_sgs, DMLABEL_DEFAULT, DMLABEL_DEFAULT_VALUE, height, num_comp_eigvec,
3829eadbee4SJames Wright &elem_restr_eigvec));
383b87d60b3SJames Wright PetscCallCeed(ceed, CeedElemRestrictionCreateVector(elem_restr_eigvec, &eigvec, NULL));
384b87d60b3SJames Wright
385e3db12f8SJames Wright PetscCall(DMPlexCeedElemRestrictionCreate(ceed, sgs_dd_data->dm_dd_inputs, DMLABEL_DEFAULT, DMLABEL_DEFAULT_VALUE, height, dm_field,
386e3db12f8SJames Wright &elem_restr_dd_inputs));
387e3db12f8SJames Wright PetscCall(DMPlexCeedElemRestrictionCreate(ceed, sgs_dd_data->dm_dd_outputs, DMLABEL_DEFAULT, DMLABEL_DEFAULT_VALUE, height, dm_field,
388e3db12f8SJames Wright &elem_restr_dd_outputs));
389b87d60b3SJames Wright
390e3db12f8SJames Wright PetscCall(GetInverseMultiplicity(ceed, sgs_dd_data->dm_sgs, DMLABEL_DEFAULT, DMLABEL_DEFAULT_VALUE, height, dm_field, PETSC_FALSE,
391e3db12f8SJames Wright &elem_restr_inv_multiplicity, &inv_multiplicity));
392b87d60b3SJames Wright
393b87d60b3SJames Wright { // Create operator for data-driven input evaluation
394b87d60b3SJames Wright CeedQFunction qf_sgs_dd_inputs;
395b87d60b3SJames Wright CeedOperator op_sgs_dd_inputs;
396b87d60b3SJames Wright
3970c373b74SJames Wright switch (honee->phys->state_var) {
398b87d60b3SJames Wright case STATEVAR_PRIMITIVE:
399b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionCreateInterior(ceed, 1, ComputeSgsDDNodal_Sequential_Inputs_Prim,
400b87d60b3SJames Wright ComputeSgsDDNodal_Sequential_Inputs_Prim_loc, &qf_sgs_dd_inputs));
401b87d60b3SJames Wright break;
402b87d60b3SJames Wright case STATEVAR_CONSERVATIVE:
403b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionCreateInterior(ceed, 1, ComputeSgsDDNodal_Sequential_Inputs_Conserv,
404b87d60b3SJames Wright ComputeSgsDDNodal_Sequential_Inputs_Conserv_loc, &qf_sgs_dd_inputs));
405b87d60b3SJames Wright break;
4069b103f75SJames Wright case STATEVAR_ENTROPY:
4079b103f75SJames Wright PetscCallCeed(ceed, CeedQFunctionCreateInterior(ceed, 1, ComputeSgsDDNodal_Sequential_Inputs_Entropy,
4089b103f75SJames Wright ComputeSgsDDNodal_Sequential_Inputs_Entropy_loc, &qf_sgs_dd_inputs));
4099b103f75SJames Wright break;
410b87d60b3SJames Wright }
411b87d60b3SJames Wright
412b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionSetContext(qf_sgs_dd_inputs, sgs_dd_setup_data->sgsdd_qfctx));
413b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionAddInput(qf_sgs_dd_inputs, "q", num_comp_q, CEED_EVAL_NONE));
414b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionAddInput(qf_sgs_dd_inputs, "gradient velocity", num_comp_grad_velo, CEED_EVAL_NONE));
415b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionAddInput(qf_sgs_dd_inputs, "anisotropy tensor", num_comp_grid_aniso, CEED_EVAL_NONE));
416b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionAddInput(qf_sgs_dd_inputs, "inverse multiplicity", 1, CEED_EVAL_NONE));
417b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionAddOutput(qf_sgs_dd_inputs, "eigenvectors", num_comp_eigvec, CEED_EVAL_NONE));
418b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionAddOutput(qf_sgs_dd_inputs, "model inputs", sgs_dd_data->num_comp_inputs, CEED_EVAL_NONE));
419b87d60b3SJames Wright
420b87d60b3SJames Wright PetscCallCeed(ceed, CeedOperatorCreate(ceed, qf_sgs_dd_inputs, NULL, NULL, &op_sgs_dd_inputs));
421cf8f12c8SJames Wright PetscCallCeed(ceed, CeedOperatorSetField(op_sgs_dd_inputs, "q", elem_restr_q, CEED_BASIS_NONE, honee->q_ceed));
422b87d60b3SJames Wright PetscCallCeed(ceed, CeedOperatorSetField(op_sgs_dd_inputs, "gradient velocity", elem_restr_grad_velo, CEED_BASIS_NONE, CEED_VECTOR_ACTIVE));
423b87d60b3SJames Wright PetscCallCeed(ceed, CeedOperatorSetField(op_sgs_dd_inputs, "anisotropy tensor", sgs_dd_setup_data->elem_restr_grid_aniso, CEED_BASIS_NONE,
424b87d60b3SJames Wright sgs_dd_setup_data->grid_aniso_ceed));
425b87d60b3SJames Wright PetscCallCeed(ceed,
426b87d60b3SJames Wright CeedOperatorSetField(op_sgs_dd_inputs, "inverse multiplicity", elem_restr_inv_multiplicity, CEED_BASIS_NONE, inv_multiplicity));
427b87d60b3SJames Wright PetscCallCeed(ceed, CeedOperatorSetField(op_sgs_dd_inputs, "eigenvectors", elem_restr_eigvec, CEED_BASIS_NONE, eigvec));
428b87d60b3SJames Wright PetscCallCeed(ceed, CeedOperatorSetField(op_sgs_dd_inputs, "model inputs", elem_restr_dd_inputs, CEED_BASIS_NONE, CEED_VECTOR_ACTIVE));
429b87d60b3SJames Wright
4308340219bSJames Wright PetscCall(OperatorApplyContextCreate(grad_velo_proj->dm, sgs_dd_data->dm_dd_inputs, ceed, op_sgs_dd_inputs, NULL, NULL, NULL, NULL,
431b87d60b3SJames Wright &sgs_dd_data->op_nodal_dd_inputs_ctx));
432b87d60b3SJames Wright PetscCallCeed(ceed, CeedOperatorDestroy(&op_sgs_dd_inputs));
433b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionDestroy(&qf_sgs_dd_inputs));
434b87d60b3SJames Wright }
435b87d60b3SJames Wright
436b87d60b3SJames Wright { // Create operator for data-driven output handling
437b87d60b3SJames Wright CeedQFunction qf_sgs_dd_outputs;
438b87d60b3SJames Wright CeedOperator op_sgs_dd_outputs;
439b87d60b3SJames Wright
440b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionCreateInterior(ceed, 1, ComputeSgsDDNodal_Sequential_Outputs, ComputeSgsDDNodal_Sequential_Outputs_loc,
441b87d60b3SJames Wright &qf_sgs_dd_outputs));
442b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionSetContext(qf_sgs_dd_outputs, sgs_dd_setup_data->sgsdd_qfctx));
443b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionAddInput(qf_sgs_dd_outputs, "model outputs", sgs_dd_data->num_comp_outputs, CEED_EVAL_NONE));
444b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionAddInput(qf_sgs_dd_outputs, "anisotropy tensor", num_comp_grid_aniso, CEED_EVAL_NONE));
445b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionAddInput(qf_sgs_dd_outputs, "inverse multiplicity", 1, CEED_EVAL_NONE));
446b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionAddInput(qf_sgs_dd_outputs, "eigenvectors", num_comp_eigvec, CEED_EVAL_NONE));
447b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionAddOutput(qf_sgs_dd_outputs, "km_sgs", sgs_dd_data->num_comp_sgs, CEED_EVAL_NONE));
448b87d60b3SJames Wright
449b87d60b3SJames Wright PetscCallCeed(ceed, CeedOperatorCreate(ceed, qf_sgs_dd_outputs, NULL, NULL, &op_sgs_dd_outputs));
450b87d60b3SJames Wright PetscCallCeed(ceed, CeedOperatorSetField(op_sgs_dd_outputs, "model outputs", elem_restr_dd_outputs, CEED_BASIS_NONE, CEED_VECTOR_ACTIVE));
451b87d60b3SJames Wright PetscCallCeed(ceed, CeedOperatorSetField(op_sgs_dd_outputs, "anisotropy tensor", sgs_dd_setup_data->elem_restr_grid_aniso, CEED_BASIS_NONE,
452b87d60b3SJames Wright sgs_dd_setup_data->grid_aniso_ceed));
453b87d60b3SJames Wright PetscCallCeed(ceed,
454b87d60b3SJames Wright CeedOperatorSetField(op_sgs_dd_outputs, "inverse multiplicity", elem_restr_inv_multiplicity, CEED_BASIS_NONE, inv_multiplicity));
455b87d60b3SJames Wright PetscCallCeed(ceed, CeedOperatorSetField(op_sgs_dd_outputs, "eigenvectors", elem_restr_eigvec, CEED_BASIS_NONE, eigvec));
456b87d60b3SJames Wright PetscCallCeed(ceed, CeedOperatorSetField(op_sgs_dd_outputs, "km_sgs", elem_restr_sgs, CEED_BASIS_NONE, CEED_VECTOR_ACTIVE));
457b87d60b3SJames Wright
458b87d60b3SJames Wright PetscCall(OperatorApplyContextCreate(sgs_dd_data->dm_dd_outputs, sgs_dd_data->dm_sgs, ceed, op_sgs_dd_outputs, NULL, sgs_dd_data->sgs_nodal_ceed,
459b87d60b3SJames Wright NULL, NULL, &sgs_dd_data->op_nodal_dd_outputs_ctx));
460b87d60b3SJames Wright PetscCallCeed(ceed, CeedOperatorDestroy(&op_sgs_dd_outputs));
461b87d60b3SJames Wright PetscCallCeed(ceed, CeedQFunctionDestroy(&qf_sgs_dd_outputs));
462b87d60b3SJames Wright }
463b87d60b3SJames Wright
464b87d60b3SJames Wright sgs_dd_data->sgs_nodal_eval = SgsDDNodalStressEval_Sequential;
4654c07ec22SJames Wright
4664c07ec22SJames Wright if (sgs_dd_setup_data->sgs_dd_model_implementation == SGS_MODEL_DD_SEQENTIAL_CEED) {
4674c07ec22SJames Wright sgs_dd_data->sgs_nodal_inference = SgsDDNodalStressEval_Sequential_Ceed;
4684c07ec22SJames Wright PetscCall(SgsDDSetupNodalEvaluation_Sequential_Ceed(ceed, sgs_dd_data, sgs_dd_setup_data, elem_restr_dd_inputs, elem_restr_dd_outputs,
469b87d60b3SJames Wright elem_restr_inv_multiplicity, inv_multiplicity, &sgs_dd_data->sgs_nodal_inference_ctx));
4704c07ec22SJames Wright } else if (sgs_dd_setup_data->sgs_dd_model_implementation == SGS_MODEL_DD_SEQENTIAL_TORCH) {
4714c07ec22SJames Wright sgs_dd_data->sgs_nodal_inference = SgsDDNodalStressEval_Sequential_Torch;
4724c07ec22SJames Wright PetscCall(SgsDDSetupNodalEvaluation_Sequential_Torch(ceed, sgs_dd_data, sgs_dd_setup_data, elem_restr_dd_inputs, elem_restr_dd_outputs,
4734c07ec22SJames Wright elem_restr_inv_multiplicity, inv_multiplicity, &sgs_dd_data->sgs_nodal_inference_ctx));
4744c07ec22SJames Wright }
475b87d60b3SJames Wright
476b87d60b3SJames Wright sgs_dd_setup_data->elem_restr_sgs = elem_restr_sgs;
477b87d60b3SJames Wright
478b87d60b3SJames Wright PetscCallCeed(ceed, CeedVectorDestroy(&inv_multiplicity));
479b87d60b3SJames Wright PetscCallCeed(ceed, CeedVectorDestroy(&eigvec));
480b87d60b3SJames Wright PetscCallCeed(ceed, CeedElemRestrictionDestroy(&elem_restr_inv_multiplicity));
481b87d60b3SJames Wright PetscCallCeed(ceed, CeedElemRestrictionDestroy(&elem_restr_eigvec));
482b87d60b3SJames Wright PetscCallCeed(ceed, CeedElemRestrictionDestroy(&elem_restr_dd_inputs));
483b87d60b3SJames Wright PetscCallCeed(ceed, CeedElemRestrictionDestroy(&elem_restr_dd_outputs));
484fff85bd3SJames Wright PetscCallCeed(ceed, CeedElemRestrictionDestroy(&elem_restr_grad_velo));
485cf8f12c8SJames Wright PetscCallCeed(ceed, CeedElemRestrictionDestroy(&elem_restr_q));
486b87d60b3SJames Wright PetscFunctionReturn(PETSC_SUCCESS);
487b87d60b3SJames Wright }
488b87d60b3SJames Wright
4899c678832SJames Wright // @brief Create CeedOperator to compute SGS contribution to the residual
SgsSetupNodalIFunction(Ceed ceed,Honee honee,SgsDDSetupData sgs_dd_setup_data)490e3663b90SJames Wright static PetscErrorCode SgsSetupNodalIFunction(Ceed ceed, Honee honee, SgsDDSetupData sgs_dd_setup_data) {
49182baf964SJames Wright SgsDDData sgs_dd_data;
492cf8f12c8SJames Wright CeedInt q_data_size;
493cf8f12c8SJames Wright PetscInt dim, num_comp_q, num_comp_x;
4949c678832SJames Wright CeedQFunction qf_sgs_apply;
4959c678832SJames Wright CeedOperator op_sgs_apply;
496cf8f12c8SJames Wright CeedBasis basis_sgs, basis_q;
497be29160dSJames Wright CeedVector q_data;
498cf8f12c8SJames Wright CeedElemRestriction elem_restr_qd, elem_restr_q;
4999c678832SJames Wright
5009c678832SJames Wright PetscFunctionBeginUser;
5010c70a8bcSJames Wright PetscCall(HoneeGetContainer(honee, SGS_DD_DATA_KEY, &sgs_dd_data));
5020c373b74SJames Wright PetscCall(DMGetDimension(honee->dm, &dim));
503cf8f12c8SJames Wright PetscCall(DMPlexCeedElemRestrictionCreate(ceed, honee->dm, DMLABEL_DEFAULT, DMLABEL_DEFAULT_VALUE, 0, 0, &elem_restr_q));
504cf8f12c8SJames Wright PetscCall(DMGetFieldNumComps(honee->dm, 0, &num_comp_q));
505cf8f12c8SJames Wright PetscCall(DMGetCoordinateNumComps(honee->dm, &num_comp_x));
5069c678832SJames Wright
507be29160dSJames Wright {
508e3db12f8SJames Wright PetscInt height = 0, dm_field = 0;
509be29160dSJames Wright
510cf8f12c8SJames Wright PetscCall(DMPlexCeedBasisCreate(ceed, honee->dm, DMLABEL_DEFAULT, DMLABEL_DEFAULT_VALUE, 0, 0, &basis_q));
511e3db12f8SJames Wright PetscCall(DMPlexCeedBasisCreate(ceed, sgs_dd_data->dm_sgs, DMLABEL_DEFAULT, DMLABEL_DEFAULT_VALUE, height, dm_field, &basis_sgs));
5129018c49aSJames Wright PetscCall(QDataGet(ceed, sgs_dd_data->dm_sgs, DMLABEL_DEFAULT, DMLABEL_DEFAULT_VALUE, &elem_restr_qd, &q_data, &q_data_size));
513be29160dSJames Wright }
5149c678832SJames Wright
5150c373b74SJames Wright switch (honee->phys->state_var) {
5169c678832SJames Wright case STATEVAR_PRIMITIVE:
51742454adaSJames Wright PetscCallCeed(ceed, CeedQFunctionCreateInterior(ceed, 1, IFunction_NodalSgs_Prim, IFunction_NodalSgs_Prim_loc, &qf_sgs_apply));
5189c678832SJames Wright break;
5199c678832SJames Wright case STATEVAR_CONSERVATIVE:
52042454adaSJames Wright PetscCallCeed(ceed, CeedQFunctionCreateInterior(ceed, 1, IFunction_NodalSgs_Conserv, IFunction_NodalSgs_Conserv_loc, &qf_sgs_apply));
5219c678832SJames Wright break;
5229b103f75SJames Wright case STATEVAR_ENTROPY:
5239b103f75SJames Wright PetscCallCeed(ceed, CeedQFunctionCreateInterior(ceed, 1, IFunction_NodalSgs_Entropy, IFunction_NodalSgs_Entropy_loc, &qf_sgs_apply));
5249b103f75SJames Wright break;
5259c678832SJames Wright }
5269c678832SJames Wright
52740816385SJames Wright PetscCallCeed(ceed, CeedQFunctionSetContext(qf_sgs_apply, sgs_dd_setup_data->ifunction_qfctx));
528b4c37c5cSJames Wright PetscCallCeed(ceed, CeedQFunctionAddInput(qf_sgs_apply, "q", num_comp_q, CEED_EVAL_INTERP));
529be29160dSJames Wright PetscCallCeed(ceed, CeedQFunctionAddInput(qf_sgs_apply, "qdata", q_data_size, CEED_EVAL_NONE));
530b4c37c5cSJames Wright PetscCallCeed(ceed, CeedQFunctionAddInput(qf_sgs_apply, "km_sgs", sgs_dd_data->num_comp_sgs, CEED_EVAL_INTERP));
531b4c37c5cSJames Wright PetscCallCeed(ceed, CeedQFunctionAddOutput(qf_sgs_apply, "Grad_v", num_comp_q * dim, CEED_EVAL_GRAD));
5329c678832SJames Wright
533b4c37c5cSJames Wright PetscCallCeed(ceed, CeedOperatorCreate(ceed, qf_sgs_apply, NULL, NULL, &op_sgs_apply));
534cf8f12c8SJames Wright PetscCallCeed(ceed, CeedOperatorSetField(op_sgs_apply, "q", elem_restr_q, basis_q, CEED_VECTOR_ACTIVE));
535be29160dSJames Wright PetscCallCeed(ceed, CeedOperatorSetField(op_sgs_apply, "qdata", elem_restr_qd, CEED_BASIS_NONE, q_data));
536b4c37c5cSJames Wright PetscCallCeed(ceed, CeedOperatorSetField(op_sgs_apply, "km_sgs", sgs_dd_setup_data->elem_restr_sgs, basis_sgs, sgs_dd_data->sgs_nodal_ceed));
537cf8f12c8SJames Wright PetscCallCeed(ceed, CeedOperatorSetField(op_sgs_apply, "Grad_v", elem_restr_q, basis_q, CEED_VECTOR_ACTIVE));
5389c678832SJames Wright
5399eadbee4SJames Wright PetscCall(OperatorApplyContextCreate(honee->dm, honee->dm, ceed, op_sgs_apply, honee->q_ceed, honee->g_ceed, NULL, NULL,
5409eadbee4SJames Wright &sgs_dd_data->op_sgs_apply_ctx));
5419c678832SJames Wright
542be29160dSJames Wright PetscCallCeed(ceed, CeedVectorDestroy(&q_data));
543be29160dSJames Wright PetscCallCeed(ceed, CeedElemRestrictionDestroy(&elem_restr_qd));
54487edb941SJames Wright PetscCallCeed(ceed, CeedBasisDestroy(&basis_sgs));
545b4c37c5cSJames Wright PetscCallCeed(ceed, CeedOperatorDestroy(&op_sgs_apply));
546b4c37c5cSJames Wright PetscCallCeed(ceed, CeedQFunctionDestroy(&qf_sgs_apply));
547cf8f12c8SJames Wright PetscCallCeed(ceed, CeedElemRestrictionDestroy(&elem_restr_q));
548cf8f12c8SJames Wright PetscCallCeed(ceed, CeedBasisDestroy(&basis_q));
549d949ddfcSJames Wright PetscFunctionReturn(PETSC_SUCCESS);
5509c678832SJames Wright }
5519c678832SJames Wright
5529c678832SJames Wright // @brief Calculate and add data-driven SGS residual to the global residual
SgsDDApplyIFunction(Honee honee,const Vec Q_loc,Vec G_loc)5530c373b74SJames Wright PetscErrorCode SgsDDApplyIFunction(Honee honee, const Vec Q_loc, Vec G_loc) {
55482baf964SJames Wright SgsDDData sgs_dd_data;
5559c678832SJames Wright Vec VelocityGradient, SGSNodal_loc;
556cceb3143SJames Wright PetscMemType sgs_nodal_mem_type;
5578340219bSJames Wright NodalProjectionData grad_velo_proj;
5589c678832SJames Wright
5599c678832SJames Wright PetscFunctionBeginUser;
560ea615d4cSJames Wright PetscCall(PetscLogEventBegin(HONEE_SgsModel, Q_loc, G_loc, NULL, NULL));
5610c70a8bcSJames Wright PetscCall(HoneeGetContainer(honee, SGS_DD_DATA_KEY, &sgs_dd_data));
5620c70a8bcSJames Wright PetscCall(HoneeGetContainer(honee, GRAD_VELO_PROJ_KEY, &grad_velo_proj));
5638340219bSJames Wright PetscCall(DMGetGlobalVector(grad_velo_proj->dm, &VelocityGradient));
5648340219bSJames Wright PetscCall(VelocityGradientProjectionApply(grad_velo_proj, Q_loc, VelocityGradient));
5659c678832SJames Wright
5669c678832SJames Wright // -- Compute Nodal SGS tensor
5679c678832SJames Wright PetscCall(DMGetLocalVector(sgs_dd_data->dm_sgs, &SGSNodal_loc));
5680c373b74SJames Wright PetscCall(sgs_dd_data->sgs_nodal_eval(honee, Q_loc, VelocityGradient, SGSNodal_loc));
5699c678832SJames Wright
5709c678832SJames Wright // -- Compute contribution of the SGS stress
571a7dac1d5SJames Wright PetscCall(VecPetscToCeed(SGSNodal_loc, &sgs_nodal_mem_type, sgs_dd_data->sgs_nodal_ceed)); // sgs_nodal_ceed is an implicit input
5729c678832SJames Wright PetscCall(ApplyAddCeedOperatorLocalToLocal(Q_loc, G_loc, sgs_dd_data->op_sgs_apply_ctx));
5739c678832SJames Wright
5749c678832SJames Wright // -- Return local SGS vector
575a7dac1d5SJames Wright PetscCall(VecCeedToPetsc(sgs_dd_data->sgs_nodal_ceed, sgs_nodal_mem_type, SGSNodal_loc));
5769c678832SJames Wright PetscCall(DMRestoreLocalVector(sgs_dd_data->dm_sgs, &SGSNodal_loc));
5778340219bSJames Wright PetscCall(DMRestoreGlobalVector(grad_velo_proj->dm, &VelocityGradient));
578ea615d4cSJames Wright PetscCall(PetscLogEventEnd(HONEE_SgsModel, Q_loc, G_loc, NULL, NULL));
579d949ddfcSJames Wright PetscFunctionReturn(PETSC_SUCCESS);
5809c678832SJames Wright }
5819c678832SJames Wright
58262b7942eSJames Wright // @brief B = A^T, A is NxM, B is MxN
TransposeMatrix(const PetscScalar * A,PetscScalar * B,const PetscInt N,const PetscInt M)583cceb3143SJames Wright static PetscErrorCode TransposeMatrix(const PetscScalar *A, PetscScalar *B, const PetscInt N, const PetscInt M) {
58462b7942eSJames Wright PetscFunctionBeginUser;
58562b7942eSJames Wright for (PetscInt i = 0; i < N; i++) {
58662b7942eSJames Wright for (PetscInt j = 0; j < M; j++) {
58762b7942eSJames Wright B[j * N + i] = A[i * M + j];
58862b7942eSJames Wright }
58962b7942eSJames Wright }
590d949ddfcSJames Wright PetscFunctionReturn(PETSC_SUCCESS);
59162b7942eSJames Wright }
59262b7942eSJames Wright
59362b7942eSJames Wright // @brief Read neural network coefficients from file and put into context struct
SgsDDContextFill(MPI_Comm comm,char data_dir[PETSC_MAX_PATH_LEN],SgsDDContext * psgsdd_ctx)594ad494f68SJames Wright static PetscErrorCode SgsDDContextFill(MPI_Comm comm, char data_dir[PETSC_MAX_PATH_LEN], SgsDDContext *psgsdd_ctx) {
595ad494f68SJames Wright SgsDDContext sgsdd_ctx;
59662b7942eSJames Wright PetscInt num_inputs = (*psgsdd_ctx)->num_inputs, num_outputs = (*psgsdd_ctx)->num_outputs, num_neurons = (*psgsdd_ctx)->num_neurons;
59762b7942eSJames Wright char file_path[PETSC_MAX_PATH_LEN];
59862b7942eSJames Wright PetscScalar *temp;
59962b7942eSJames Wright
60062b7942eSJames Wright PetscFunctionBeginUser;
60162b7942eSJames Wright {
602ad494f68SJames Wright SgsDDContext sgsdd_temp;
60362b7942eSJames Wright PetscCall(PetscNew(&sgsdd_temp));
60462b7942eSJames Wright *sgsdd_temp = **psgsdd_ctx;
60562b7942eSJames Wright sgsdd_temp->offsets.bias1 = 0;
60662b7942eSJames Wright sgsdd_temp->offsets.bias2 = sgsdd_temp->offsets.bias1 + num_neurons;
60762b7942eSJames Wright sgsdd_temp->offsets.weight1 = sgsdd_temp->offsets.bias2 + num_neurons;
60862b7942eSJames Wright sgsdd_temp->offsets.weight2 = sgsdd_temp->offsets.weight1 + num_neurons * num_inputs;
60962b7942eSJames Wright sgsdd_temp->offsets.out_scaling = sgsdd_temp->offsets.weight2 + num_inputs * num_neurons;
61062b7942eSJames Wright PetscInt total_num_scalars = sgsdd_temp->offsets.out_scaling + 2 * num_outputs;
61162b7942eSJames Wright sgsdd_temp->total_bytes = sizeof(*sgsdd_ctx) + total_num_scalars * sizeof(sgsdd_ctx->data[0]);
61262b7942eSJames Wright PetscCall(PetscMalloc(sgsdd_temp->total_bytes, &sgsdd_ctx));
61362b7942eSJames Wright *sgsdd_ctx = *sgsdd_temp;
61462b7942eSJames Wright PetscCall(PetscFree(sgsdd_temp));
61562b7942eSJames Wright }
61662b7942eSJames Wright
61762b7942eSJames Wright PetscCall(PetscSNPrintf(file_path, sizeof file_path, "%s/%s", data_dir, "b1.dat"));
61842454adaSJames Wright PetscCall(PhastaDatFileReadToArrayReal(comm, file_path, &sgsdd_ctx->data[sgsdd_ctx->offsets.bias1]));
61962b7942eSJames Wright PetscCall(PetscSNPrintf(file_path, sizeof file_path, "%s/%s", data_dir, "b2.dat"));
62042454adaSJames Wright PetscCall(PhastaDatFileReadToArrayReal(comm, file_path, &sgsdd_ctx->data[sgsdd_ctx->offsets.bias2]));
62162b7942eSJames Wright PetscCall(PetscSNPrintf(file_path, sizeof file_path, "%s/%s", data_dir, "OutScaling.dat"));
62242454adaSJames Wright PetscCall(PhastaDatFileReadToArrayReal(comm, file_path, &sgsdd_ctx->data[sgsdd_ctx->offsets.out_scaling]));
62362b7942eSJames Wright
62462b7942eSJames Wright {
62562b7942eSJames Wright PetscCall(PetscMalloc1(num_inputs * num_neurons, &temp));
62662b7942eSJames Wright PetscCall(PetscSNPrintf(file_path, sizeof file_path, "%s/%s", data_dir, "w1.dat"));
62742454adaSJames Wright PetscCall(PhastaDatFileReadToArrayReal(comm, file_path, temp));
62862b7942eSJames Wright PetscCall(TransposeMatrix(temp, &sgsdd_ctx->data[sgsdd_ctx->offsets.weight1], num_inputs, num_neurons));
62962b7942eSJames Wright PetscCall(PetscFree(temp));
63062b7942eSJames Wright }
63162b7942eSJames Wright {
63262b7942eSJames Wright PetscCall(PetscMalloc1(num_outputs * num_neurons, &temp));
63362b7942eSJames Wright PetscCall(PetscSNPrintf(file_path, sizeof file_path, "%s/%s", data_dir, "w2.dat"));
63442454adaSJames Wright PetscCall(PhastaDatFileReadToArrayReal(comm, file_path, temp));
63562b7942eSJames Wright PetscCall(TransposeMatrix(temp, &sgsdd_ctx->data[sgsdd_ctx->offsets.weight2], num_neurons, num_outputs));
63662b7942eSJames Wright PetscCall(PetscFree(temp));
63762b7942eSJames Wright }
63862b7942eSJames Wright
63962b7942eSJames Wright PetscCall(PetscFree(*psgsdd_ctx));
64062b7942eSJames Wright *psgsdd_ctx = sgsdd_ctx;
641d949ddfcSJames Wright PetscFunctionReturn(PETSC_SUCCESS);
64262b7942eSJames Wright }
64362b7942eSJames Wright
SgsDDSetup(Ceed ceed,Honee honee,ProblemData problem)644e3663b90SJames Wright PetscErrorCode SgsDDSetup(Ceed ceed, Honee honee, ProblemData problem) {
645ee1455b7SJames Wright PetscReal alpha = 0;
646ad494f68SJames Wright SgsDDContext sgsdd_ctx;
6470c373b74SJames Wright MPI_Comm comm = honee->comm;
648ee1455b7SJames Wright char sgs_dd_dir[PETSC_MAX_PATH_LEN] = "./dd_sgs_parameters";
649ad494f68SJames Wright SgsDDSetupData sgs_dd_setup_data;
650cde3d787SJames Wright NewtonianIdealGasContext newt_ctx;
6518340219bSJames Wright NodalProjectionData grad_velo_proj;
65282baf964SJames Wright SgsDDData sgs_dd_data;
65362b7942eSJames Wright
65406f41313SJames Wright PetscFunctionBeginUser;
655cf8f12c8SJames Wright {
656cf8f12c8SJames Wright CeedElemRestriction elem_restr_q;
657cf8f12c8SJames Wright CeedBasis basis_q;
658cf8f12c8SJames Wright
659cf8f12c8SJames Wright PetscCall(DMPlexCeedElemRestrictionCreate(ceed, honee->dm, DMLABEL_DEFAULT, DMLABEL_DEFAULT_VALUE, 0, 0, &elem_restr_q));
660cf8f12c8SJames Wright PetscCall(DMPlexCeedBasisCreate(ceed, honee->dm, DMLABEL_DEFAULT, DMLABEL_DEFAULT_VALUE, 0, 0, &basis_q));
661cf8f12c8SJames Wright // TODO: Should probably move the elem_restr_q and basis_q creation to inside the velocity gradient projection setup???
662cf8f12c8SJames Wright PetscCall(VelocityGradientProjectionSetup(ceed, honee, problem, honee->phys->state_var, elem_restr_q, basis_q, &grad_velo_proj));
663cf8f12c8SJames Wright PetscCallCeed(ceed, CeedElemRestrictionDestroy(&elem_restr_q));
664cf8f12c8SJames Wright PetscCallCeed(ceed, CeedBasisDestroy(&basis_q));
665cf8f12c8SJames Wright }
6660c70a8bcSJames Wright PetscCall(HoneeSetContainer(honee, GRAD_VELO_PROJ_KEY, grad_velo_proj, (PetscCtxDestroyFn *)NodalProjectionDataDestroy));
6679ab09d51SJames Wright
66882baf964SJames Wright PetscCall(PetscNew(&sgs_dd_data));
66982baf964SJames Wright sgs_dd_data->num_comp_inputs = 6;
67082baf964SJames Wright sgs_dd_data->num_comp_outputs = 6;
6710c70a8bcSJames Wright PetscCall(HoneeSetContainer(honee, SGS_DD_DATA_KEY, sgs_dd_data, (PetscCtxDestroyFn *)SgsDDDataDestroy));
67262b7942eSJames Wright
6734c07ec22SJames Wright PetscCall(PetscNew(&sgs_dd_setup_data));
6744c07ec22SJames Wright
6754b0f6111SJames Wright PetscOptionsBegin(comm, NULL, "SGS Data-Driven Model Options", NULL);
67662b7942eSJames Wright PetscCall(PetscOptionsReal("-sgs_model_dd_leakyrelu_alpha", "Slope parameter for Leaky ReLU activation function", NULL, alpha, &alpha, NULL));
67762b7942eSJames Wright PetscCall(PetscOptionsString("-sgs_model_dd_parameter_dir", "Path to directory with model parameters (weights, biases, etc.)", NULL, sgs_dd_dir,
67862b7942eSJames Wright sgs_dd_dir, sizeof(sgs_dd_dir), NULL));
6794c07ec22SJames Wright PetscCall(PetscOptionsDeprecated("-sgs_model_dd_use_fused", NULL, "libCEED 0.12.0", "Use -sgs_model_dd_type instead"));
6804c07ec22SJames Wright sgs_dd_setup_data->sgs_dd_model_implementation = SGS_MODEL_DD_FUSED;
6814c07ec22SJames Wright PetscCall(PetscOptionsEnum("-sgs_model_dd_implementation", "Data-Driven SGS model implementation", NULL, SGSModelDDImplementations,
6824c07ec22SJames Wright (PetscEnum)sgs_dd_setup_data->sgs_dd_model_implementation, (PetscEnum *)&sgs_dd_setup_data->sgs_dd_model_implementation,
6834c07ec22SJames Wright NULL));
68462b7942eSJames Wright PetscOptionsEnd();
68562b7942eSJames Wright
686b87d60b3SJames Wright PetscCall(PetscNew(&sgsdd_ctx));
687f5dc303cSJames Wright *sgsdd_ctx = (struct SgsDDContext_){
688f5dc303cSJames Wright .num_layers = 1,
689f5dc303cSJames Wright .num_inputs = 6,
690f5dc303cSJames Wright .num_outputs = 6,
691f5dc303cSJames Wright .num_neurons = 20,
692f5dc303cSJames Wright .alpha = alpha,
693f5dc303cSJames Wright };
69462b7942eSJames Wright
695ad494f68SJames Wright PetscCall(SgsDDContextFill(comm, sgs_dd_dir, &sgsdd_ctx));
69662b7942eSJames Wright
697ee1455b7SJames Wright // -- Create DM for storing SGS tensor at nodes
69882baf964SJames Wright PetscCall(SgsDDCreateDM(honee->dm, &sgs_dd_data->dm_sgs, honee->app_ctx->degree, honee->app_ctx->q_extra, &sgs_dd_data->num_comp_sgs));
699ee1455b7SJames Wright
700cde3d787SJames Wright PetscCallCeed(ceed, CeedQFunctionContextGetDataRead(problem->apply_vol_ifunction.qfctx, CEED_MEM_HOST, &newt_ctx));
701cde3d787SJames Wright sgsdd_ctx->newt_ctx = *newt_ctx;
702cde3d787SJames Wright PetscCallCeed(ceed, CeedQFunctionContextRestoreDataRead(problem->apply_vol_ifunction.qfctx, &newt_ctx));
7030c373b74SJames Wright PetscCallCeed(ceed, CeedQFunctionContextCreate(honee->ceed, &sgs_dd_setup_data->sgsdd_qfctx));
704b4c37c5cSJames Wright PetscCallCeed(ceed,
705b4c37c5cSJames Wright CeedQFunctionContextSetData(sgs_dd_setup_data->sgsdd_qfctx, CEED_MEM_HOST, CEED_USE_POINTER, sgsdd_ctx->total_bytes, sgsdd_ctx));
706b4c37c5cSJames Wright PetscCallCeed(ceed, CeedQFunctionContextSetDataDestroy(sgs_dd_setup_data->sgsdd_qfctx, CEED_MEM_HOST, FreeContextPetsc));
707ee1455b7SJames Wright
708e07531f7SJames Wright PetscCallCeed(ceed, CeedQFunctionContextReferenceCopy(problem->apply_vol_ifunction.qfctx, &sgs_dd_setup_data->ifunction_qfctx));
70940816385SJames Wright
710c38c977aSJames Wright // -- Compute and store anisotropy tensor
711e3663b90SJames Wright PetscCall(GridAnisotropyTensorProjectionSetupApply(ceed, honee, &sgs_dd_setup_data->elem_restr_grid_aniso, &sgs_dd_setup_data->grid_aniso_ceed));
712c38c977aSJames Wright
713ee1455b7SJames Wright // -- Create Nodal Evaluation Operator
7144c07ec22SJames Wright switch (sgs_dd_setup_data->sgs_dd_model_implementation) {
7154c07ec22SJames Wright case SGS_MODEL_DD_FUSED:
716e3663b90SJames Wright PetscCall(SgsDDSetupNodalEvaluation_Fused(ceed, honee, sgs_dd_setup_data));
7174c07ec22SJames Wright break;
7184c07ec22SJames Wright case SGS_MODEL_DD_SEQENTIAL_CEED:
7194c07ec22SJames Wright case SGS_MODEL_DD_SEQENTIAL_TORCH:
720e3663b90SJames Wright PetscCall(SgsDDSetupNodalEvaluation_Sequential(ceed, honee, sgs_dd_setup_data));
7214c07ec22SJames Wright break;
7224c07ec22SJames Wright }
723ee1455b7SJames Wright
7249c678832SJames Wright // -- Create Operator to evalutate residual of SGS stress
725e3663b90SJames Wright PetscCall(SgsSetupNodalIFunction(ceed, honee, sgs_dd_setup_data));
7269c678832SJames Wright
727ad494f68SJames Wright PetscCall(SgsDDSetupDataDestroy(sgs_dd_setup_data));
728d949ddfcSJames Wright PetscFunctionReturn(PETSC_SUCCESS);
72962b7942eSJames Wright }
730