xref: /libCEED/tests/t524-operator.c (revision d1d35e2f02dc969aee8debf3fd943dd784aa847a)
1250756a7Sjeremylt /// @file
26227f746SJeremy L Thompson /// Test CeedOperatorApplyAdd for composite operator
36227f746SJeremy L Thompson /// \test CeedOperatorApplyAdd for composite operator
4250756a7Sjeremylt #include <ceed.h>
5250756a7Sjeremylt #include <stdlib.h>
6250756a7Sjeremylt #include <math.h>
7250756a7Sjeremylt #include "t320-basis.h"
8250756a7Sjeremylt #include "t510-operator.h"
9250756a7Sjeremylt 
10250756a7Sjeremylt /* The mesh comprises of two rows of 3 quadralaterals followed by one row
11250756a7Sjeremylt      of 6 triangles:
12250756a7Sjeremylt    _ _ _
13250756a7Sjeremylt   |_|_|_|
14250756a7Sjeremylt   |_|_|_|
15250756a7Sjeremylt   |/|/|/|
16250756a7Sjeremylt 
17250756a7Sjeremylt */
18250756a7Sjeremylt 
19250756a7Sjeremylt int main(int argc, char **argv) {
20250756a7Sjeremylt   Ceed ceed;
21*d1d35e2fSjeremylt   CeedElemRestriction elem_restr_x_tet, elem_restr_u_tet,
22*d1d35e2fSjeremylt                       elem_restr_qd_i_tet,
23*d1d35e2fSjeremylt                       elem_restr_x_hex, elem_restr_u_hex,
24*d1d35e2fSjeremylt                       elem_restr_qd_i_hex;
25*d1d35e2fSjeremylt   CeedBasis basis_x_tet, basis_u_tet,
26*d1d35e2fSjeremylt             basis_x_hex, basis_u_hex;
27*d1d35e2fSjeremylt   CeedQFunction qf_setup_tet, qf_mass_tet,
28*d1d35e2fSjeremylt                 qf_setup_hex, qf_mass_hex;
29*d1d35e2fSjeremylt   CeedOperator op_setup_tet, op_mass_tet,
30*d1d35e2fSjeremylt                op_setup_hex, op_mass_hex,
31250756a7Sjeremylt                op_setup, op_mass;
32*d1d35e2fSjeremylt   CeedVector q_data_tet, q_data_hex, X, U, V;
33250756a7Sjeremylt   const CeedScalar *hv;
34*d1d35e2fSjeremylt   CeedInt nelem_tet = 6, P_tet = 6, Q_tet = 4,
35*d1d35e2fSjeremylt           nelem_hex = 6, P_hex = 3, Q_hex = 4, dim = 2;
36250756a7Sjeremylt   CeedInt nx = 3, ny = 3,
37*d1d35e2fSjeremylt           nx_tet = 3, ny_tet = 1, nx_hex = 3;
38250756a7Sjeremylt   CeedInt row, col, offset;
39*d1d35e2fSjeremylt   CeedInt num_dofs = (nx*2+1)*(ny*2+1),
40*d1d35e2fSjeremylt           num_qpts_tet = nelem_tet*Q_tet,
41*d1d35e2fSjeremylt           num_qpts_hex = nelem_hex*Q_hex*Q_hex;
42*d1d35e2fSjeremylt   CeedInt ind_x_tet[nelem_tet*P_tet],
43*d1d35e2fSjeremylt           ind_x_hex[nelem_hex*P_hex*P_hex];
44*d1d35e2fSjeremylt   CeedScalar x[dim*num_dofs];
45*d1d35e2fSjeremylt   CeedScalar q_ref[dim*Q_tet], q_weight[Q_tet];
46*d1d35e2fSjeremylt   CeedScalar interp[P_tet*Q_tet], grad[dim*P_tet*Q_tet];
47250756a7Sjeremylt   CeedScalar sum;
48250756a7Sjeremylt 
49250756a7Sjeremylt   CeedInit(argv[1], &ceed);
50250756a7Sjeremylt 
51250756a7Sjeremylt   // DoF Coordinates
52250756a7Sjeremylt   for (CeedInt i=0; i<ny*2+1; i++)
53250756a7Sjeremylt     for (CeedInt j=0; j<nx*2+1; j++) {
54*d1d35e2fSjeremylt       x[i+j*(ny*2+1)+0*num_dofs] = (CeedScalar) i / (2*ny);
55*d1d35e2fSjeremylt       x[i+j*(ny*2+1)+1*num_dofs] = (CeedScalar) j / (2*nx);
56250756a7Sjeremylt     }
57*d1d35e2fSjeremylt   CeedVectorCreate(ceed, dim*num_dofs, &X);
58250756a7Sjeremylt   CeedVectorSetArray(X, CEED_MEM_HOST, CEED_USE_POINTER, x);
59250756a7Sjeremylt 
60250756a7Sjeremylt   // Qdata Vectors
61*d1d35e2fSjeremylt   CeedVectorCreate(ceed, num_qpts_tet, &q_data_tet);
62*d1d35e2fSjeremylt   CeedVectorCreate(ceed, num_qpts_hex, &q_data_hex);
63250756a7Sjeremylt 
64*d1d35e2fSjeremylt   // _tet Elements
65*d1d35e2fSjeremylt   for (CeedInt i=0; i<nelem_tet/2; i++) {
66*d1d35e2fSjeremylt     col = i % nx_tet;
67*d1d35e2fSjeremylt     row = i / nx_tet;
68*d1d35e2fSjeremylt     offset = col*2 + row*(nx_tet*2+1)*2;
69250756a7Sjeremylt 
70*d1d35e2fSjeremylt     ind_x_tet[i*2*P_tet +  0] =  2 + offset;
71*d1d35e2fSjeremylt     ind_x_tet[i*2*P_tet +  1] =  9 + offset;
72*d1d35e2fSjeremylt     ind_x_tet[i*2*P_tet +  2] = 16 + offset;
73*d1d35e2fSjeremylt     ind_x_tet[i*2*P_tet +  3] =  1 + offset;
74*d1d35e2fSjeremylt     ind_x_tet[i*2*P_tet +  4] =  8 + offset;
75*d1d35e2fSjeremylt     ind_x_tet[i*2*P_tet +  5] =  0 + offset;
76250756a7Sjeremylt 
77*d1d35e2fSjeremylt     ind_x_tet[i*2*P_tet +  6] = 14 + offset;
78*d1d35e2fSjeremylt     ind_x_tet[i*2*P_tet +  7] =  7 + offset;
79*d1d35e2fSjeremylt     ind_x_tet[i*2*P_tet +  8] =  0 + offset;
80*d1d35e2fSjeremylt     ind_x_tet[i*2*P_tet +  9] = 15 + offset;
81*d1d35e2fSjeremylt     ind_x_tet[i*2*P_tet + 10] =  8 + offset;
82*d1d35e2fSjeremylt     ind_x_tet[i*2*P_tet + 11] = 16 + offset;
83250756a7Sjeremylt   }
84250756a7Sjeremylt 
85250756a7Sjeremylt   // -- Restrictions
86*d1d35e2fSjeremylt   CeedElemRestrictionCreate(ceed, nelem_tet, P_tet, dim, num_dofs, dim*num_dofs,
87*d1d35e2fSjeremylt                             CEED_MEM_HOST, CEED_USE_POINTER, ind_x_tet,
88*d1d35e2fSjeremylt                             &elem_restr_x_tet);
89250756a7Sjeremylt 
90*d1d35e2fSjeremylt   CeedElemRestrictionCreate(ceed, nelem_tet, P_tet, 1, 1, num_dofs,
91*d1d35e2fSjeremylt                             CEED_MEM_HOST, CEED_USE_POINTER, ind_x_tet,
92*d1d35e2fSjeremylt                             &elem_restr_u_tet);
93*d1d35e2fSjeremylt   CeedInt strides_qd_tet[3] = {1, Q_tet, Q_tet};
94*d1d35e2fSjeremylt   CeedElemRestrictionCreateStrided(ceed,  nelem_tet, Q_tet, 1, num_qpts_tet,
95*d1d35e2fSjeremylt                                    strides_qd_tet, &elem_restr_qd_i_tet);
96250756a7Sjeremylt 
97250756a7Sjeremylt   // -- Bases
98*d1d35e2fSjeremylt   buildmats(q_ref, q_weight, interp, grad);
99*d1d35e2fSjeremylt   CeedBasisCreateH1(ceed, CEED_TRIANGLE, dim, P_tet, Q_tet, interp, grad, q_ref,
100*d1d35e2fSjeremylt                     q_weight, &basis_x_tet);
101250756a7Sjeremylt 
102*d1d35e2fSjeremylt   buildmats(q_ref, q_weight, interp, grad);
103*d1d35e2fSjeremylt   CeedBasisCreateH1(ceed, CEED_TRIANGLE, 1, P_tet, Q_tet, interp, grad, q_ref,
104*d1d35e2fSjeremylt                     q_weight, &basis_u_tet);
105250756a7Sjeremylt 
106250756a7Sjeremylt   // -- QFunctions
107*d1d35e2fSjeremylt   CeedQFunctionCreateInterior(ceed, 1, setup, setup_loc, &qf_setup_tet);
108*d1d35e2fSjeremylt   CeedQFunctionAddInput(qf_setup_tet, "_weight", 1, CEED_EVAL_WEIGHT);
109*d1d35e2fSjeremylt   CeedQFunctionAddInput(qf_setup_tet, "dx", dim*dim, CEED_EVAL_GRAD);
110*d1d35e2fSjeremylt   CeedQFunctionAddOutput(qf_setup_tet, "rho", 1, CEED_EVAL_NONE);
111250756a7Sjeremylt 
112*d1d35e2fSjeremylt   CeedQFunctionCreateInterior(ceed, 1, mass, mass_loc, &qf_mass_tet);
113*d1d35e2fSjeremylt   CeedQFunctionAddInput(qf_mass_tet, "rho", 1, CEED_EVAL_NONE);
114*d1d35e2fSjeremylt   CeedQFunctionAddInput(qf_mass_tet, "u", 1, CEED_EVAL_INTERP);
115*d1d35e2fSjeremylt   CeedQFunctionAddOutput(qf_mass_tet, "v", 1, CEED_EVAL_INTERP);
116250756a7Sjeremylt 
117250756a7Sjeremylt   // -- Operators
118*d1d35e2fSjeremylt   // ---- Setup _tet
119*d1d35e2fSjeremylt   CeedOperatorCreate(ceed, qf_setup_tet, CEED_QFUNCTION_NONE,
120*d1d35e2fSjeremylt                      CEED_QFUNCTION_NONE, &op_setup_tet);
121*d1d35e2fSjeremylt   CeedOperatorSetField(op_setup_tet, "_weight", CEED_ELEMRESTRICTION_NONE,
122*d1d35e2fSjeremylt                        basis_x_tet,
123a8d32208Sjeremylt                        CEED_VECTOR_NONE);
124*d1d35e2fSjeremylt   CeedOperatorSetField(op_setup_tet, "dx", elem_restr_x_tet, basis_x_tet,
125a8d32208Sjeremylt                        CEED_VECTOR_ACTIVE);
126*d1d35e2fSjeremylt   CeedOperatorSetField(op_setup_tet, "rho", elem_restr_qd_i_tet,
127*d1d35e2fSjeremylt                        CEED_BASIS_COLLOCATED, q_data_tet);
128*d1d35e2fSjeremylt   // ---- Mass _tet
129*d1d35e2fSjeremylt   CeedOperatorCreate(ceed, qf_mass_tet, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE,
130*d1d35e2fSjeremylt                      &op_mass_tet);
131*d1d35e2fSjeremylt   CeedOperatorSetField(op_mass_tet, "rho", elem_restr_qd_i_tet,
132*d1d35e2fSjeremylt                        CEED_BASIS_COLLOCATED,
133*d1d35e2fSjeremylt                        q_data_tet);
134*d1d35e2fSjeremylt   CeedOperatorSetField(op_mass_tet, "u", elem_restr_u_tet, basis_u_tet,
135a8d32208Sjeremylt                        CEED_VECTOR_ACTIVE);
136*d1d35e2fSjeremylt   CeedOperatorSetField(op_mass_tet, "v", elem_restr_u_tet, basis_u_tet,
137a8d32208Sjeremylt                        CEED_VECTOR_ACTIVE);
138250756a7Sjeremylt 
139*d1d35e2fSjeremylt   // _hex Elements
140*d1d35e2fSjeremylt   for (CeedInt i=0; i<nelem_hex; i++) {
141*d1d35e2fSjeremylt     col = i % nx_hex;
142*d1d35e2fSjeremylt     row = i / nx_hex;
143*d1d35e2fSjeremylt     offset = (nx_tet*2+1)*(ny_tet*2)*(1+row) + col*2;
144*d1d35e2fSjeremylt     for (CeedInt j=0; j<P_hex; j++)
145*d1d35e2fSjeremylt       for (CeedInt k=0; k<P_hex; k++)
146*d1d35e2fSjeremylt         ind_x_hex[P_hex*(P_hex*i+k)+j] = offset + k*(nx_hex*2+1) + j;
147250756a7Sjeremylt   }
148250756a7Sjeremylt 
149250756a7Sjeremylt   // -- Restrictions
150*d1d35e2fSjeremylt   CeedElemRestrictionCreate(ceed, nelem_hex, P_hex*P_hex, dim, num_dofs,
151*d1d35e2fSjeremylt                             dim*num_dofs,
152*d1d35e2fSjeremylt                             CEED_MEM_HOST, CEED_USE_POINTER, ind_x_hex,
153*d1d35e2fSjeremylt                             &elem_restr_x_hex);
154250756a7Sjeremylt 
155*d1d35e2fSjeremylt   CeedElemRestrictionCreate(ceed, nelem_hex, P_hex*P_hex, 1, 1, num_dofs,
156*d1d35e2fSjeremylt                             CEED_MEM_HOST, CEED_USE_POINTER, ind_x_hex,
157*d1d35e2fSjeremylt                             &elem_restr_u_hex);
158*d1d35e2fSjeremylt   CeedInt strides_qd_hex[3] = {1, Q_hex*Q_hex, Q_hex*Q_hex};
159*d1d35e2fSjeremylt   CeedElemRestrictionCreateStrided(ceed, nelem_hex, Q_hex*Q_hex, 1, num_qpts_hex,
160*d1d35e2fSjeremylt                                    strides_qd_hex, &elem_restr_qd_i_hex);
161250756a7Sjeremylt 
162250756a7Sjeremylt   // -- Bases
163*d1d35e2fSjeremylt   CeedBasisCreateTensorH1Lagrange(ceed, dim, dim, P_hex, Q_hex, CEED_GAUSS,
164*d1d35e2fSjeremylt                                   &basis_x_hex);
165*d1d35e2fSjeremylt   CeedBasisCreateTensorH1Lagrange(ceed, dim, 1, P_hex, Q_hex, CEED_GAUSS,
166*d1d35e2fSjeremylt                                   &basis_u_hex);
167250756a7Sjeremylt 
168250756a7Sjeremylt   // -- QFunctions
169*d1d35e2fSjeremylt   CeedQFunctionCreateInterior(ceed, 1, setup, setup_loc, &qf_setup_hex);
170*d1d35e2fSjeremylt   CeedQFunctionAddInput(qf_setup_hex, "_weight", 1, CEED_EVAL_WEIGHT);
171*d1d35e2fSjeremylt   CeedQFunctionAddInput(qf_setup_hex, "dx", dim*dim, CEED_EVAL_GRAD);
172*d1d35e2fSjeremylt   CeedQFunctionAddOutput(qf_setup_hex, "rho", 1, CEED_EVAL_NONE);
173250756a7Sjeremylt 
174*d1d35e2fSjeremylt   CeedQFunctionCreateInterior(ceed, 1, mass, mass_loc, &qf_mass_hex);
175*d1d35e2fSjeremylt   CeedQFunctionAddInput(qf_mass_hex, "rho", 1, CEED_EVAL_NONE);
176*d1d35e2fSjeremylt   CeedQFunctionAddInput(qf_mass_hex, "u", 1, CEED_EVAL_INTERP);
177*d1d35e2fSjeremylt   CeedQFunctionAddOutput(qf_mass_hex, "v", 1, CEED_EVAL_INTERP);
178250756a7Sjeremylt 
179250756a7Sjeremylt   // -- Operators
180*d1d35e2fSjeremylt   CeedOperatorCreate(ceed, qf_setup_hex, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE,
181*d1d35e2fSjeremylt                      &op_setup_hex);
182*d1d35e2fSjeremylt   CeedOperatorSetField(op_setup_hex, "_weight", CEED_ELEMRESTRICTION_NONE,
183*d1d35e2fSjeremylt                        basis_x_hex,
184a8d32208Sjeremylt                        CEED_VECTOR_NONE);
185*d1d35e2fSjeremylt   CeedOperatorSetField(op_setup_hex, "dx", elem_restr_x_hex, basis_x_hex,
186a8d32208Sjeremylt                        CEED_VECTOR_ACTIVE);
187*d1d35e2fSjeremylt   CeedOperatorSetField(op_setup_hex, "rho", elem_restr_qd_i_hex,
188*d1d35e2fSjeremylt                        CEED_BASIS_COLLOCATED, q_data_hex);
189250756a7Sjeremylt 
190*d1d35e2fSjeremylt   CeedOperatorCreate(ceed, qf_mass_hex, CEED_QFUNCTION_NONE, CEED_QFUNCTION_NONE,
191*d1d35e2fSjeremylt                      &op_mass_hex);
192*d1d35e2fSjeremylt   CeedOperatorSetField(op_mass_hex, "rho", elem_restr_qd_i_hex,
193*d1d35e2fSjeremylt                        CEED_BASIS_COLLOCATED,
194*d1d35e2fSjeremylt                        q_data_hex);
195*d1d35e2fSjeremylt   CeedOperatorSetField(op_mass_hex, "u", elem_restr_u_hex, basis_u_hex,
196a8d32208Sjeremylt                        CEED_VECTOR_ACTIVE);
197*d1d35e2fSjeremylt   CeedOperatorSetField(op_mass_hex, "v", elem_restr_u_hex, basis_u_hex,
198a8d32208Sjeremylt                        CEED_VECTOR_ACTIVE);
199250756a7Sjeremylt 
200250756a7Sjeremylt   // Composite Operators
201250756a7Sjeremylt   CeedCompositeOperatorCreate(ceed, &op_setup);
202*d1d35e2fSjeremylt   CeedCompositeOperatorAddSub(op_setup, op_setup_tet);
203*d1d35e2fSjeremylt   CeedCompositeOperatorAddSub(op_setup, op_setup_hex);
204250756a7Sjeremylt 
205250756a7Sjeremylt   CeedCompositeOperatorCreate(ceed, &op_mass);
206*d1d35e2fSjeremylt   CeedCompositeOperatorAddSub(op_mass, op_mass_tet);
207*d1d35e2fSjeremylt   CeedCompositeOperatorAddSub(op_mass, op_mass_hex);
208250756a7Sjeremylt 
209250756a7Sjeremylt   // Apply Setup Operator
210250756a7Sjeremylt   CeedOperatorApply(op_setup, X, CEED_VECTOR_NONE, CEED_REQUEST_IMMEDIATE);
211250756a7Sjeremylt 
212250756a7Sjeremylt   // Apply Mass Operator
213*d1d35e2fSjeremylt   CeedVectorCreate(ceed, num_dofs, &U);
214250756a7Sjeremylt   CeedVectorSetValue(U, 1.0);
215*d1d35e2fSjeremylt   CeedVectorCreate(ceed, num_dofs, &V);
216250756a7Sjeremylt   CeedVectorSetValue(V, 0.0);
217250756a7Sjeremylt 
218250756a7Sjeremylt   // Apply
219250756a7Sjeremylt   CeedOperatorApplyAdd(op_mass, U, V, CEED_REQUEST_IMMEDIATE);
220250756a7Sjeremylt 
221250756a7Sjeremylt   // Check output
222250756a7Sjeremylt   CeedVectorGetArrayRead(V, CEED_MEM_HOST, &hv);
223250756a7Sjeremylt   sum = 0.;
224*d1d35e2fSjeremylt   for (CeedInt i=0; i<num_dofs; i++)
225250756a7Sjeremylt     sum += hv[i];
226250756a7Sjeremylt   if (fabs(sum-1.)>1e-10) printf("Computed Area: %f != True Area: 1.0\n", sum);
227250756a7Sjeremylt   CeedVectorRestoreArrayRead(V, &hv);
228250756a7Sjeremylt 
229250756a7Sjeremylt   // Apply Add
230250756a7Sjeremylt   CeedVectorSetValue(V, 1.0);
231250756a7Sjeremylt   CeedOperatorApplyAdd(op_mass, U, V, CEED_REQUEST_IMMEDIATE);
232250756a7Sjeremylt 
233250756a7Sjeremylt   // Check output
234250756a7Sjeremylt   CeedVectorGetArrayRead(V, CEED_MEM_HOST, &hv);
235*d1d35e2fSjeremylt   sum = -num_dofs;
236*d1d35e2fSjeremylt   for (CeedInt i=0; i<num_dofs; i++)
237250756a7Sjeremylt     sum += hv[i];
238250756a7Sjeremylt   if (fabs(sum-1.)>1e-10) printf("Computed Area: %f != True Area: 1.0\n", sum);
239250756a7Sjeremylt   CeedVectorRestoreArrayRead(V, &hv);
240250756a7Sjeremylt 
241250756a7Sjeremylt   // Cleanup
242*d1d35e2fSjeremylt   CeedQFunctionDestroy(&qf_setup_tet);
243*d1d35e2fSjeremylt   CeedQFunctionDestroy(&qf_mass_tet);
244*d1d35e2fSjeremylt   CeedOperatorDestroy(&op_setup_tet);
245*d1d35e2fSjeremylt   CeedOperatorDestroy(&op_mass_tet);
246*d1d35e2fSjeremylt   CeedQFunctionDestroy(&qf_setup_hex);
247*d1d35e2fSjeremylt   CeedQFunctionDestroy(&qf_mass_hex);
248*d1d35e2fSjeremylt   CeedOperatorDestroy(&op_setup_hex);
249*d1d35e2fSjeremylt   CeedOperatorDestroy(&op_mass_hex);
250250756a7Sjeremylt   CeedOperatorDestroy(&op_setup);
251250756a7Sjeremylt   CeedOperatorDestroy(&op_mass);
252*d1d35e2fSjeremylt   CeedElemRestrictionDestroy(&elem_restr_u_tet);
253*d1d35e2fSjeremylt   CeedElemRestrictionDestroy(&elem_restr_x_tet);
254*d1d35e2fSjeremylt   CeedElemRestrictionDestroy(&elem_restr_qd_i_tet);
255*d1d35e2fSjeremylt   CeedElemRestrictionDestroy(&elem_restr_u_hex);
256*d1d35e2fSjeremylt   CeedElemRestrictionDestroy(&elem_restr_x_hex);
257*d1d35e2fSjeremylt   CeedElemRestrictionDestroy(&elem_restr_qd_i_hex);
258*d1d35e2fSjeremylt   CeedBasisDestroy(&basis_u_tet);
259*d1d35e2fSjeremylt   CeedBasisDestroy(&basis_x_tet);
260*d1d35e2fSjeremylt   CeedBasisDestroy(&basis_u_hex);
261*d1d35e2fSjeremylt   CeedBasisDestroy(&basis_x_hex);
262250756a7Sjeremylt   CeedVectorDestroy(&X);
263250756a7Sjeremylt   CeedVectorDestroy(&U);
264250756a7Sjeremylt   CeedVectorDestroy(&V);
265*d1d35e2fSjeremylt   CeedVectorDestroy(&q_data_tet);
266*d1d35e2fSjeremylt   CeedVectorDestroy(&q_data_hex);
267250756a7Sjeremylt   CeedDestroy(&ceed);
268250756a7Sjeremylt   return 0;
269250756a7Sjeremylt }
270