xref: /libCEED/examples/ceed/ex2-surface.c (revision 66087c0803b66a861339d30698fcb9988ebff34d)
1*66087c08SValeria Barra // Copyright (c) 2017-2018, Lawrence Livermore National Security, LLC.
2*66087c08SValeria Barra // Produced at the Lawrence Livermore National Laboratory. LLNL-CODE-734707.
3*66087c08SValeria Barra // All Rights reserved. See files LICENSE and NOTICE for details.
4*66087c08SValeria Barra //
5*66087c08SValeria Barra // This file is part of CEED, a collection of benchmarks, miniapps, software
6*66087c08SValeria Barra // libraries and APIs for efficient high-order finite element and spectral
7*66087c08SValeria Barra // element discretizations for exascale applications. For more information and
8*66087c08SValeria Barra // source code availability see http://github.com/ceed.
9*66087c08SValeria Barra //
10*66087c08SValeria Barra // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC,
11*66087c08SValeria Barra // a collaborative effort of two U.S. Department of Energy organizations (Office
12*66087c08SValeria Barra // of Science and the National Nuclear Security Administration) responsible for
13*66087c08SValeria Barra // the planning and preparation of a capable exascale ecosystem, including
14*66087c08SValeria Barra // software, applications, hardware, advanced system engineering and early
15*66087c08SValeria Barra // testbed platforms, in support of the nation's exascale computing imperative.
16*66087c08SValeria Barra 
17*66087c08SValeria Barra //                             libCEED Example 2
18*66087c08SValeria Barra //
19*66087c08SValeria Barra // This example illustrates a simple usage of libCEED to compute the surface
20*66087c08SValeria Barra // area of a 3D body using matrix-free application of a diffusion operator.
21*66087c08SValeria Barra // Arbitrary mesh and solution orders in 1D, 2D and 3D are supported from the
22*66087c08SValeria Barra // same code.
23*66087c08SValeria Barra //
24*66087c08SValeria Barra // The example has no dependencies, and is designed to be self-contained. For
25*66087c08SValeria Barra // additional examples that use external discretization libraries (MFEM, PETSc,
26*66087c08SValeria Barra // etc.) see the subdirectories in libceed/examples.
27*66087c08SValeria Barra //
28*66087c08SValeria Barra // All libCEED objects use a Ceed device object constructed based on a command
29*66087c08SValeria Barra // line argument (-ceed).
30*66087c08SValeria Barra //
31*66087c08SValeria Barra // Build with:
32*66087c08SValeria Barra //
33*66087c08SValeria Barra //     make ex2-surface [CEED_DIR=</path/to/libceed>]
34*66087c08SValeria Barra //
35*66087c08SValeria Barra // Sample runs:
36*66087c08SValeria Barra //
37*66087c08SValeria Barra //     ./ex2-surface
38*66087c08SValeria Barra //     ./ex2-surface -ceed /cpu/self
39*66087c08SValeria Barra //     ./ex2-surface -ceed /gpu/occa
40*66087c08SValeria Barra //     ./ex2-surface -ceed /cpu/occa
41*66087c08SValeria Barra //     ./ex2-surface -ceed /omp/occa
42*66087c08SValeria Barra //     ./ex2-surface -ceed /ocl/occa
43*66087c08SValeria Barra //     ./ex2-surface -m ../../../mfem/data/fichera.mesh
44*66087c08SValeria Barra //     ./ex2-surface -m ../../../mfem/data/star.vtk -o 3
45*66087c08SValeria Barra //     ./ex2-surface -m ../../../mfem/data/inline-segment.mesh -o 8
46*66087c08SValeria Barra //
47*66087c08SValeria Barra // Next line is grep'd from tap.sh to set its arguments
48*66087c08SValeria Barra // Test in 1D-3D
49*66087c08SValeria Barra //TESTARGS -ceed {ceed_resource} -d 2 -t
50*66087c08SValeria Barra //TESTARGS -ceed {ceed_resource} -d 1 -t -g
51*66087c08SValeria Barra //TESTARGS -ceed {ceed_resource} -d 2 -t -g
52*66087c08SValeria Barra //TESTARGS -ceed {ceed_resource} -d 3 -t -g
53*66087c08SValeria Barra 
54*66087c08SValeria Barra /// @file
55*66087c08SValeria Barra /// libCEED example using diffusion operator to compute surface area
56*66087c08SValeria Barra 
57*66087c08SValeria Barra #include <ceed.h>
58*66087c08SValeria Barra #include <stdlib.h>
59*66087c08SValeria Barra #include <math.h>
60*66087c08SValeria Barra #include <string.h>
61*66087c08SValeria Barra 
62*66087c08SValeria Barra #include "ex2-surface.h"
63*66087c08SValeria Barra 
64*66087c08SValeria Barra // Auxiliary functions.
65*66087c08SValeria Barra int GetCartesianMeshSize(int dim, int order, int prob_size, int nxyz[3]);
66*66087c08SValeria Barra int BuildCartesianRestriction(Ceed ceed, int dim, int nxyz[3], int order,
67*66087c08SValeria Barra                               int ncomp, CeedInt *size, CeedInt num_qpts,
68*66087c08SValeria Barra                               CeedElemRestriction *restr,
69*66087c08SValeria Barra                               CeedElemRestriction *restr_i);
70*66087c08SValeria Barra int SetCartesianMeshCoords(int dim, int nxyz[3], int mesh_order,
71*66087c08SValeria Barra                            CeedVector mesh_coords);
72*66087c08SValeria Barra CeedScalar TransformMeshCoords(int dim, int mesh_size, CeedVector mesh_coords);
73*66087c08SValeria Barra 
74*66087c08SValeria Barra 
75*66087c08SValeria Barra int main(int argc, const char *argv[]) {
76*66087c08SValeria Barra   const char *ceed_spec = "/cpu/self";
77*66087c08SValeria Barra   int dim        = 3;           // dimension of the mesh
78*66087c08SValeria Barra   int ncompx     = 3;           // number of x components
79*66087c08SValeria Barra   int mesh_order = 4;           // polynomial degree for the mesh
80*66087c08SValeria Barra   int sol_order  = 4;           // polynomial degree for the solution
81*66087c08SValeria Barra   int num_qpts   = sol_order+2; // number of 1D quadrature points
82*66087c08SValeria Barra   int prob_size  = -1;          // approximate problem size
83*66087c08SValeria Barra   int help = 0, test = 0, gallery = 0;
84*66087c08SValeria Barra 
85*66087c08SValeria Barra   // Process command line arguments.
86*66087c08SValeria Barra   for (int ia = 1; ia < argc; ia++) {
87*66087c08SValeria Barra     int next_arg = ((ia+1) < argc), parse_error = 0;
88*66087c08SValeria Barra     if (!strcmp(argv[ia],"-h")) {
89*66087c08SValeria Barra       help = 1;
90*66087c08SValeria Barra     } else if (!strcmp(argv[ia],"-c") || !strcmp(argv[ia],"-ceed")) {
91*66087c08SValeria Barra       parse_error = next_arg ? ceed_spec = argv[++ia], 0 : 1;
92*66087c08SValeria Barra     } else if (!strcmp(argv[ia],"-d")) {
93*66087c08SValeria Barra       parse_error = next_arg ? dim = atoi(argv[++ia]), 0 : 1;
94*66087c08SValeria Barra       ncompx = dim;
95*66087c08SValeria Barra     } else if (!strcmp(argv[ia],"-m")) {
96*66087c08SValeria Barra       parse_error = next_arg ? mesh_order = atoi(argv[++ia]), 0 : 1;
97*66087c08SValeria Barra     } else if (!strcmp(argv[ia],"-o")) {
98*66087c08SValeria Barra       parse_error = next_arg ? sol_order = atoi(argv[++ia]), 0 : 1;
99*66087c08SValeria Barra     } else if (!strcmp(argv[ia],"-q")) {
100*66087c08SValeria Barra       parse_error = next_arg ? num_qpts = atoi(argv[++ia]), 0 : 1;
101*66087c08SValeria Barra     } else if (!strcmp(argv[ia],"-s")) {
102*66087c08SValeria Barra       parse_error = next_arg ? prob_size = atoi(argv[++ia]), 0 : 1;
103*66087c08SValeria Barra     } else if (!strcmp(argv[ia],"-t")) {
104*66087c08SValeria Barra       test = 1;
105*66087c08SValeria Barra     } else if (!strcmp(argv[ia],"-g")) {
106*66087c08SValeria Barra       gallery = 1;
107*66087c08SValeria Barra     }
108*66087c08SValeria Barra     if (parse_error) {
109*66087c08SValeria Barra       printf("Error parsing command line options.\n");
110*66087c08SValeria Barra       return 1;
111*66087c08SValeria Barra     }
112*66087c08SValeria Barra   }
113*66087c08SValeria Barra   if (prob_size < 0) prob_size = test ? 16*16*dim*dim : 256*1024;
114*66087c08SValeria Barra 
115*66087c08SValeria Barra   // Set mesh_order = sol_order.
116*66087c08SValeria Barra   mesh_order = fmax(mesh_order, sol_order);
117*66087c08SValeria Barra   sol_order = mesh_order;
118*66087c08SValeria Barra 
119*66087c08SValeria Barra   // Print the values of all options:
120*66087c08SValeria Barra   if (!test || help) {
121*66087c08SValeria Barra     printf("Selected options: [command line option] : <current value>\n");
122*66087c08SValeria Barra     printf("  Ceed specification [-c] : %s\n", ceed_spec);
123*66087c08SValeria Barra     printf("  Mesh dimension     [-d] : %d\n", dim);
124*66087c08SValeria Barra     printf("  Mesh order         [-m] : %d\n", mesh_order);
125*66087c08SValeria Barra     printf("  Solution order     [-o] : %d\n", sol_order);
126*66087c08SValeria Barra     printf("  Num. 1D quadr. pts [-q] : %d\n", num_qpts);
127*66087c08SValeria Barra     printf("  Approx. # unknowns [-s] : %d\n", prob_size);
128*66087c08SValeria Barra     printf("  QFunction source   [-g] : %s\n", gallery?"gallery":"header");
129*66087c08SValeria Barra     if (help) {
130*66087c08SValeria Barra       printf("Test/quiet mode is %s\n", (test?"ON":"OFF (use -t to enable)"));
131*66087c08SValeria Barra       return 0;
132*66087c08SValeria Barra     }
133*66087c08SValeria Barra     printf("\n");
134*66087c08SValeria Barra   }
135*66087c08SValeria Barra 
136*66087c08SValeria Barra   // Select appropriate backend and logical device based on the <ceed-spec>
137*66087c08SValeria Barra   // command line argument.
138*66087c08SValeria Barra   Ceed ceed;
139*66087c08SValeria Barra   CeedInit(ceed_spec, &ceed);
140*66087c08SValeria Barra 
141*66087c08SValeria Barra   // Construct the mesh and solution bases.
142*66087c08SValeria Barra   CeedBasis mesh_basis, sol_basis;
143*66087c08SValeria Barra   CeedBasisCreateTensorH1Lagrange(ceed, dim, ncompx, mesh_order+1, num_qpts,
144*66087c08SValeria Barra                                   CEED_GAUSS, &mesh_basis);
145*66087c08SValeria Barra   CeedBasisCreateTensorH1Lagrange(ceed, dim, 1, sol_order+1, num_qpts,
146*66087c08SValeria Barra                                   CEED_GAUSS, &sol_basis);
147*66087c08SValeria Barra 
148*66087c08SValeria Barra   // Determine the mesh size based on the given approximate problem size.
149*66087c08SValeria Barra   int nxyz[3];
150*66087c08SValeria Barra   GetCartesianMeshSize(dim, sol_order, prob_size, nxyz);
151*66087c08SValeria Barra 
152*66087c08SValeria Barra   if (!test) {
153*66087c08SValeria Barra     printf("Mesh size: nx = %d", nxyz[0]);
154*66087c08SValeria Barra     if (dim > 1) { printf(", ny = %d", nxyz[1]); }
155*66087c08SValeria Barra     if (dim > 2) { printf(", nz = %d", nxyz[2]); }
156*66087c08SValeria Barra     printf("\n");
157*66087c08SValeria Barra   }
158*66087c08SValeria Barra 
159*66087c08SValeria Barra   // Build CeedElemRestriction objects describing the mesh and solution discrete
160*66087c08SValeria Barra   // representations.
161*66087c08SValeria Barra   CeedInt mesh_size, sol_size;
162*66087c08SValeria Barra   CeedElemRestriction mesh_restr, sol_restr, mesh_restr_i, sol_restr_i,
163*66087c08SValeria Barra                       qdata_restr_i;
164*66087c08SValeria Barra   BuildCartesianRestriction(ceed, dim, nxyz, mesh_order, ncompx, &mesh_size,
165*66087c08SValeria Barra                             num_qpts, &mesh_restr, &mesh_restr_i);
166*66087c08SValeria Barra   BuildCartesianRestriction(ceed, dim, nxyz, sol_order, dim*(dim+1)/2,
167*66087c08SValeria Barra                             &sol_size, num_qpts, NULL, &qdata_restr_i);
168*66087c08SValeria Barra   BuildCartesianRestriction(ceed, dim, nxyz, sol_order, 1, &sol_size,
169*66087c08SValeria Barra                             num_qpts, &sol_restr, &sol_restr_i);
170*66087c08SValeria Barra   if (!test) {
171*66087c08SValeria Barra     printf("Number of mesh nodes     : %d\n", mesh_size/dim);
172*66087c08SValeria Barra     printf("Number of solution nodes : %d\n", sol_size);
173*66087c08SValeria Barra   }
174*66087c08SValeria Barra 
175*66087c08SValeria Barra   // Create a CeedVector with the mesh coordinates.
176*66087c08SValeria Barra   CeedVector mesh_coords;
177*66087c08SValeria Barra   CeedVectorCreate(ceed, mesh_size, &mesh_coords);
178*66087c08SValeria Barra   SetCartesianMeshCoords(dim, nxyz, mesh_order, mesh_coords);
179*66087c08SValeria Barra 
180*66087c08SValeria Barra   // Apply a transformation to the mesh.
181*66087c08SValeria Barra   CeedScalar exact_sa = TransformMeshCoords(dim, mesh_size, mesh_coords);
182*66087c08SValeria Barra 
183*66087c08SValeria Barra   // Context data to be passed to the 'f_build_diff' Q-function.
184*66087c08SValeria Barra   struct BuildContext build_ctx;
185*66087c08SValeria Barra   build_ctx.dim = build_ctx.space_dim = dim;
186*66087c08SValeria Barra 
187*66087c08SValeria Barra   // Create the Q-function that builds the diffusion operator (i.e. computes its
188*66087c08SValeria Barra   // quadrature data) and set its context data.
189*66087c08SValeria Barra   CeedQFunction build_qfunc;
190*66087c08SValeria Barra   switch (gallery) {
191*66087c08SValeria Barra   case 0:
192*66087c08SValeria Barra     // This creates the QFunction directly.
193*66087c08SValeria Barra     CeedQFunctionCreateInterior(ceed, 1, f_build_diff,
194*66087c08SValeria Barra                                 f_build_diff_loc, &build_qfunc);
195*66087c08SValeria Barra     CeedQFunctionAddInput(build_qfunc, "dx", ncompx*dim, CEED_EVAL_GRAD);
196*66087c08SValeria Barra     CeedQFunctionAddInput(build_qfunc, "weights", 1, CEED_EVAL_WEIGHT);
197*66087c08SValeria Barra     CeedQFunctionAddOutput(build_qfunc, "qdata", dim*(dim+1)/2, CEED_EVAL_NONE);
198*66087c08SValeria Barra     CeedQFunctionSetContext(build_qfunc, &build_ctx, sizeof(build_ctx));
199*66087c08SValeria Barra     break;
200*66087c08SValeria Barra   case 1: {
201*66087c08SValeria Barra     // This creates the QFunction via the gallery.
202*66087c08SValeria Barra     char name[16] = "";
203*66087c08SValeria Barra     snprintf(name, sizeof name, "Poisson%dDBuild", dim);
204*66087c08SValeria Barra     CeedQFunctionCreateInteriorByName(ceed, name, &build_qfunc);
205*66087c08SValeria Barra     break;
206*66087c08SValeria Barra   }
207*66087c08SValeria Barra   }
208*66087c08SValeria Barra 
209*66087c08SValeria Barra   // Create the operator that builds the quadrature data for the diffusion
210*66087c08SValeria Barra   // operator.
211*66087c08SValeria Barra   CeedOperator build_oper;
212*66087c08SValeria Barra   CeedOperatorCreate(ceed, build_qfunc, CEED_QFUNCTION_NONE,
213*66087c08SValeria Barra                      CEED_QFUNCTION_NONE, &build_oper);
214*66087c08SValeria Barra   CeedOperatorSetField(build_oper, "dx", mesh_restr, CEED_NOTRANSPOSE,
215*66087c08SValeria Barra                        mesh_basis,CEED_VECTOR_ACTIVE);
216*66087c08SValeria Barra   CeedOperatorSetField(build_oper, "weights", mesh_restr_i, CEED_NOTRANSPOSE,
217*66087c08SValeria Barra                        mesh_basis, CEED_VECTOR_NONE);
218*66087c08SValeria Barra   CeedOperatorSetField(build_oper, "qdata", qdata_restr_i, CEED_NOTRANSPOSE,
219*66087c08SValeria Barra                        CEED_BASIS_COLLOCATED, CEED_VECTOR_ACTIVE);
220*66087c08SValeria Barra 
221*66087c08SValeria Barra   // Compute the quadrature data for the diffusion operator.
222*66087c08SValeria Barra   CeedVector qdata;
223*66087c08SValeria Barra   CeedInt elem_qpts = CeedIntPow(num_qpts, dim);
224*66087c08SValeria Barra   CeedInt num_elem = 1;
225*66087c08SValeria Barra   for (int d = 0; d < dim; d++)
226*66087c08SValeria Barra     num_elem *= nxyz[d];
227*66087c08SValeria Barra   CeedVectorCreate(ceed, num_elem*elem_qpts*dim*(dim+1)/2, &qdata);
228*66087c08SValeria Barra   if (!test) {
229*66087c08SValeria Barra     printf("Computing the quadrature data for the diffusion operator ...");
230*66087c08SValeria Barra     fflush(stdout);
231*66087c08SValeria Barra   }
232*66087c08SValeria Barra   CeedOperatorApply(build_oper, mesh_coords, qdata,
233*66087c08SValeria Barra                     CEED_REQUEST_IMMEDIATE);
234*66087c08SValeria Barra   if (!test) {
235*66087c08SValeria Barra     printf(" done.\n");
236*66087c08SValeria Barra   }
237*66087c08SValeria Barra 
238*66087c08SValeria Barra   // Create the Q-function that defines the action of the diffusion operator.
239*66087c08SValeria Barra   CeedQFunction apply_qfunc;
240*66087c08SValeria Barra   switch (gallery) {
241*66087c08SValeria Barra   case 0:
242*66087c08SValeria Barra     // This creates the QFunction directly.
243*66087c08SValeria Barra     CeedQFunctionCreateInterior(ceed, 1, f_apply_diff,
244*66087c08SValeria Barra                                 f_apply_diff_loc, &apply_qfunc);
245*66087c08SValeria Barra     CeedQFunctionAddInput(apply_qfunc, "du", dim, CEED_EVAL_GRAD);
246*66087c08SValeria Barra     CeedQFunctionAddInput(apply_qfunc, "qdata", dim*(dim+1)/2, CEED_EVAL_NONE);
247*66087c08SValeria Barra     CeedQFunctionAddOutput(apply_qfunc, "dv", dim, CEED_EVAL_GRAD);
248*66087c08SValeria Barra     CeedQFunctionSetContext(apply_qfunc, &build_ctx, sizeof(build_ctx));
249*66087c08SValeria Barra     break;
250*66087c08SValeria Barra   case 1: {
251*66087c08SValeria Barra     // This creates the QFunction via the gallery.
252*66087c08SValeria Barra     char name[16] = "";
253*66087c08SValeria Barra     snprintf(name, sizeof name, "Poisson%dDApply", dim);
254*66087c08SValeria Barra     CeedQFunctionCreateInteriorByName(ceed, name, &apply_qfunc);
255*66087c08SValeria Barra     break;
256*66087c08SValeria Barra   }
257*66087c08SValeria Barra   }
258*66087c08SValeria Barra 
259*66087c08SValeria Barra   // Create the diffusion operator.
260*66087c08SValeria Barra   CeedOperator oper;
261*66087c08SValeria Barra   CeedOperatorCreate(ceed, apply_qfunc, CEED_QFUNCTION_NONE,
262*66087c08SValeria Barra                      CEED_QFUNCTION_NONE, &oper);
263*66087c08SValeria Barra   CeedOperatorSetField(oper, "du", sol_restr, CEED_NOTRANSPOSE,
264*66087c08SValeria Barra                        sol_basis, CEED_VECTOR_ACTIVE);
265*66087c08SValeria Barra   CeedOperatorSetField(oper, "qdata", qdata_restr_i, CEED_NOTRANSPOSE,
266*66087c08SValeria Barra                        CEED_BASIS_COLLOCATED, qdata);
267*66087c08SValeria Barra   CeedOperatorSetField(oper, "dv", sol_restr, CEED_NOTRANSPOSE,
268*66087c08SValeria Barra                        sol_basis, CEED_VECTOR_ACTIVE);
269*66087c08SValeria Barra 
270*66087c08SValeria Barra   // Compute the mesh surface area using the diff operator:
271*66087c08SValeria Barra   //                                             sa = 1^T \cdot abs( K \cdot x).
272*66087c08SValeria Barra   if (!test) {
273*66087c08SValeria Barra     printf("Computing the mesh surface area using the formula: sa = 1^T.|K.x| ...");
274*66087c08SValeria Barra     fflush(stdout);
275*66087c08SValeria Barra   }
276*66087c08SValeria Barra 
277*66087c08SValeria Barra   // Create auxiliary solution-size vectors.
278*66087c08SValeria Barra   CeedVector u, v;
279*66087c08SValeria Barra   CeedVectorCreate(ceed, sol_size, &u);
280*66087c08SValeria Barra   CeedVectorCreate(ceed, sol_size, &v);
281*66087c08SValeria Barra 
282*66087c08SValeria Barra   // Initialize 'u' with sum of coordinates, x+y+z.
283*66087c08SValeria Barra   CeedScalar *u_host;
284*66087c08SValeria Barra   const CeedScalar *x_host;
285*66087c08SValeria Barra   CeedVectorGetArray(u, CEED_MEM_HOST, &u_host);
286*66087c08SValeria Barra   CeedVectorGetArrayRead(mesh_coords, CEED_MEM_HOST, &x_host);
287*66087c08SValeria Barra   for (CeedInt i = 0; i < sol_size; i++) {
288*66087c08SValeria Barra     u_host[i] = 0;
289*66087c08SValeria Barra     for (CeedInt d = 0; d < dim; d++)
290*66087c08SValeria Barra       u_host[i] += x_host[i+d*sol_size];
291*66087c08SValeria Barra   }
292*66087c08SValeria Barra   CeedVectorRestoreArray(u, &u_host);
293*66087c08SValeria Barra   CeedVectorRestoreArrayRead(mesh_coords, &x_host);
294*66087c08SValeria Barra 
295*66087c08SValeria Barra   // Apply the diffusion operator: 'u' -> 'v'.
296*66087c08SValeria Barra   CeedOperatorApply(oper, u, v, CEED_REQUEST_IMMEDIATE);
297*66087c08SValeria Barra 
298*66087c08SValeria Barra   // Compute and print the sum of the entries of 'v' giving the mesh surface area.
299*66087c08SValeria Barra   const CeedScalar *v_host;
300*66087c08SValeria Barra   CeedVectorGetArrayRead(v, CEED_MEM_HOST, &v_host);
301*66087c08SValeria Barra   CeedScalar sa = 0.;
302*66087c08SValeria Barra   for (CeedInt i = 0; i < sol_size; i++) {
303*66087c08SValeria Barra     sa += fabs(v_host[i]);
304*66087c08SValeria Barra   }
305*66087c08SValeria Barra   CeedVectorRestoreArrayRead(v, &v_host);
306*66087c08SValeria Barra   if (!test) {
307*66087c08SValeria Barra     printf(" done.\n");
308*66087c08SValeria Barra     printf("Exact mesh surface area    : % .14g\n", exact_sa);
309*66087c08SValeria Barra     printf("Computed mesh surface area : % .14g\n", sa);
310*66087c08SValeria Barra     printf("Surface area error         : % .14g\n", sa-exact_sa);
311*66087c08SValeria Barra   } else {
312*66087c08SValeria Barra     CeedScalar tol = (dim==1? 1E-12 : dim==2? 1E-1 : 1E-1);
313*66087c08SValeria Barra     if (fabs(sa-exact_sa)>tol)
314*66087c08SValeria Barra       printf("Surface area error         : % .14g\n", sa-exact_sa);
315*66087c08SValeria Barra   }
316*66087c08SValeria Barra 
317*66087c08SValeria Barra   // Free dynamically allocated memory.
318*66087c08SValeria Barra   CeedVectorDestroy(&u);
319*66087c08SValeria Barra   CeedVectorDestroy(&v);
320*66087c08SValeria Barra   CeedVectorDestroy(&qdata);
321*66087c08SValeria Barra   CeedVectorDestroy(&mesh_coords);
322*66087c08SValeria Barra   CeedOperatorDestroy(&oper);
323*66087c08SValeria Barra   CeedQFunctionDestroy(&apply_qfunc);
324*66087c08SValeria Barra   CeedOperatorDestroy(&build_oper);
325*66087c08SValeria Barra   CeedQFunctionDestroy(&build_qfunc);
326*66087c08SValeria Barra   CeedElemRestrictionDestroy(&sol_restr);
327*66087c08SValeria Barra   CeedElemRestrictionDestroy(&mesh_restr);
328*66087c08SValeria Barra   CeedElemRestrictionDestroy(&sol_restr_i);
329*66087c08SValeria Barra   CeedElemRestrictionDestroy(&mesh_restr_i);
330*66087c08SValeria Barra   CeedElemRestrictionDestroy(&qdata_restr_i);
331*66087c08SValeria Barra   CeedBasisDestroy(&sol_basis);
332*66087c08SValeria Barra   CeedBasisDestroy(&mesh_basis);
333*66087c08SValeria Barra   CeedDestroy(&ceed);
334*66087c08SValeria Barra   return 0;
335*66087c08SValeria Barra }
336*66087c08SValeria Barra 
337*66087c08SValeria Barra 
338*66087c08SValeria Barra int GetCartesianMeshSize(int dim, int order, int prob_size, int nxyz[3]) {
339*66087c08SValeria Barra   // Use the approximate formula:
340*66087c08SValeria Barra   //    prob_size ~ num_elem * order^dim
341*66087c08SValeria Barra   CeedInt num_elem = prob_size / CeedIntPow(order, dim);
342*66087c08SValeria Barra   CeedInt s = 0;  // find s: num_elem/2 < 2^s <= num_elem
343*66087c08SValeria Barra   while (num_elem > 1) {
344*66087c08SValeria Barra     num_elem /= 2;
345*66087c08SValeria Barra     s++;
346*66087c08SValeria Barra   }
347*66087c08SValeria Barra   CeedInt r = s%dim;
348*66087c08SValeria Barra   for (int d = 0; d < dim; d++) {
349*66087c08SValeria Barra     int sd = s/dim;
350*66087c08SValeria Barra     if (r > 0) { sd++; r--; }
351*66087c08SValeria Barra     nxyz[d] = 1 << sd;
352*66087c08SValeria Barra   }
353*66087c08SValeria Barra   return 0;
354*66087c08SValeria Barra }
355*66087c08SValeria Barra 
356*66087c08SValeria Barra int BuildCartesianRestriction(Ceed ceed, int dim, int nxyz[3], int order,
357*66087c08SValeria Barra                               int ncomp, CeedInt *size, CeedInt num_qpts,
358*66087c08SValeria Barra                               CeedElemRestriction *restr,
359*66087c08SValeria Barra                               CeedElemRestriction *restr_i) {
360*66087c08SValeria Barra   CeedInt p = order, pp1 = p+1;
361*66087c08SValeria Barra   CeedInt nnodes = CeedIntPow(pp1, dim); // number of scal. nodes per element
362*66087c08SValeria Barra   CeedInt elem_qpts = CeedIntPow(num_qpts, dim); // number of qpts per element
363*66087c08SValeria Barra   CeedInt nd[3], num_elem = 1, scalar_size = 1;
364*66087c08SValeria Barra   for (int d = 0; d < dim; d++) {
365*66087c08SValeria Barra     num_elem *= nxyz[d];
366*66087c08SValeria Barra     nd[d] = nxyz[d]*p + 1;
367*66087c08SValeria Barra     scalar_size *= nd[d];
368*66087c08SValeria Barra   }
369*66087c08SValeria Barra   *size = scalar_size*ncomp;
370*66087c08SValeria Barra   // elem:         0             1                 n-1
371*66087c08SValeria Barra   //        |---*-...-*---|---*-...-*---|- ... -|--...--|
372*66087c08SValeria Barra   // nnodes:   0   1    p-1  p  p+1       2*p             n*p
373*66087c08SValeria Barra   CeedInt *el_nodes = malloc(sizeof(CeedInt)*num_elem*nnodes);
374*66087c08SValeria Barra   for (CeedInt e = 0; e < num_elem; e++) {
375*66087c08SValeria Barra     CeedInt exyz[3], re = e;
376*66087c08SValeria Barra     for (int d = 0; d < dim; d++) { exyz[d] = re%nxyz[d]; re /= nxyz[d]; }
377*66087c08SValeria Barra     CeedInt *loc_el_nodes = el_nodes + e*nnodes;
378*66087c08SValeria Barra     for (int lnodes = 0; lnodes < nnodes; lnodes++) {
379*66087c08SValeria Barra       CeedInt gnodes = 0, gnodes_stride = 1, rnodes = lnodes;
380*66087c08SValeria Barra       for (int d = 0; d < dim; d++) {
381*66087c08SValeria Barra         gnodes += (exyz[d]*p + rnodes%pp1) * gnodes_stride;
382*66087c08SValeria Barra         gnodes_stride *= nd[d];
383*66087c08SValeria Barra         rnodes /= pp1;
384*66087c08SValeria Barra       }
385*66087c08SValeria Barra       loc_el_nodes[lnodes] = gnodes;
386*66087c08SValeria Barra     }
387*66087c08SValeria Barra   }
388*66087c08SValeria Barra   if (restr)
389*66087c08SValeria Barra     CeedElemRestrictionCreate(ceed, num_elem, nnodes, scalar_size,
390*66087c08SValeria Barra                               ncomp, CEED_MEM_HOST,
391*66087c08SValeria Barra                               CEED_COPY_VALUES, el_nodes, restr);
392*66087c08SValeria Barra   if (restr_i)
393*66087c08SValeria Barra     CeedElemRestrictionCreateIdentity(ceed, num_elem, elem_qpts,
394*66087c08SValeria Barra                                       elem_qpts*num_elem,
395*66087c08SValeria Barra                                       ncomp, restr_i);
396*66087c08SValeria Barra   free(el_nodes);
397*66087c08SValeria Barra   return 0;
398*66087c08SValeria Barra }
399*66087c08SValeria Barra 
400*66087c08SValeria Barra int SetCartesianMeshCoords(int dim, int nxyz[3], int mesh_order,
401*66087c08SValeria Barra                            CeedVector mesh_coords) {
402*66087c08SValeria Barra   CeedInt p = mesh_order;
403*66087c08SValeria Barra   CeedInt nd[3], num_elem = 1, scalar_size = 1;
404*66087c08SValeria Barra   for (int d = 0; d < dim; d++) {
405*66087c08SValeria Barra     num_elem *= nxyz[d];
406*66087c08SValeria Barra     nd[d] = nxyz[d]*p + 1;
407*66087c08SValeria Barra     scalar_size *= nd[d];
408*66087c08SValeria Barra   }
409*66087c08SValeria Barra   CeedScalar *coords;
410*66087c08SValeria Barra   CeedVectorGetArray(mesh_coords, CEED_MEM_HOST, &coords);
411*66087c08SValeria Barra   CeedScalar *nodes = malloc(sizeof(CeedScalar)*(p+1));
412*66087c08SValeria Barra   // The H1 basis uses Lobatto quadrature points as nodes.
413*66087c08SValeria Barra   CeedLobattoQuadrature(p+1, nodes, NULL); // nodes are in [-1,1]
414*66087c08SValeria Barra   for (CeedInt i = 0; i <= p; i++) { nodes[i] = 0.5+0.5*nodes[i]; }
415*66087c08SValeria Barra   for (CeedInt gsnodes = 0; gsnodes < scalar_size; gsnodes++) {
416*66087c08SValeria Barra     CeedInt rnodes = gsnodes;
417*66087c08SValeria Barra     for (int d = 0; d < dim; d++) {
418*66087c08SValeria Barra       CeedInt d1d = rnodes%nd[d];
419*66087c08SValeria Barra       coords[gsnodes+scalar_size*d] = ((d1d/p)+nodes[d1d%p]) / nxyz[d];
420*66087c08SValeria Barra       rnodes /= nd[d];
421*66087c08SValeria Barra     }
422*66087c08SValeria Barra   }
423*66087c08SValeria Barra   free(nodes);
424*66087c08SValeria Barra   CeedVectorRestoreArray(mesh_coords, &coords);
425*66087c08SValeria Barra   return 0;
426*66087c08SValeria Barra }
427*66087c08SValeria Barra 
428*66087c08SValeria Barra #ifndef M_PI
429*66087c08SValeria Barra #define M_PI    3.14159265358979323846
430*66087c08SValeria Barra #define M_PI_2  1.57079632679489661923
431*66087c08SValeria Barra #endif
432*66087c08SValeria Barra 
433*66087c08SValeria Barra CeedScalar TransformMeshCoords(int dim, int mesh_size, CeedVector mesh_coords) {
434*66087c08SValeria Barra   CeedScalar exact_sa = (dim==1? 2 : dim==2? 4 : 6);
435*66087c08SValeria Barra   CeedScalar *coords;
436*66087c08SValeria Barra 
437*66087c08SValeria Barra   CeedVectorGetArray(mesh_coords, CEED_MEM_HOST, &coords);
438*66087c08SValeria Barra   for (CeedInt i = 0; i < mesh_size; i++) {
439*66087c08SValeria Barra     // map [0,1] to [0,1] varying the mesh density
440*66087c08SValeria Barra     coords[i] = 0.5+1./sqrt(3.)*sin((2./3.)*M_PI*(coords[i]-0.5));
441*66087c08SValeria Barra   }
442*66087c08SValeria Barra   CeedVectorRestoreArray(mesh_coords, &coords);
443*66087c08SValeria Barra 
444*66087c08SValeria Barra   return exact_sa;
445*66087c08SValeria Barra }
446