xref: /petsc/src/snes/tutorials/ex19.c (revision 48a46eb9bd028bec07ec0f396b1a3abb43f14558)
1c4762a1bSJed Brown 
2c4762a1bSJed Brown static char help[] = "Nonlinear driven cavity with multigrid in 2d.\n \
3c4762a1bSJed Brown   \n\
4c4762a1bSJed Brown The 2D driven cavity problem is solved in a velocity-vorticity formulation.\n\
5c4762a1bSJed Brown The flow can be driven with the lid or with bouyancy or both:\n\
6c4762a1bSJed Brown   -lidvelocity &ltlid&gt, where &ltlid&gt = dimensionless velocity of lid\n\
7c4762a1bSJed Brown   -grashof &ltgr&gt, where &ltgr&gt = dimensionless temperature gradent\n\
8c4762a1bSJed Brown   -prandtl &ltpr&gt, where &ltpr&gt = dimensionless thermal/momentum diffusity ratio\n\
9c4762a1bSJed Brown  -contours : draw contour plots of solution\n\n";
10c4762a1bSJed Brown /* in HTML, '&lt' = '<' and '&gt' = '>' */
11c4762a1bSJed Brown 
12c4762a1bSJed Brown /*
13c4762a1bSJed Brown       See src/ksp/ksp/tutorials/ex45.c
14c4762a1bSJed Brown */
15c4762a1bSJed Brown 
16c4762a1bSJed Brown /*F-----------------------------------------------------------------------
17c4762a1bSJed Brown 
18c4762a1bSJed Brown     We thank David E. Keyes for contributing the driven cavity discretization within this example code.
19c4762a1bSJed Brown 
20c4762a1bSJed Brown     This problem is modeled by the partial differential equation system
21c4762a1bSJed Brown 
22c4762a1bSJed Brown \begin{eqnarray}
23c4762a1bSJed Brown         - \triangle U - \nabla_y \Omega & = & 0  \\
24c4762a1bSJed Brown         - \triangle V + \nabla_x\Omega & = & 0  \\
25c4762a1bSJed Brown         - \triangle \Omega + \nabla \cdot ([U*\Omega,V*\Omega]) - GR* \nabla_x T & = & 0  \\
26c4762a1bSJed Brown         - \triangle T + PR* \nabla \cdot ([U*T,V*T]) & = & 0
27c4762a1bSJed Brown \end{eqnarray}
28c4762a1bSJed Brown 
29c4762a1bSJed Brown     in the unit square, which is uniformly discretized in each of x and y in this simple encoding.
30c4762a1bSJed Brown 
31c4762a1bSJed Brown     No-slip, rigid-wall Dirichlet conditions are used for $ [U,V]$.
32c4762a1bSJed Brown     Dirichlet conditions are used for Omega, based on the definition of
33c4762a1bSJed Brown     vorticity: $ \Omega = - \nabla_y U + \nabla_x V$, where along each
34c4762a1bSJed Brown     constant coordinate boundary, the tangential derivative is zero.
35c4762a1bSJed Brown     Dirichlet conditions are used for T on the left and right walls,
36c4762a1bSJed Brown     and insulation homogeneous Neumann conditions are used for T on
37c4762a1bSJed Brown     the top and bottom walls.
38c4762a1bSJed Brown 
39c4762a1bSJed Brown     A finite difference approximation with the usual 5-point stencil
40c4762a1bSJed Brown     is used to discretize the boundary value problem to obtain a
41c4762a1bSJed Brown     nonlinear system of equations.  Upwinding is used for the divergence
42c4762a1bSJed Brown     (convective) terms and central for the gradient (source) terms.
43c4762a1bSJed Brown 
44c4762a1bSJed Brown     The Jacobian can be either
45c4762a1bSJed Brown       * formed via finite differencing using coloring (the default), or
46c4762a1bSJed Brown       * applied matrix-free via the option -snes_mf
47c4762a1bSJed Brown         (for larger grid problems this variant may not converge
48c4762a1bSJed Brown         without a preconditioner due to ill-conditioning).
49c4762a1bSJed Brown 
50c4762a1bSJed Brown   ------------------------------------------------------------------------F*/
51c4762a1bSJed Brown 
52c4762a1bSJed Brown /*
53c4762a1bSJed Brown    Include "petscdmda.h" so that we can use distributed arrays (DMDAs).
54c4762a1bSJed Brown    Include "petscsnes.h" so that we can use SNES solvers.  Note that this
55c4762a1bSJed Brown    file automatically includes:
56c4762a1bSJed Brown      petscsys.h       - base PETSc routines   petscvec.h - vectors
57c4762a1bSJed Brown      petscmat.h - matrices
58c4762a1bSJed Brown      petscis.h     - index sets            petscksp.h - Krylov subspace methods
59c4762a1bSJed Brown      petscviewer.h - viewers               petscpc.h  - preconditioners
60c4762a1bSJed Brown      petscksp.h   - linear solvers
61c4762a1bSJed Brown */
62c4762a1bSJed Brown #if defined(PETSC_APPLE_FRAMEWORK)
63c4762a1bSJed Brown #import <PETSc/petscsnes.h>
64c4762a1bSJed Brown #import <PETSc/petscdmda.h>
65c4762a1bSJed Brown #else
66c4762a1bSJed Brown #include <petscsnes.h>
67c4762a1bSJed Brown #include <petscdm.h>
68c4762a1bSJed Brown #include <petscdmda.h>
69c4762a1bSJed Brown #endif
70c4762a1bSJed Brown 
71c4762a1bSJed Brown /*
72c4762a1bSJed Brown    User-defined routines and data structures
73c4762a1bSJed Brown */
74c4762a1bSJed Brown typedef struct {
75c4762a1bSJed Brown   PetscScalar u, v, omega, temp;
76c4762a1bSJed Brown } Field;
77c4762a1bSJed Brown 
78c4762a1bSJed Brown PetscErrorCode FormFunctionLocal(DMDALocalInfo *, Field **, Field **, void *);
79c4762a1bSJed Brown 
80c4762a1bSJed Brown typedef struct {
81c4762a1bSJed Brown   PetscReal lidvelocity, prandtl, grashof; /* physical parameters */
82c4762a1bSJed Brown   PetscBool draw_contours;                 /* flag - 1 indicates drawing contours */
83c4762a1bSJed Brown } AppCtx;
84c4762a1bSJed Brown 
85c4762a1bSJed Brown extern PetscErrorCode FormInitialGuess(AppCtx *, DM, Vec);
86c4762a1bSJed Brown extern PetscErrorCode NonlinearGS(SNES, Vec, Vec, void *);
87c4762a1bSJed Brown 
889371c9d4SSatish Balay int main(int argc, char **argv) {
89c4762a1bSJed Brown   AppCtx   user; /* user-defined work context */
90c4762a1bSJed Brown   PetscInt mx, my, its;
91c4762a1bSJed Brown   MPI_Comm comm;
92c4762a1bSJed Brown   SNES     snes;
93c4762a1bSJed Brown   DM       da;
94c4762a1bSJed Brown   Vec      x;
95c4762a1bSJed Brown 
96327415f7SBarry Smith   PetscFunctionBeginUser;
979566063dSJacob Faibussowitsch   PetscCall(PetscInitialize(&argc, &argv, (char *)0, help));
98c4762a1bSJed Brown   comm = PETSC_COMM_WORLD;
999566063dSJacob Faibussowitsch   PetscCall(SNESCreate(comm, &snes));
100c4762a1bSJed Brown 
101c4762a1bSJed Brown   /*
102c4762a1bSJed Brown       Create distributed array object to manage parallel grid and vectors
103c4762a1bSJed Brown       for principal unknowns (x) and governing residuals (f)
104c4762a1bSJed Brown   */
1059566063dSJacob Faibussowitsch   PetscCall(DMDACreate2d(PETSC_COMM_WORLD, DM_BOUNDARY_NONE, DM_BOUNDARY_NONE, DMDA_STENCIL_STAR, 4, 4, PETSC_DECIDE, PETSC_DECIDE, 4, 1, 0, 0, &da));
1069566063dSJacob Faibussowitsch   PetscCall(DMSetFromOptions(da));
1079566063dSJacob Faibussowitsch   PetscCall(DMSetUp(da));
1089566063dSJacob Faibussowitsch   PetscCall(SNESSetDM(snes, (DM)da));
1099566063dSJacob Faibussowitsch   PetscCall(SNESSetNGS(snes, NonlinearGS, (void *)&user));
110c4762a1bSJed Brown 
1119566063dSJacob Faibussowitsch   PetscCall(DMDAGetInfo(da, 0, &mx, &my, PETSC_IGNORE, PETSC_IGNORE, PETSC_IGNORE, PETSC_IGNORE, PETSC_IGNORE, PETSC_IGNORE, PETSC_IGNORE, PETSC_IGNORE, PETSC_IGNORE, PETSC_IGNORE));
112c4762a1bSJed Brown   /*
113c4762a1bSJed Brown      Problem parameters (velocity of lid, prandtl, and grashof numbers)
114c4762a1bSJed Brown   */
115c4762a1bSJed Brown   user.lidvelocity = 1.0 / (mx * my);
116c4762a1bSJed Brown   user.prandtl     = 1.0;
117c4762a1bSJed Brown   user.grashof     = 1.0;
118c4762a1bSJed Brown 
1199566063dSJacob Faibussowitsch   PetscCall(PetscOptionsGetReal(NULL, NULL, "-lidvelocity", &user.lidvelocity, NULL));
1209566063dSJacob Faibussowitsch   PetscCall(PetscOptionsGetReal(NULL, NULL, "-prandtl", &user.prandtl, NULL));
1219566063dSJacob Faibussowitsch   PetscCall(PetscOptionsGetReal(NULL, NULL, "-grashof", &user.grashof, NULL));
1229566063dSJacob Faibussowitsch   PetscCall(PetscOptionsHasName(NULL, NULL, "-contours", &user.draw_contours));
123c4762a1bSJed Brown 
1249566063dSJacob Faibussowitsch   PetscCall(DMDASetFieldName(da, 0, "x_velocity"));
1259566063dSJacob Faibussowitsch   PetscCall(DMDASetFieldName(da, 1, "y_velocity"));
1269566063dSJacob Faibussowitsch   PetscCall(DMDASetFieldName(da, 2, "Omega"));
1279566063dSJacob Faibussowitsch   PetscCall(DMDASetFieldName(da, 3, "temperature"));
128c4762a1bSJed Brown 
129c4762a1bSJed Brown   /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
130c4762a1bSJed Brown      Create user context, set problem data, create vector data structures.
131c4762a1bSJed Brown      Also, compute the initial guess.
132c4762a1bSJed Brown      - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */
133c4762a1bSJed Brown 
134c4762a1bSJed Brown   /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
135c4762a1bSJed Brown      Create nonlinear solver context
136c4762a1bSJed Brown 
137c4762a1bSJed Brown      - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */
1389566063dSJacob Faibussowitsch   PetscCall(DMSetApplicationContext(da, &user));
1399566063dSJacob Faibussowitsch   PetscCall(DMDASNESSetFunctionLocal(da, INSERT_VALUES, (PetscErrorCode(*)(DMDALocalInfo *, void *, void *, void *))FormFunctionLocal, &user));
1409566063dSJacob Faibussowitsch   PetscCall(SNESSetFromOptions(snes));
1419566063dSJacob Faibussowitsch   PetscCall(PetscPrintf(comm, "lid velocity = %g, prandtl # = %g, grashof # = %g\n", (double)user.lidvelocity, (double)user.prandtl, (double)user.grashof));
142c4762a1bSJed Brown 
143c4762a1bSJed Brown   /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
144c4762a1bSJed Brown      Solve the nonlinear system
145660278c0SBarry Smith      - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */
1469566063dSJacob Faibussowitsch   PetscCall(DMCreateGlobalVector(da, &x));
1479566063dSJacob Faibussowitsch   PetscCall(FormInitialGuess(&user, da, x));
148c4762a1bSJed Brown 
1499566063dSJacob Faibussowitsch   PetscCall(SNESSolve(snes, NULL, x));
150c4762a1bSJed Brown 
1519566063dSJacob Faibussowitsch   PetscCall(SNESGetIterationNumber(snes, &its));
15263a3b9bcSJacob Faibussowitsch   PetscCall(PetscPrintf(comm, "Number of SNES iterations = %" PetscInt_FMT "\n", its));
153c4762a1bSJed Brown 
154c4762a1bSJed Brown   /*
155c4762a1bSJed Brown      Visualize solution
156c4762a1bSJed Brown   */
1571baa6e33SBarry Smith   if (user.draw_contours) PetscCall(VecView(x, PETSC_VIEWER_DRAW_WORLD));
158c4762a1bSJed Brown 
159c4762a1bSJed Brown   /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
160c4762a1bSJed Brown      Free work space.  All PETSc objects should be destroyed when they
161c4762a1bSJed Brown      are no longer needed.
162c4762a1bSJed Brown      - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */
1639566063dSJacob Faibussowitsch   PetscCall(VecDestroy(&x));
1649566063dSJacob Faibussowitsch   PetscCall(DMDestroy(&da));
1659566063dSJacob Faibussowitsch   PetscCall(SNESDestroy(&snes));
1669566063dSJacob Faibussowitsch   PetscCall(PetscFinalize());
167b122ec5aSJacob Faibussowitsch   return 0;
168c4762a1bSJed Brown }
169c4762a1bSJed Brown 
170c4762a1bSJed Brown /* ------------------------------------------------------------------- */
171c4762a1bSJed Brown 
172c4762a1bSJed Brown /*
173c4762a1bSJed Brown    FormInitialGuess - Forms initial approximation.
174c4762a1bSJed Brown 
175c4762a1bSJed Brown    Input Parameters:
176c4762a1bSJed Brown    user - user-defined application context
177c4762a1bSJed Brown    X - vector
178c4762a1bSJed Brown 
179c4762a1bSJed Brown    Output Parameter:
180c4762a1bSJed Brown    X - vector
181c4762a1bSJed Brown */
1829371c9d4SSatish Balay PetscErrorCode FormInitialGuess(AppCtx *user, DM da, Vec X) {
183c4762a1bSJed Brown   PetscInt  i, j, mx, xs, ys, xm, ym;
184c4762a1bSJed Brown   PetscReal grashof, dx;
185c4762a1bSJed Brown   Field   **x;
186c4762a1bSJed Brown 
187c4762a1bSJed Brown   PetscFunctionBeginUser;
188c4762a1bSJed Brown   grashof = user->grashof;
189c4762a1bSJed Brown 
1909566063dSJacob Faibussowitsch   PetscCall(DMDAGetInfo(da, 0, &mx, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0));
191c4762a1bSJed Brown   dx = 1.0 / (mx - 1);
192c4762a1bSJed Brown 
193c4762a1bSJed Brown   /*
194c4762a1bSJed Brown      Get local grid boundaries (for 2-dimensional DMDA):
195c4762a1bSJed Brown        xs, ys   - starting grid indices (no ghost points)
196c4762a1bSJed Brown        xm, ym   - widths of local grid (no ghost points)
197c4762a1bSJed Brown   */
1989566063dSJacob Faibussowitsch   PetscCall(DMDAGetCorners(da, &xs, &ys, NULL, &xm, &ym, NULL));
199c4762a1bSJed Brown 
200c4762a1bSJed Brown   /*
201c4762a1bSJed Brown      Get a pointer to vector data.
202c4762a1bSJed Brown        - For default PETSc vectors, VecGetArray() returns a pointer to
203c4762a1bSJed Brown          the data array.  Otherwise, the routine is implementation dependent.
204c4762a1bSJed Brown        - You MUST call VecRestoreArray() when you no longer need access to
205c4762a1bSJed Brown          the array.
206c4762a1bSJed Brown   */
2079566063dSJacob Faibussowitsch   PetscCall(DMDAVecGetArrayWrite(da, X, &x));
208c4762a1bSJed Brown 
209c4762a1bSJed Brown   /*
210c4762a1bSJed Brown      Compute initial guess over the locally owned part of the grid
211c4762a1bSJed Brown      Initial condition is motionless fluid and equilibrium temperature
212c4762a1bSJed Brown   */
213c4762a1bSJed Brown   for (j = ys; j < ys + ym; j++) {
214c4762a1bSJed Brown     for (i = xs; i < xs + xm; i++) {
215c4762a1bSJed Brown       x[j][i].u     = 0.0;
216c4762a1bSJed Brown       x[j][i].v     = 0.0;
217c4762a1bSJed Brown       x[j][i].omega = 0.0;
218c4762a1bSJed Brown       x[j][i].temp  = (grashof > 0) * i * dx;
219c4762a1bSJed Brown     }
220c4762a1bSJed Brown   }
221c4762a1bSJed Brown 
222c4762a1bSJed Brown   /*
223c4762a1bSJed Brown      Restore vector
224c4762a1bSJed Brown   */
2259566063dSJacob Faibussowitsch   PetscCall(DMDAVecRestoreArrayWrite(da, X, &x));
226c4762a1bSJed Brown   PetscFunctionReturn(0);
227c4762a1bSJed Brown }
228c4762a1bSJed Brown 
2299371c9d4SSatish Balay PetscErrorCode FormFunctionLocal(DMDALocalInfo *info, Field **x, Field **f, void *ptr) {
230c4762a1bSJed Brown   AppCtx     *user = (AppCtx *)ptr;
231c4762a1bSJed Brown   PetscInt    xints, xinte, yints, yinte, i, j;
232c4762a1bSJed Brown   PetscReal   hx, hy, dhx, dhy, hxdhy, hydhx;
233c4762a1bSJed Brown   PetscReal   grashof, prandtl, lid;
234c4762a1bSJed Brown   PetscScalar u, uxx, uyy, vx, vy, avx, avy, vxp, vxm, vyp, vym;
235c4762a1bSJed Brown 
236c4762a1bSJed Brown   PetscFunctionBeginUser;
237c4762a1bSJed Brown   grashof = user->grashof;
238c4762a1bSJed Brown   prandtl = user->prandtl;
239c4762a1bSJed Brown   lid     = user->lidvelocity;
240c4762a1bSJed Brown 
241c4762a1bSJed Brown   /*
242c4762a1bSJed Brown      Define mesh intervals ratios for uniform grid.
243c4762a1bSJed Brown 
244c4762a1bSJed Brown      Note: FD formulae below are normalized by multiplying through by
245c4762a1bSJed Brown      local volume element (i.e. hx*hy) to obtain coefficients O(1) in two dimensions.
246c4762a1bSJed Brown 
247c4762a1bSJed Brown   */
2489371c9d4SSatish Balay   dhx   = (PetscReal)(info->mx - 1);
2499371c9d4SSatish Balay   dhy   = (PetscReal)(info->my - 1);
2509371c9d4SSatish Balay   hx    = 1.0 / dhx;
2519371c9d4SSatish Balay   hy    = 1.0 / dhy;
2529371c9d4SSatish Balay   hxdhy = hx * dhy;
2539371c9d4SSatish Balay   hydhx = hy * dhx;
254c4762a1bSJed Brown 
2559371c9d4SSatish Balay   xints = info->xs;
2569371c9d4SSatish Balay   xinte = info->xs + info->xm;
2579371c9d4SSatish Balay   yints = info->ys;
2589371c9d4SSatish Balay   yinte = info->ys + info->ym;
259c4762a1bSJed Brown 
260c4762a1bSJed Brown   /* Test whether we are on the bottom edge of the global array */
261c4762a1bSJed Brown   if (yints == 0) {
262c4762a1bSJed Brown     j     = 0;
263c4762a1bSJed Brown     yints = yints + 1;
264c4762a1bSJed Brown     /* bottom edge */
265c4762a1bSJed Brown     for (i = info->xs; i < info->xs + info->xm; i++) {
266c4762a1bSJed Brown       f[j][i].u     = x[j][i].u;
267c4762a1bSJed Brown       f[j][i].v     = x[j][i].v;
268c4762a1bSJed Brown       f[j][i].omega = x[j][i].omega + (x[j + 1][i].u - x[j][i].u) * dhy;
269c4762a1bSJed Brown       f[j][i].temp  = x[j][i].temp - x[j + 1][i].temp;
270c4762a1bSJed Brown     }
271c4762a1bSJed Brown   }
272c4762a1bSJed Brown 
273c4762a1bSJed Brown   /* Test whether we are on the top edge of the global array */
274c4762a1bSJed Brown   if (yinte == info->my) {
275c4762a1bSJed Brown     j     = info->my - 1;
276c4762a1bSJed Brown     yinte = yinte - 1;
277c4762a1bSJed Brown     /* top edge */
278c4762a1bSJed Brown     for (i = info->xs; i < info->xs + info->xm; i++) {
279c4762a1bSJed Brown       f[j][i].u     = x[j][i].u - lid;
280c4762a1bSJed Brown       f[j][i].v     = x[j][i].v;
281c4762a1bSJed Brown       f[j][i].omega = x[j][i].omega + (x[j][i].u - x[j - 1][i].u) * dhy;
282c4762a1bSJed Brown       f[j][i].temp  = x[j][i].temp - x[j - 1][i].temp;
283c4762a1bSJed Brown     }
284c4762a1bSJed Brown   }
285c4762a1bSJed Brown 
286c4762a1bSJed Brown   /* Test whether we are on the left edge of the global array */
287c4762a1bSJed Brown   if (xints == 0) {
288c4762a1bSJed Brown     i     = 0;
289c4762a1bSJed Brown     xints = xints + 1;
290c4762a1bSJed Brown     /* left edge */
291c4762a1bSJed Brown     for (j = info->ys; j < info->ys + info->ym; j++) {
292c4762a1bSJed Brown       f[j][i].u     = x[j][i].u;
293c4762a1bSJed Brown       f[j][i].v     = x[j][i].v;
294c4762a1bSJed Brown       f[j][i].omega = x[j][i].omega - (x[j][i + 1].v - x[j][i].v) * dhx;
295c4762a1bSJed Brown       f[j][i].temp  = x[j][i].temp;
296c4762a1bSJed Brown     }
297c4762a1bSJed Brown   }
298c4762a1bSJed Brown 
299c4762a1bSJed Brown   /* Test whether we are on the right edge of the global array */
300c4762a1bSJed Brown   if (xinte == info->mx) {
301c4762a1bSJed Brown     i     = info->mx - 1;
302c4762a1bSJed Brown     xinte = xinte - 1;
303c4762a1bSJed Brown     /* right edge */
304c4762a1bSJed Brown     for (j = info->ys; j < info->ys + info->ym; j++) {
305c4762a1bSJed Brown       f[j][i].u     = x[j][i].u;
306c4762a1bSJed Brown       f[j][i].v     = x[j][i].v;
307c4762a1bSJed Brown       f[j][i].omega = x[j][i].omega - (x[j][i].v - x[j][i - 1].v) * dhx;
308c4762a1bSJed Brown       f[j][i].temp  = x[j][i].temp - (PetscReal)(grashof > 0);
309c4762a1bSJed Brown     }
310c4762a1bSJed Brown   }
311c4762a1bSJed Brown 
312c4762a1bSJed Brown   /* Compute over the interior points */
313c4762a1bSJed Brown   for (j = yints; j < yinte; j++) {
314c4762a1bSJed Brown     for (i = xints; i < xinte; i++) {
315c4762a1bSJed Brown       /*
316c4762a1bSJed Brown        convective coefficients for upwinding
317c4762a1bSJed Brown       */
3189371c9d4SSatish Balay       vx  = x[j][i].u;
3199371c9d4SSatish Balay       avx = PetscAbsScalar(vx);
3209371c9d4SSatish Balay       vxp = .5 * (vx + avx);
3219371c9d4SSatish Balay       vxm = .5 * (vx - avx);
3229371c9d4SSatish Balay       vy  = x[j][i].v;
3239371c9d4SSatish Balay       avy = PetscAbsScalar(vy);
3249371c9d4SSatish Balay       vyp = .5 * (vy + avy);
3259371c9d4SSatish Balay       vym = .5 * (vy - avy);
326c4762a1bSJed Brown 
327c4762a1bSJed Brown       /* U velocity */
328c4762a1bSJed Brown       u         = x[j][i].u;
329c4762a1bSJed Brown       uxx       = (2.0 * u - x[j][i - 1].u - x[j][i + 1].u) * hydhx;
330c4762a1bSJed Brown       uyy       = (2.0 * u - x[j - 1][i].u - x[j + 1][i].u) * hxdhy;
331c4762a1bSJed Brown       f[j][i].u = uxx + uyy - .5 * (x[j + 1][i].omega - x[j - 1][i].omega) * hx;
332c4762a1bSJed Brown 
333c4762a1bSJed Brown       /* V velocity */
334c4762a1bSJed Brown       u         = x[j][i].v;
335c4762a1bSJed Brown       uxx       = (2.0 * u - x[j][i - 1].v - x[j][i + 1].v) * hydhx;
336c4762a1bSJed Brown       uyy       = (2.0 * u - x[j - 1][i].v - x[j + 1][i].v) * hxdhy;
337c4762a1bSJed Brown       f[j][i].v = uxx + uyy + .5 * (x[j][i + 1].omega - x[j][i - 1].omega) * hy;
338c4762a1bSJed Brown 
339c4762a1bSJed Brown       /* Omega */
340c4762a1bSJed Brown       u             = x[j][i].omega;
341c4762a1bSJed Brown       uxx           = (2.0 * u - x[j][i - 1].omega - x[j][i + 1].omega) * hydhx;
342c4762a1bSJed Brown       uyy           = (2.0 * u - x[j - 1][i].omega - x[j + 1][i].omega) * hxdhy;
3439371c9d4SSatish Balay       f[j][i].omega = uxx + uyy + (vxp * (u - x[j][i - 1].omega) + vxm * (x[j][i + 1].omega - u)) * hy + (vyp * (u - x[j - 1][i].omega) + vym * (x[j + 1][i].omega - u)) * hx - .5 * grashof * (x[j][i + 1].temp - x[j][i - 1].temp) * hy;
344c4762a1bSJed Brown 
345c4762a1bSJed Brown       /* Temperature */
346c4762a1bSJed Brown       u            = x[j][i].temp;
347c4762a1bSJed Brown       uxx          = (2.0 * u - x[j][i - 1].temp - x[j][i + 1].temp) * hydhx;
348c4762a1bSJed Brown       uyy          = (2.0 * u - x[j - 1][i].temp - x[j + 1][i].temp) * hxdhy;
3499371c9d4SSatish Balay       f[j][i].temp = uxx + uyy + prandtl * ((vxp * (u - x[j][i - 1].temp) + vxm * (x[j][i + 1].temp - u)) * hy + (vyp * (u - x[j - 1][i].temp) + vym * (x[j + 1][i].temp - u)) * hx);
350c4762a1bSJed Brown     }
351c4762a1bSJed Brown   }
352c4762a1bSJed Brown 
353c4762a1bSJed Brown   /*
354c4762a1bSJed Brown      Flop count (multiply-adds are counted as 2 operations)
355c4762a1bSJed Brown   */
3569566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(84.0 * info->ym * info->xm));
357c4762a1bSJed Brown   PetscFunctionReturn(0);
358c4762a1bSJed Brown }
359c4762a1bSJed Brown 
360c4762a1bSJed Brown /*
361c4762a1bSJed Brown     Performs sweeps of point block nonlinear Gauss-Seidel on all the local grid points
362c4762a1bSJed Brown */
3639371c9d4SSatish Balay PetscErrorCode NonlinearGS(SNES snes, Vec X, Vec B, void *ctx) {
364c4762a1bSJed Brown   DMDALocalInfo info;
365c4762a1bSJed Brown   Field       **x, **b;
366c4762a1bSJed Brown   Vec           localX, localB;
367c4762a1bSJed Brown   DM            da;
368c4762a1bSJed Brown   PetscInt      xints, xinte, yints, yinte, i, j, k, l;
369c4762a1bSJed Brown   PetscInt      max_its, tot_its;
370c4762a1bSJed Brown   PetscInt      sweeps;
371c4762a1bSJed Brown   PetscReal     rtol, atol, stol;
372c4762a1bSJed Brown   PetscReal     hx, hy, dhx, dhy, hxdhy, hydhx;
373c4762a1bSJed Brown   PetscReal     grashof, prandtl, lid;
374c4762a1bSJed Brown   PetscScalar   u, uxx, uyy, vx, vy, avx, avy, vxp, vxm, vyp, vym;
375c4762a1bSJed Brown   PetscScalar   fu, fv, fomega, ftemp;
376c4762a1bSJed Brown   PetscScalar   dfudu;
377c4762a1bSJed Brown   PetscScalar   dfvdv;
378c4762a1bSJed Brown   PetscScalar   dfodu, dfodv, dfodo;
379c4762a1bSJed Brown   PetscScalar   dftdu, dftdv, dftdt;
380c4762a1bSJed Brown   PetscScalar   yu = 0, yv = 0, yo = 0, yt = 0;
381c4762a1bSJed Brown   PetscScalar   bjiu, bjiv, bjiomega, bjitemp;
382c4762a1bSJed Brown   PetscBool     ptconverged;
383c4762a1bSJed Brown   PetscReal     pfnorm, pfnorm0, pynorm, pxnorm;
384c4762a1bSJed Brown   AppCtx       *user = (AppCtx *)ctx;
385c4762a1bSJed Brown 
386c4762a1bSJed Brown   PetscFunctionBeginUser;
387c4762a1bSJed Brown   grashof = user->grashof;
388c4762a1bSJed Brown   prandtl = user->prandtl;
389c4762a1bSJed Brown   lid     = user->lidvelocity;
390c4762a1bSJed Brown   tot_its = 0;
3919566063dSJacob Faibussowitsch   PetscCall(SNESNGSGetTolerances(snes, &rtol, &atol, &stol, &max_its));
3929566063dSJacob Faibussowitsch   PetscCall(SNESNGSGetSweeps(snes, &sweeps));
3939566063dSJacob Faibussowitsch   PetscCall(SNESGetDM(snes, (DM *)&da));
3949566063dSJacob Faibussowitsch   PetscCall(DMGetLocalVector(da, &localX));
395*48a46eb9SPierre Jolivet   if (B) PetscCall(DMGetLocalVector(da, &localB));
396c4762a1bSJed Brown   /*
397c4762a1bSJed Brown      Scatter ghost points to local vector, using the 2-step process
398c4762a1bSJed Brown         DMGlobalToLocalBegin(), DMGlobalToLocalEnd().
399c4762a1bSJed Brown   */
4009566063dSJacob Faibussowitsch   PetscCall(DMGlobalToLocalBegin(da, X, INSERT_VALUES, localX));
4019566063dSJacob Faibussowitsch   PetscCall(DMGlobalToLocalEnd(da, X, INSERT_VALUES, localX));
402c4762a1bSJed Brown   if (B) {
4039566063dSJacob Faibussowitsch     PetscCall(DMGlobalToLocalBegin(da, B, INSERT_VALUES, localB));
4049566063dSJacob Faibussowitsch     PetscCall(DMGlobalToLocalEnd(da, B, INSERT_VALUES, localB));
405c4762a1bSJed Brown   }
4069566063dSJacob Faibussowitsch   PetscCall(DMDAGetLocalInfo(da, &info));
4079566063dSJacob Faibussowitsch   PetscCall(DMDAVecGetArrayWrite(da, localX, &x));
408*48a46eb9SPierre Jolivet   if (B) PetscCall(DMDAVecGetArrayRead(da, localB, &b));
409c4762a1bSJed Brown   /* looks like a combination of the formfunction / formjacobian routines */
4109371c9d4SSatish Balay   dhx   = (PetscReal)(info.mx - 1);
4119371c9d4SSatish Balay   dhy   = (PetscReal)(info.my - 1);
4129371c9d4SSatish Balay   hx    = 1.0 / dhx;
4139371c9d4SSatish Balay   hy    = 1.0 / dhy;
4149371c9d4SSatish Balay   hxdhy = hx * dhy;
4159371c9d4SSatish Balay   hydhx = hy * dhx;
416c4762a1bSJed Brown 
4179371c9d4SSatish Balay   xints = info.xs;
4189371c9d4SSatish Balay   xinte = info.xs + info.xm;
4199371c9d4SSatish Balay   yints = info.ys;
4209371c9d4SSatish Balay   yinte = info.ys + info.ym;
421c4762a1bSJed Brown 
422c4762a1bSJed Brown   /* Set the boundary conditions on the momentum equations */
423c4762a1bSJed Brown   /* Test whether we are on the bottom edge of the global array */
424c4762a1bSJed Brown   if (yints == 0) {
425c4762a1bSJed Brown     j = 0;
426c4762a1bSJed Brown     /* bottom edge */
427c4762a1bSJed Brown     for (i = info.xs; i < info.xs + info.xm; i++) {
428c4762a1bSJed Brown       if (B) {
429c4762a1bSJed Brown         bjiu = b[j][i].u;
430c4762a1bSJed Brown         bjiv = b[j][i].v;
431c4762a1bSJed Brown       } else {
432c4762a1bSJed Brown         bjiu = 0.0;
433c4762a1bSJed Brown         bjiv = 0.0;
434c4762a1bSJed Brown       }
435c4762a1bSJed Brown       x[j][i].u = 0.0 + bjiu;
436c4762a1bSJed Brown       x[j][i].v = 0.0 + bjiv;
437c4762a1bSJed Brown     }
438c4762a1bSJed Brown   }
439c4762a1bSJed Brown 
440c4762a1bSJed Brown   /* Test whether we are on the top edge of the global array */
441c4762a1bSJed Brown   if (yinte == info.my) {
442c4762a1bSJed Brown     j = info.my - 1;
443c4762a1bSJed Brown     /* top edge */
444c4762a1bSJed Brown     for (i = info.xs; i < info.xs + info.xm; i++) {
445c4762a1bSJed Brown       if (B) {
446c4762a1bSJed Brown         bjiu = b[j][i].u;
447c4762a1bSJed Brown         bjiv = b[j][i].v;
448c4762a1bSJed Brown       } else {
449c4762a1bSJed Brown         bjiu = 0.0;
450c4762a1bSJed Brown         bjiv = 0.0;
451c4762a1bSJed Brown       }
452c4762a1bSJed Brown       x[j][i].u = lid + bjiu;
453c4762a1bSJed Brown       x[j][i].v = bjiv;
454c4762a1bSJed Brown     }
455c4762a1bSJed Brown   }
456c4762a1bSJed Brown 
457c4762a1bSJed Brown   /* Test whether we are on the left edge of the global array */
458c4762a1bSJed Brown   if (xints == 0) {
459c4762a1bSJed Brown     i = 0;
460c4762a1bSJed Brown     /* left edge */
461c4762a1bSJed Brown     for (j = info.ys; j < info.ys + info.ym; j++) {
462c4762a1bSJed Brown       if (B) {
463c4762a1bSJed Brown         bjiu = b[j][i].u;
464c4762a1bSJed Brown         bjiv = b[j][i].v;
465c4762a1bSJed Brown       } else {
466c4762a1bSJed Brown         bjiu = 0.0;
467c4762a1bSJed Brown         bjiv = 0.0;
468c4762a1bSJed Brown       }
469c4762a1bSJed Brown       x[j][i].u = 0.0 + bjiu;
470c4762a1bSJed Brown       x[j][i].v = 0.0 + bjiv;
471c4762a1bSJed Brown     }
472c4762a1bSJed Brown   }
473c4762a1bSJed Brown 
474c4762a1bSJed Brown   /* Test whether we are on the right edge of the global array */
475c4762a1bSJed Brown   if (xinte == info.mx) {
476c4762a1bSJed Brown     i = info.mx - 1;
477c4762a1bSJed Brown     /* right edge */
478c4762a1bSJed Brown     for (j = info.ys; j < info.ys + info.ym; j++) {
479c4762a1bSJed Brown       if (B) {
480c4762a1bSJed Brown         bjiu = b[j][i].u;
481c4762a1bSJed Brown         bjiv = b[j][i].v;
482c4762a1bSJed Brown       } else {
483c4762a1bSJed Brown         bjiu = 0.0;
484c4762a1bSJed Brown         bjiv = 0.0;
485c4762a1bSJed Brown       }
486c4762a1bSJed Brown       x[j][i].u = 0.0 + bjiu;
487c4762a1bSJed Brown       x[j][i].v = 0.0 + bjiv;
488c4762a1bSJed Brown     }
489c4762a1bSJed Brown   }
490c4762a1bSJed Brown 
491c4762a1bSJed Brown   for (k = 0; k < sweeps; k++) {
492c4762a1bSJed Brown     for (j = info.ys; j < info.ys + info.ym; j++) {
493c4762a1bSJed Brown       for (i = info.xs; i < info.xs + info.xm; i++) {
494c4762a1bSJed Brown         ptconverged = PETSC_FALSE;
495c4762a1bSJed Brown         pfnorm0     = 0.0;
496c4762a1bSJed Brown         fu          = 0.0;
497c4762a1bSJed Brown         fv          = 0.0;
498c4762a1bSJed Brown         fomega      = 0.0;
499c4762a1bSJed Brown         ftemp       = 0.0;
500c4762a1bSJed Brown         /*  Run Newton's method on a single grid point */
501c4762a1bSJed Brown         for (l = 0; l < max_its && !ptconverged; l++) {
502c4762a1bSJed Brown           if (B) {
503c4762a1bSJed Brown             bjiu     = b[j][i].u;
504c4762a1bSJed Brown             bjiv     = b[j][i].v;
505c4762a1bSJed Brown             bjiomega = b[j][i].omega;
506c4762a1bSJed Brown             bjitemp  = b[j][i].temp;
507c4762a1bSJed Brown           } else {
508c4762a1bSJed Brown             bjiu     = 0.0;
509c4762a1bSJed Brown             bjiv     = 0.0;
510c4762a1bSJed Brown             bjiomega = 0.0;
511c4762a1bSJed Brown             bjitemp  = 0.0;
512c4762a1bSJed Brown           }
513c4762a1bSJed Brown 
514c4762a1bSJed Brown           if (i != 0 && i != info.mx - 1 && j != 0 && j != info.my - 1) {
515c4762a1bSJed Brown             /* U velocity */
516c4762a1bSJed Brown             u      = x[j][i].u;
517c4762a1bSJed Brown             uxx    = (2.0 * u - x[j][i - 1].u - x[j][i + 1].u) * hydhx;
518c4762a1bSJed Brown             uyy    = (2.0 * u - x[j - 1][i].u - x[j + 1][i].u) * hxdhy;
519c4762a1bSJed Brown             fu     = uxx + uyy - .5 * (x[j + 1][i].omega - x[j - 1][i].omega) * hx - bjiu;
520c4762a1bSJed Brown             dfudu  = 2.0 * (hydhx + hxdhy);
521c4762a1bSJed Brown             /* V velocity */
522c4762a1bSJed Brown             u      = x[j][i].v;
523c4762a1bSJed Brown             uxx    = (2.0 * u - x[j][i - 1].v - x[j][i + 1].v) * hydhx;
524c4762a1bSJed Brown             uyy    = (2.0 * u - x[j - 1][i].v - x[j + 1][i].v) * hxdhy;
525c4762a1bSJed Brown             fv     = uxx + uyy + .5 * (x[j][i + 1].omega - x[j][i - 1].omega) * hy - bjiv;
526c4762a1bSJed Brown             dfvdv  = 2.0 * (hydhx + hxdhy);
527c4762a1bSJed Brown             /*
528c4762a1bSJed Brown              convective coefficients for upwinding
529c4762a1bSJed Brown              */
5309371c9d4SSatish Balay             vx     = x[j][i].u;
5319371c9d4SSatish Balay             avx    = PetscAbsScalar(vx);
5329371c9d4SSatish Balay             vxp    = .5 * (vx + avx);
5339371c9d4SSatish Balay             vxm    = .5 * (vx - avx);
5349371c9d4SSatish Balay             vy     = x[j][i].v;
5359371c9d4SSatish Balay             avy    = PetscAbsScalar(vy);
5369371c9d4SSatish Balay             vyp    = .5 * (vy + avy);
5379371c9d4SSatish Balay             vym    = .5 * (vy - avy);
538c4762a1bSJed Brown             /* Omega */
539c4762a1bSJed Brown             u      = x[j][i].omega;
540c4762a1bSJed Brown             uxx    = (2.0 * u - x[j][i - 1].omega - x[j][i + 1].omega) * hydhx;
541c4762a1bSJed Brown             uyy    = (2.0 * u - x[j - 1][i].omega - x[j + 1][i].omega) * hxdhy;
5429371c9d4SSatish Balay             fomega = uxx + uyy + (vxp * (u - x[j][i - 1].omega) + vxm * (x[j][i + 1].omega - u)) * hy + (vyp * (u - x[j - 1][i].omega) + vym * (x[j + 1][i].omega - u)) * hx - .5 * grashof * (x[j][i + 1].temp - x[j][i - 1].temp) * hy - bjiomega;
543c4762a1bSJed Brown             /* convective coefficient derivatives */
544c4762a1bSJed Brown             dfodo  = 2.0 * (hydhx + hxdhy) + ((vxp - vxm) * hy + (vyp - vym) * hx);
545c4762a1bSJed Brown             if (PetscRealPart(vx) > 0.0) dfodu = (u - x[j][i - 1].omega) * hy;
546c4762a1bSJed Brown             else dfodu = (x[j][i + 1].omega - u) * hy;
547c4762a1bSJed Brown 
548c4762a1bSJed Brown             if (PetscRealPart(vy) > 0.0) dfodv = (u - x[j - 1][i].omega) * hx;
549c4762a1bSJed Brown             else dfodv = (x[j + 1][i].omega - u) * hx;
550c4762a1bSJed Brown 
551c4762a1bSJed Brown             /* Temperature */
552c4762a1bSJed Brown             u     = x[j][i].temp;
553c4762a1bSJed Brown             uxx   = (2.0 * u - x[j][i - 1].temp - x[j][i + 1].temp) * hydhx;
554c4762a1bSJed Brown             uyy   = (2.0 * u - x[j - 1][i].temp - x[j + 1][i].temp) * hxdhy;
555c4762a1bSJed Brown             ftemp = uxx + uyy + prandtl * ((vxp * (u - x[j][i - 1].temp) + vxm * (x[j][i + 1].temp - u)) * hy + (vyp * (u - x[j - 1][i].temp) + vym * (x[j + 1][i].temp - u)) * hx) - bjitemp;
556c4762a1bSJed Brown             dftdt = 2.0 * (hydhx + hxdhy) + prandtl * ((vxp - vxm) * hy + (vyp - vym) * hx);
557c4762a1bSJed Brown             if (PetscRealPart(vx) > 0.0) dftdu = prandtl * (u - x[j][i - 1].temp) * hy;
558c4762a1bSJed Brown             else dftdu = prandtl * (x[j][i + 1].temp - u) * hy;
559c4762a1bSJed Brown 
560c4762a1bSJed Brown             if (PetscRealPart(vy) > 0.0) dftdv = prandtl * (u - x[j - 1][i].temp) * hx;
561c4762a1bSJed Brown             else dftdv = prandtl * (x[j + 1][i].temp - u) * hx;
562c4762a1bSJed Brown 
563c4762a1bSJed Brown             /* invert the system:
564c4762a1bSJed Brown              [ dfu / du     0        0        0    ][yu] = [fu]
565c4762a1bSJed Brown              [     0    dfv / dv     0        0    ][yv]   [fv]
566c4762a1bSJed Brown              [ dfo / du dfo / dv dfo / do     0    ][yo]   [fo]
567c4762a1bSJed Brown              [ dft / du dft / dv     0    dft / dt ][yt]   [ft]
568c4762a1bSJed Brown              by simple back-substitution
569c4762a1bSJed Brown            */
570c4762a1bSJed Brown             yu = fu / dfudu;
571c4762a1bSJed Brown             yv = fv / dfvdv;
572c4762a1bSJed Brown             yo = (fomega - (dfodu * yu + dfodv * yv)) / dfodo;
573c4762a1bSJed Brown             yt = (ftemp - (dftdu * yu + dftdv * yv)) / dftdt;
574c4762a1bSJed Brown 
575c4762a1bSJed Brown             x[j][i].u     = x[j][i].u - yu;
576c4762a1bSJed Brown             x[j][i].v     = x[j][i].v - yv;
577c4762a1bSJed Brown             x[j][i].temp  = x[j][i].temp - yt;
578c4762a1bSJed Brown             x[j][i].omega = x[j][i].omega - yo;
579c4762a1bSJed Brown           }
580c4762a1bSJed Brown           if (i == 0) {
581c4762a1bSJed Brown             fomega        = x[j][i].omega - (x[j][i + 1].v - x[j][i].v) * dhx - bjiomega;
582c4762a1bSJed Brown             ftemp         = x[j][i].temp - bjitemp;
583c4762a1bSJed Brown             yo            = fomega;
584c4762a1bSJed Brown             yt            = ftemp;
585c4762a1bSJed Brown             x[j][i].omega = x[j][i].omega - fomega;
586c4762a1bSJed Brown             x[j][i].temp  = x[j][i].temp - ftemp;
587c4762a1bSJed Brown           }
588c4762a1bSJed Brown           if (i == info.mx - 1) {
589c4762a1bSJed Brown             fomega        = x[j][i].omega - (x[j][i].v - x[j][i - 1].v) * dhx - bjiomega;
590c4762a1bSJed Brown             ftemp         = x[j][i].temp - (PetscReal)(grashof > 0) - bjitemp;
591c4762a1bSJed Brown             yo            = fomega;
592c4762a1bSJed Brown             yt            = ftemp;
593c4762a1bSJed Brown             x[j][i].omega = x[j][i].omega - fomega;
594c4762a1bSJed Brown             x[j][i].temp  = x[j][i].temp - ftemp;
595c4762a1bSJed Brown           }
596c4762a1bSJed Brown           if (j == 0) {
597c4762a1bSJed Brown             fomega        = x[j][i].omega + (x[j + 1][i].u - x[j][i].u) * dhy - bjiomega;
598c4762a1bSJed Brown             ftemp         = x[j][i].temp - x[j + 1][i].temp - bjitemp;
599c4762a1bSJed Brown             yo            = fomega;
600c4762a1bSJed Brown             yt            = ftemp;
601c4762a1bSJed Brown             x[j][i].omega = x[j][i].omega - fomega;
602c4762a1bSJed Brown             x[j][i].temp  = x[j][i].temp - ftemp;
603c4762a1bSJed Brown           }
604c4762a1bSJed Brown           if (j == info.my - 1) {
605c4762a1bSJed Brown             fomega        = x[j][i].omega + (x[j][i].u - x[j - 1][i].u) * dhy - bjiomega;
606c4762a1bSJed Brown             ftemp         = x[j][i].temp - x[j - 1][i].temp - bjitemp;
607c4762a1bSJed Brown             yo            = fomega;
608c4762a1bSJed Brown             yt            = ftemp;
609c4762a1bSJed Brown             x[j][i].omega = x[j][i].omega - fomega;
610c4762a1bSJed Brown             x[j][i].temp  = x[j][i].temp - ftemp;
611c4762a1bSJed Brown           }
612c4762a1bSJed Brown           tot_its++;
613c4762a1bSJed Brown           pfnorm = PetscRealPart(fu * fu + fv * fv + fomega * fomega + ftemp * ftemp);
614c4762a1bSJed Brown           pfnorm = PetscSqrtReal(pfnorm);
615c4762a1bSJed Brown           pynorm = PetscRealPart(yu * yu + yv * yv + yo * yo + yt * yt);
616c4762a1bSJed Brown           pynorm = PetscSqrtReal(pynorm);
617c4762a1bSJed Brown           pxnorm = PetscRealPart(x[j][i].u * x[j][i].u + x[j][i].v * x[j][i].v + x[j][i].omega * x[j][i].omega + x[j][i].temp * x[j][i].temp);
618c4762a1bSJed Brown           pxnorm = PetscSqrtReal(pxnorm);
619c4762a1bSJed Brown           if (l == 0) pfnorm0 = pfnorm;
620c4762a1bSJed Brown           if (rtol * pfnorm0 > pfnorm || atol > pfnorm || pxnorm * stol > pynorm) ptconverged = PETSC_TRUE;
621c4762a1bSJed Brown         }
622c4762a1bSJed Brown       }
623c4762a1bSJed Brown     }
624c4762a1bSJed Brown   }
6259566063dSJacob Faibussowitsch   PetscCall(DMDAVecRestoreArrayWrite(da, localX, &x));
626*48a46eb9SPierre Jolivet   if (B) PetscCall(DMDAVecRestoreArrayRead(da, localB, &b));
6279566063dSJacob Faibussowitsch   PetscCall(DMLocalToGlobalBegin(da, localX, INSERT_VALUES, X));
6289566063dSJacob Faibussowitsch   PetscCall(DMLocalToGlobalEnd(da, localX, INSERT_VALUES, X));
6299566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(tot_its * (84.0 + 41.0 + 26.0)));
6309566063dSJacob Faibussowitsch   PetscCall(DMRestoreLocalVector(da, &localX));
631*48a46eb9SPierre Jolivet   if (B) PetscCall(DMRestoreLocalVector(da, &localB));
632c4762a1bSJed Brown   PetscFunctionReturn(0);
633c4762a1bSJed Brown }
634c4762a1bSJed Brown 
635c4762a1bSJed Brown /*TEST
636c4762a1bSJed Brown 
637c4762a1bSJed Brown    test:
638c4762a1bSJed Brown       nsize: 2
639c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type mg -ksp_type fgmres -pc_mg_type full
640c4762a1bSJed Brown       requires: !single
641c4762a1bSJed Brown 
642c4762a1bSJed Brown    test:
643c4762a1bSJed Brown       suffix: 10
644c4762a1bSJed Brown       nsize: 3
645c4762a1bSJed Brown       args: -snes_monitor_short -ksp_monitor_short -pc_type fieldsplit -pc_fieldsplit_type symmetric_multiplicative -snes_view -da_refine 1 -ksp_type fgmres
646c4762a1bSJed Brown       requires: !single
647c4762a1bSJed Brown 
648c4762a1bSJed Brown    test:
649c4762a1bSJed Brown       suffix: 11
650c4762a1bSJed Brown       nsize: 4
651c4762a1bSJed Brown       requires: pastix
652c4762a1bSJed Brown       args: -snes_monitor_short -pc_type redundant -dm_mat_type mpiaij -redundant_pc_factor_mat_solver_type pastix -pc_redundant_number 2 -da_refine 4 -ksp_type fgmres
653c4762a1bSJed Brown 
654c4762a1bSJed Brown    test:
655c4762a1bSJed Brown       suffix: 12
656c4762a1bSJed Brown       nsize: 12
657c4762a1bSJed Brown       requires: pastix
658c4762a1bSJed Brown       args: -snes_monitor_short -pc_type redundant -dm_mat_type mpiaij -redundant_pc_factor_mat_solver_type pastix -pc_redundant_number 5 -da_refine 4 -ksp_type fgmres
659c4762a1bSJed Brown 
660c4762a1bSJed Brown    test:
661c4762a1bSJed Brown       suffix: 13
662c4762a1bSJed Brown       nsize: 3
663c4762a1bSJed Brown       args: -snes_monitor_short -ksp_monitor_short -pc_type fieldsplit -pc_fieldsplit_type multiplicative -snes_view -da_refine 1 -ksp_type fgmres -snes_mf_operator
664c4762a1bSJed Brown       requires: !single
665c4762a1bSJed Brown 
666c4762a1bSJed Brown    test:
667c4762a1bSJed Brown       suffix: 14
668c4762a1bSJed Brown       nsize: 4
669c4762a1bSJed Brown       args: -snes_monitor_short -pc_type mg -dm_mat_type baij -mg_coarse_pc_type bjacobi -da_refine 3 -ksp_type fgmres
670c4762a1bSJed Brown       requires: !single
671c4762a1bSJed Brown 
672c4762a1bSJed Brown    test:
673c4762a1bSJed Brown       suffix: 14_ds
674c4762a1bSJed Brown       nsize: 4
675c4762a1bSJed Brown       args: -snes_converged_reason -pc_type mg -dm_mat_type baij -mg_coarse_pc_type bjacobi -da_refine 3 -ksp_type fgmres -mat_fd_type ds
676c4762a1bSJed Brown       output_file: output/ex19_2.out
677c4762a1bSJed Brown       requires: !single
678c4762a1bSJed Brown 
679c4762a1bSJed Brown    test:
680c4762a1bSJed Brown       suffix: 17
681c4762a1bSJed Brown       args: -snes_monitor_short -ksp_pc_side right
682c4762a1bSJed Brown       requires: !single
683c4762a1bSJed Brown 
684c4762a1bSJed Brown    test:
685c4762a1bSJed Brown       suffix: 18
686798534f6SMatthew G. Knepley       args: -snes_monitor_ksp draw::draw_lg -ksp_pc_side right
687c4762a1bSJed Brown       requires: x !single
688c4762a1bSJed Brown 
689c4762a1bSJed Brown    test:
69041ba4c6cSHeeho Park       suffix: 19
69141ba4c6cSHeeho Park       nsize: 2
69241ba4c6cSHeeho Park       args: -da_refine 3 -snes_monitor_short -pc_type mg -ksp_type fgmres -pc_mg_type full -snes_type newtontrdc
69341ba4c6cSHeeho Park       requires: !single
69441ba4c6cSHeeho Park 
69541ba4c6cSHeeho Park    test:
69641ba4c6cSHeeho Park       suffix: 20
69741ba4c6cSHeeho Park       nsize: 2
69841ba4c6cSHeeho Park       args: -da_refine 3 -snes_monitor_short -pc_type mg -ksp_type fgmres -pc_mg_type full -snes_type newtontrdc -snes_trdc_use_cauchy false
69941ba4c6cSHeeho Park       requires: !single
70041ba4c6cSHeeho Park 
70141ba4c6cSHeeho Park    test:
702c4762a1bSJed Brown       suffix: 2
703c4762a1bSJed Brown       nsize: 4
704c4762a1bSJed Brown       args: -da_refine 3 -snes_converged_reason -pc_type mg -mat_fd_type ds
705c4762a1bSJed Brown       requires: !single
706c4762a1bSJed Brown 
707c4762a1bSJed Brown    test:
708c4762a1bSJed Brown       suffix: 2_bcols1
709c4762a1bSJed Brown       nsize: 4
710c4762a1bSJed Brown       args: -da_refine 3 -snes_converged_reason -pc_type mg -mat_fd_type ds -mat_fd_coloring_bcols
711c4762a1bSJed Brown       output_file: output/ex19_2.out
712c4762a1bSJed Brown       requires: !single
713c4762a1bSJed Brown 
714c4762a1bSJed Brown    test:
715c4762a1bSJed Brown       suffix: 3
716c4762a1bSJed Brown       nsize: 4
717c4762a1bSJed Brown       requires: mumps
718c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type redundant -dm_mat_type mpiaij -redundant_ksp_type preonly -redundant_pc_factor_mat_solver_type mumps -pc_redundant_number 2
719c4762a1bSJed Brown 
720c4762a1bSJed Brown    test:
721c4762a1bSJed Brown       suffix: 4
722c4762a1bSJed Brown       nsize: 12
723c4762a1bSJed Brown       requires: mumps
724c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type redundant -dm_mat_type mpiaij -redundant_ksp_type preonly -redundant_pc_factor_mat_solver_type mumps -pc_redundant_number 5
725c4762a1bSJed Brown       output_file: output/ex19_3.out
726c4762a1bSJed Brown 
727c4762a1bSJed Brown    test:
728c4762a1bSJed Brown       suffix: 6
729c4762a1bSJed Brown       args: -snes_monitor_short -ksp_monitor_short -pc_type fieldsplit -snes_view -ksp_type fgmres -da_refine 1
730c4762a1bSJed Brown       requires: !single
731c4762a1bSJed Brown 
732c4762a1bSJed Brown    test:
733c4762a1bSJed Brown       suffix: 7
734c4762a1bSJed Brown       nsize: 3
735c4762a1bSJed Brown       args: -snes_monitor_short -ksp_monitor_short -pc_type fieldsplit -snes_view -da_refine 1 -ksp_type fgmres
736c4762a1bSJed Brown 
737c4762a1bSJed Brown       requires: !single
738c4762a1bSJed Brown    test:
739c4762a1bSJed Brown       suffix: 8
740c4762a1bSJed Brown       args: -snes_monitor_short -ksp_monitor_short -pc_type fieldsplit -pc_fieldsplit_block_size 2 -pc_fieldsplit_0_fields 0,1 -pc_fieldsplit_1_fields 0,1 -pc_fieldsplit_type multiplicative -snes_view -fieldsplit_pc_type lu -da_refine 1 -ksp_type fgmres
741c4762a1bSJed Brown       requires: !single
742c4762a1bSJed Brown 
743c4762a1bSJed Brown    test:
744c4762a1bSJed Brown       suffix: 9
745c4762a1bSJed Brown       nsize: 3
746c4762a1bSJed Brown       args: -snes_monitor_short -ksp_monitor_short -pc_type fieldsplit -pc_fieldsplit_type multiplicative -snes_view -da_refine 1 -ksp_type fgmres
747c4762a1bSJed Brown       requires: !single
748c4762a1bSJed Brown 
749c4762a1bSJed Brown    test:
750c4762a1bSJed Brown       suffix: aspin
751c4762a1bSJed Brown       nsize: 4
752c4762a1bSJed Brown       args: -da_refine 3 -da_overlap 2 -snes_monitor_short -snes_type aspin -grashof 4e4 -lidvelocity 100 -ksp_monitor_short
753c4762a1bSJed Brown       requires: !single
754c4762a1bSJed Brown 
755c4762a1bSJed Brown    test:
756c4762a1bSJed Brown       suffix: bcgsl
757c4762a1bSJed Brown       nsize: 2
758c4762a1bSJed Brown       args: -ksp_type bcgsl -ksp_monitor_short -da_refine 2 -ksp_bcgsl_ell 3 -snes_view
759c4762a1bSJed Brown       requires: !single
760c4762a1bSJed Brown 
761c4762a1bSJed Brown    test:
762c4762a1bSJed Brown       suffix: bcols1
763c4762a1bSJed Brown       nsize: 2
764c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type mg -ksp_type fgmres -pc_mg_type full -mat_fd_coloring_bcols 1
765c4762a1bSJed Brown       output_file: output/ex19_1.out
766c4762a1bSJed Brown       requires: !single
767c4762a1bSJed Brown 
768c4762a1bSJed Brown    test:
769c4762a1bSJed Brown       suffix: bjacobi
770c4762a1bSJed Brown       nsize: 4
771c4762a1bSJed Brown       args: -da_refine 4 -ksp_type fgmres -pc_type bjacobi -pc_bjacobi_blocks 2 -sub_ksp_type gmres -sub_ksp_max_it 2 -sub_pc_type bjacobi -sub_sub_ksp_type preonly -sub_sub_pc_type ilu -snes_monitor_short
772c4762a1bSJed Brown       requires: !single
773c4762a1bSJed Brown 
774c4762a1bSJed Brown    test:
775c4762a1bSJed Brown       suffix: cgne
776c4762a1bSJed Brown       args: -da_refine 2 -pc_type lu -ksp_type cgne -ksp_monitor_short -ksp_converged_reason -ksp_view -ksp_norm_type unpreconditioned
777c4762a1bSJed Brown       filter: grep -v HERMITIAN
778c4762a1bSJed Brown       requires: !single
779c4762a1bSJed Brown 
780c4762a1bSJed Brown    test:
781c4762a1bSJed Brown       suffix: cgs
782c4762a1bSJed Brown       args: -da_refine 1 -ksp_monitor_short -ksp_type cgs
783c4762a1bSJed Brown       requires: !single
784c4762a1bSJed Brown 
785c4762a1bSJed Brown    test:
786c4762a1bSJed Brown       suffix: composite_fieldsplit
787c4762a1bSJed Brown       args: -ksp_type fgmres -pc_type composite -pc_composite_type MULTIPLICATIVE -pc_composite_pcs fieldsplit,none -sub_0_pc_fieldsplit_block_size 4 -sub_0_pc_fieldsplit_type additive -sub_0_pc_fieldsplit_0_fields 0,1,2 -sub_0_pc_fieldsplit_1_fields 3 -snes_monitor_short -ksp_monitor_short
788c4762a1bSJed Brown       requires: !single
789c4762a1bSJed Brown 
790c4762a1bSJed Brown    test:
791c4762a1bSJed Brown       suffix: composite_fieldsplit_bjacobi
792c4762a1bSJed Brown       args: -ksp_type fgmres -pc_type composite -pc_composite_type MULTIPLICATIVE -pc_composite_pcs fieldsplit,bjacobi -sub_0_pc_fieldsplit_block_size 4 -sub_0_pc_fieldsplit_type additive -sub_0_pc_fieldsplit_0_fields 0,1,2 -sub_0_pc_fieldsplit_1_fields 3 -sub_1_pc_bjacobi_blocks 16 -sub_1_sub_pc_type lu -snes_monitor_short -ksp_monitor_short
793c4762a1bSJed Brown       requires: !single
794c4762a1bSJed Brown 
795c4762a1bSJed Brown    test:
796c4762a1bSJed Brown       suffix: composite_fieldsplit_bjacobi_2
797c4762a1bSJed Brown       nsize: 4
798c4762a1bSJed Brown       args: -ksp_type fgmres -pc_type composite -pc_composite_type MULTIPLICATIVE -pc_composite_pcs fieldsplit,bjacobi -sub_0_pc_fieldsplit_block_size 4 -sub_0_pc_fieldsplit_type additive -sub_0_pc_fieldsplit_0_fields 0,1,2 -sub_0_pc_fieldsplit_1_fields 3 -sub_1_pc_bjacobi_blocks 16 -sub_1_sub_pc_type lu -snes_monitor_short -ksp_monitor_short
799c4762a1bSJed Brown       requires: !single
800c4762a1bSJed Brown 
801c4762a1bSJed Brown    test:
802c4762a1bSJed Brown       suffix: composite_gs_newton
803c4762a1bSJed Brown       nsize: 2
804c4762a1bSJed Brown       args: -da_refine 3 -grashof 4e4 -lidvelocity 100 -snes_monitor_short -snes_type composite -snes_composite_type additiveoptimal -snes_composite_sneses ngs,newtonls -sub_0_snes_max_it 20 -sub_1_pc_type mg
805c4762a1bSJed Brown       requires: !single
806c4762a1bSJed Brown 
807c4762a1bSJed Brown    test:
808c4762a1bSJed Brown       suffix: cuda
809c4762a1bSJed Brown       requires: cuda !single
810c4762a1bSJed Brown       args: -dm_vec_type cuda -dm_mat_type aijcusparse -pc_type none -ksp_type fgmres -snes_monitor_short -snes_rtol 1.e-5
811c4762a1bSJed Brown 
812c4762a1bSJed Brown    test:
813c4762a1bSJed Brown       suffix: draw
814c4762a1bSJed Brown       args: -pc_type fieldsplit -snes_view draw -fieldsplit_x_velocity_pc_type mg -fieldsplit_x_velocity_pc_mg_galerkin pmat -fieldsplit_x_velocity_pc_mg_levels 2 -da_refine 1 -fieldsplit_x_velocity_mg_coarse_pc_type svd
815c4762a1bSJed Brown       requires: x !single
816c4762a1bSJed Brown 
817c4762a1bSJed Brown    test:
818c4762a1bSJed Brown       suffix: drawports
819c4762a1bSJed Brown       args: -snes_monitor_solution draw::draw_ports -da_refine 1
820c4762a1bSJed Brown       output_file: output/ex19_draw.out
821c4762a1bSJed Brown       requires: x !single
822c4762a1bSJed Brown 
823c4762a1bSJed Brown    test:
824c4762a1bSJed Brown       suffix: fas
825c4762a1bSJed Brown       args: -da_refine 4 -snes_monitor_short -snes_type fas -fas_levels_snes_type ngs -fas_levels_snes_ngs_sweeps 3 -fas_levels_snes_ngs_atol 0.0 -fas_levels_snes_ngs_stol 0.0 -grashof 4e4 -snes_fas_smoothup 6 -snes_fas_smoothdown 6 -lidvelocity 100
826c4762a1bSJed Brown       requires: !single
827c4762a1bSJed Brown 
828c4762a1bSJed Brown    test:
829c4762a1bSJed Brown       suffix: fas_full
830c4762a1bSJed Brown       args: -da_refine 4 -snes_monitor_short -snes_type fas -snes_fas_type full -snes_fas_full_downsweep -fas_levels_snes_type ngs -fas_levels_snes_ngs_sweeps 3 -fas_levels_snes_ngs_atol 0.0 -fas_levels_snes_ngs_stol 0.0 -grashof 4e4 -snes_fas_smoothup 6 -snes_fas_smoothdown 6 -lidvelocity 100
831c4762a1bSJed Brown       requires: !single
832c4762a1bSJed Brown 
833c4762a1bSJed Brown    test:
834c4762a1bSJed Brown       suffix: fdcoloring_ds
835c4762a1bSJed Brown       args: -da_refine 3 -snes_converged_reason -pc_type mg -mat_fd_type ds
836c4762a1bSJed Brown       output_file: output/ex19_2.out
837c4762a1bSJed Brown       requires: !single
838c4762a1bSJed Brown 
839c4762a1bSJed Brown    test:
840c4762a1bSJed Brown       suffix: fdcoloring_ds_baij
841c4762a1bSJed Brown       args: -da_refine 3 -snes_converged_reason -pc_type mg -mat_fd_type ds -dm_mat_type baij
842c4762a1bSJed Brown       output_file: output/ex19_2.out
843c4762a1bSJed Brown       requires: !single
844c4762a1bSJed Brown 
845c4762a1bSJed Brown    test:
846c4762a1bSJed Brown       suffix: fdcoloring_ds_bcols1
847c4762a1bSJed Brown       args: -da_refine 3 -snes_converged_reason -pc_type mg -mat_fd_type ds -mat_fd_coloring_bcols 1
848c4762a1bSJed Brown       output_file: output/ex19_2.out
849c4762a1bSJed Brown       requires: !single
850c4762a1bSJed Brown 
851c4762a1bSJed Brown    test:
852c4762a1bSJed Brown       suffix: fdcoloring_wp
853c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type mg
854c4762a1bSJed Brown       requires: !single
855c4762a1bSJed Brown 
856c4762a1bSJed Brown    test:
857c4762a1bSJed Brown       suffix: fdcoloring_wp_baij
858c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type mg -dm_mat_type baij
859c4762a1bSJed Brown       output_file: output/ex19_fdcoloring_wp.out
860c4762a1bSJed Brown       requires: !single
861c4762a1bSJed Brown 
862c4762a1bSJed Brown    test:
863c4762a1bSJed Brown       suffix: fdcoloring_wp_bcols1
864c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type mg -mat_fd_coloring_bcols 1
865c4762a1bSJed Brown       output_file: output/ex19_fdcoloring_wp.out
866c4762a1bSJed Brown       requires: !single
867c4762a1bSJed Brown 
868c4762a1bSJed Brown    test:
869c4762a1bSJed Brown       suffix: fieldsplit_2
870c4762a1bSJed Brown       args: -ksp_type fgmres -pc_type fieldsplit -pc_fieldsplit_block_size 4 -pc_fieldsplit_type additive -pc_fieldsplit_0_fields 0,1,2 -pc_fieldsplit_1_fields 3 -snes_monitor_short -ksp_monitor_short
871c4762a1bSJed Brown       requires: !single
872c4762a1bSJed Brown 
873c4762a1bSJed Brown    test:
874c4762a1bSJed Brown       suffix: fieldsplit_3
875c4762a1bSJed Brown       args: -ksp_type fgmres -pc_type fieldsplit -pc_fieldsplit_block_size 4 -pc_fieldsplit_type additive -pc_fieldsplit_0_fields 0,1,2 -pc_fieldsplit_1_fields 3 -fieldsplit_0_pc_type lu -fieldsplit_1_pc_type lu -snes_monitor_short -ksp_monitor_short
876c4762a1bSJed Brown       requires: !single
877c4762a1bSJed Brown 
878c4762a1bSJed Brown    test:
879c4762a1bSJed Brown       suffix: fieldsplit_4
880c4762a1bSJed Brown       args: -ksp_type fgmres -pc_type fieldsplit -pc_fieldsplit_block_size 4 -pc_fieldsplit_type SCHUR -pc_fieldsplit_0_fields 0,1,2 -pc_fieldsplit_1_fields 3 -fieldsplit_0_pc_type lu -fieldsplit_1_pc_type lu -snes_monitor_short -ksp_monitor_short
881c4762a1bSJed Brown       requires: !single
882c4762a1bSJed Brown 
883c4762a1bSJed Brown    # HYPRE PtAP broken with complex numbers
884c4762a1bSJed Brown    test:
885c4762a1bSJed Brown       suffix: fieldsplit_hypre
886c4762a1bSJed Brown       nsize: 2
887263f2b91SStefano Zampini       requires: hypre mumps !complex !defined(PETSC_HAVE_HYPRE_DEVICE)
888c4762a1bSJed Brown       args: -pc_type fieldsplit -pc_fieldsplit_block_size 4 -pc_fieldsplit_type SCHUR -pc_fieldsplit_0_fields 0,1,2 -pc_fieldsplit_1_fields 3 -fieldsplit_0_pc_type lu -fieldsplit_0_pc_factor_mat_solver_type mumps -fieldsplit_1_pc_type hypre -fieldsplit_1_pc_hypre_type boomeramg -snes_monitor_short -ksp_monitor_short
889c4762a1bSJed Brown 
890c4762a1bSJed Brown    test:
891c4762a1bSJed Brown       suffix: fieldsplit_mumps
892c4762a1bSJed Brown       nsize: 2
893c4762a1bSJed Brown       requires: mumps
894c4762a1bSJed Brown       args: -pc_type fieldsplit -pc_fieldsplit_block_size 4 -pc_fieldsplit_type SCHUR -pc_fieldsplit_0_fields 0,1,2 -pc_fieldsplit_1_fields 3 -fieldsplit_0_pc_type lu -fieldsplit_1_pc_type lu -snes_monitor_short -ksp_monitor_short -fieldsplit_0_pc_factor_mat_solver_type mumps -fieldsplit_1_pc_factor_mat_solver_type mumps
895c4762a1bSJed Brown       output_file: output/ex19_fieldsplit_5.out
896c4762a1bSJed Brown 
897c4762a1bSJed Brown    test:
898c4762a1bSJed Brown       suffix: greedy_coloring
899c4762a1bSJed Brown       nsize: 2
900c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -snes_fd_color -snes_fd_color_use_mat -mat_coloring_type greedy -mat_coloring_weight_type lf -mat_coloring_view> ex19_greedy_coloring.tmp 2>&1
901c4762a1bSJed Brown       requires: !single
902c4762a1bSJed Brown 
903c4762a1bSJed Brown    # HYPRE PtAP broken with complex numbers
904c4762a1bSJed Brown    test:
905c4762a1bSJed Brown       suffix: hypre
906c4762a1bSJed Brown       nsize: 2
907263f2b91SStefano Zampini       requires: hypre !complex !defined(PETSC_HAVE_HYPRE_DEVICE)
908263f2b91SStefano Zampini       args: -da_refine 3 -snes_monitor_short -pc_type hypre -ksp_norm_type unpreconditioned
909c4762a1bSJed Brown 
910263f2b91SStefano Zampini    # ibcgs is broken when using device vectors
911c4762a1bSJed Brown    test:
912c4762a1bSJed Brown       suffix: ibcgs
913c4762a1bSJed Brown       nsize: 2
914c4762a1bSJed Brown       args: -ksp_type ibcgs -ksp_monitor_short -da_refine 2 -snes_view
915c4762a1bSJed Brown       requires: !complex !single
916c4762a1bSJed Brown 
917c4762a1bSJed Brown    test:
918c4762a1bSJed Brown       suffix: kaczmarz
919c4762a1bSJed Brown       nsize: 2
920c4762a1bSJed Brown       args: -pc_type kaczmarz -ksp_monitor_short -snes_monitor_short -snes_view
921c4762a1bSJed Brown       requires: !single
922c4762a1bSJed Brown 
923c4762a1bSJed Brown    test:
924c4762a1bSJed Brown       suffix: klu
925c4762a1bSJed Brown       requires: suitesparse
926c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type klu
927c4762a1bSJed Brown       output_file: output/ex19_superlu.out
928c4762a1bSJed Brown 
929c4762a1bSJed Brown    test:
930c4762a1bSJed Brown       suffix: klu_2
931c4762a1bSJed Brown       requires: suitesparse
9324ac6704cSBarry Smith       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type klu -pc_factor_mat_ordering_type nd
933c4762a1bSJed Brown       output_file: output/ex19_superlu.out
934c4762a1bSJed Brown 
935c4762a1bSJed Brown    test:
936c4762a1bSJed Brown       suffix: klu_3
937c4762a1bSJed Brown       requires: suitesparse
938c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type klu -mat_klu_use_btf 0
939c4762a1bSJed Brown       output_file: output/ex19_superlu.out
940c4762a1bSJed Brown 
941c4762a1bSJed Brown    test:
942c4762a1bSJed Brown       suffix: ml
943c4762a1bSJed Brown       nsize: 2
944c4762a1bSJed Brown       requires: ml
945c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type ml
946c4762a1bSJed Brown 
947c4762a1bSJed Brown    test:
948c4762a1bSJed Brown       suffix: ngmres_fas
949c4762a1bSJed Brown       args: -da_refine 4 -snes_monitor_short -snes_type ngmres -npc_fas_levels_snes_type ngs -npc_fas_levels_snes_ngs_sweeps 3 -npc_fas_levels_snes_ngs_atol 0.0 -npc_fas_levels_snes_ngs_stol 0.0 -npc_snes_type fas -npc_fas_levels_snes_type ngs -npc_snes_max_it 1 -npc_snes_fas_smoothup 6 -npc_snes_fas_smoothdown 6 -lidvelocity 100 -grashof 4e4
950c4762a1bSJed Brown       requires: !single
951c4762a1bSJed Brown 
952c4762a1bSJed Brown    test:
953c4762a1bSJed Brown       suffix: ngmres_fas_gssecant
954c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -snes_type ngmres -npc_snes_type fas -npc_fas_levels_snes_type ngs -npc_fas_levels_snes_max_it 6 -npc_fas_levels_snes_ngs_secant -npc_fas_levels_snes_ngs_max_it 1 -npc_fas_coarse_snes_max_it 1 -lidvelocity 100 -grashof 4e4
955c4762a1bSJed Brown       requires: !single
956c4762a1bSJed Brown 
957c4762a1bSJed Brown    test:
958c4762a1bSJed Brown       suffix: ngmres_fas_ms
959c4762a1bSJed Brown       nsize: 2
960c4762a1bSJed Brown       args: -snes_grid_sequence 2 -lidvelocity 200 -grashof 1e4 -snes_monitor_short -snes_view -snes_converged_reason -snes_type ngmres -npc_snes_type fas -npc_fas_coarse_snes_type newtonls -npc_fas_coarse_ksp_type preonly -npc_snes_max_it 1
961c4762a1bSJed Brown       requires: !single
962c4762a1bSJed Brown 
963c4762a1bSJed Brown    test:
964c4762a1bSJed Brown       suffix: ngmres_nasm
965c4762a1bSJed Brown       nsize: 4
966c4762a1bSJed Brown       args: -da_refine 4 -da_overlap 2 -snes_monitor_short -snes_type ngmres -snes_max_it 10 -npc_snes_type nasm -npc_snes_nasm_type basic -grashof 4e4 -lidvelocity 100
967c4762a1bSJed Brown       requires: !single
968c4762a1bSJed Brown 
969c4762a1bSJed Brown    test:
970c4762a1bSJed Brown       suffix: ngs
971c4762a1bSJed Brown       args: -snes_type ngs -snes_view -snes_monitor -snes_rtol 1e-4
972c4762a1bSJed Brown       requires: !single
973c4762a1bSJed Brown 
974c4762a1bSJed Brown    test:
975c4762a1bSJed Brown       suffix: ngs_fd
976c4762a1bSJed Brown       args: -snes_type ngs -snes_ngs_secant -snes_view -snes_monitor -snes_rtol 1e-4
977c4762a1bSJed Brown       requires: !single
978c4762a1bSJed Brown 
979c4762a1bSJed Brown    test:
980c4762a1bSJed Brown       suffix: parms
981c4762a1bSJed Brown       nsize: 2
982c4762a1bSJed Brown       requires: parms
983c4762a1bSJed Brown       args: -pc_type parms -ksp_monitor_short -snes_view
984c4762a1bSJed Brown 
985c4762a1bSJed Brown    test:
986c4762a1bSJed Brown       suffix: superlu
987c4762a1bSJed Brown       requires: superlu
988c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type superlu
989c4762a1bSJed Brown 
990c4762a1bSJed Brown    test:
991c4762a1bSJed Brown       suffix: superlu_sell
992c4762a1bSJed Brown       requires: superlu
993c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type superlu -dm_mat_type sell -pc_factor_mat_ordering_type natural
994c4762a1bSJed Brown       output_file: output/ex19_superlu.out
995c4762a1bSJed Brown 
996c4762a1bSJed Brown    test:
997c4762a1bSJed Brown       suffix: superlu_dist
998c4762a1bSJed Brown       requires: superlu_dist
999c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type superlu_dist
1000c4762a1bSJed Brown       output_file: output/ex19_superlu.out
1001c4762a1bSJed Brown 
1002c4762a1bSJed Brown    test:
1003c4762a1bSJed Brown       suffix: superlu_dist_2
1004c4762a1bSJed Brown       nsize: 2
1005c4762a1bSJed Brown       requires: superlu_dist
1006c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type superlu_dist
1007c4762a1bSJed Brown       output_file: output/ex19_superlu.out
1008c4762a1bSJed Brown 
1009c4762a1bSJed Brown    test:
10103e558968SBarry Smith       suffix: superlu_dist_3d
10113e558968SBarry Smith       nsize: 4
10123e558968SBarry Smith       requires: superlu_dist !defined(PETSCTEST_VALGRIND)
10133e558968SBarry Smith       filter: grep -v iam | grep -v openMP
10143e558968SBarry Smith       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type superlu_dist -mat_superlu_dist_3d -mat_superlu_dist_d 2 -snes_view -snes_monitor -ksp_monitor
10153e558968SBarry Smith 
10163e558968SBarry Smith    test:
1017c4762a1bSJed Brown       suffix: superlu_equil
1018c4762a1bSJed Brown       requires: superlu
1019c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -{snes,ksp}_monitor_short -pc_type lu -pc_factor_mat_solver_type superlu -mat_superlu_equil
1020c4762a1bSJed Brown 
1021c4762a1bSJed Brown    test:
1022c4762a1bSJed Brown       suffix: superlu_equil_sell
1023c4762a1bSJed Brown       requires: superlu
1024c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -{snes,ksp}_monitor_short -pc_type lu -pc_factor_mat_solver_type superlu -mat_superlu_equil -dm_mat_type sell -pc_factor_mat_ordering_type natural
1025c4762a1bSJed Brown       output_file: output/ex19_superlu_equil.out
1026c4762a1bSJed Brown 
1027c4762a1bSJed Brown    test:
1028c4762a1bSJed Brown       suffix: tcqmr
1029c4762a1bSJed Brown       args: -da_refine 1 -ksp_monitor_short -ksp_type tcqmr
1030c4762a1bSJed Brown       requires: !single
1031c4762a1bSJed Brown 
1032c4762a1bSJed Brown    test:
1033c4762a1bSJed Brown       suffix: tfqmr
1034c4762a1bSJed Brown       args: -da_refine 1 -ksp_monitor_short -ksp_type tfqmr
1035c4762a1bSJed Brown       requires: !single
1036c4762a1bSJed Brown 
1037c4762a1bSJed Brown    test:
1038c4762a1bSJed Brown       suffix: umfpack
1039c4762a1bSJed Brown       requires: suitesparse
10402c7c0729SBarry Smith       args: -da_refine 2 -pc_type lu -pc_factor_mat_solver_type umfpack -snes_view -snes_monitor_short -ksp_monitor_short -pc_factor_mat_ordering_type external
1041c4762a1bSJed Brown 
1042c4762a1bSJed Brown    test:
1043c4762a1bSJed Brown       suffix: tut_1
1044c4762a1bSJed Brown       nsize: 4
1045c4762a1bSJed Brown       requires: !single
1046c4762a1bSJed Brown       args: -da_refine 5 -snes_monitor -ksp_monitor -snes_view
1047c4762a1bSJed Brown 
1048c4762a1bSJed Brown    test:
1049c4762a1bSJed Brown       suffix: tut_2
1050c4762a1bSJed Brown       nsize: 4
1051c4762a1bSJed Brown       requires: !single
1052c4762a1bSJed Brown       args: -da_refine 5 -snes_monitor -ksp_monitor -snes_view -pc_type mg
1053c4762a1bSJed Brown 
1054c4762a1bSJed Brown    # HYPRE PtAP broken with complex numbers
1055c4762a1bSJed Brown    test:
1056c4762a1bSJed Brown       suffix: tut_3
1057c4762a1bSJed Brown       nsize: 4
1058263f2b91SStefano Zampini       requires: hypre !single !complex !defined(PETSC_HAVE_HYPRE_DEVICE)
1059c4762a1bSJed Brown       args: -da_refine 5 -snes_monitor -ksp_monitor -snes_view -pc_type hypre
1060c4762a1bSJed Brown 
1061c4762a1bSJed Brown    test:
1062c4762a1bSJed Brown       suffix: tut_8
1063c4762a1bSJed Brown       nsize: 4
1064c4762a1bSJed Brown       requires: ml !single
1065c4762a1bSJed Brown       args: -da_refine 5 -snes_monitor -ksp_monitor -snes_view -pc_type ml
1066c4762a1bSJed Brown 
1067c4762a1bSJed Brown    test:
1068c4762a1bSJed Brown       suffix: tut_4
1069c4762a1bSJed Brown       nsize: 1
1070c4762a1bSJed Brown       requires: !single
1071c4762a1bSJed Brown       args: -da_refine 5 -log_view
1072c4762a1bSJed Brown       filter: head -n 2
1073c4762a1bSJed Brown       filter_output: head -n 2
1074c4762a1bSJed Brown 
1075c4762a1bSJed Brown    test:
1076c4762a1bSJed Brown       suffix: tut_5
1077c4762a1bSJed Brown       nsize: 1
1078c4762a1bSJed Brown       requires: !single
1079c4762a1bSJed Brown       args: -da_refine 5 -log_view -pc_type mg
1080c4762a1bSJed Brown       filter: head -n 2
1081c4762a1bSJed Brown       filter_output: head -n 2
1082c4762a1bSJed Brown 
1083c4762a1bSJed Brown    test:
1084c4762a1bSJed Brown       suffix: tut_6
1085c4762a1bSJed Brown       nsize: 4
1086c4762a1bSJed Brown       requires: !single
1087c4762a1bSJed Brown       args: -da_refine 5 -log_view
1088c4762a1bSJed Brown       filter: head -n 2
1089c4762a1bSJed Brown       filter_output: head -n 2
1090c4762a1bSJed Brown 
1091c4762a1bSJed Brown    test:
1092c4762a1bSJed Brown       suffix: tut_7
1093c4762a1bSJed Brown       nsize: 4
1094c4762a1bSJed Brown       requires: !single
1095c4762a1bSJed Brown       args: -da_refine 5 -log_view -pc_type mg
1096c4762a1bSJed Brown       filter: head -n 2
1097c4762a1bSJed Brown       filter_output: head -n 2
1098c4762a1bSJed Brown 
1099c4762a1bSJed Brown    test:
1100c4762a1bSJed Brown       suffix: cuda_1
1101c4762a1bSJed Brown       nsize: 1
1102c4762a1bSJed Brown       requires: cuda
110373f7197eSJed Brown       args: -snes_monitor -dm_mat_type seqaijcusparse -dm_vec_type seqcuda -pc_type gamg -pc_gamg_esteig_ksp_max_it 10 -ksp_monitor -mg_levels_ksp_max_it 3
1104c4762a1bSJed Brown 
1105c4762a1bSJed Brown    test:
1106c4762a1bSJed Brown       suffix: cuda_2
1107c4762a1bSJed Brown       nsize: 3
1108c4762a1bSJed Brown       requires: cuda !single
110973f7197eSJed Brown       args: -snes_monitor -dm_mat_type mpiaijcusparse -dm_vec_type mpicuda -pc_type gamg -pc_gamg_esteig_ksp_max_it 10 -ksp_monitor  -mg_levels_ksp_max_it 3
1110c4762a1bSJed Brown 
1111c4762a1bSJed Brown    test:
1112d38ac8baSRichard Tran Mills       suffix: cuda_dm_bind_below
1113d38ac8baSRichard Tran Mills       nsize: 2
1114d38ac8baSRichard Tran Mills       requires: cuda
1115d38ac8baSRichard Tran Mills       args: -dm_mat_type aijcusparse -dm_vec_type cuda -da_refine 3 -pc_type mg -mg_levels_ksp_type chebyshev -mg_levels_pc_type jacobi -log_view -pc_mg_log -dm_bind_below 10000
111617fc1e00SRichard Tran Mills       filter: awk "/Level/ {print \$NF}"
1117d38ac8baSRichard Tran Mills 
1118d38ac8baSRichard Tran Mills    test:
1119d38ac8baSRichard Tran Mills       suffix: viennacl_dm_bind_below
1120d38ac8baSRichard Tran Mills       nsize: 2
1121d38ac8baSRichard Tran Mills       requires: viennacl
1122d38ac8baSRichard Tran Mills       args: -dm_mat_type aijviennacl -dm_vec_type viennacl -da_refine 3 -pc_type mg -mg_levels_ksp_type chebyshev -mg_levels_pc_type jacobi -log_view -pc_mg_log -dm_bind_below 10000
112317fc1e00SRichard Tran Mills       filter: awk "/Level/ {print \$NF}"
1124d38ac8baSRichard Tran Mills 
1125d38ac8baSRichard Tran Mills    test:
1126c4762a1bSJed Brown       suffix: seqbaijmkl
1127c4762a1bSJed Brown       nsize: 1
1128dfd57a17SPierre Jolivet       requires: defined(PETSC_HAVE_MKL_SPARSE_OPTIMIZE)
1129c4762a1bSJed Brown       args: -dm_mat_type baij -snes_monitor -ksp_monitor -snes_view
1130c4762a1bSJed Brown 
1131c4762a1bSJed Brown    test:
1132c4762a1bSJed Brown       suffix: mpibaijmkl
1133c4762a1bSJed Brown       nsize: 2
1134dfd57a17SPierre Jolivet       requires:  defined(PETSC_HAVE_MKL_SPARSE_OPTIMIZE)
1135c4762a1bSJed Brown       args: -dm_mat_type baij -snes_monitor -ksp_monitor -snes_view
1136c4762a1bSJed Brown 
1137c4762a1bSJed Brown    test:
1138c4762a1bSJed Brown      suffix: cpardiso
1139c4762a1bSJed Brown      nsize: 4
1140c4762a1bSJed Brown      requires: mkl_cpardiso
1141c4762a1bSJed Brown      args: -pc_type lu -pc_factor_mat_solver_type mkl_cpardiso -ksp_monitor
1142c4762a1bSJed Brown 
1143c4762a1bSJed Brown    test:
1144c4762a1bSJed Brown      suffix: logviewmemory
1145dfd57a17SPierre Jolivet      requires: defined(PETSC_USE_LOG) !defined(PETSCTEST_VALGRIND)
1146c4762a1bSJed Brown      args: -log_view -log_view_memory -da_refine 4
1147c4762a1bSJed Brown      filter: grep MatFDColorSetUp | wc -w | xargs  -I % sh -c "expr % \> 21"
1148c4762a1bSJed Brown 
1149534f0846SBarry Smith    test:
1150534f0846SBarry Smith      suffix: fs
1151534f0846SBarry Smith      args: -pc_type fieldsplit -da_refine 3  -all_ksp_monitor -fieldsplit_y_velocity_pc_type lu  -fieldsplit_temperature_pc_type lu -fieldsplit_x_velocity_pc_type lu  -snes_view
1152534f0846SBarry Smith 
115371f558e3SSatish Balay    test:
1154a8e42557SLawrence Mitchell      suffix: asm_matconvert
1155a8e42557SLawrence Mitchell      args: -mat_type aij -pc_type asm -pc_asm_sub_mat_type dense -snes_view
1156a8e42557SLawrence Mitchell 
11578bf83915SBarry Smith    test:
11588bf83915SBarry Smith       suffix: euclid
11598bf83915SBarry Smith       nsize: 2
1160263f2b91SStefano Zampini       requires: hypre !single !complex !defined(PETSC_HAVE_HYPRE_MIXEDINT) !defined(PETSC_HAVE_HYPRE_DEVICE)
11618bf83915SBarry Smith       args: -da_refine 2 -ksp_monitor -snes_monitor -snes_view -pc_type hypre -pc_hypre_type euclid
11628bf83915SBarry Smith 
11638bf83915SBarry Smith    test:
11648bf83915SBarry Smith       suffix: euclid_bj
11658bf83915SBarry Smith       nsize: 2
1166263f2b91SStefano Zampini       requires: hypre !single !complex !defined(PETSC_HAVE_HYPRE_MIXEDINT) !defined(PETSC_HAVE_HYPRE_DEVICE)
11678bf83915SBarry Smith       args: -da_refine 2 -ksp_monitor -snes_monitor -snes_view -pc_type hypre -pc_hypre_type euclid -pc_hypre_euclid_bj
11688bf83915SBarry Smith 
11698bf83915SBarry Smith    test:
11708bf83915SBarry Smith       suffix: euclid_droptolerance
11718bf83915SBarry Smith       nsize: 1
1172263f2b91SStefano Zampini       requires: hypre !single !complex !defined(PETSC_HAVE_HYPRE_MIXEDINT) !defined(PETSC_HAVE_HYPRE_DEVICE)
11738bf83915SBarry Smith       args: -da_refine 2 -ksp_monitor -snes_monitor -snes_view -pc_type hypre -pc_hypre_type euclid -pc_hypre_euclid_droptolerance .1
11748bf83915SBarry Smith 
1175660278c0SBarry Smith    test:
1176660278c0SBarry Smith       suffix: failure_size
1177660278c0SBarry Smith       nsize: 1
1178660278c0SBarry Smith       requires: !defined(PETSC_USE_64BIT_INDICES) !defined(PETSCTEST_VALGRIND)
1179660278c0SBarry Smith       args: -da_refine 100 -petsc_ci_portable_error_output -error_output_stdout
1180f4bc716fSBarry Smith       filter: egrep -v "(options_left|memory block|leaked context|is not freed before MPI_Finalize|Could be the program crashed)"
1181660278c0SBarry Smith 
1182c4762a1bSJed Brown TEST*/
1183