xref: /petsc/src/snes/tutorials/ex19.c (revision b122ec5aa1bd4469eb4e0673542fb7de3f411254)
1c4762a1bSJed Brown 
2c4762a1bSJed Brown static char help[] = "Nonlinear driven cavity with multigrid in 2d.\n \
3c4762a1bSJed Brown   \n\
4c4762a1bSJed Brown The 2D driven cavity problem is solved in a velocity-vorticity formulation.\n\
5c4762a1bSJed Brown The flow can be driven with the lid or with bouyancy or both:\n\
6c4762a1bSJed Brown   -lidvelocity &ltlid&gt, where &ltlid&gt = dimensionless velocity of lid\n\
7c4762a1bSJed Brown   -grashof &ltgr&gt, where &ltgr&gt = dimensionless temperature gradent\n\
8c4762a1bSJed Brown   -prandtl &ltpr&gt, where &ltpr&gt = dimensionless thermal/momentum diffusity ratio\n\
9c4762a1bSJed Brown  -contours : draw contour plots of solution\n\n";
10c4762a1bSJed Brown /* in HTML, '&lt' = '<' and '&gt' = '>' */
11c4762a1bSJed Brown 
12c4762a1bSJed Brown /*
13c4762a1bSJed Brown       See src/ksp/ksp/tutorials/ex45.c
14c4762a1bSJed Brown */
15c4762a1bSJed Brown 
16c4762a1bSJed Brown /*T
17c4762a1bSJed Brown    Concepts: SNES^solving a system of nonlinear equations (parallel multicomponent example);
18c4762a1bSJed Brown    Concepts: DMDA^using distributed arrays;
19c4762a1bSJed Brown    Concepts: multicomponent
20c4762a1bSJed Brown    Processors: n
21c4762a1bSJed Brown T*/
22c4762a1bSJed Brown 
23c4762a1bSJed Brown /*F-----------------------------------------------------------------------
24c4762a1bSJed Brown 
25c4762a1bSJed Brown     We thank David E. Keyes for contributing the driven cavity discretization within this example code.
26c4762a1bSJed Brown 
27c4762a1bSJed Brown     This problem is modeled by the partial differential equation system
28c4762a1bSJed Brown 
29c4762a1bSJed Brown \begin{eqnarray}
30c4762a1bSJed Brown         - \triangle U - \nabla_y \Omega & = & 0  \\
31c4762a1bSJed Brown         - \triangle V + \nabla_x\Omega & = & 0  \\
32c4762a1bSJed Brown         - \triangle \Omega + \nabla \cdot ([U*\Omega,V*\Omega]) - GR* \nabla_x T & = & 0  \\
33c4762a1bSJed Brown         - \triangle T + PR* \nabla \cdot ([U*T,V*T]) & = & 0
34c4762a1bSJed Brown \end{eqnarray}
35c4762a1bSJed Brown 
36c4762a1bSJed Brown     in the unit square, which is uniformly discretized in each of x and y in this simple encoding.
37c4762a1bSJed Brown 
38c4762a1bSJed Brown     No-slip, rigid-wall Dirichlet conditions are used for $ [U,V]$.
39c4762a1bSJed Brown     Dirichlet conditions are used for Omega, based on the definition of
40c4762a1bSJed Brown     vorticity: $ \Omega = - \nabla_y U + \nabla_x V$, where along each
41c4762a1bSJed Brown     constant coordinate boundary, the tangential derivative is zero.
42c4762a1bSJed Brown     Dirichlet conditions are used for T on the left and right walls,
43c4762a1bSJed Brown     and insulation homogeneous Neumann conditions are used for T on
44c4762a1bSJed Brown     the top and bottom walls.
45c4762a1bSJed Brown 
46c4762a1bSJed Brown     A finite difference approximation with the usual 5-point stencil
47c4762a1bSJed Brown     is used to discretize the boundary value problem to obtain a
48c4762a1bSJed Brown     nonlinear system of equations.  Upwinding is used for the divergence
49c4762a1bSJed Brown     (convective) terms and central for the gradient (source) terms.
50c4762a1bSJed Brown 
51c4762a1bSJed Brown     The Jacobian can be either
52c4762a1bSJed Brown       * formed via finite differencing using coloring (the default), or
53c4762a1bSJed Brown       * applied matrix-free via the option -snes_mf
54c4762a1bSJed Brown         (for larger grid problems this variant may not converge
55c4762a1bSJed Brown         without a preconditioner due to ill-conditioning).
56c4762a1bSJed Brown 
57c4762a1bSJed Brown   ------------------------------------------------------------------------F*/
58c4762a1bSJed Brown 
59c4762a1bSJed Brown /*
60c4762a1bSJed Brown    Include "petscdmda.h" so that we can use distributed arrays (DMDAs).
61c4762a1bSJed Brown    Include "petscsnes.h" so that we can use SNES solvers.  Note that this
62c4762a1bSJed Brown    file automatically includes:
63c4762a1bSJed Brown      petscsys.h       - base PETSc routines   petscvec.h - vectors
64c4762a1bSJed Brown      petscmat.h - matrices
65c4762a1bSJed Brown      petscis.h     - index sets            petscksp.h - Krylov subspace methods
66c4762a1bSJed Brown      petscviewer.h - viewers               petscpc.h  - preconditioners
67c4762a1bSJed Brown      petscksp.h   - linear solvers
68c4762a1bSJed Brown */
69c4762a1bSJed Brown #if defined(PETSC_APPLE_FRAMEWORK)
70c4762a1bSJed Brown #import <PETSc/petscsnes.h>
71c4762a1bSJed Brown #import <PETSc/petscdmda.h>
72c4762a1bSJed Brown #else
73c4762a1bSJed Brown #include <petscsnes.h>
74c4762a1bSJed Brown #include <petscdm.h>
75c4762a1bSJed Brown #include <petscdmda.h>
76c4762a1bSJed Brown #endif
77c4762a1bSJed Brown 
78c4762a1bSJed Brown /*
79c4762a1bSJed Brown    User-defined routines and data structures
80c4762a1bSJed Brown */
81c4762a1bSJed Brown typedef struct {
82c4762a1bSJed Brown   PetscScalar u,v,omega,temp;
83c4762a1bSJed Brown } Field;
84c4762a1bSJed Brown 
85c4762a1bSJed Brown PetscErrorCode FormFunctionLocal(DMDALocalInfo*,Field**,Field**,void*);
86c4762a1bSJed Brown 
87c4762a1bSJed Brown typedef struct {
88c4762a1bSJed Brown   PetscReal   lidvelocity,prandtl,grashof;  /* physical parameters */
89c4762a1bSJed Brown   PetscBool   draw_contours;                /* flag - 1 indicates drawing contours */
90c4762a1bSJed Brown } AppCtx;
91c4762a1bSJed Brown 
92c4762a1bSJed Brown extern PetscErrorCode FormInitialGuess(AppCtx*,DM,Vec);
93c4762a1bSJed Brown extern PetscErrorCode NonlinearGS(SNES,Vec,Vec,void*);
94c4762a1bSJed Brown 
95c4762a1bSJed Brown int main(int argc,char **argv)
96c4762a1bSJed Brown {
97c4762a1bSJed Brown   AppCtx         user;                /* user-defined work context */
98c4762a1bSJed Brown   PetscInt       mx,my,its;
99c4762a1bSJed Brown   MPI_Comm       comm;
100c4762a1bSJed Brown   SNES           snes;
101c4762a1bSJed Brown   DM             da;
102c4762a1bSJed Brown   Vec            x;
103c4762a1bSJed Brown 
104*b122ec5aSJacob Faibussowitsch   CHKERRQ(PetscInitialize(&argc,&argv,(char*)0,help));
105c4762a1bSJed Brown 
106c4762a1bSJed Brown   PetscFunctionBeginUser;
107c4762a1bSJed Brown   comm = PETSC_COMM_WORLD;
1085f80ce2aSJacob Faibussowitsch   CHKERRQ(SNESCreate(comm,&snes));
109c4762a1bSJed Brown 
110c4762a1bSJed Brown   /*
111c4762a1bSJed Brown       Create distributed array object to manage parallel grid and vectors
112c4762a1bSJed Brown       for principal unknowns (x) and governing residuals (f)
113c4762a1bSJed Brown   */
1145f80ce2aSJacob Faibussowitsch   CHKERRQ(DMDACreate2d(PETSC_COMM_WORLD,DM_BOUNDARY_NONE,DM_BOUNDARY_NONE,DMDA_STENCIL_STAR,4,4,PETSC_DECIDE,PETSC_DECIDE,4,1,0,0,&da));
1155f80ce2aSJacob Faibussowitsch   CHKERRQ(DMSetFromOptions(da));
1165f80ce2aSJacob Faibussowitsch   CHKERRQ(DMSetUp(da));
1175f80ce2aSJacob Faibussowitsch   CHKERRQ(SNESSetDM(snes,(DM)da));
1185f80ce2aSJacob Faibussowitsch   CHKERRQ(SNESSetNGS(snes, NonlinearGS, (void*)&user));
119c4762a1bSJed Brown 
1205f80ce2aSJacob Faibussowitsch   CHKERRQ(DMDAGetInfo(da,0,&mx,&my,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE));
121c4762a1bSJed Brown   /*
122c4762a1bSJed Brown      Problem parameters (velocity of lid, prandtl, and grashof numbers)
123c4762a1bSJed Brown   */
124c4762a1bSJed Brown   user.lidvelocity = 1.0/(mx*my);
125c4762a1bSJed Brown   user.prandtl     = 1.0;
126c4762a1bSJed Brown   user.grashof     = 1.0;
127c4762a1bSJed Brown 
1285f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscOptionsGetReal(NULL,NULL,"-lidvelocity",&user.lidvelocity,NULL));
1295f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscOptionsGetReal(NULL,NULL,"-prandtl",&user.prandtl,NULL));
1305f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscOptionsGetReal(NULL,NULL,"-grashof",&user.grashof,NULL));
1315f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscOptionsHasName(NULL,NULL,"-contours",&user.draw_contours));
132c4762a1bSJed Brown 
1335f80ce2aSJacob Faibussowitsch   CHKERRQ(DMDASetFieldName(da,0,"x_velocity"));
1345f80ce2aSJacob Faibussowitsch   CHKERRQ(DMDASetFieldName(da,1,"y_velocity"));
1355f80ce2aSJacob Faibussowitsch   CHKERRQ(DMDASetFieldName(da,2,"Omega"));
1365f80ce2aSJacob Faibussowitsch   CHKERRQ(DMDASetFieldName(da,3,"temperature"));
137c4762a1bSJed Brown 
138c4762a1bSJed Brown   /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
139c4762a1bSJed Brown      Create user context, set problem data, create vector data structures.
140c4762a1bSJed Brown      Also, compute the initial guess.
141c4762a1bSJed Brown      - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */
142c4762a1bSJed Brown 
143c4762a1bSJed Brown   /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
144c4762a1bSJed Brown      Create nonlinear solver context
145c4762a1bSJed Brown 
146c4762a1bSJed Brown      - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */
1475f80ce2aSJacob Faibussowitsch   CHKERRQ(DMSetApplicationContext(da,&user));
1485f80ce2aSJacob Faibussowitsch   CHKERRQ(DMDASNESSetFunctionLocal(da,INSERT_VALUES,(PetscErrorCode (*)(DMDALocalInfo*,void*,void*,void*))FormFunctionLocal,&user));
1495f80ce2aSJacob Faibussowitsch   CHKERRQ(SNESSetFromOptions(snes));
1505f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscPrintf(comm,"lid velocity = %g, prandtl # = %g, grashof # = %g\n",(double)user.lidvelocity,(double)user.prandtl,(double)user.grashof));
151c4762a1bSJed Brown 
152c4762a1bSJed Brown   /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
153c4762a1bSJed Brown      Solve the nonlinear system
154c4762a1bSJed Brown      - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */
1555f80ce2aSJacob Faibussowitsch   CHKERRQ(DMCreateGlobalVector(da,&x));
1565f80ce2aSJacob Faibussowitsch   CHKERRQ(FormInitialGuess(&user,da,x));
157c4762a1bSJed Brown 
1585f80ce2aSJacob Faibussowitsch   CHKERRQ(SNESSolve(snes,NULL,x));
159c4762a1bSJed Brown 
1605f80ce2aSJacob Faibussowitsch   CHKERRQ(SNESGetIterationNumber(snes,&its));
1615f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscPrintf(comm,"Number of SNES iterations = %D\n", its));
162c4762a1bSJed Brown 
163c4762a1bSJed Brown   /*
164c4762a1bSJed Brown      Visualize solution
165c4762a1bSJed Brown   */
166c4762a1bSJed Brown   if (user.draw_contours) {
1675f80ce2aSJacob Faibussowitsch     CHKERRQ(VecView(x,PETSC_VIEWER_DRAW_WORLD));
168c4762a1bSJed Brown   }
169c4762a1bSJed Brown 
170c4762a1bSJed Brown   /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
171c4762a1bSJed Brown      Free work space.  All PETSc objects should be destroyed when they
172c4762a1bSJed Brown      are no longer needed.
173c4762a1bSJed Brown      - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */
1745f80ce2aSJacob Faibussowitsch   CHKERRQ(VecDestroy(&x));
1755f80ce2aSJacob Faibussowitsch   CHKERRQ(DMDestroy(&da));
1765f80ce2aSJacob Faibussowitsch   CHKERRQ(SNESDestroy(&snes));
177*b122ec5aSJacob Faibussowitsch   CHKERRQ(PetscFinalize());
178*b122ec5aSJacob Faibussowitsch   return 0;
179c4762a1bSJed Brown }
180c4762a1bSJed Brown 
181c4762a1bSJed Brown /* ------------------------------------------------------------------- */
182c4762a1bSJed Brown 
183c4762a1bSJed Brown /*
184c4762a1bSJed Brown    FormInitialGuess - Forms initial approximation.
185c4762a1bSJed Brown 
186c4762a1bSJed Brown    Input Parameters:
187c4762a1bSJed Brown    user - user-defined application context
188c4762a1bSJed Brown    X - vector
189c4762a1bSJed Brown 
190c4762a1bSJed Brown    Output Parameter:
191c4762a1bSJed Brown    X - vector
192c4762a1bSJed Brown */
193c4762a1bSJed Brown PetscErrorCode FormInitialGuess(AppCtx *user,DM da,Vec X)
194c4762a1bSJed Brown {
195c4762a1bSJed Brown   PetscInt       i,j,mx,xs,ys,xm,ym;
196c4762a1bSJed Brown   PetscReal      grashof,dx;
197c4762a1bSJed Brown   Field          **x;
198c4762a1bSJed Brown 
199c4762a1bSJed Brown   PetscFunctionBeginUser;
200c4762a1bSJed Brown   grashof = user->grashof;
201c4762a1bSJed Brown 
2025f80ce2aSJacob Faibussowitsch   CHKERRQ(DMDAGetInfo(da,0,&mx,0,0,0,0,0,0,0,0,0,0,0));
203c4762a1bSJed Brown   dx   = 1.0/(mx-1);
204c4762a1bSJed Brown 
205c4762a1bSJed Brown   /*
206c4762a1bSJed Brown      Get local grid boundaries (for 2-dimensional DMDA):
207c4762a1bSJed Brown        xs, ys   - starting grid indices (no ghost points)
208c4762a1bSJed Brown        xm, ym   - widths of local grid (no ghost points)
209c4762a1bSJed Brown   */
2105f80ce2aSJacob Faibussowitsch   CHKERRQ(DMDAGetCorners(da,&xs,&ys,NULL,&xm,&ym,NULL));
211c4762a1bSJed Brown 
212c4762a1bSJed Brown   /*
213c4762a1bSJed Brown      Get a pointer to vector data.
214c4762a1bSJed Brown        - For default PETSc vectors, VecGetArray() returns a pointer to
215c4762a1bSJed Brown          the data array.  Otherwise, the routine is implementation dependent.
216c4762a1bSJed Brown        - You MUST call VecRestoreArray() when you no longer need access to
217c4762a1bSJed Brown          the array.
218c4762a1bSJed Brown   */
2195f80ce2aSJacob Faibussowitsch   CHKERRQ(DMDAVecGetArrayWrite(da,X,&x));
220c4762a1bSJed Brown 
221c4762a1bSJed Brown   /*
222c4762a1bSJed Brown      Compute initial guess over the locally owned part of the grid
223c4762a1bSJed Brown      Initial condition is motionless fluid and equilibrium temperature
224c4762a1bSJed Brown   */
225c4762a1bSJed Brown   for (j=ys; j<ys+ym; j++) {
226c4762a1bSJed Brown     for (i=xs; i<xs+xm; i++) {
227c4762a1bSJed Brown       x[j][i].u     = 0.0;
228c4762a1bSJed Brown       x[j][i].v     = 0.0;
229c4762a1bSJed Brown       x[j][i].omega = 0.0;
230c4762a1bSJed Brown       x[j][i].temp  = (grashof>0)*i*dx;
231c4762a1bSJed Brown     }
232c4762a1bSJed Brown   }
233c4762a1bSJed Brown 
234c4762a1bSJed Brown   /*
235c4762a1bSJed Brown      Restore vector
236c4762a1bSJed Brown   */
2375f80ce2aSJacob Faibussowitsch   CHKERRQ(DMDAVecRestoreArrayWrite(da,X,&x));
238c4762a1bSJed Brown   PetscFunctionReturn(0);
239c4762a1bSJed Brown }
240c4762a1bSJed Brown 
241c4762a1bSJed Brown PetscErrorCode FormFunctionLocal(DMDALocalInfo *info,Field **x,Field **f,void *ptr)
242c4762a1bSJed Brown {
243c4762a1bSJed Brown   AppCtx         *user = (AppCtx*)ptr;
244c4762a1bSJed Brown   PetscInt       xints,xinte,yints,yinte,i,j;
245c4762a1bSJed Brown   PetscReal      hx,hy,dhx,dhy,hxdhy,hydhx;
246c4762a1bSJed Brown   PetscReal      grashof,prandtl,lid;
247c4762a1bSJed Brown   PetscScalar    u,uxx,uyy,vx,vy,avx,avy,vxp,vxm,vyp,vym;
248c4762a1bSJed Brown 
249c4762a1bSJed Brown   PetscFunctionBeginUser;
250c4762a1bSJed Brown   grashof = user->grashof;
251c4762a1bSJed Brown   prandtl = user->prandtl;
252c4762a1bSJed Brown   lid     = user->lidvelocity;
253c4762a1bSJed Brown 
254c4762a1bSJed Brown   /*
255c4762a1bSJed Brown      Define mesh intervals ratios for uniform grid.
256c4762a1bSJed Brown 
257c4762a1bSJed Brown      Note: FD formulae below are normalized by multiplying through by
258c4762a1bSJed Brown      local volume element (i.e. hx*hy) to obtain coefficients O(1) in two dimensions.
259c4762a1bSJed Brown 
260c4762a1bSJed Brown   */
261c4762a1bSJed Brown   dhx   = (PetscReal)(info->mx-1);  dhy = (PetscReal)(info->my-1);
262c4762a1bSJed Brown   hx    = 1.0/dhx;                   hy = 1.0/dhy;
263c4762a1bSJed Brown   hxdhy = hx*dhy;                 hydhx = hy*dhx;
264c4762a1bSJed Brown 
265c4762a1bSJed Brown   xints = info->xs; xinte = info->xs+info->xm; yints = info->ys; yinte = info->ys+info->ym;
266c4762a1bSJed Brown 
267c4762a1bSJed Brown   /* Test whether we are on the bottom edge of the global array */
268c4762a1bSJed Brown   if (yints == 0) {
269c4762a1bSJed Brown     j     = 0;
270c4762a1bSJed Brown     yints = yints + 1;
271c4762a1bSJed Brown     /* bottom edge */
272c4762a1bSJed Brown     for (i=info->xs; i<info->xs+info->xm; i++) {
273c4762a1bSJed Brown       f[j][i].u     = x[j][i].u;
274c4762a1bSJed Brown       f[j][i].v     = x[j][i].v;
275c4762a1bSJed Brown       f[j][i].omega = x[j][i].omega + (x[j+1][i].u - x[j][i].u)*dhy;
276c4762a1bSJed Brown       f[j][i].temp  = x[j][i].temp-x[j+1][i].temp;
277c4762a1bSJed Brown     }
278c4762a1bSJed Brown   }
279c4762a1bSJed Brown 
280c4762a1bSJed Brown   /* Test whether we are on the top edge of the global array */
281c4762a1bSJed Brown   if (yinte == info->my) {
282c4762a1bSJed Brown     j     = info->my - 1;
283c4762a1bSJed Brown     yinte = yinte - 1;
284c4762a1bSJed Brown     /* top edge */
285c4762a1bSJed Brown     for (i=info->xs; i<info->xs+info->xm; i++) {
286c4762a1bSJed Brown       f[j][i].u     = x[j][i].u - lid;
287c4762a1bSJed Brown       f[j][i].v     = x[j][i].v;
288c4762a1bSJed Brown       f[j][i].omega = x[j][i].omega + (x[j][i].u - x[j-1][i].u)*dhy;
289c4762a1bSJed Brown       f[j][i].temp  = x[j][i].temp-x[j-1][i].temp;
290c4762a1bSJed Brown     }
291c4762a1bSJed Brown   }
292c4762a1bSJed Brown 
293c4762a1bSJed Brown   /* Test whether we are on the left edge of the global array */
294c4762a1bSJed Brown   if (xints == 0) {
295c4762a1bSJed Brown     i     = 0;
296c4762a1bSJed Brown     xints = xints + 1;
297c4762a1bSJed Brown     /* left edge */
298c4762a1bSJed Brown     for (j=info->ys; j<info->ys+info->ym; j++) {
299c4762a1bSJed Brown       f[j][i].u     = x[j][i].u;
300c4762a1bSJed Brown       f[j][i].v     = x[j][i].v;
301c4762a1bSJed Brown       f[j][i].omega = x[j][i].omega - (x[j][i+1].v - x[j][i].v)*dhx;
302c4762a1bSJed Brown       f[j][i].temp  = x[j][i].temp;
303c4762a1bSJed Brown     }
304c4762a1bSJed Brown   }
305c4762a1bSJed Brown 
306c4762a1bSJed Brown   /* Test whether we are on the right edge of the global array */
307c4762a1bSJed Brown   if (xinte == info->mx) {
308c4762a1bSJed Brown     i     = info->mx - 1;
309c4762a1bSJed Brown     xinte = xinte - 1;
310c4762a1bSJed Brown     /* right edge */
311c4762a1bSJed Brown     for (j=info->ys; j<info->ys+info->ym; j++) {
312c4762a1bSJed Brown       f[j][i].u     = x[j][i].u;
313c4762a1bSJed Brown       f[j][i].v     = x[j][i].v;
314c4762a1bSJed Brown       f[j][i].omega = x[j][i].omega - (x[j][i].v - x[j][i-1].v)*dhx;
315c4762a1bSJed Brown       f[j][i].temp  = x[j][i].temp - (PetscReal)(grashof>0);
316c4762a1bSJed Brown     }
317c4762a1bSJed Brown   }
318c4762a1bSJed Brown 
319c4762a1bSJed Brown   /* Compute over the interior points */
320c4762a1bSJed Brown   for (j=yints; j<yinte; j++) {
321c4762a1bSJed Brown     for (i=xints; i<xinte; i++) {
322c4762a1bSJed Brown 
323c4762a1bSJed Brown       /*
324c4762a1bSJed Brown        convective coefficients for upwinding
325c4762a1bSJed Brown       */
326c4762a1bSJed Brown       vx  = x[j][i].u; avx = PetscAbsScalar(vx);
327c4762a1bSJed Brown       vxp = .5*(vx+avx); vxm = .5*(vx-avx);
328c4762a1bSJed Brown       vy  = x[j][i].v; avy = PetscAbsScalar(vy);
329c4762a1bSJed Brown       vyp = .5*(vy+avy); vym = .5*(vy-avy);
330c4762a1bSJed Brown 
331c4762a1bSJed Brown       /* U velocity */
332c4762a1bSJed Brown       u         = x[j][i].u;
333c4762a1bSJed Brown       uxx       = (2.0*u - x[j][i-1].u - x[j][i+1].u)*hydhx;
334c4762a1bSJed Brown       uyy       = (2.0*u - x[j-1][i].u - x[j+1][i].u)*hxdhy;
335c4762a1bSJed Brown       f[j][i].u = uxx + uyy - .5*(x[j+1][i].omega-x[j-1][i].omega)*hx;
336c4762a1bSJed Brown 
337c4762a1bSJed Brown       /* V velocity */
338c4762a1bSJed Brown       u         = x[j][i].v;
339c4762a1bSJed Brown       uxx       = (2.0*u - x[j][i-1].v - x[j][i+1].v)*hydhx;
340c4762a1bSJed Brown       uyy       = (2.0*u - x[j-1][i].v - x[j+1][i].v)*hxdhy;
341c4762a1bSJed Brown       f[j][i].v = uxx + uyy + .5*(x[j][i+1].omega-x[j][i-1].omega)*hy;
342c4762a1bSJed Brown 
343c4762a1bSJed Brown       /* Omega */
344c4762a1bSJed Brown       u             = x[j][i].omega;
345c4762a1bSJed Brown       uxx           = (2.0*u - x[j][i-1].omega - x[j][i+1].omega)*hydhx;
346c4762a1bSJed Brown       uyy           = (2.0*u - x[j-1][i].omega - x[j+1][i].omega)*hxdhy;
347c4762a1bSJed Brown       f[j][i].omega = uxx + uyy + (vxp*(u - x[j][i-1].omega) + vxm*(x[j][i+1].omega - u))*hy +
348c4762a1bSJed Brown                       (vyp*(u - x[j-1][i].omega) + vym*(x[j+1][i].omega - u))*hx -
349c4762a1bSJed Brown                       .5*grashof*(x[j][i+1].temp - x[j][i-1].temp)*hy;
350c4762a1bSJed Brown 
351c4762a1bSJed Brown       /* Temperature */
352c4762a1bSJed Brown       u            = x[j][i].temp;
353c4762a1bSJed Brown       uxx          = (2.0*u - x[j][i-1].temp - x[j][i+1].temp)*hydhx;
354c4762a1bSJed Brown       uyy          = (2.0*u - x[j-1][i].temp - x[j+1][i].temp)*hxdhy;
355c4762a1bSJed Brown       f[j][i].temp =  uxx + uyy  + prandtl*((vxp*(u - x[j][i-1].temp) + vxm*(x[j][i+1].temp - u))*hy +
356c4762a1bSJed Brown                                             (vyp*(u - x[j-1][i].temp) + vym*(x[j+1][i].temp - u))*hx);
357c4762a1bSJed Brown     }
358c4762a1bSJed Brown   }
359c4762a1bSJed Brown 
360c4762a1bSJed Brown   /*
361c4762a1bSJed Brown      Flop count (multiply-adds are counted as 2 operations)
362c4762a1bSJed Brown   */
3635f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscLogFlops(84.0*info->ym*info->xm));
364c4762a1bSJed Brown   PetscFunctionReturn(0);
365c4762a1bSJed Brown }
366c4762a1bSJed Brown 
367c4762a1bSJed Brown /*
368c4762a1bSJed Brown     Performs sweeps of point block nonlinear Gauss-Seidel on all the local grid points
369c4762a1bSJed Brown */
370c4762a1bSJed Brown PetscErrorCode NonlinearGS(SNES snes, Vec X, Vec B, void *ctx)
371c4762a1bSJed Brown {
372c4762a1bSJed Brown   DMDALocalInfo  info;
373c4762a1bSJed Brown   Field          **x,**b;
374c4762a1bSJed Brown   Vec            localX, localB;
375c4762a1bSJed Brown   DM             da;
376c4762a1bSJed Brown   PetscInt       xints,xinte,yints,yinte,i,j,k,l;
377c4762a1bSJed Brown   PetscInt       max_its,tot_its;
378c4762a1bSJed Brown   PetscInt       sweeps;
379c4762a1bSJed Brown   PetscReal      rtol,atol,stol;
380c4762a1bSJed Brown   PetscReal      hx,hy,dhx,dhy,hxdhy,hydhx;
381c4762a1bSJed Brown   PetscReal      grashof,prandtl,lid;
382c4762a1bSJed Brown   PetscScalar    u,uxx,uyy,vx,vy,avx,avy,vxp,vxm,vyp,vym;
383c4762a1bSJed Brown   PetscScalar    fu, fv, fomega, ftemp;
384c4762a1bSJed Brown   PetscScalar    dfudu;
385c4762a1bSJed Brown   PetscScalar    dfvdv;
386c4762a1bSJed Brown   PetscScalar    dfodu, dfodv, dfodo;
387c4762a1bSJed Brown   PetscScalar    dftdu, dftdv, dftdt;
388c4762a1bSJed Brown   PetscScalar    yu=0, yv=0, yo=0, yt=0;
389c4762a1bSJed Brown   PetscScalar    bjiu, bjiv, bjiomega, bjitemp;
390c4762a1bSJed Brown   PetscBool      ptconverged;
391c4762a1bSJed Brown   PetscReal      pfnorm,pfnorm0,pynorm,pxnorm;
392c4762a1bSJed Brown   AppCtx         *user = (AppCtx*)ctx;
393c4762a1bSJed Brown 
394c4762a1bSJed Brown   PetscFunctionBeginUser;
395c4762a1bSJed Brown   grashof = user->grashof;
396c4762a1bSJed Brown   prandtl = user->prandtl;
397c4762a1bSJed Brown   lid     = user->lidvelocity;
398c4762a1bSJed Brown   tot_its = 0;
3995f80ce2aSJacob Faibussowitsch   CHKERRQ(SNESNGSGetTolerances(snes,&rtol,&atol,&stol,&max_its));
4005f80ce2aSJacob Faibussowitsch   CHKERRQ(SNESNGSGetSweeps(snes,&sweeps));
4015f80ce2aSJacob Faibussowitsch   CHKERRQ(SNESGetDM(snes,(DM*)&da));
4025f80ce2aSJacob Faibussowitsch   CHKERRQ(DMGetLocalVector(da,&localX));
403c4762a1bSJed Brown   if (B) {
4045f80ce2aSJacob Faibussowitsch     CHKERRQ(DMGetLocalVector(da,&localB));
405c4762a1bSJed Brown   }
406c4762a1bSJed Brown   /*
407c4762a1bSJed Brown      Scatter ghost points to local vector, using the 2-step process
408c4762a1bSJed Brown         DMGlobalToLocalBegin(), DMGlobalToLocalEnd().
409c4762a1bSJed Brown   */
4105f80ce2aSJacob Faibussowitsch   CHKERRQ(DMGlobalToLocalBegin(da,X,INSERT_VALUES,localX));
4115f80ce2aSJacob Faibussowitsch   CHKERRQ(DMGlobalToLocalEnd(da,X,INSERT_VALUES,localX));
412c4762a1bSJed Brown   if (B) {
4135f80ce2aSJacob Faibussowitsch     CHKERRQ(DMGlobalToLocalBegin(da,B,INSERT_VALUES,localB));
4145f80ce2aSJacob Faibussowitsch     CHKERRQ(DMGlobalToLocalEnd(da,B,INSERT_VALUES,localB));
415c4762a1bSJed Brown   }
4165f80ce2aSJacob Faibussowitsch   CHKERRQ(DMDAGetLocalInfo(da,&info));
4175f80ce2aSJacob Faibussowitsch   CHKERRQ(DMDAVecGetArrayWrite(da,localX,&x));
418c4762a1bSJed Brown   if (B) {
4195f80ce2aSJacob Faibussowitsch     CHKERRQ(DMDAVecGetArrayRead(da,localB,&b));
420c4762a1bSJed Brown   }
421c4762a1bSJed Brown   /* looks like a combination of the formfunction / formjacobian routines */
422c4762a1bSJed Brown   dhx   = (PetscReal)(info.mx-1);dhy   = (PetscReal)(info.my-1);
423c4762a1bSJed Brown   hx    = 1.0/dhx;               hy    = 1.0/dhy;
424c4762a1bSJed Brown   hxdhy = hx*dhy;                hydhx = hy*dhx;
425c4762a1bSJed Brown 
426c4762a1bSJed Brown   xints = info.xs; xinte = info.xs+info.xm; yints = info.ys; yinte = info.ys+info.ym;
427c4762a1bSJed Brown 
428c4762a1bSJed Brown   /* Set the boundary conditions on the momentum equations */
429c4762a1bSJed Brown   /* Test whether we are on the bottom edge of the global array */
430c4762a1bSJed Brown   if (yints == 0) {
431c4762a1bSJed Brown     j     = 0;
432c4762a1bSJed Brown     /* bottom edge */
433c4762a1bSJed Brown     for (i=info.xs; i<info.xs+info.xm; i++) {
434c4762a1bSJed Brown 
435c4762a1bSJed Brown       if (B) {
436c4762a1bSJed Brown         bjiu = b[j][i].u;
437c4762a1bSJed Brown         bjiv = b[j][i].v;
438c4762a1bSJed Brown       } else {
439c4762a1bSJed Brown         bjiu = 0.0;
440c4762a1bSJed Brown         bjiv = 0.0;
441c4762a1bSJed Brown       }
442c4762a1bSJed Brown       x[j][i].u = 0.0 + bjiu;
443c4762a1bSJed Brown       x[j][i].v = 0.0 + bjiv;
444c4762a1bSJed Brown     }
445c4762a1bSJed Brown   }
446c4762a1bSJed Brown 
447c4762a1bSJed Brown   /* Test whether we are on the top edge of the global array */
448c4762a1bSJed Brown   if (yinte == info.my) {
449c4762a1bSJed Brown     j     = info.my - 1;
450c4762a1bSJed Brown     /* top edge */
451c4762a1bSJed Brown     for (i=info.xs; i<info.xs+info.xm; i++) {
452c4762a1bSJed Brown       if (B) {
453c4762a1bSJed Brown         bjiu = b[j][i].u;
454c4762a1bSJed Brown         bjiv = b[j][i].v;
455c4762a1bSJed Brown       } else {
456c4762a1bSJed Brown         bjiu = 0.0;
457c4762a1bSJed Brown         bjiv = 0.0;
458c4762a1bSJed Brown       }
459c4762a1bSJed Brown       x[j][i].u = lid + bjiu;
460c4762a1bSJed Brown       x[j][i].v = bjiv;
461c4762a1bSJed Brown     }
462c4762a1bSJed Brown   }
463c4762a1bSJed Brown 
464c4762a1bSJed Brown   /* Test whether we are on the left edge of the global array */
465c4762a1bSJed Brown   if (xints == 0) {
466c4762a1bSJed Brown     i     = 0;
467c4762a1bSJed Brown     /* left edge */
468c4762a1bSJed Brown     for (j=info.ys; j<info.ys+info.ym; j++) {
469c4762a1bSJed Brown       if (B) {
470c4762a1bSJed Brown         bjiu = b[j][i].u;
471c4762a1bSJed Brown         bjiv = b[j][i].v;
472c4762a1bSJed Brown       } else {
473c4762a1bSJed Brown         bjiu = 0.0;
474c4762a1bSJed Brown         bjiv = 0.0;
475c4762a1bSJed Brown       }
476c4762a1bSJed Brown       x[j][i].u = 0.0 + bjiu;
477c4762a1bSJed Brown       x[j][i].v = 0.0 + bjiv;
478c4762a1bSJed Brown     }
479c4762a1bSJed Brown   }
480c4762a1bSJed Brown 
481c4762a1bSJed Brown   /* Test whether we are on the right edge of the global array */
482c4762a1bSJed Brown   if (xinte == info.mx) {
483c4762a1bSJed Brown     i     = info.mx - 1;
484c4762a1bSJed Brown     /* right edge */
485c4762a1bSJed Brown     for (j=info.ys; j<info.ys+info.ym; j++) {
486c4762a1bSJed Brown       if (B) {
487c4762a1bSJed Brown         bjiu = b[j][i].u;
488c4762a1bSJed Brown         bjiv = b[j][i].v;
489c4762a1bSJed Brown       } else {
490c4762a1bSJed Brown         bjiu = 0.0;
491c4762a1bSJed Brown         bjiv = 0.0;
492c4762a1bSJed Brown       }
493c4762a1bSJed Brown       x[j][i].u = 0.0 + bjiu;
494c4762a1bSJed Brown       x[j][i].v = 0.0 + bjiv;
495c4762a1bSJed Brown     }
496c4762a1bSJed Brown   }
497c4762a1bSJed Brown 
498c4762a1bSJed Brown   for (k=0; k < sweeps; k++) {
499c4762a1bSJed Brown     for (j=info.ys; j<info.ys + info.ym; j++) {
500c4762a1bSJed Brown       for (i=info.xs; i<info.xs + info.xm; i++) {
501c4762a1bSJed Brown         ptconverged = PETSC_FALSE;
502c4762a1bSJed Brown         pfnorm0     = 0.0;
503c4762a1bSJed Brown         fu          = 0.0;
504c4762a1bSJed Brown         fv          = 0.0;
505c4762a1bSJed Brown         fomega      = 0.0;
506c4762a1bSJed Brown         ftemp       = 0.0;
507c4762a1bSJed Brown         /*  Run Newton's method on a single grid point */
508c4762a1bSJed Brown         for (l = 0; l < max_its && !ptconverged; l++) {
509c4762a1bSJed Brown           if (B) {
510c4762a1bSJed Brown             bjiu     = b[j][i].u;
511c4762a1bSJed Brown             bjiv     = b[j][i].v;
512c4762a1bSJed Brown             bjiomega = b[j][i].omega;
513c4762a1bSJed Brown             bjitemp  = b[j][i].temp;
514c4762a1bSJed Brown           } else {
515c4762a1bSJed Brown             bjiu     = 0.0;
516c4762a1bSJed Brown             bjiv     = 0.0;
517c4762a1bSJed Brown             bjiomega = 0.0;
518c4762a1bSJed Brown             bjitemp  = 0.0;
519c4762a1bSJed Brown           }
520c4762a1bSJed Brown 
521c4762a1bSJed Brown           if (i != 0 && i != info.mx - 1 && j != 0 && j != info.my-1) {
522c4762a1bSJed Brown             /* U velocity */
523c4762a1bSJed Brown             u     = x[j][i].u;
524c4762a1bSJed Brown             uxx   = (2.0*u - x[j][i-1].u - x[j][i+1].u)*hydhx;
525c4762a1bSJed Brown             uyy   = (2.0*u - x[j-1][i].u - x[j+1][i].u)*hxdhy;
526c4762a1bSJed Brown             fu    = uxx + uyy - .5*(x[j+1][i].omega-x[j-1][i].omega)*hx - bjiu;
527c4762a1bSJed Brown             dfudu = 2.0*(hydhx + hxdhy);
528c4762a1bSJed Brown             /* V velocity */
529c4762a1bSJed Brown             u     = x[j][i].v;
530c4762a1bSJed Brown             uxx   = (2.0*u - x[j][i-1].v - x[j][i+1].v)*hydhx;
531c4762a1bSJed Brown             uyy   = (2.0*u - x[j-1][i].v - x[j+1][i].v)*hxdhy;
532c4762a1bSJed Brown             fv    = uxx + uyy + .5*(x[j][i+1].omega-x[j][i-1].omega)*hy - bjiv;
533c4762a1bSJed Brown             dfvdv = 2.0*(hydhx + hxdhy);
534c4762a1bSJed Brown             /*
535c4762a1bSJed Brown              convective coefficients for upwinding
536c4762a1bSJed Brown              */
537c4762a1bSJed Brown             vx  = x[j][i].u; avx = PetscAbsScalar(vx);
538c4762a1bSJed Brown             vxp = .5*(vx+avx); vxm = .5*(vx-avx);
539c4762a1bSJed Brown             vy  = x[j][i].v; avy = PetscAbsScalar(vy);
540c4762a1bSJed Brown             vyp = .5*(vy+avy); vym = .5*(vy-avy);
541c4762a1bSJed Brown             /* Omega */
542c4762a1bSJed Brown             u      = x[j][i].omega;
543c4762a1bSJed Brown             uxx    = (2.0*u - x[j][i-1].omega - x[j][i+1].omega)*hydhx;
544c4762a1bSJed Brown             uyy    = (2.0*u - x[j-1][i].omega - x[j+1][i].omega)*hxdhy;
545c4762a1bSJed Brown             fomega = uxx + uyy +  (vxp*(u - x[j][i-1].omega) + vxm*(x[j][i+1].omega - u))*hy +
546c4762a1bSJed Brown                      (vyp*(u - x[j-1][i].omega) + vym*(x[j+1][i].omega - u))*hx -
547c4762a1bSJed Brown                      .5*grashof*(x[j][i+1].temp - x[j][i-1].temp)*hy - bjiomega;
548c4762a1bSJed Brown             /* convective coefficient derivatives */
549c4762a1bSJed Brown             dfodo = 2.0*(hydhx + hxdhy) + ((vxp - vxm)*hy + (vyp - vym)*hx);
550c4762a1bSJed Brown             if (PetscRealPart(vx) > 0.0) dfodu = (u - x[j][i-1].omega)*hy;
551c4762a1bSJed Brown             else dfodu = (x[j][i+1].omega - u)*hy;
552c4762a1bSJed Brown 
553c4762a1bSJed Brown             if (PetscRealPart(vy) > 0.0) dfodv = (u - x[j-1][i].omega)*hx;
554c4762a1bSJed Brown             else dfodv = (x[j+1][i].omega - u)*hx;
555c4762a1bSJed Brown 
556c4762a1bSJed Brown             /* Temperature */
557c4762a1bSJed Brown             u     = x[j][i].temp;
558c4762a1bSJed Brown             uxx   = (2.0*u - x[j][i-1].temp - x[j][i+1].temp)*hydhx;
559c4762a1bSJed Brown             uyy   = (2.0*u - x[j-1][i].temp - x[j+1][i].temp)*hxdhy;
560c4762a1bSJed Brown             ftemp =  uxx + uyy  + prandtl*((vxp*(u - x[j][i-1].temp) + vxm*(x[j][i+1].temp - u))*hy + (vyp*(u - x[j-1][i].temp) + vym*(x[j+1][i].temp - u))*hx) - bjitemp;
561c4762a1bSJed Brown             dftdt = 2.0*(hydhx + hxdhy) + prandtl*((vxp - vxm)*hy + (vyp - vym)*hx);
562c4762a1bSJed Brown             if (PetscRealPart(vx) > 0.0) dftdu = prandtl*(u - x[j][i-1].temp)*hy;
563c4762a1bSJed Brown             else dftdu = prandtl*(x[j][i+1].temp - u)*hy;
564c4762a1bSJed Brown 
565c4762a1bSJed Brown             if (PetscRealPart(vy) > 0.0) dftdv = prandtl*(u - x[j-1][i].temp)*hx;
566c4762a1bSJed Brown             else dftdv = prandtl*(x[j+1][i].temp - u)*hx;
567c4762a1bSJed Brown 
568c4762a1bSJed Brown             /* invert the system:
569c4762a1bSJed Brown              [ dfu / du     0        0        0    ][yu] = [fu]
570c4762a1bSJed Brown              [     0    dfv / dv     0        0    ][yv]   [fv]
571c4762a1bSJed Brown              [ dfo / du dfo / dv dfo / do     0    ][yo]   [fo]
572c4762a1bSJed Brown              [ dft / du dft / dv     0    dft / dt ][yt]   [ft]
573c4762a1bSJed Brown              by simple back-substitution
574c4762a1bSJed Brown            */
575c4762a1bSJed Brown             yu = fu / dfudu;
576c4762a1bSJed Brown             yv = fv / dfvdv;
577c4762a1bSJed Brown             yo = (fomega - (dfodu*yu + dfodv*yv)) / dfodo;
578c4762a1bSJed Brown             yt = (ftemp - (dftdu*yu + dftdv*yv)) / dftdt;
579c4762a1bSJed Brown 
580c4762a1bSJed Brown             x[j][i].u     = x[j][i].u - yu;
581c4762a1bSJed Brown             x[j][i].v     = x[j][i].v - yv;
582c4762a1bSJed Brown             x[j][i].temp  = x[j][i].temp - yt;
583c4762a1bSJed Brown             x[j][i].omega = x[j][i].omega - yo;
584c4762a1bSJed Brown           }
585c4762a1bSJed Brown           if (i == 0) {
586c4762a1bSJed Brown             fomega        = x[j][i].omega - (x[j][i+1].v - x[j][i].v)*dhx - bjiomega;
587c4762a1bSJed Brown             ftemp         = x[j][i].temp - bjitemp;
588c4762a1bSJed Brown             yo            = fomega;
589c4762a1bSJed Brown             yt            = ftemp;
590c4762a1bSJed Brown             x[j][i].omega = x[j][i].omega - fomega;
591c4762a1bSJed Brown             x[j][i].temp  = x[j][i].temp - ftemp;
592c4762a1bSJed Brown           }
593c4762a1bSJed Brown           if (i == info.mx - 1) {
594c4762a1bSJed Brown             fomega        = x[j][i].omega - (x[j][i].v - x[j][i-1].v)*dhx - bjiomega;
595c4762a1bSJed Brown             ftemp         = x[j][i].temp - (PetscReal)(grashof>0) - bjitemp;
596c4762a1bSJed Brown             yo            = fomega;
597c4762a1bSJed Brown             yt            = ftemp;
598c4762a1bSJed Brown             x[j][i].omega = x[j][i].omega - fomega;
599c4762a1bSJed Brown             x[j][i].temp  = x[j][i].temp - ftemp;
600c4762a1bSJed Brown           }
601c4762a1bSJed Brown           if (j == 0) {
602c4762a1bSJed Brown             fomega        = x[j][i].omega + (x[j+1][i].u - x[j][i].u)*dhy - bjiomega;
603c4762a1bSJed Brown             ftemp         = x[j][i].temp-x[j+1][i].temp - bjitemp;
604c4762a1bSJed Brown             yo            = fomega;
605c4762a1bSJed Brown             yt            = ftemp;
606c4762a1bSJed Brown             x[j][i].omega = x[j][i].omega - fomega;
607c4762a1bSJed Brown             x[j][i].temp  = x[j][i].temp - ftemp;
608c4762a1bSJed Brown           }
609c4762a1bSJed Brown           if (j == info.my - 1) {
610c4762a1bSJed Brown             fomega        = x[j][i].omega + (x[j][i].u - x[j-1][i].u)*dhy - bjiomega;
611c4762a1bSJed Brown             ftemp         = x[j][i].temp-x[j-1][i].temp - bjitemp;
612c4762a1bSJed Brown             yo            = fomega;
613c4762a1bSJed Brown             yt            = ftemp;
614c4762a1bSJed Brown             x[j][i].omega = x[j][i].omega - fomega;
615c4762a1bSJed Brown             x[j][i].temp  = x[j][i].temp - ftemp;
616c4762a1bSJed Brown           }
617c4762a1bSJed Brown           tot_its++;
618c4762a1bSJed Brown           pfnorm = PetscRealPart(fu*fu + fv*fv + fomega*fomega + ftemp*ftemp);
619c4762a1bSJed Brown           pfnorm = PetscSqrtReal(pfnorm);
620c4762a1bSJed Brown           pynorm = PetscRealPart(yu*yu + yv*yv + yo*yo + yt*yt);
621c4762a1bSJed Brown           pynorm = PetscSqrtReal(pynorm);
622c4762a1bSJed Brown           pxnorm = PetscRealPart(x[j][i].u*x[j][i].u + x[j][i].v*x[j][i].v + x[j][i].omega*x[j][i].omega + x[j][i].temp*x[j][i].temp);
623c4762a1bSJed Brown           pxnorm = PetscSqrtReal(pxnorm);
624c4762a1bSJed Brown           if (l == 0) pfnorm0 = pfnorm;
625c4762a1bSJed Brown           if (rtol*pfnorm0 >pfnorm || atol > pfnorm || pxnorm*stol > pynorm) ptconverged = PETSC_TRUE;
626c4762a1bSJed Brown         }
627c4762a1bSJed Brown       }
628c4762a1bSJed Brown     }
629c4762a1bSJed Brown   }
6305f80ce2aSJacob Faibussowitsch   CHKERRQ(DMDAVecRestoreArrayWrite(da,localX,&x));
631c4762a1bSJed Brown   if (B) {
6325f80ce2aSJacob Faibussowitsch     CHKERRQ(DMDAVecRestoreArrayRead(da,localB,&b));
633c4762a1bSJed Brown   }
6345f80ce2aSJacob Faibussowitsch   CHKERRQ(DMLocalToGlobalBegin(da,localX,INSERT_VALUES,X));
6355f80ce2aSJacob Faibussowitsch   CHKERRQ(DMLocalToGlobalEnd(da,localX,INSERT_VALUES,X));
6365f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscLogFlops(tot_its*(84.0 + 41.0 + 26.0)));
6375f80ce2aSJacob Faibussowitsch   CHKERRQ(DMRestoreLocalVector(da,&localX));
638c4762a1bSJed Brown   if (B) {
6395f80ce2aSJacob Faibussowitsch     CHKERRQ(DMRestoreLocalVector(da,&localB));
640c4762a1bSJed Brown   }
641c4762a1bSJed Brown   PetscFunctionReturn(0);
642c4762a1bSJed Brown }
643c4762a1bSJed Brown 
644c4762a1bSJed Brown /*TEST
645c4762a1bSJed Brown 
646c4762a1bSJed Brown    test:
647c4762a1bSJed Brown       nsize: 2
648c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type mg -ksp_type fgmres -pc_mg_type full
649c4762a1bSJed Brown       requires: !single
650c4762a1bSJed Brown 
651c4762a1bSJed Brown    test:
652c4762a1bSJed Brown       suffix: 10
653c4762a1bSJed Brown       nsize: 3
654c4762a1bSJed Brown       args: -snes_monitor_short -ksp_monitor_short -pc_type fieldsplit -pc_fieldsplit_type symmetric_multiplicative -snes_view -da_refine 1 -ksp_type fgmres
655c4762a1bSJed Brown       requires: !single
656c4762a1bSJed Brown 
657c4762a1bSJed Brown    test:
658c4762a1bSJed Brown       suffix: 11
659c4762a1bSJed Brown       nsize: 4
660c4762a1bSJed Brown       requires: pastix
661c4762a1bSJed Brown       args: -snes_monitor_short -pc_type redundant -dm_mat_type mpiaij -redundant_pc_factor_mat_solver_type pastix -pc_redundant_number 2 -da_refine 4 -ksp_type fgmres
662c4762a1bSJed Brown 
663c4762a1bSJed Brown    test:
664c4762a1bSJed Brown       suffix: 12
665c4762a1bSJed Brown       nsize: 12
666c4762a1bSJed Brown       requires: pastix
667c4762a1bSJed Brown       args: -snes_monitor_short -pc_type redundant -dm_mat_type mpiaij -redundant_pc_factor_mat_solver_type pastix -pc_redundant_number 5 -da_refine 4 -ksp_type fgmres
668c4762a1bSJed Brown 
669c4762a1bSJed Brown    test:
670c4762a1bSJed Brown       suffix: 13
671c4762a1bSJed Brown       nsize: 3
672c4762a1bSJed Brown       args: -snes_monitor_short -ksp_monitor_short -pc_type fieldsplit -pc_fieldsplit_type multiplicative -snes_view -da_refine 1 -ksp_type fgmres -snes_mf_operator
673c4762a1bSJed Brown       requires: !single
674c4762a1bSJed Brown 
675c4762a1bSJed Brown    test:
676c4762a1bSJed Brown       suffix: 14
677c4762a1bSJed Brown       nsize: 4
678c4762a1bSJed Brown       args: -snes_monitor_short -pc_type mg -dm_mat_type baij -mg_coarse_pc_type bjacobi -da_refine 3 -ksp_type fgmres
679c4762a1bSJed Brown       requires: !single
680c4762a1bSJed Brown 
681c4762a1bSJed Brown    test:
682c4762a1bSJed Brown       suffix: 14_ds
683c4762a1bSJed Brown       nsize: 4
684c4762a1bSJed Brown       args: -snes_converged_reason -pc_type mg -dm_mat_type baij -mg_coarse_pc_type bjacobi -da_refine 3 -ksp_type fgmres -mat_fd_type ds
685c4762a1bSJed Brown       output_file: output/ex19_2.out
686c4762a1bSJed Brown       requires: !single
687c4762a1bSJed Brown 
688c4762a1bSJed Brown    test:
689c4762a1bSJed Brown       suffix: 17
690c4762a1bSJed Brown       args: -snes_monitor_short -ksp_pc_side right
691c4762a1bSJed Brown       requires: !single
692c4762a1bSJed Brown 
693c4762a1bSJed Brown    test:
694c4762a1bSJed Brown       suffix: 18
695798534f6SMatthew G. Knepley       args: -snes_monitor_ksp draw::draw_lg -ksp_pc_side right
696c4762a1bSJed Brown       requires: x !single
697c4762a1bSJed Brown 
698c4762a1bSJed Brown    test:
69941ba4c6cSHeeho Park       suffix: 19
70041ba4c6cSHeeho Park       nsize: 2
70141ba4c6cSHeeho Park       args: -da_refine 3 -snes_monitor_short -pc_type mg -ksp_type fgmres -pc_mg_type full -snes_type newtontrdc
70241ba4c6cSHeeho Park       requires: !single
70341ba4c6cSHeeho Park 
70441ba4c6cSHeeho Park    test:
70541ba4c6cSHeeho Park       suffix: 20
70641ba4c6cSHeeho Park       nsize: 2
70741ba4c6cSHeeho Park       args: -da_refine 3 -snes_monitor_short -pc_type mg -ksp_type fgmres -pc_mg_type full -snes_type newtontrdc -snes_trdc_use_cauchy false
70841ba4c6cSHeeho Park       requires: !single
70941ba4c6cSHeeho Park 
71041ba4c6cSHeeho Park    test:
711c4762a1bSJed Brown       suffix: 2
712c4762a1bSJed Brown       nsize: 4
713c4762a1bSJed Brown       args: -da_refine 3 -snes_converged_reason -pc_type mg -mat_fd_type ds
714c4762a1bSJed Brown       requires: !single
715c4762a1bSJed Brown 
716c4762a1bSJed Brown    test:
717c4762a1bSJed Brown       suffix: 2_bcols1
718c4762a1bSJed Brown       nsize: 4
719c4762a1bSJed Brown       args: -da_refine 3 -snes_converged_reason -pc_type mg -mat_fd_type ds -mat_fd_coloring_bcols
720c4762a1bSJed Brown       output_file: output/ex19_2.out
721c4762a1bSJed Brown       requires: !single
722c4762a1bSJed Brown 
723c4762a1bSJed Brown    test:
724c4762a1bSJed Brown       suffix: 3
725c4762a1bSJed Brown       nsize: 4
726c4762a1bSJed Brown       requires: mumps
727c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type redundant -dm_mat_type mpiaij -redundant_ksp_type preonly -redundant_pc_factor_mat_solver_type mumps -pc_redundant_number 2
728c4762a1bSJed Brown 
729c4762a1bSJed Brown    test:
730c4762a1bSJed Brown       suffix: 4
731c4762a1bSJed Brown       nsize: 12
732c4762a1bSJed Brown       requires: mumps
733c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type redundant -dm_mat_type mpiaij -redundant_ksp_type preonly -redundant_pc_factor_mat_solver_type mumps -pc_redundant_number 5
734c4762a1bSJed Brown       output_file: output/ex19_3.out
735c4762a1bSJed Brown 
736c4762a1bSJed Brown    test:
737c4762a1bSJed Brown       suffix: 6
738c4762a1bSJed Brown       args: -snes_monitor_short -ksp_monitor_short -pc_type fieldsplit -snes_view -ksp_type fgmres -da_refine 1
739c4762a1bSJed Brown       requires: !single
740c4762a1bSJed Brown 
741c4762a1bSJed Brown    test:
742c4762a1bSJed Brown       suffix: 7
743c4762a1bSJed Brown       nsize: 3
744c4762a1bSJed Brown       args: -snes_monitor_short -ksp_monitor_short -pc_type fieldsplit -snes_view -da_refine 1 -ksp_type fgmres
745c4762a1bSJed Brown 
746c4762a1bSJed Brown       requires: !single
747c4762a1bSJed Brown    test:
748c4762a1bSJed Brown       suffix: 8
749c4762a1bSJed Brown       args: -snes_monitor_short -ksp_monitor_short -pc_type fieldsplit -pc_fieldsplit_block_size 2 -pc_fieldsplit_0_fields 0,1 -pc_fieldsplit_1_fields 0,1 -pc_fieldsplit_type multiplicative -snes_view -fieldsplit_pc_type lu -da_refine 1 -ksp_type fgmres
750c4762a1bSJed Brown       requires: !single
751c4762a1bSJed Brown 
752c4762a1bSJed Brown    test:
753c4762a1bSJed Brown       suffix: 9
754c4762a1bSJed Brown       nsize: 3
755c4762a1bSJed Brown       args: -snes_monitor_short -ksp_monitor_short -pc_type fieldsplit -pc_fieldsplit_type multiplicative -snes_view -da_refine 1 -ksp_type fgmres
756c4762a1bSJed Brown       requires: !single
757c4762a1bSJed Brown 
758c4762a1bSJed Brown    test:
759c4762a1bSJed Brown       suffix: aspin
760c4762a1bSJed Brown       nsize: 4
761c4762a1bSJed Brown       args: -da_refine 3 -da_overlap 2 -snes_monitor_short -snes_type aspin -grashof 4e4 -lidvelocity 100 -ksp_monitor_short
762c4762a1bSJed Brown       requires: !single
763c4762a1bSJed Brown 
764c4762a1bSJed Brown    test:
765c4762a1bSJed Brown       suffix: bcgsl
766c4762a1bSJed Brown       nsize: 2
767c4762a1bSJed Brown       args: -ksp_type bcgsl -ksp_monitor_short -da_refine 2 -ksp_bcgsl_ell 3 -snes_view
768c4762a1bSJed Brown       requires: !single
769c4762a1bSJed Brown 
770c4762a1bSJed Brown    test:
771c4762a1bSJed Brown       suffix: bcols1
772c4762a1bSJed Brown       nsize: 2
773c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type mg -ksp_type fgmres -pc_mg_type full -mat_fd_coloring_bcols 1
774c4762a1bSJed Brown       output_file: output/ex19_1.out
775c4762a1bSJed Brown       requires: !single
776c4762a1bSJed Brown 
777c4762a1bSJed Brown    test:
778c4762a1bSJed Brown       suffix: bjacobi
779c4762a1bSJed Brown       nsize: 4
780c4762a1bSJed Brown       args: -da_refine 4 -ksp_type fgmres -pc_type bjacobi -pc_bjacobi_blocks 2 -sub_ksp_type gmres -sub_ksp_max_it 2 -sub_pc_type bjacobi -sub_sub_ksp_type preonly -sub_sub_pc_type ilu -snes_monitor_short
781c4762a1bSJed Brown       requires: !single
782c4762a1bSJed Brown 
783c4762a1bSJed Brown    test:
784c4762a1bSJed Brown       suffix: cgne
785c4762a1bSJed Brown       args: -da_refine 2 -pc_type lu -ksp_type cgne -ksp_monitor_short -ksp_converged_reason -ksp_view -ksp_norm_type unpreconditioned
786c4762a1bSJed Brown       filter: grep -v HERMITIAN
787c4762a1bSJed Brown       requires: !single
788c4762a1bSJed Brown 
789c4762a1bSJed Brown    test:
790c4762a1bSJed Brown       suffix: cgs
791c4762a1bSJed Brown       args: -da_refine 1 -ksp_monitor_short -ksp_type cgs
792c4762a1bSJed Brown       requires: !single
793c4762a1bSJed Brown 
794c4762a1bSJed Brown    test:
795c4762a1bSJed Brown       suffix: composite_fieldsplit
796c4762a1bSJed Brown       args: -ksp_type fgmres -pc_type composite -pc_composite_type MULTIPLICATIVE -pc_composite_pcs fieldsplit,none -sub_0_pc_fieldsplit_block_size 4 -sub_0_pc_fieldsplit_type additive -sub_0_pc_fieldsplit_0_fields 0,1,2 -sub_0_pc_fieldsplit_1_fields 3 -snes_monitor_short -ksp_monitor_short
797c4762a1bSJed Brown       requires: !single
798c4762a1bSJed Brown 
799c4762a1bSJed Brown    test:
800c4762a1bSJed Brown       suffix: composite_fieldsplit_bjacobi
801c4762a1bSJed Brown       args: -ksp_type fgmres -pc_type composite -pc_composite_type MULTIPLICATIVE -pc_composite_pcs fieldsplit,bjacobi -sub_0_pc_fieldsplit_block_size 4 -sub_0_pc_fieldsplit_type additive -sub_0_pc_fieldsplit_0_fields 0,1,2 -sub_0_pc_fieldsplit_1_fields 3 -sub_1_pc_bjacobi_blocks 16 -sub_1_sub_pc_type lu -snes_monitor_short -ksp_monitor_short
802c4762a1bSJed Brown       requires: !single
803c4762a1bSJed Brown 
804c4762a1bSJed Brown    test:
805c4762a1bSJed Brown       suffix: composite_fieldsplit_bjacobi_2
806c4762a1bSJed Brown       nsize: 4
807c4762a1bSJed Brown       args: -ksp_type fgmres -pc_type composite -pc_composite_type MULTIPLICATIVE -pc_composite_pcs fieldsplit,bjacobi -sub_0_pc_fieldsplit_block_size 4 -sub_0_pc_fieldsplit_type additive -sub_0_pc_fieldsplit_0_fields 0,1,2 -sub_0_pc_fieldsplit_1_fields 3 -sub_1_pc_bjacobi_blocks 16 -sub_1_sub_pc_type lu -snes_monitor_short -ksp_monitor_short
808c4762a1bSJed Brown       requires: !single
809c4762a1bSJed Brown 
810c4762a1bSJed Brown    test:
811c4762a1bSJed Brown       suffix: composite_gs_newton
812c4762a1bSJed Brown       nsize: 2
813c4762a1bSJed Brown       args: -da_refine 3 -grashof 4e4 -lidvelocity 100 -snes_monitor_short -snes_type composite -snes_composite_type additiveoptimal -snes_composite_sneses ngs,newtonls -sub_0_snes_max_it 20 -sub_1_pc_type mg
814c4762a1bSJed Brown       requires: !single
815c4762a1bSJed Brown 
816c4762a1bSJed Brown    test:
817c4762a1bSJed Brown       suffix: cuda
818c4762a1bSJed Brown       requires: cuda !single
819c4762a1bSJed Brown       args: -dm_vec_type cuda -dm_mat_type aijcusparse -pc_type none -ksp_type fgmres -snes_monitor_short -snes_rtol 1.e-5
820c4762a1bSJed Brown 
821c4762a1bSJed Brown    test:
822c4762a1bSJed Brown       suffix: draw
823c4762a1bSJed Brown       args: -pc_type fieldsplit -snes_view draw -fieldsplit_x_velocity_pc_type mg -fieldsplit_x_velocity_pc_mg_galerkin pmat -fieldsplit_x_velocity_pc_mg_levels 2 -da_refine 1 -fieldsplit_x_velocity_mg_coarse_pc_type svd
824c4762a1bSJed Brown       requires: x !single
825c4762a1bSJed Brown 
826c4762a1bSJed Brown    test:
827c4762a1bSJed Brown       suffix: drawports
828c4762a1bSJed Brown       args: -snes_monitor_solution draw::draw_ports -da_refine 1
829c4762a1bSJed Brown       output_file: output/ex19_draw.out
830c4762a1bSJed Brown       requires: x !single
831c4762a1bSJed Brown 
832c4762a1bSJed Brown    test:
833c4762a1bSJed Brown       suffix: fas
834c4762a1bSJed Brown       args: -da_refine 4 -snes_monitor_short -snes_type fas -fas_levels_snes_type ngs -fas_levels_snes_ngs_sweeps 3 -fas_levels_snes_ngs_atol 0.0 -fas_levels_snes_ngs_stol 0.0 -grashof 4e4 -snes_fas_smoothup 6 -snes_fas_smoothdown 6 -lidvelocity 100
835c4762a1bSJed Brown       requires: !single
836c4762a1bSJed Brown 
837c4762a1bSJed Brown    test:
838c4762a1bSJed Brown       suffix: fas_full
839c4762a1bSJed Brown       args: -da_refine 4 -snes_monitor_short -snes_type fas -snes_fas_type full -snes_fas_full_downsweep -fas_levels_snes_type ngs -fas_levels_snes_ngs_sweeps 3 -fas_levels_snes_ngs_atol 0.0 -fas_levels_snes_ngs_stol 0.0 -grashof 4e4 -snes_fas_smoothup 6 -snes_fas_smoothdown 6 -lidvelocity 100
840c4762a1bSJed Brown       requires: !single
841c4762a1bSJed Brown 
842c4762a1bSJed Brown    test:
843c4762a1bSJed Brown       suffix: fdcoloring_ds
844c4762a1bSJed Brown       args: -da_refine 3 -snes_converged_reason -pc_type mg -mat_fd_type ds
845c4762a1bSJed Brown       output_file: output/ex19_2.out
846c4762a1bSJed Brown       requires: !single
847c4762a1bSJed Brown 
848c4762a1bSJed Brown    test:
849c4762a1bSJed Brown       suffix: fdcoloring_ds_baij
850c4762a1bSJed Brown       args: -da_refine 3 -snes_converged_reason -pc_type mg -mat_fd_type ds -dm_mat_type baij
851c4762a1bSJed Brown       output_file: output/ex19_2.out
852c4762a1bSJed Brown       requires: !single
853c4762a1bSJed Brown 
854c4762a1bSJed Brown    test:
855c4762a1bSJed Brown       suffix: fdcoloring_ds_bcols1
856c4762a1bSJed Brown       args: -da_refine 3 -snes_converged_reason -pc_type mg -mat_fd_type ds -mat_fd_coloring_bcols 1
857c4762a1bSJed Brown       output_file: output/ex19_2.out
858c4762a1bSJed Brown       requires: !single
859c4762a1bSJed Brown 
860c4762a1bSJed Brown    test:
861c4762a1bSJed Brown       suffix: fdcoloring_wp
862c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type mg
863c4762a1bSJed Brown       requires: !single
864c4762a1bSJed Brown 
865c4762a1bSJed Brown    test:
866c4762a1bSJed Brown       suffix: fdcoloring_wp_baij
867c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type mg -dm_mat_type baij
868c4762a1bSJed Brown       output_file: output/ex19_fdcoloring_wp.out
869c4762a1bSJed Brown       requires: !single
870c4762a1bSJed Brown 
871c4762a1bSJed Brown    test:
872c4762a1bSJed Brown       suffix: fdcoloring_wp_bcols1
873c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type mg -mat_fd_coloring_bcols 1
874c4762a1bSJed Brown       output_file: output/ex19_fdcoloring_wp.out
875c4762a1bSJed Brown       requires: !single
876c4762a1bSJed Brown 
877c4762a1bSJed Brown    test:
878c4762a1bSJed Brown       suffix: fieldsplit_2
879c4762a1bSJed Brown       args: -ksp_type fgmres -pc_type fieldsplit -pc_fieldsplit_block_size 4 -pc_fieldsplit_type additive -pc_fieldsplit_0_fields 0,1,2 -pc_fieldsplit_1_fields 3 -snes_monitor_short -ksp_monitor_short
880c4762a1bSJed Brown       requires: !single
881c4762a1bSJed Brown 
882c4762a1bSJed Brown    test:
883c4762a1bSJed Brown       suffix: fieldsplit_3
884c4762a1bSJed Brown       args: -ksp_type fgmres -pc_type fieldsplit -pc_fieldsplit_block_size 4 -pc_fieldsplit_type additive -pc_fieldsplit_0_fields 0,1,2 -pc_fieldsplit_1_fields 3 -fieldsplit_0_pc_type lu -fieldsplit_1_pc_type lu -snes_monitor_short -ksp_monitor_short
885c4762a1bSJed Brown       requires: !single
886c4762a1bSJed Brown 
887c4762a1bSJed Brown    test:
888c4762a1bSJed Brown       suffix: fieldsplit_4
889c4762a1bSJed Brown       args: -ksp_type fgmres -pc_type fieldsplit -pc_fieldsplit_block_size 4 -pc_fieldsplit_type SCHUR -pc_fieldsplit_0_fields 0,1,2 -pc_fieldsplit_1_fields 3 -fieldsplit_0_pc_type lu -fieldsplit_1_pc_type lu -snes_monitor_short -ksp_monitor_short
890c4762a1bSJed Brown       requires: !single
891c4762a1bSJed Brown 
892c4762a1bSJed Brown    # HYPRE PtAP broken with complex numbers
893c4762a1bSJed Brown    test:
894c4762a1bSJed Brown       suffix: fieldsplit_hypre
895c4762a1bSJed Brown       nsize: 2
896263f2b91SStefano Zampini       requires: hypre mumps !complex !defined(PETSC_HAVE_HYPRE_DEVICE)
897c4762a1bSJed Brown       args: -pc_type fieldsplit -pc_fieldsplit_block_size 4 -pc_fieldsplit_type SCHUR -pc_fieldsplit_0_fields 0,1,2 -pc_fieldsplit_1_fields 3 -fieldsplit_0_pc_type lu -fieldsplit_0_pc_factor_mat_solver_type mumps -fieldsplit_1_pc_type hypre -fieldsplit_1_pc_hypre_type boomeramg -snes_monitor_short -ksp_monitor_short
898c4762a1bSJed Brown 
899c4762a1bSJed Brown    test:
900c4762a1bSJed Brown       suffix: fieldsplit_mumps
901c4762a1bSJed Brown       nsize: 2
902c4762a1bSJed Brown       requires: mumps
903c4762a1bSJed Brown       args: -pc_type fieldsplit -pc_fieldsplit_block_size 4 -pc_fieldsplit_type SCHUR -pc_fieldsplit_0_fields 0,1,2 -pc_fieldsplit_1_fields 3 -fieldsplit_0_pc_type lu -fieldsplit_1_pc_type lu -snes_monitor_short -ksp_monitor_short -fieldsplit_0_pc_factor_mat_solver_type mumps -fieldsplit_1_pc_factor_mat_solver_type mumps
904c4762a1bSJed Brown       output_file: output/ex19_fieldsplit_5.out
905c4762a1bSJed Brown 
906c4762a1bSJed Brown    test:
907c4762a1bSJed Brown       suffix: greedy_coloring
908c4762a1bSJed Brown       nsize: 2
909c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -snes_fd_color -snes_fd_color_use_mat -mat_coloring_type greedy -mat_coloring_weight_type lf -mat_coloring_view> ex19_greedy_coloring.tmp 2>&1
910c4762a1bSJed Brown       requires: !single
911c4762a1bSJed Brown 
912c4762a1bSJed Brown    # HYPRE PtAP broken with complex numbers
913c4762a1bSJed Brown    test:
914c4762a1bSJed Brown       suffix: hypre
915c4762a1bSJed Brown       nsize: 2
916263f2b91SStefano Zampini       requires: hypre !complex !defined(PETSC_HAVE_HYPRE_DEVICE)
917263f2b91SStefano Zampini       args: -da_refine 3 -snes_monitor_short -pc_type hypre -ksp_norm_type unpreconditioned
918c4762a1bSJed Brown 
919263f2b91SStefano Zampini    # ibcgs is broken when using device vectors
920c4762a1bSJed Brown    test:
921c4762a1bSJed Brown       suffix: ibcgs
922c4762a1bSJed Brown       nsize: 2
923c4762a1bSJed Brown       args: -ksp_type ibcgs -ksp_monitor_short -da_refine 2 -snes_view
924c4762a1bSJed Brown       requires: !complex !single
925c4762a1bSJed Brown 
926c4762a1bSJed Brown    test:
927c4762a1bSJed Brown       suffix: kaczmarz
928c4762a1bSJed Brown       nsize: 2
929c4762a1bSJed Brown       args: -pc_type kaczmarz -ksp_monitor_short -snes_monitor_short -snes_view
930c4762a1bSJed Brown       requires: !single
931c4762a1bSJed Brown 
932c4762a1bSJed Brown    test:
933c4762a1bSJed Brown       suffix: klu
934c4762a1bSJed Brown       requires: suitesparse
935c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type klu
936c4762a1bSJed Brown       output_file: output/ex19_superlu.out
937c4762a1bSJed Brown 
938c4762a1bSJed Brown    test:
939c4762a1bSJed Brown       suffix: klu_2
940c4762a1bSJed Brown       requires: suitesparse
9414ac6704cSBarry Smith       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type klu -pc_factor_mat_ordering_type nd
942c4762a1bSJed Brown       output_file: output/ex19_superlu.out
943c4762a1bSJed Brown 
944c4762a1bSJed Brown    test:
945c4762a1bSJed Brown       suffix: klu_3
946c4762a1bSJed Brown       requires: suitesparse
947c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type klu -mat_klu_use_btf 0
948c4762a1bSJed Brown       output_file: output/ex19_superlu.out
949c4762a1bSJed Brown 
950c4762a1bSJed Brown    test:
951c4762a1bSJed Brown       suffix: ml
952c4762a1bSJed Brown       nsize: 2
953c4762a1bSJed Brown       requires: ml
954c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type ml
955c4762a1bSJed Brown 
956c4762a1bSJed Brown    test:
957c4762a1bSJed Brown       suffix: ngmres_fas
958c4762a1bSJed Brown       args: -da_refine 4 -snes_monitor_short -snes_type ngmres -npc_fas_levels_snes_type ngs -npc_fas_levels_snes_ngs_sweeps 3 -npc_fas_levels_snes_ngs_atol 0.0 -npc_fas_levels_snes_ngs_stol 0.0 -npc_snes_type fas -npc_fas_levels_snes_type ngs -npc_snes_max_it 1 -npc_snes_fas_smoothup 6 -npc_snes_fas_smoothdown 6 -lidvelocity 100 -grashof 4e4
959c4762a1bSJed Brown       requires: !single
960c4762a1bSJed Brown 
961c4762a1bSJed Brown    test:
962c4762a1bSJed Brown       suffix: ngmres_fas_gssecant
963c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -snes_type ngmres -npc_snes_type fas -npc_fas_levels_snes_type ngs -npc_fas_levels_snes_max_it 6 -npc_fas_levels_snes_ngs_secant -npc_fas_levels_snes_ngs_max_it 1 -npc_fas_coarse_snes_max_it 1 -lidvelocity 100 -grashof 4e4
964c4762a1bSJed Brown       requires: !single
965c4762a1bSJed Brown 
966c4762a1bSJed Brown    test:
967c4762a1bSJed Brown       suffix: ngmres_fas_ms
968c4762a1bSJed Brown       nsize: 2
969c4762a1bSJed Brown       args: -snes_grid_sequence 2 -lidvelocity 200 -grashof 1e4 -snes_monitor_short -snes_view -snes_converged_reason -snes_type ngmres -npc_snes_type fas -npc_fas_coarse_snes_type newtonls -npc_fas_coarse_ksp_type preonly -npc_snes_max_it 1
970c4762a1bSJed Brown       requires: !single
971c4762a1bSJed Brown 
972c4762a1bSJed Brown    test:
973c4762a1bSJed Brown       suffix: ngmres_nasm
974c4762a1bSJed Brown       nsize: 4
975c4762a1bSJed Brown       args: -da_refine 4 -da_overlap 2 -snes_monitor_short -snes_type ngmres -snes_max_it 10 -npc_snes_type nasm -npc_snes_nasm_type basic -grashof 4e4 -lidvelocity 100
976c4762a1bSJed Brown       requires: !single
977c4762a1bSJed Brown 
978c4762a1bSJed Brown    test:
979c4762a1bSJed Brown       suffix: ngs
980c4762a1bSJed Brown       args: -snes_type ngs -snes_view -snes_monitor -snes_rtol 1e-4
981c4762a1bSJed Brown       requires: !single
982c4762a1bSJed Brown 
983c4762a1bSJed Brown    test:
984c4762a1bSJed Brown       suffix: ngs_fd
985c4762a1bSJed Brown       args: -snes_type ngs -snes_ngs_secant -snes_view -snes_monitor -snes_rtol 1e-4
986c4762a1bSJed Brown       requires: !single
987c4762a1bSJed Brown 
988c4762a1bSJed Brown    test:
989c4762a1bSJed Brown       suffix: parms
990c4762a1bSJed Brown       nsize: 2
991c4762a1bSJed Brown       requires: parms
992c4762a1bSJed Brown       args: -pc_type parms -ksp_monitor_short -snes_view
993c4762a1bSJed Brown 
994c4762a1bSJed Brown    test:
995c4762a1bSJed Brown       suffix: superlu
996c4762a1bSJed Brown       requires: superlu
997c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type superlu
998c4762a1bSJed Brown 
999c4762a1bSJed Brown    test:
1000c4762a1bSJed Brown       suffix: superlu_sell
1001c4762a1bSJed Brown       requires: superlu
1002c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type superlu -dm_mat_type sell -pc_factor_mat_ordering_type natural
1003c4762a1bSJed Brown       output_file: output/ex19_superlu.out
1004c4762a1bSJed Brown 
1005c4762a1bSJed Brown    test:
1006c4762a1bSJed Brown       suffix: superlu_dist
1007c4762a1bSJed Brown       requires: superlu_dist
1008c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type superlu_dist
1009c4762a1bSJed Brown       output_file: output/ex19_superlu.out
1010c4762a1bSJed Brown 
1011c4762a1bSJed Brown    test:
1012c4762a1bSJed Brown       suffix: superlu_dist_2
1013c4762a1bSJed Brown       nsize: 2
1014c4762a1bSJed Brown       requires: superlu_dist
1015c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type superlu_dist
1016c4762a1bSJed Brown       output_file: output/ex19_superlu.out
1017c4762a1bSJed Brown 
1018c4762a1bSJed Brown    test:
10193e558968SBarry Smith       suffix: superlu_dist_3d
10203e558968SBarry Smith       nsize: 4
10213e558968SBarry Smith       requires: superlu_dist !defined(PETSCTEST_VALGRIND)
10223e558968SBarry Smith       filter: grep -v iam | grep -v openMP
10233e558968SBarry Smith       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type superlu_dist -mat_superlu_dist_3d -mat_superlu_dist_d 2 -snes_view -snes_monitor -ksp_monitor
10243e558968SBarry Smith 
10253e558968SBarry Smith    test:
1026c4762a1bSJed Brown       suffix: superlu_equil
1027c4762a1bSJed Brown       requires: superlu
1028c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -{snes,ksp}_monitor_short -pc_type lu -pc_factor_mat_solver_type superlu -mat_superlu_equil
1029c4762a1bSJed Brown 
1030c4762a1bSJed Brown    test:
1031c4762a1bSJed Brown       suffix: superlu_equil_sell
1032c4762a1bSJed Brown       requires: superlu
1033c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -{snes,ksp}_monitor_short -pc_type lu -pc_factor_mat_solver_type superlu -mat_superlu_equil -dm_mat_type sell -pc_factor_mat_ordering_type natural
1034c4762a1bSJed Brown       output_file: output/ex19_superlu_equil.out
1035c4762a1bSJed Brown 
1036c4762a1bSJed Brown    test:
1037c4762a1bSJed Brown       suffix: tcqmr
1038c4762a1bSJed Brown       args: -da_refine 1 -ksp_monitor_short -ksp_type tcqmr
1039c4762a1bSJed Brown       requires: !single
1040c4762a1bSJed Brown 
1041c4762a1bSJed Brown    test:
1042c4762a1bSJed Brown       suffix: tfqmr
1043c4762a1bSJed Brown       args: -da_refine 1 -ksp_monitor_short -ksp_type tfqmr
1044c4762a1bSJed Brown       requires: !single
1045c4762a1bSJed Brown 
1046c4762a1bSJed Brown    test:
1047c4762a1bSJed Brown       suffix: umfpack
1048c4762a1bSJed Brown       requires: suitesparse
10492c7c0729SBarry Smith       args: -da_refine 2 -pc_type lu -pc_factor_mat_solver_type umfpack -snes_view -snes_monitor_short -ksp_monitor_short -pc_factor_mat_ordering_type external
1050c4762a1bSJed Brown 
1051c4762a1bSJed Brown    test:
1052c4762a1bSJed Brown       suffix: tut_1
1053c4762a1bSJed Brown       nsize: 4
1054c4762a1bSJed Brown       requires: !single
1055c4762a1bSJed Brown       args: -da_refine 5 -snes_monitor -ksp_monitor -snes_view
1056c4762a1bSJed Brown 
1057c4762a1bSJed Brown    test:
1058c4762a1bSJed Brown       suffix: tut_2
1059c4762a1bSJed Brown       nsize: 4
1060c4762a1bSJed Brown       requires: !single
1061c4762a1bSJed Brown       args: -da_refine 5 -snes_monitor -ksp_monitor -snes_view -pc_type mg
1062c4762a1bSJed Brown 
1063c4762a1bSJed Brown    # HYPRE PtAP broken with complex numbers
1064c4762a1bSJed Brown    test:
1065c4762a1bSJed Brown       suffix: tut_3
1066c4762a1bSJed Brown       nsize: 4
1067263f2b91SStefano Zampini       requires: hypre !single !complex !defined(PETSC_HAVE_HYPRE_DEVICE)
1068c4762a1bSJed Brown       args: -da_refine 5 -snes_monitor -ksp_monitor -snes_view -pc_type hypre
1069c4762a1bSJed Brown 
1070c4762a1bSJed Brown    test:
1071c4762a1bSJed Brown       suffix: tut_8
1072c4762a1bSJed Brown       nsize: 4
1073c4762a1bSJed Brown       requires: ml !single
1074c4762a1bSJed Brown       args: -da_refine 5 -snes_monitor -ksp_monitor -snes_view -pc_type ml
1075c4762a1bSJed Brown 
1076c4762a1bSJed Brown    test:
1077c4762a1bSJed Brown       suffix: tut_4
1078c4762a1bSJed Brown       nsize: 1
1079c4762a1bSJed Brown       requires: !single
1080c4762a1bSJed Brown       args: -da_refine 5 -log_view
1081c4762a1bSJed Brown       filter: head -n 2
1082c4762a1bSJed Brown       filter_output: head -n 2
1083c4762a1bSJed Brown 
1084c4762a1bSJed Brown    test:
1085c4762a1bSJed Brown       suffix: tut_5
1086c4762a1bSJed Brown       nsize: 1
1087c4762a1bSJed Brown       requires: !single
1088c4762a1bSJed Brown       args: -da_refine 5 -log_view -pc_type mg
1089c4762a1bSJed Brown       filter: head -n 2
1090c4762a1bSJed Brown       filter_output: head -n 2
1091c4762a1bSJed Brown 
1092c4762a1bSJed Brown    test:
1093c4762a1bSJed Brown       suffix: tut_6
1094c4762a1bSJed Brown       nsize: 4
1095c4762a1bSJed Brown       requires: !single
1096c4762a1bSJed Brown       args: -da_refine 5 -log_view
1097c4762a1bSJed Brown       filter: head -n 2
1098c4762a1bSJed Brown       filter_output: head -n 2
1099c4762a1bSJed Brown 
1100c4762a1bSJed Brown    test:
1101c4762a1bSJed Brown       suffix: tut_7
1102c4762a1bSJed Brown       nsize: 4
1103c4762a1bSJed Brown       requires: !single
1104c4762a1bSJed Brown       args: -da_refine 5 -log_view -pc_type mg
1105c4762a1bSJed Brown       filter: head -n 2
1106c4762a1bSJed Brown       filter_output: head -n 2
1107c4762a1bSJed Brown 
1108c4762a1bSJed Brown    test:
1109c4762a1bSJed Brown       suffix: cuda_1
1110c4762a1bSJed Brown       nsize: 1
1111c4762a1bSJed Brown       requires: cuda
111273f7197eSJed Brown       args: -snes_monitor -dm_mat_type seqaijcusparse -dm_vec_type seqcuda -pc_type gamg -pc_gamg_esteig_ksp_max_it 10 -ksp_monitor -mg_levels_ksp_max_it 3
1113c4762a1bSJed Brown 
1114c4762a1bSJed Brown    test:
1115c4762a1bSJed Brown       suffix: cuda_2
1116c4762a1bSJed Brown       nsize: 3
1117c4762a1bSJed Brown       requires: cuda !single
111873f7197eSJed Brown       args: -snes_monitor -dm_mat_type mpiaijcusparse -dm_vec_type mpicuda -pc_type gamg -pc_gamg_esteig_ksp_max_it 10 -ksp_monitor  -mg_levels_ksp_max_it 3
1119c4762a1bSJed Brown 
1120c4762a1bSJed Brown    test:
1121d38ac8baSRichard Tran Mills       suffix: cuda_dm_bind_below
1122d38ac8baSRichard Tran Mills       nsize: 2
1123d38ac8baSRichard Tran Mills       requires: cuda
1124d38ac8baSRichard Tran Mills       args: -dm_mat_type aijcusparse -dm_vec_type cuda -da_refine 3 -pc_type mg -mg_levels_ksp_type chebyshev -mg_levels_pc_type jacobi -log_view -pc_mg_log -dm_bind_below 10000
1125d38ac8baSRichard Tran Mills       filter: awk "/Level/ {print \$24}"
1126d38ac8baSRichard Tran Mills 
1127d38ac8baSRichard Tran Mills    test:
1128d38ac8baSRichard Tran Mills       suffix: viennacl_dm_bind_below
1129d38ac8baSRichard Tran Mills       nsize: 2
1130d38ac8baSRichard Tran Mills       requires: viennacl
1131d38ac8baSRichard Tran Mills       args: -dm_mat_type aijviennacl -dm_vec_type viennacl -da_refine 3 -pc_type mg -mg_levels_ksp_type chebyshev -mg_levels_pc_type jacobi -log_view -pc_mg_log -dm_bind_below 10000
1132d38ac8baSRichard Tran Mills       filter: awk "/Level/ {print \$24}"
1133d38ac8baSRichard Tran Mills 
1134d38ac8baSRichard Tran Mills    test:
1135c4762a1bSJed Brown       suffix: seqbaijmkl
1136c4762a1bSJed Brown       nsize: 1
1137dfd57a17SPierre Jolivet       requires: defined(PETSC_HAVE_MKL_SPARSE_OPTIMIZE)
1138c4762a1bSJed Brown       args: -dm_mat_type baij -snes_monitor -ksp_monitor -snes_view
1139c4762a1bSJed Brown 
1140c4762a1bSJed Brown    test:
1141c4762a1bSJed Brown       suffix: mpibaijmkl
1142c4762a1bSJed Brown       nsize: 2
1143dfd57a17SPierre Jolivet       requires:  defined(PETSC_HAVE_MKL_SPARSE_OPTIMIZE)
1144c4762a1bSJed Brown       args: -dm_mat_type baij -snes_monitor -ksp_monitor -snes_view
1145c4762a1bSJed Brown 
1146c4762a1bSJed Brown    test:
1147c4762a1bSJed Brown      suffix: cpardiso
1148c4762a1bSJed Brown      nsize: 4
1149c4762a1bSJed Brown      requires: mkl_cpardiso
1150c4762a1bSJed Brown      args: -pc_type lu -pc_factor_mat_solver_type mkl_cpardiso -ksp_monitor
1151c4762a1bSJed Brown 
1152c4762a1bSJed Brown    test:
1153c4762a1bSJed Brown      suffix: logviewmemory
1154dfd57a17SPierre Jolivet      requires: defined(PETSC_USE_LOG) !defined(PETSCTEST_VALGRIND)
1155c4762a1bSJed Brown      args: -log_view -log_view_memory -da_refine 4
1156c4762a1bSJed Brown      filter: grep MatFDColorSetUp | wc -w | xargs  -I % sh -c "expr % \> 21"
1157c4762a1bSJed Brown 
1158534f0846SBarry Smith    test:
1159534f0846SBarry Smith      suffix: fs
1160534f0846SBarry Smith      args: -pc_type fieldsplit -da_refine 3  -all_ksp_monitor -fieldsplit_y_velocity_pc_type lu  -fieldsplit_temperature_pc_type lu -fieldsplit_x_velocity_pc_type lu  -snes_view
1161534f0846SBarry Smith 
116271f558e3SSatish Balay    test:
1163a8e42557SLawrence Mitchell      suffix: asm_matconvert
1164a8e42557SLawrence Mitchell      args: -mat_type aij -pc_type asm -pc_asm_sub_mat_type dense -snes_view
1165a8e42557SLawrence Mitchell 
11668bf83915SBarry Smith    test:
11678bf83915SBarry Smith       suffix: euclid
11688bf83915SBarry Smith       nsize: 2
1169263f2b91SStefano Zampini       requires: hypre !single !complex !defined(PETSC_HAVE_HYPRE_MIXEDINT) !defined(PETSC_HAVE_HYPRE_DEVICE)
11708bf83915SBarry Smith       args: -da_refine 2 -ksp_monitor -snes_monitor -snes_view -pc_type hypre -pc_hypre_type euclid
11718bf83915SBarry Smith 
11728bf83915SBarry Smith    test:
11738bf83915SBarry Smith       suffix: euclid_bj
11748bf83915SBarry Smith       nsize: 2
1175263f2b91SStefano Zampini       requires: hypre !single !complex !defined(PETSC_HAVE_HYPRE_MIXEDINT) !defined(PETSC_HAVE_HYPRE_DEVICE)
11768bf83915SBarry Smith       args: -da_refine 2 -ksp_monitor -snes_monitor -snes_view -pc_type hypre -pc_hypre_type euclid -pc_hypre_euclid_bj
11778bf83915SBarry Smith 
11788bf83915SBarry Smith    test:
11798bf83915SBarry Smith       suffix: euclid_droptolerance
11808bf83915SBarry Smith       nsize: 1
1181263f2b91SStefano Zampini       requires: hypre !single !complex !defined(PETSC_HAVE_HYPRE_MIXEDINT) !defined(PETSC_HAVE_HYPRE_DEVICE)
11828bf83915SBarry Smith       args: -da_refine 2 -ksp_monitor -snes_monitor -snes_view -pc_type hypre -pc_hypre_type euclid -pc_hypre_euclid_droptolerance .1
11838bf83915SBarry Smith 
1184c4762a1bSJed Brown TEST*/
1185