xref: /petsc/src/snes/tutorials/ex19.c (revision 2c7c0729d89b910088ee906aed2239ea927d033e)
1c4762a1bSJed Brown 
2c4762a1bSJed Brown static char help[] = "Nonlinear driven cavity with multigrid in 2d.\n \
3c4762a1bSJed Brown   \n\
4c4762a1bSJed Brown The 2D driven cavity problem is solved in a velocity-vorticity formulation.\n\
5c4762a1bSJed Brown The flow can be driven with the lid or with bouyancy or both:\n\
6c4762a1bSJed Brown   -lidvelocity &ltlid&gt, where &ltlid&gt = dimensionless velocity of lid\n\
7c4762a1bSJed Brown   -grashof &ltgr&gt, where &ltgr&gt = dimensionless temperature gradent\n\
8c4762a1bSJed Brown   -prandtl &ltpr&gt, where &ltpr&gt = dimensionless thermal/momentum diffusity ratio\n\
9c4762a1bSJed Brown  -contours : draw contour plots of solution\n\n";
10c4762a1bSJed Brown /* in HTML, '&lt' = '<' and '&gt' = '>' */
11c4762a1bSJed Brown 
12c4762a1bSJed Brown /*
13c4762a1bSJed Brown       See src/ksp/ksp/tutorials/ex45.c
14c4762a1bSJed Brown */
15c4762a1bSJed Brown 
16c4762a1bSJed Brown /*T
17c4762a1bSJed Brown    Concepts: SNES^solving a system of nonlinear equations (parallel multicomponent example);
18c4762a1bSJed Brown    Concepts: DMDA^using distributed arrays;
19c4762a1bSJed Brown    Concepts: multicomponent
20c4762a1bSJed Brown    Processors: n
21c4762a1bSJed Brown T*/
22c4762a1bSJed Brown 
23c4762a1bSJed Brown 
24c4762a1bSJed Brown /*F-----------------------------------------------------------------------
25c4762a1bSJed Brown 
26c4762a1bSJed Brown     We thank David E. Keyes for contributing the driven cavity discretization within this example code.
27c4762a1bSJed Brown 
28c4762a1bSJed Brown     This problem is modeled by the partial differential equation system
29c4762a1bSJed Brown 
30c4762a1bSJed Brown \begin{eqnarray}
31c4762a1bSJed Brown         - \triangle U - \nabla_y \Omega & = & 0  \\
32c4762a1bSJed Brown         - \triangle V + \nabla_x\Omega & = & 0  \\
33c4762a1bSJed Brown         - \triangle \Omega + \nabla \cdot ([U*\Omega,V*\Omega]) - GR* \nabla_x T & = & 0  \\
34c4762a1bSJed Brown         - \triangle T + PR* \nabla \cdot ([U*T,V*T]) & = & 0
35c4762a1bSJed Brown \end{eqnarray}
36c4762a1bSJed Brown 
37c4762a1bSJed Brown     in the unit square, which is uniformly discretized in each of x and y in this simple encoding.
38c4762a1bSJed Brown 
39c4762a1bSJed Brown     No-slip, rigid-wall Dirichlet conditions are used for $ [U,V]$.
40c4762a1bSJed Brown     Dirichlet conditions are used for Omega, based on the definition of
41c4762a1bSJed Brown     vorticity: $ \Omega = - \nabla_y U + \nabla_x V$, where along each
42c4762a1bSJed Brown     constant coordinate boundary, the tangential derivative is zero.
43c4762a1bSJed Brown     Dirichlet conditions are used for T on the left and right walls,
44c4762a1bSJed Brown     and insulation homogeneous Neumann conditions are used for T on
45c4762a1bSJed Brown     the top and bottom walls.
46c4762a1bSJed Brown 
47c4762a1bSJed Brown     A finite difference approximation with the usual 5-point stencil
48c4762a1bSJed Brown     is used to discretize the boundary value problem to obtain a
49c4762a1bSJed Brown     nonlinear system of equations.  Upwinding is used for the divergence
50c4762a1bSJed Brown     (convective) terms and central for the gradient (source) terms.
51c4762a1bSJed Brown 
52c4762a1bSJed Brown     The Jacobian can be either
53c4762a1bSJed Brown       * formed via finite differencing using coloring (the default), or
54c4762a1bSJed Brown       * applied matrix-free via the option -snes_mf
55c4762a1bSJed Brown         (for larger grid problems this variant may not converge
56c4762a1bSJed Brown         without a preconditioner due to ill-conditioning).
57c4762a1bSJed Brown 
58c4762a1bSJed Brown   ------------------------------------------------------------------------F*/
59c4762a1bSJed Brown 
60c4762a1bSJed Brown /*
61c4762a1bSJed Brown    Include "petscdmda.h" so that we can use distributed arrays (DMDAs).
62c4762a1bSJed Brown    Include "petscsnes.h" so that we can use SNES solvers.  Note that this
63c4762a1bSJed Brown    file automatically includes:
64c4762a1bSJed Brown      petscsys.h       - base PETSc routines   petscvec.h - vectors
65c4762a1bSJed Brown      petscmat.h - matrices
66c4762a1bSJed Brown      petscis.h     - index sets            petscksp.h - Krylov subspace methods
67c4762a1bSJed Brown      petscviewer.h - viewers               petscpc.h  - preconditioners
68c4762a1bSJed Brown      petscksp.h   - linear solvers
69c4762a1bSJed Brown */
70c4762a1bSJed Brown #if defined(PETSC_APPLE_FRAMEWORK)
71c4762a1bSJed Brown #import <PETSc/petscsnes.h>
72c4762a1bSJed Brown #import <PETSc/petscdmda.h>
73c4762a1bSJed Brown #else
74c4762a1bSJed Brown #include <petscsnes.h>
75c4762a1bSJed Brown #include <petscdm.h>
76c4762a1bSJed Brown #include <petscdmda.h>
77c4762a1bSJed Brown #endif
78c4762a1bSJed Brown 
79c4762a1bSJed Brown /*
80c4762a1bSJed Brown    User-defined routines and data structures
81c4762a1bSJed Brown */
82c4762a1bSJed Brown typedef struct {
83c4762a1bSJed Brown   PetscScalar u,v,omega,temp;
84c4762a1bSJed Brown } Field;
85c4762a1bSJed Brown 
86c4762a1bSJed Brown PetscErrorCode FormFunctionLocal(DMDALocalInfo*,Field**,Field**,void*);
87c4762a1bSJed Brown 
88c4762a1bSJed Brown typedef struct {
89c4762a1bSJed Brown   PetscReal   lidvelocity,prandtl,grashof;  /* physical parameters */
90c4762a1bSJed Brown   PetscBool   draw_contours;                /* flag - 1 indicates drawing contours */
91c4762a1bSJed Brown } AppCtx;
92c4762a1bSJed Brown 
93c4762a1bSJed Brown extern PetscErrorCode FormInitialGuess(AppCtx*,DM,Vec);
94c4762a1bSJed Brown extern PetscErrorCode NonlinearGS(SNES,Vec,Vec,void*);
95c4762a1bSJed Brown 
96c4762a1bSJed Brown int main(int argc,char **argv)
97c4762a1bSJed Brown {
98c4762a1bSJed Brown   AppCtx         user;                /* user-defined work context */
99c4762a1bSJed Brown   PetscInt       mx,my,its;
100c4762a1bSJed Brown   PetscErrorCode ierr;
101c4762a1bSJed Brown   MPI_Comm       comm;
102c4762a1bSJed Brown   SNES           snes;
103c4762a1bSJed Brown   DM             da;
104c4762a1bSJed Brown   Vec            x;
105c4762a1bSJed Brown 
106c4762a1bSJed Brown   ierr = PetscInitialize(&argc,&argv,(char*)0,help);if (ierr) return ierr;
107c4762a1bSJed Brown 
108c4762a1bSJed Brown   PetscFunctionBeginUser;
109c4762a1bSJed Brown   comm = PETSC_COMM_WORLD;
110c4762a1bSJed Brown   ierr = SNESCreate(comm,&snes);CHKERRQ(ierr);
111c4762a1bSJed Brown 
112c4762a1bSJed Brown   /*
113c4762a1bSJed Brown       Create distributed array object to manage parallel grid and vectors
114c4762a1bSJed Brown       for principal unknowns (x) and governing residuals (f)
115c4762a1bSJed Brown   */
116c4762a1bSJed Brown   ierr = DMDACreate2d(PETSC_COMM_WORLD,DM_BOUNDARY_NONE,DM_BOUNDARY_NONE,DMDA_STENCIL_STAR,4,4,PETSC_DECIDE,PETSC_DECIDE,4,1,0,0,&da);CHKERRQ(ierr);
117c4762a1bSJed Brown   ierr = DMSetFromOptions(da);CHKERRQ(ierr);
118c4762a1bSJed Brown   ierr = DMSetUp(da);CHKERRQ(ierr);
119c4762a1bSJed Brown   ierr = SNESSetDM(snes,(DM)da);CHKERRQ(ierr);
120c4762a1bSJed Brown   ierr = SNESSetNGS(snes, NonlinearGS, (void*)&user);CHKERRQ(ierr);
121c4762a1bSJed Brown 
122c4762a1bSJed Brown   ierr = DMDAGetInfo(da,0,&mx,&my,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE);CHKERRQ(ierr);
123c4762a1bSJed Brown   /*
124c4762a1bSJed Brown      Problem parameters (velocity of lid, prandtl, and grashof numbers)
125c4762a1bSJed Brown   */
126c4762a1bSJed Brown   user.lidvelocity = 1.0/(mx*my);
127c4762a1bSJed Brown   user.prandtl     = 1.0;
128c4762a1bSJed Brown   user.grashof     = 1.0;
129c4762a1bSJed Brown 
130c4762a1bSJed Brown   ierr = PetscOptionsGetReal(NULL,NULL,"-lidvelocity",&user.lidvelocity,NULL);CHKERRQ(ierr);
131c4762a1bSJed Brown   ierr = PetscOptionsGetReal(NULL,NULL,"-prandtl",&user.prandtl,NULL);CHKERRQ(ierr);
132c4762a1bSJed Brown   ierr = PetscOptionsGetReal(NULL,NULL,"-grashof",&user.grashof,NULL);CHKERRQ(ierr);
133c4762a1bSJed Brown   ierr = PetscOptionsHasName(NULL,NULL,"-contours",&user.draw_contours);CHKERRQ(ierr);
134c4762a1bSJed Brown 
135c4762a1bSJed Brown   ierr = DMDASetFieldName(da,0,"x_velocity");CHKERRQ(ierr);
136c4762a1bSJed Brown   ierr = DMDASetFieldName(da,1,"y_velocity");CHKERRQ(ierr);
137c4762a1bSJed Brown   ierr = DMDASetFieldName(da,2,"Omega");CHKERRQ(ierr);
138c4762a1bSJed Brown   ierr = DMDASetFieldName(da,3,"temperature");CHKERRQ(ierr);
139c4762a1bSJed Brown 
140c4762a1bSJed Brown   /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
141c4762a1bSJed Brown      Create user context, set problem data, create vector data structures.
142c4762a1bSJed Brown      Also, compute the initial guess.
143c4762a1bSJed Brown      - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */
144c4762a1bSJed Brown 
145c4762a1bSJed Brown   /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
146c4762a1bSJed Brown      Create nonlinear solver context
147c4762a1bSJed Brown 
148c4762a1bSJed Brown      - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */
149c4762a1bSJed Brown   ierr = DMSetApplicationContext(da,&user);CHKERRQ(ierr);
150c4762a1bSJed Brown   ierr = DMDASNESSetFunctionLocal(da,INSERT_VALUES,(PetscErrorCode (*)(DMDALocalInfo*,void*,void*,void*))FormFunctionLocal,&user);CHKERRQ(ierr);
151c4762a1bSJed Brown   ierr = SNESSetFromOptions(snes);CHKERRQ(ierr);
152c4762a1bSJed Brown   ierr = PetscPrintf(comm,"lid velocity = %g, prandtl # = %g, grashof # = %g\n",(double)user.lidvelocity,(double)user.prandtl,(double)user.grashof);CHKERRQ(ierr);
153c4762a1bSJed Brown 
154c4762a1bSJed Brown 
155c4762a1bSJed Brown   /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
156c4762a1bSJed Brown      Solve the nonlinear system
157c4762a1bSJed Brown      - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */
158c4762a1bSJed Brown   ierr = DMCreateGlobalVector(da,&x);CHKERRQ(ierr);
159c4762a1bSJed Brown   ierr = FormInitialGuess(&user,da,x);CHKERRQ(ierr);
160c4762a1bSJed Brown 
161c4762a1bSJed Brown   ierr = SNESSolve(snes,NULL,x);CHKERRQ(ierr);
162c4762a1bSJed Brown 
163c4762a1bSJed Brown   ierr = SNESGetIterationNumber(snes,&its);CHKERRQ(ierr);
164c4762a1bSJed Brown   ierr = PetscPrintf(comm,"Number of SNES iterations = %D\n", its);CHKERRQ(ierr);
165c4762a1bSJed Brown 
166c4762a1bSJed Brown   /*
167c4762a1bSJed Brown      Visualize solution
168c4762a1bSJed Brown   */
169c4762a1bSJed Brown   if (user.draw_contours) {
170c4762a1bSJed Brown     ierr = VecView(x,PETSC_VIEWER_DRAW_WORLD);CHKERRQ(ierr);
171c4762a1bSJed Brown   }
172c4762a1bSJed Brown 
173c4762a1bSJed Brown   /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
174c4762a1bSJed Brown      Free work space.  All PETSc objects should be destroyed when they
175c4762a1bSJed Brown      are no longer needed.
176c4762a1bSJed Brown      - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */
177c4762a1bSJed Brown   ierr = VecDestroy(&x);CHKERRQ(ierr);
178c4762a1bSJed Brown   ierr = DMDestroy(&da);CHKERRQ(ierr);
179c4762a1bSJed Brown   ierr = SNESDestroy(&snes);CHKERRQ(ierr);
180c4762a1bSJed Brown   ierr = PetscFinalize();
181c4762a1bSJed Brown   return ierr;
182c4762a1bSJed Brown }
183c4762a1bSJed Brown 
184c4762a1bSJed Brown /* ------------------------------------------------------------------- */
185c4762a1bSJed Brown 
186c4762a1bSJed Brown /*
187c4762a1bSJed Brown    FormInitialGuess - Forms initial approximation.
188c4762a1bSJed Brown 
189c4762a1bSJed Brown    Input Parameters:
190c4762a1bSJed Brown    user - user-defined application context
191c4762a1bSJed Brown    X - vector
192c4762a1bSJed Brown 
193c4762a1bSJed Brown    Output Parameter:
194c4762a1bSJed Brown    X - vector
195c4762a1bSJed Brown */
196c4762a1bSJed Brown PetscErrorCode FormInitialGuess(AppCtx *user,DM da,Vec X)
197c4762a1bSJed Brown {
198c4762a1bSJed Brown   PetscInt       i,j,mx,xs,ys,xm,ym;
199c4762a1bSJed Brown   PetscErrorCode ierr;
200c4762a1bSJed Brown   PetscReal      grashof,dx;
201c4762a1bSJed Brown   Field          **x;
202c4762a1bSJed Brown 
203c4762a1bSJed Brown   PetscFunctionBeginUser;
204c4762a1bSJed Brown   grashof = user->grashof;
205c4762a1bSJed Brown 
206c4762a1bSJed Brown   ierr = DMDAGetInfo(da,0,&mx,0,0,0,0,0,0,0,0,0,0,0);CHKERRQ(ierr);
207c4762a1bSJed Brown   dx   = 1.0/(mx-1);
208c4762a1bSJed Brown 
209c4762a1bSJed Brown   /*
210c4762a1bSJed Brown      Get local grid boundaries (for 2-dimensional DMDA):
211c4762a1bSJed Brown        xs, ys   - starting grid indices (no ghost points)
212c4762a1bSJed Brown        xm, ym   - widths of local grid (no ghost points)
213c4762a1bSJed Brown   */
214c4762a1bSJed Brown   ierr = DMDAGetCorners(da,&xs,&ys,NULL,&xm,&ym,NULL);CHKERRQ(ierr);
215c4762a1bSJed Brown 
216c4762a1bSJed Brown   /*
217c4762a1bSJed Brown      Get a pointer to vector data.
218c4762a1bSJed Brown        - For default PETSc vectors, VecGetArray() returns a pointer to
219c4762a1bSJed Brown          the data array.  Otherwise, the routine is implementation dependent.
220c4762a1bSJed Brown        - You MUST call VecRestoreArray() when you no longer need access to
221c4762a1bSJed Brown          the array.
222c4762a1bSJed Brown   */
223c4762a1bSJed Brown   ierr = DMDAVecGetArrayWrite(da,X,&x);CHKERRQ(ierr);
224c4762a1bSJed Brown 
225c4762a1bSJed Brown   /*
226c4762a1bSJed Brown      Compute initial guess over the locally owned part of the grid
227c4762a1bSJed Brown      Initial condition is motionless fluid and equilibrium temperature
228c4762a1bSJed Brown   */
229c4762a1bSJed Brown   for (j=ys; j<ys+ym; j++) {
230c4762a1bSJed Brown     for (i=xs; i<xs+xm; i++) {
231c4762a1bSJed Brown       x[j][i].u     = 0.0;
232c4762a1bSJed Brown       x[j][i].v     = 0.0;
233c4762a1bSJed Brown       x[j][i].omega = 0.0;
234c4762a1bSJed Brown       x[j][i].temp  = (grashof>0)*i*dx;
235c4762a1bSJed Brown     }
236c4762a1bSJed Brown   }
237c4762a1bSJed Brown 
238c4762a1bSJed Brown   /*
239c4762a1bSJed Brown      Restore vector
240c4762a1bSJed Brown   */
241c4762a1bSJed Brown   ierr = DMDAVecRestoreArrayWrite(da,X,&x);CHKERRQ(ierr);
242c4762a1bSJed Brown   PetscFunctionReturn(0);
243c4762a1bSJed Brown }
244c4762a1bSJed Brown 
245c4762a1bSJed Brown PetscErrorCode FormFunctionLocal(DMDALocalInfo *info,Field **x,Field **f,void *ptr)
246c4762a1bSJed Brown {
247c4762a1bSJed Brown   AppCtx         *user = (AppCtx*)ptr;
248c4762a1bSJed Brown   PetscErrorCode ierr;
249c4762a1bSJed Brown   PetscInt       xints,xinte,yints,yinte,i,j;
250c4762a1bSJed Brown   PetscReal      hx,hy,dhx,dhy,hxdhy,hydhx;
251c4762a1bSJed Brown   PetscReal      grashof,prandtl,lid;
252c4762a1bSJed Brown   PetscScalar    u,uxx,uyy,vx,vy,avx,avy,vxp,vxm,vyp,vym;
253c4762a1bSJed Brown 
254c4762a1bSJed Brown   PetscFunctionBeginUser;
255c4762a1bSJed Brown   grashof = user->grashof;
256c4762a1bSJed Brown   prandtl = user->prandtl;
257c4762a1bSJed Brown   lid     = user->lidvelocity;
258c4762a1bSJed Brown 
259c4762a1bSJed Brown   /*
260c4762a1bSJed Brown      Define mesh intervals ratios for uniform grid.
261c4762a1bSJed Brown 
262c4762a1bSJed Brown      Note: FD formulae below are normalized by multiplying through by
263c4762a1bSJed Brown      local volume element (i.e. hx*hy) to obtain coefficients O(1) in two dimensions.
264c4762a1bSJed Brown 
265c4762a1bSJed Brown 
266c4762a1bSJed Brown   */
267c4762a1bSJed Brown   dhx   = (PetscReal)(info->mx-1);  dhy = (PetscReal)(info->my-1);
268c4762a1bSJed Brown   hx    = 1.0/dhx;                   hy = 1.0/dhy;
269c4762a1bSJed Brown   hxdhy = hx*dhy;                 hydhx = hy*dhx;
270c4762a1bSJed Brown 
271c4762a1bSJed Brown   xints = info->xs; xinte = info->xs+info->xm; yints = info->ys; yinte = info->ys+info->ym;
272c4762a1bSJed Brown 
273c4762a1bSJed Brown   /* Test whether we are on the bottom edge of the global array */
274c4762a1bSJed Brown   if (yints == 0) {
275c4762a1bSJed Brown     j     = 0;
276c4762a1bSJed Brown     yints = yints + 1;
277c4762a1bSJed Brown     /* bottom edge */
278c4762a1bSJed Brown     for (i=info->xs; i<info->xs+info->xm; i++) {
279c4762a1bSJed Brown       f[j][i].u     = x[j][i].u;
280c4762a1bSJed Brown       f[j][i].v     = x[j][i].v;
281c4762a1bSJed Brown       f[j][i].omega = x[j][i].omega + (x[j+1][i].u - x[j][i].u)*dhy;
282c4762a1bSJed Brown       f[j][i].temp  = x[j][i].temp-x[j+1][i].temp;
283c4762a1bSJed Brown     }
284c4762a1bSJed Brown   }
285c4762a1bSJed Brown 
286c4762a1bSJed Brown   /* Test whether we are on the top edge of the global array */
287c4762a1bSJed Brown   if (yinte == info->my) {
288c4762a1bSJed Brown     j     = info->my - 1;
289c4762a1bSJed Brown     yinte = yinte - 1;
290c4762a1bSJed Brown     /* top edge */
291c4762a1bSJed Brown     for (i=info->xs; i<info->xs+info->xm; i++) {
292c4762a1bSJed Brown       f[j][i].u     = x[j][i].u - lid;
293c4762a1bSJed Brown       f[j][i].v     = x[j][i].v;
294c4762a1bSJed Brown       f[j][i].omega = x[j][i].omega + (x[j][i].u - x[j-1][i].u)*dhy;
295c4762a1bSJed Brown       f[j][i].temp  = x[j][i].temp-x[j-1][i].temp;
296c4762a1bSJed Brown     }
297c4762a1bSJed Brown   }
298c4762a1bSJed Brown 
299c4762a1bSJed Brown   /* Test whether we are on the left edge of the global array */
300c4762a1bSJed Brown   if (xints == 0) {
301c4762a1bSJed Brown     i     = 0;
302c4762a1bSJed Brown     xints = xints + 1;
303c4762a1bSJed Brown     /* left edge */
304c4762a1bSJed Brown     for (j=info->ys; j<info->ys+info->ym; j++) {
305c4762a1bSJed Brown       f[j][i].u     = x[j][i].u;
306c4762a1bSJed Brown       f[j][i].v     = x[j][i].v;
307c4762a1bSJed Brown       f[j][i].omega = x[j][i].omega - (x[j][i+1].v - x[j][i].v)*dhx;
308c4762a1bSJed Brown       f[j][i].temp  = x[j][i].temp;
309c4762a1bSJed Brown     }
310c4762a1bSJed Brown   }
311c4762a1bSJed Brown 
312c4762a1bSJed Brown   /* Test whether we are on the right edge of the global array */
313c4762a1bSJed Brown   if (xinte == info->mx) {
314c4762a1bSJed Brown     i     = info->mx - 1;
315c4762a1bSJed Brown     xinte = xinte - 1;
316c4762a1bSJed Brown     /* right edge */
317c4762a1bSJed Brown     for (j=info->ys; j<info->ys+info->ym; j++) {
318c4762a1bSJed Brown       f[j][i].u     = x[j][i].u;
319c4762a1bSJed Brown       f[j][i].v     = x[j][i].v;
320c4762a1bSJed Brown       f[j][i].omega = x[j][i].omega - (x[j][i].v - x[j][i-1].v)*dhx;
321c4762a1bSJed Brown       f[j][i].temp  = x[j][i].temp - (PetscReal)(grashof>0);
322c4762a1bSJed Brown     }
323c4762a1bSJed Brown   }
324c4762a1bSJed Brown 
325c4762a1bSJed Brown   /* Compute over the interior points */
326c4762a1bSJed Brown   for (j=yints; j<yinte; j++) {
327c4762a1bSJed Brown     for (i=xints; i<xinte; i++) {
328c4762a1bSJed Brown 
329c4762a1bSJed Brown       /*
330c4762a1bSJed Brown        convective coefficients for upwinding
331c4762a1bSJed Brown       */
332c4762a1bSJed Brown       vx  = x[j][i].u; avx = PetscAbsScalar(vx);
333c4762a1bSJed Brown       vxp = .5*(vx+avx); vxm = .5*(vx-avx);
334c4762a1bSJed Brown       vy  = x[j][i].v; avy = PetscAbsScalar(vy);
335c4762a1bSJed Brown       vyp = .5*(vy+avy); vym = .5*(vy-avy);
336c4762a1bSJed Brown 
337c4762a1bSJed Brown       /* U velocity */
338c4762a1bSJed Brown       u         = x[j][i].u;
339c4762a1bSJed Brown       uxx       = (2.0*u - x[j][i-1].u - x[j][i+1].u)*hydhx;
340c4762a1bSJed Brown       uyy       = (2.0*u - x[j-1][i].u - x[j+1][i].u)*hxdhy;
341c4762a1bSJed Brown       f[j][i].u = uxx + uyy - .5*(x[j+1][i].omega-x[j-1][i].omega)*hx;
342c4762a1bSJed Brown 
343c4762a1bSJed Brown       /* V velocity */
344c4762a1bSJed Brown       u         = x[j][i].v;
345c4762a1bSJed Brown       uxx       = (2.0*u - x[j][i-1].v - x[j][i+1].v)*hydhx;
346c4762a1bSJed Brown       uyy       = (2.0*u - x[j-1][i].v - x[j+1][i].v)*hxdhy;
347c4762a1bSJed Brown       f[j][i].v = uxx + uyy + .5*(x[j][i+1].omega-x[j][i-1].omega)*hy;
348c4762a1bSJed Brown 
349c4762a1bSJed Brown       /* Omega */
350c4762a1bSJed Brown       u             = x[j][i].omega;
351c4762a1bSJed Brown       uxx           = (2.0*u - x[j][i-1].omega - x[j][i+1].omega)*hydhx;
352c4762a1bSJed Brown       uyy           = (2.0*u - x[j-1][i].omega - x[j+1][i].omega)*hxdhy;
353c4762a1bSJed Brown       f[j][i].omega = uxx + uyy + (vxp*(u - x[j][i-1].omega) + vxm*(x[j][i+1].omega - u))*hy +
354c4762a1bSJed Brown                       (vyp*(u - x[j-1][i].omega) + vym*(x[j+1][i].omega - u))*hx -
355c4762a1bSJed Brown                       .5*grashof*(x[j][i+1].temp - x[j][i-1].temp)*hy;
356c4762a1bSJed Brown 
357c4762a1bSJed Brown       /* Temperature */
358c4762a1bSJed Brown       u            = x[j][i].temp;
359c4762a1bSJed Brown       uxx          = (2.0*u - x[j][i-1].temp - x[j][i+1].temp)*hydhx;
360c4762a1bSJed Brown       uyy          = (2.0*u - x[j-1][i].temp - x[j+1][i].temp)*hxdhy;
361c4762a1bSJed Brown       f[j][i].temp =  uxx + uyy  + prandtl*((vxp*(u - x[j][i-1].temp) + vxm*(x[j][i+1].temp - u))*hy +
362c4762a1bSJed Brown                                             (vyp*(u - x[j-1][i].temp) + vym*(x[j+1][i].temp - u))*hx);
363c4762a1bSJed Brown     }
364c4762a1bSJed Brown   }
365c4762a1bSJed Brown 
366c4762a1bSJed Brown   /*
367c4762a1bSJed Brown      Flop count (multiply-adds are counted as 2 operations)
368c4762a1bSJed Brown   */
369c4762a1bSJed Brown   ierr = PetscLogFlops(84.0*info->ym*info->xm);CHKERRQ(ierr);
370c4762a1bSJed Brown   PetscFunctionReturn(0);
371c4762a1bSJed Brown }
372c4762a1bSJed Brown 
373c4762a1bSJed Brown /*
374c4762a1bSJed Brown     Performs sweeps of point block nonlinear Gauss-Seidel on all the local grid points
375c4762a1bSJed Brown */
376c4762a1bSJed Brown PetscErrorCode NonlinearGS(SNES snes, Vec X, Vec B, void *ctx)
377c4762a1bSJed Brown {
378c4762a1bSJed Brown   DMDALocalInfo  info;
379c4762a1bSJed Brown   Field          **x,**b;
380c4762a1bSJed Brown   PetscErrorCode ierr;
381c4762a1bSJed Brown   Vec            localX, localB;
382c4762a1bSJed Brown   DM             da;
383c4762a1bSJed Brown   PetscInt       xints,xinte,yints,yinte,i,j,k,l;
384c4762a1bSJed Brown   PetscInt       max_its,tot_its;
385c4762a1bSJed Brown   PetscInt       sweeps;
386c4762a1bSJed Brown   PetscReal      rtol,atol,stol;
387c4762a1bSJed Brown   PetscReal      hx,hy,dhx,dhy,hxdhy,hydhx;
388c4762a1bSJed Brown   PetscReal      grashof,prandtl,lid;
389c4762a1bSJed Brown   PetscScalar    u,uxx,uyy,vx,vy,avx,avy,vxp,vxm,vyp,vym;
390c4762a1bSJed Brown   PetscScalar    fu, fv, fomega, ftemp;
391c4762a1bSJed Brown   PetscScalar    dfudu;
392c4762a1bSJed Brown   PetscScalar    dfvdv;
393c4762a1bSJed Brown   PetscScalar    dfodu, dfodv, dfodo;
394c4762a1bSJed Brown   PetscScalar    dftdu, dftdv, dftdt;
395c4762a1bSJed Brown   PetscScalar    yu=0, yv=0, yo=0, yt=0;
396c4762a1bSJed Brown   PetscScalar    bjiu, bjiv, bjiomega, bjitemp;
397c4762a1bSJed Brown   PetscBool      ptconverged;
398c4762a1bSJed Brown   PetscReal      pfnorm,pfnorm0,pynorm,pxnorm;
399c4762a1bSJed Brown   AppCtx         *user = (AppCtx*)ctx;
400c4762a1bSJed Brown 
401c4762a1bSJed Brown   PetscFunctionBeginUser;
402c4762a1bSJed Brown   grashof = user->grashof;
403c4762a1bSJed Brown   prandtl = user->prandtl;
404c4762a1bSJed Brown   lid     = user->lidvelocity;
405c4762a1bSJed Brown   tot_its = 0;
406c4762a1bSJed Brown   ierr    = SNESNGSGetTolerances(snes,&rtol,&atol,&stol,&max_its);CHKERRQ(ierr);
407c4762a1bSJed Brown   ierr    = SNESNGSGetSweeps(snes,&sweeps);CHKERRQ(ierr);
408c4762a1bSJed Brown   ierr    = SNESGetDM(snes,(DM*)&da);CHKERRQ(ierr);
409c4762a1bSJed Brown   ierr    = DMGetLocalVector(da,&localX);CHKERRQ(ierr);
410c4762a1bSJed Brown   if (B) {
411c4762a1bSJed Brown     ierr = DMGetLocalVector(da,&localB);CHKERRQ(ierr);
412c4762a1bSJed Brown   }
413c4762a1bSJed Brown   /*
414c4762a1bSJed Brown      Scatter ghost points to local vector, using the 2-step process
415c4762a1bSJed Brown         DMGlobalToLocalBegin(), DMGlobalToLocalEnd().
416c4762a1bSJed Brown   */
417c4762a1bSJed Brown   ierr = DMGlobalToLocalBegin(da,X,INSERT_VALUES,localX);CHKERRQ(ierr);
418c4762a1bSJed Brown   ierr = DMGlobalToLocalEnd(da,X,INSERT_VALUES,localX);CHKERRQ(ierr);
419c4762a1bSJed Brown   if (B) {
420c4762a1bSJed Brown     ierr = DMGlobalToLocalBegin(da,B,INSERT_VALUES,localB);CHKERRQ(ierr);
421c4762a1bSJed Brown     ierr = DMGlobalToLocalEnd(da,B,INSERT_VALUES,localB);CHKERRQ(ierr);
422c4762a1bSJed Brown   }
423c4762a1bSJed Brown   ierr = DMDAGetLocalInfo(da,&info);CHKERRQ(ierr);
424c4762a1bSJed Brown   ierr = DMDAVecGetArrayWrite(da,localX,&x);CHKERRQ(ierr);
425c4762a1bSJed Brown   if (B) {
426c4762a1bSJed Brown     ierr = DMDAVecGetArrayRead(da,localB,&b);CHKERRQ(ierr);
427c4762a1bSJed Brown   }
428c4762a1bSJed Brown   /* looks like a combination of the formfunction / formjacobian routines */
429c4762a1bSJed Brown   dhx   = (PetscReal)(info.mx-1);dhy   = (PetscReal)(info.my-1);
430c4762a1bSJed Brown   hx    = 1.0/dhx;               hy    = 1.0/dhy;
431c4762a1bSJed Brown   hxdhy = hx*dhy;                hydhx = hy*dhx;
432c4762a1bSJed Brown 
433c4762a1bSJed Brown   xints = info.xs; xinte = info.xs+info.xm; yints = info.ys; yinte = info.ys+info.ym;
434c4762a1bSJed Brown 
435c4762a1bSJed Brown   /* Set the boundary conditions on the momentum equations */
436c4762a1bSJed Brown   /* Test whether we are on the bottom edge of the global array */
437c4762a1bSJed Brown   if (yints == 0) {
438c4762a1bSJed Brown     j     = 0;
439c4762a1bSJed Brown     /* bottom edge */
440c4762a1bSJed Brown     for (i=info.xs; i<info.xs+info.xm; i++) {
441c4762a1bSJed Brown 
442c4762a1bSJed Brown       if (B) {
443c4762a1bSJed Brown         bjiu = b[j][i].u;
444c4762a1bSJed Brown         bjiv = b[j][i].v;
445c4762a1bSJed Brown       } else {
446c4762a1bSJed Brown         bjiu = 0.0;
447c4762a1bSJed Brown         bjiv = 0.0;
448c4762a1bSJed Brown       }
449c4762a1bSJed Brown       x[j][i].u = 0.0 + bjiu;
450c4762a1bSJed Brown       x[j][i].v = 0.0 + bjiv;
451c4762a1bSJed Brown     }
452c4762a1bSJed Brown   }
453c4762a1bSJed Brown 
454c4762a1bSJed Brown   /* Test whether we are on the top edge of the global array */
455c4762a1bSJed Brown   if (yinte == info.my) {
456c4762a1bSJed Brown     j     = info.my - 1;
457c4762a1bSJed Brown     /* top edge */
458c4762a1bSJed Brown     for (i=info.xs; i<info.xs+info.xm; i++) {
459c4762a1bSJed Brown       if (B) {
460c4762a1bSJed Brown         bjiu = b[j][i].u;
461c4762a1bSJed Brown         bjiv = b[j][i].v;
462c4762a1bSJed Brown       } else {
463c4762a1bSJed Brown         bjiu = 0.0;
464c4762a1bSJed Brown         bjiv = 0.0;
465c4762a1bSJed Brown       }
466c4762a1bSJed Brown       x[j][i].u = lid + bjiu;
467c4762a1bSJed Brown       x[j][i].v = bjiv;
468c4762a1bSJed Brown     }
469c4762a1bSJed Brown   }
470c4762a1bSJed Brown 
471c4762a1bSJed Brown   /* Test whether we are on the left edge of the global array */
472c4762a1bSJed Brown   if (xints == 0) {
473c4762a1bSJed Brown     i     = 0;
474c4762a1bSJed Brown     /* left edge */
475c4762a1bSJed Brown     for (j=info.ys; j<info.ys+info.ym; j++) {
476c4762a1bSJed Brown       if (B) {
477c4762a1bSJed Brown         bjiu = b[j][i].u;
478c4762a1bSJed Brown         bjiv = b[j][i].v;
479c4762a1bSJed Brown       } else {
480c4762a1bSJed Brown         bjiu = 0.0;
481c4762a1bSJed Brown         bjiv = 0.0;
482c4762a1bSJed Brown       }
483c4762a1bSJed Brown       x[j][i].u = 0.0 + bjiu;
484c4762a1bSJed Brown       x[j][i].v = 0.0 + bjiv;
485c4762a1bSJed Brown     }
486c4762a1bSJed Brown   }
487c4762a1bSJed Brown 
488c4762a1bSJed Brown   /* Test whether we are on the right edge of the global array */
489c4762a1bSJed Brown   if (xinte == info.mx) {
490c4762a1bSJed Brown     i     = info.mx - 1;
491c4762a1bSJed Brown     /* right edge */
492c4762a1bSJed Brown     for (j=info.ys; j<info.ys+info.ym; j++) {
493c4762a1bSJed Brown       if (B) {
494c4762a1bSJed Brown         bjiu = b[j][i].u;
495c4762a1bSJed Brown         bjiv = b[j][i].v;
496c4762a1bSJed Brown       } else {
497c4762a1bSJed Brown         bjiu = 0.0;
498c4762a1bSJed Brown         bjiv = 0.0;
499c4762a1bSJed Brown       }
500c4762a1bSJed Brown       x[j][i].u = 0.0 + bjiu;
501c4762a1bSJed Brown       x[j][i].v = 0.0 + bjiv;
502c4762a1bSJed Brown     }
503c4762a1bSJed Brown   }
504c4762a1bSJed Brown 
505c4762a1bSJed Brown   for (k=0; k < sweeps; k++) {
506c4762a1bSJed Brown     for (j=info.ys; j<info.ys + info.ym; j++) {
507c4762a1bSJed Brown       for (i=info.xs; i<info.xs + info.xm; i++) {
508c4762a1bSJed Brown         ptconverged = PETSC_FALSE;
509c4762a1bSJed Brown         pfnorm0     = 0.0;
510c4762a1bSJed Brown         fu          = 0.0;
511c4762a1bSJed Brown         fv          = 0.0;
512c4762a1bSJed Brown         fomega      = 0.0;
513c4762a1bSJed Brown         ftemp       = 0.0;
514c4762a1bSJed Brown         /*  Run Newton's method on a single grid point */
515c4762a1bSJed Brown         for (l = 0; l < max_its && !ptconverged; l++) {
516c4762a1bSJed Brown           if (B) {
517c4762a1bSJed Brown             bjiu     = b[j][i].u;
518c4762a1bSJed Brown             bjiv     = b[j][i].v;
519c4762a1bSJed Brown             bjiomega = b[j][i].omega;
520c4762a1bSJed Brown             bjitemp  = b[j][i].temp;
521c4762a1bSJed Brown           } else {
522c4762a1bSJed Brown             bjiu     = 0.0;
523c4762a1bSJed Brown             bjiv     = 0.0;
524c4762a1bSJed Brown             bjiomega = 0.0;
525c4762a1bSJed Brown             bjitemp  = 0.0;
526c4762a1bSJed Brown           }
527c4762a1bSJed Brown 
528c4762a1bSJed Brown           if (i != 0 && i != info.mx - 1 && j != 0 && j != info.my-1) {
529c4762a1bSJed Brown             /* U velocity */
530c4762a1bSJed Brown             u     = x[j][i].u;
531c4762a1bSJed Brown             uxx   = (2.0*u - x[j][i-1].u - x[j][i+1].u)*hydhx;
532c4762a1bSJed Brown             uyy   = (2.0*u - x[j-1][i].u - x[j+1][i].u)*hxdhy;
533c4762a1bSJed Brown             fu    = uxx + uyy - .5*(x[j+1][i].omega-x[j-1][i].omega)*hx - bjiu;
534c4762a1bSJed Brown             dfudu = 2.0*(hydhx + hxdhy);
535c4762a1bSJed Brown             /* V velocity */
536c4762a1bSJed Brown             u     = x[j][i].v;
537c4762a1bSJed Brown             uxx   = (2.0*u - x[j][i-1].v - x[j][i+1].v)*hydhx;
538c4762a1bSJed Brown             uyy   = (2.0*u - x[j-1][i].v - x[j+1][i].v)*hxdhy;
539c4762a1bSJed Brown             fv    = uxx + uyy + .5*(x[j][i+1].omega-x[j][i-1].omega)*hy - bjiv;
540c4762a1bSJed Brown             dfvdv = 2.0*(hydhx + hxdhy);
541c4762a1bSJed Brown             /*
542c4762a1bSJed Brown              convective coefficients for upwinding
543c4762a1bSJed Brown              */
544c4762a1bSJed Brown             vx  = x[j][i].u; avx = PetscAbsScalar(vx);
545c4762a1bSJed Brown             vxp = .5*(vx+avx); vxm = .5*(vx-avx);
546c4762a1bSJed Brown             vy  = x[j][i].v; avy = PetscAbsScalar(vy);
547c4762a1bSJed Brown             vyp = .5*(vy+avy); vym = .5*(vy-avy);
548c4762a1bSJed Brown             /* Omega */
549c4762a1bSJed Brown             u      = x[j][i].omega;
550c4762a1bSJed Brown             uxx    = (2.0*u - x[j][i-1].omega - x[j][i+1].omega)*hydhx;
551c4762a1bSJed Brown             uyy    = (2.0*u - x[j-1][i].omega - x[j+1][i].omega)*hxdhy;
552c4762a1bSJed Brown             fomega = uxx + uyy +  (vxp*(u - x[j][i-1].omega) + vxm*(x[j][i+1].omega - u))*hy +
553c4762a1bSJed Brown                      (vyp*(u - x[j-1][i].omega) + vym*(x[j+1][i].omega - u))*hx -
554c4762a1bSJed Brown                      .5*grashof*(x[j][i+1].temp - x[j][i-1].temp)*hy - bjiomega;
555c4762a1bSJed Brown             /* convective coefficient derivatives */
556c4762a1bSJed Brown             dfodo = 2.0*(hydhx + hxdhy) + ((vxp - vxm)*hy + (vyp - vym)*hx);
557c4762a1bSJed Brown             if (PetscRealPart(vx) > 0.0) dfodu = (u - x[j][i-1].omega)*hy;
558c4762a1bSJed Brown             else dfodu = (x[j][i+1].omega - u)*hy;
559c4762a1bSJed Brown 
560c4762a1bSJed Brown             if (PetscRealPart(vy) > 0.0) dfodv = (u - x[j-1][i].omega)*hx;
561c4762a1bSJed Brown             else dfodv = (x[j+1][i].omega - u)*hx;
562c4762a1bSJed Brown 
563c4762a1bSJed Brown             /* Temperature */
564c4762a1bSJed Brown             u     = x[j][i].temp;
565c4762a1bSJed Brown             uxx   = (2.0*u - x[j][i-1].temp - x[j][i+1].temp)*hydhx;
566c4762a1bSJed Brown             uyy   = (2.0*u - x[j-1][i].temp - x[j+1][i].temp)*hxdhy;
567c4762a1bSJed Brown             ftemp =  uxx + uyy  + prandtl*((vxp*(u - x[j][i-1].temp) + vxm*(x[j][i+1].temp - u))*hy + (vyp*(u - x[j-1][i].temp) + vym*(x[j+1][i].temp - u))*hx) - bjitemp;
568c4762a1bSJed Brown             dftdt = 2.0*(hydhx + hxdhy) + prandtl*((vxp - vxm)*hy + (vyp - vym)*hx);
569c4762a1bSJed Brown             if (PetscRealPart(vx) > 0.0) dftdu = prandtl*(u - x[j][i-1].temp)*hy;
570c4762a1bSJed Brown             else dftdu = prandtl*(x[j][i+1].temp - u)*hy;
571c4762a1bSJed Brown 
572c4762a1bSJed Brown             if (PetscRealPart(vy) > 0.0) dftdv = prandtl*(u - x[j-1][i].temp)*hx;
573c4762a1bSJed Brown             else dftdv = prandtl*(x[j+1][i].temp - u)*hx;
574c4762a1bSJed Brown 
575c4762a1bSJed Brown             /* invert the system:
576c4762a1bSJed Brown              [ dfu / du     0        0        0    ][yu] = [fu]
577c4762a1bSJed Brown              [     0    dfv / dv     0        0    ][yv]   [fv]
578c4762a1bSJed Brown              [ dfo / du dfo / dv dfo / do     0    ][yo]   [fo]
579c4762a1bSJed Brown              [ dft / du dft / dv     0    dft / dt ][yt]   [ft]
580c4762a1bSJed Brown              by simple back-substitution
581c4762a1bSJed Brown            */
582c4762a1bSJed Brown             yu = fu / dfudu;
583c4762a1bSJed Brown             yv = fv / dfvdv;
584c4762a1bSJed Brown             yo = (fomega - (dfodu*yu + dfodv*yv)) / dfodo;
585c4762a1bSJed Brown             yt = (ftemp - (dftdu*yu + dftdv*yv)) / dftdt;
586c4762a1bSJed Brown 
587c4762a1bSJed Brown             x[j][i].u     = x[j][i].u - yu;
588c4762a1bSJed Brown             x[j][i].v     = x[j][i].v - yv;
589c4762a1bSJed Brown             x[j][i].temp  = x[j][i].temp - yt;
590c4762a1bSJed Brown             x[j][i].omega = x[j][i].omega - yo;
591c4762a1bSJed Brown           }
592c4762a1bSJed Brown           if (i == 0) {
593c4762a1bSJed Brown             fomega        = x[j][i].omega - (x[j][i+1].v - x[j][i].v)*dhx - bjiomega;
594c4762a1bSJed Brown             ftemp         = x[j][i].temp - bjitemp;
595c4762a1bSJed Brown             yo            = fomega;
596c4762a1bSJed Brown             yt            = ftemp;
597c4762a1bSJed Brown             x[j][i].omega = x[j][i].omega - fomega;
598c4762a1bSJed Brown             x[j][i].temp  = x[j][i].temp - ftemp;
599c4762a1bSJed Brown           }
600c4762a1bSJed Brown           if (i == info.mx - 1) {
601c4762a1bSJed Brown             fomega        = x[j][i].omega - (x[j][i].v - x[j][i-1].v)*dhx - bjiomega;
602c4762a1bSJed Brown             ftemp         = x[j][i].temp - (PetscReal)(grashof>0) - bjitemp;
603c4762a1bSJed Brown             yo            = fomega;
604c4762a1bSJed Brown             yt            = ftemp;
605c4762a1bSJed Brown             x[j][i].omega = x[j][i].omega - fomega;
606c4762a1bSJed Brown             x[j][i].temp  = x[j][i].temp - ftemp;
607c4762a1bSJed Brown           }
608c4762a1bSJed Brown           if (j == 0) {
609c4762a1bSJed Brown             fomega        = x[j][i].omega + (x[j+1][i].u - x[j][i].u)*dhy - bjiomega;
610c4762a1bSJed Brown             ftemp         = x[j][i].temp-x[j+1][i].temp - bjitemp;
611c4762a1bSJed Brown             yo            = fomega;
612c4762a1bSJed Brown             yt            = ftemp;
613c4762a1bSJed Brown             x[j][i].omega = x[j][i].omega - fomega;
614c4762a1bSJed Brown             x[j][i].temp  = x[j][i].temp - ftemp;
615c4762a1bSJed Brown           }
616c4762a1bSJed Brown           if (j == info.my - 1) {
617c4762a1bSJed Brown             fomega        = x[j][i].omega + (x[j][i].u - x[j-1][i].u)*dhy - bjiomega;
618c4762a1bSJed Brown             ftemp         = x[j][i].temp-x[j-1][i].temp - bjitemp;
619c4762a1bSJed Brown             yo            = fomega;
620c4762a1bSJed Brown             yt            = ftemp;
621c4762a1bSJed Brown             x[j][i].omega = x[j][i].omega - fomega;
622c4762a1bSJed Brown             x[j][i].temp  = x[j][i].temp - ftemp;
623c4762a1bSJed Brown           }
624c4762a1bSJed Brown           tot_its++;
625c4762a1bSJed Brown           pfnorm = PetscRealPart(fu*fu + fv*fv + fomega*fomega + ftemp*ftemp);
626c4762a1bSJed Brown           pfnorm = PetscSqrtReal(pfnorm);
627c4762a1bSJed Brown           pynorm = PetscRealPart(yu*yu + yv*yv + yo*yo + yt*yt);
628c4762a1bSJed Brown           pynorm = PetscSqrtReal(pynorm);
629c4762a1bSJed Brown           pxnorm = PetscRealPart(x[j][i].u*x[j][i].u + x[j][i].v*x[j][i].v + x[j][i].omega*x[j][i].omega + x[j][i].temp*x[j][i].temp);
630c4762a1bSJed Brown           pxnorm = PetscSqrtReal(pxnorm);
631c4762a1bSJed Brown           if (l == 0) pfnorm0 = pfnorm;
632c4762a1bSJed Brown           if (rtol*pfnorm0 >pfnorm || atol > pfnorm || pxnorm*stol > pynorm) ptconverged = PETSC_TRUE;
633c4762a1bSJed Brown         }
634c4762a1bSJed Brown       }
635c4762a1bSJed Brown     }
636c4762a1bSJed Brown   }
637c4762a1bSJed Brown   ierr = DMDAVecRestoreArrayWrite(da,localX,&x);CHKERRQ(ierr);
638c4762a1bSJed Brown   if (B) {
639c4762a1bSJed Brown     ierr = DMDAVecRestoreArrayRead(da,localB,&b);CHKERRQ(ierr);
640c4762a1bSJed Brown   }
641c4762a1bSJed Brown   ierr = DMLocalToGlobalBegin(da,localX,INSERT_VALUES,X);CHKERRQ(ierr);
642c4762a1bSJed Brown   ierr = DMLocalToGlobalEnd(da,localX,INSERT_VALUES,X);CHKERRQ(ierr);
643c4762a1bSJed Brown   ierr = PetscLogFlops(tot_its*(84.0 + 41.0 + 26.0));CHKERRQ(ierr);
644c4762a1bSJed Brown   ierr = DMRestoreLocalVector(da,&localX);CHKERRQ(ierr);
645c4762a1bSJed Brown   if (B) {
646c4762a1bSJed Brown     ierr = DMRestoreLocalVector(da,&localB);CHKERRQ(ierr);
647c4762a1bSJed Brown   }
648c4762a1bSJed Brown   PetscFunctionReturn(0);
649c4762a1bSJed Brown }
650c4762a1bSJed Brown 
651c4762a1bSJed Brown 
652c4762a1bSJed Brown /*TEST
653c4762a1bSJed Brown 
654c4762a1bSJed Brown    test:
655c4762a1bSJed Brown       nsize: 2
656c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type mg -ksp_type fgmres -pc_mg_type full
657c4762a1bSJed Brown       requires: !single
658c4762a1bSJed Brown 
659c4762a1bSJed Brown    test:
660c4762a1bSJed Brown       suffix: 10
661c4762a1bSJed Brown       nsize: 3
662c4762a1bSJed Brown       args: -snes_monitor_short -ksp_monitor_short -pc_type fieldsplit -pc_fieldsplit_type symmetric_multiplicative -snes_view -da_refine 1 -ksp_type fgmres
663c4762a1bSJed Brown       requires: !single
664c4762a1bSJed Brown 
665c4762a1bSJed Brown    test:
666c4762a1bSJed Brown       suffix: 11
667c4762a1bSJed Brown       nsize: 4
668c4762a1bSJed Brown       requires: pastix
669c4762a1bSJed Brown       args: -snes_monitor_short -pc_type redundant -dm_mat_type mpiaij -redundant_pc_factor_mat_solver_type pastix -pc_redundant_number 2 -da_refine 4 -ksp_type fgmres
670c4762a1bSJed Brown 
671c4762a1bSJed Brown    test:
672c4762a1bSJed Brown       suffix: 12
673c4762a1bSJed Brown       nsize: 12
674c4762a1bSJed Brown       requires: pastix
675c4762a1bSJed Brown       args: -snes_monitor_short -pc_type redundant -dm_mat_type mpiaij -redundant_pc_factor_mat_solver_type pastix -pc_redundant_number 5 -da_refine 4 -ksp_type fgmres
676c4762a1bSJed Brown 
677c4762a1bSJed Brown    test:
678c4762a1bSJed Brown       suffix: 13
679c4762a1bSJed Brown       nsize: 3
680c4762a1bSJed Brown       args: -snes_monitor_short -ksp_monitor_short -pc_type fieldsplit -pc_fieldsplit_type multiplicative -snes_view -da_refine 1 -ksp_type fgmres -snes_mf_operator
681c4762a1bSJed Brown       requires: !single
682c4762a1bSJed Brown 
683c4762a1bSJed Brown    test:
684c4762a1bSJed Brown       suffix: 14
685c4762a1bSJed Brown       nsize: 4
686c4762a1bSJed Brown       args: -snes_monitor_short -pc_type mg -dm_mat_type baij -mg_coarse_pc_type bjacobi -da_refine 3 -ksp_type fgmres
687c4762a1bSJed Brown       requires: !single
688c4762a1bSJed Brown 
689c4762a1bSJed Brown    test:
690c4762a1bSJed Brown       suffix: 14_ds
691c4762a1bSJed Brown       nsize: 4
692c4762a1bSJed Brown       args: -snes_converged_reason -pc_type mg -dm_mat_type baij -mg_coarse_pc_type bjacobi -da_refine 3 -ksp_type fgmres -mat_fd_type ds
693c4762a1bSJed Brown       output_file: output/ex19_2.out
694c4762a1bSJed Brown       requires: !single
695c4762a1bSJed Brown 
696c4762a1bSJed Brown    test:
697c4762a1bSJed Brown       suffix: 17
698c4762a1bSJed Brown       args: -snes_monitor_short -ksp_pc_side right
699c4762a1bSJed Brown       requires: !single
700c4762a1bSJed Brown 
701c4762a1bSJed Brown    test:
702c4762a1bSJed Brown       suffix: 18
703c4762a1bSJed Brown       args: -ksp_monitor_snes_lg -ksp_pc_side right
704c4762a1bSJed Brown       requires: x !single
705c4762a1bSJed Brown 
706c4762a1bSJed Brown    test:
707c4762a1bSJed Brown       suffix: 2
708c4762a1bSJed Brown       nsize: 4
709c4762a1bSJed Brown       args: -da_refine 3 -snes_converged_reason -pc_type mg -mat_fd_type ds
710c4762a1bSJed Brown       requires: !single
711c4762a1bSJed Brown 
712c4762a1bSJed Brown    test:
713c4762a1bSJed Brown       suffix: 2_bcols1
714c4762a1bSJed Brown       nsize: 4
715c4762a1bSJed Brown       args: -da_refine 3 -snes_converged_reason -pc_type mg -mat_fd_type ds -mat_fd_coloring_bcols
716c4762a1bSJed Brown       output_file: output/ex19_2.out
717c4762a1bSJed Brown       requires: !single
718c4762a1bSJed Brown 
719c4762a1bSJed Brown    test:
720c4762a1bSJed Brown       suffix: 3
721c4762a1bSJed Brown       nsize: 4
722c4762a1bSJed Brown       requires: mumps
723c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type redundant -dm_mat_type mpiaij -redundant_ksp_type preonly -redundant_pc_factor_mat_solver_type mumps -pc_redundant_number 2
724c4762a1bSJed Brown 
725c4762a1bSJed Brown    test:
726c4762a1bSJed Brown       suffix: 4
727c4762a1bSJed Brown       nsize: 12
728c4762a1bSJed Brown       requires: mumps
729c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type redundant -dm_mat_type mpiaij -redundant_ksp_type preonly -redundant_pc_factor_mat_solver_type mumps -pc_redundant_number 5
730c4762a1bSJed Brown       output_file: output/ex19_3.out
731c4762a1bSJed Brown 
732c4762a1bSJed Brown    test:
733c4762a1bSJed Brown       suffix: 6
734c4762a1bSJed Brown       args: -snes_monitor_short -ksp_monitor_short -pc_type fieldsplit -snes_view -ksp_type fgmres -da_refine 1
735c4762a1bSJed Brown       requires: !single
736c4762a1bSJed Brown 
737c4762a1bSJed Brown    test:
738c4762a1bSJed Brown       suffix: 7
739c4762a1bSJed Brown       nsize: 3
740c4762a1bSJed Brown       args: -snes_monitor_short -ksp_monitor_short -pc_type fieldsplit -snes_view -da_refine 1 -ksp_type fgmres
741c4762a1bSJed Brown 
742c4762a1bSJed Brown       requires: !single
743c4762a1bSJed Brown    test:
744c4762a1bSJed Brown       suffix: 8
745c4762a1bSJed Brown       args: -snes_monitor_short -ksp_monitor_short -pc_type fieldsplit -pc_fieldsplit_block_size 2 -pc_fieldsplit_0_fields 0,1 -pc_fieldsplit_1_fields 0,1 -pc_fieldsplit_type multiplicative -snes_view -fieldsplit_pc_type lu -da_refine 1 -ksp_type fgmres
746c4762a1bSJed Brown       requires: !single
747c4762a1bSJed Brown 
748c4762a1bSJed Brown    test:
749c4762a1bSJed Brown       suffix: 9
750c4762a1bSJed Brown       nsize: 3
751c4762a1bSJed Brown       args: -snes_monitor_short -ksp_monitor_short -pc_type fieldsplit -pc_fieldsplit_type multiplicative -snes_view -da_refine 1 -ksp_type fgmres
752c4762a1bSJed Brown       requires: !single
753c4762a1bSJed Brown 
754c4762a1bSJed Brown    test:
755c4762a1bSJed Brown       suffix: aspin
756c4762a1bSJed Brown       nsize: 4
757c4762a1bSJed Brown       args: -da_refine 3 -da_overlap 2 -snes_monitor_short -snes_type aspin -grashof 4e4 -lidvelocity 100 -ksp_monitor_short
758c4762a1bSJed Brown       requires: !single
759c4762a1bSJed Brown 
760c4762a1bSJed Brown    test:
761c4762a1bSJed Brown       suffix: bcgsl
762c4762a1bSJed Brown       nsize: 2
763c4762a1bSJed Brown       args: -ksp_type bcgsl -ksp_monitor_short -da_refine 2 -ksp_bcgsl_ell 3 -snes_view
764c4762a1bSJed Brown       requires: !single
765c4762a1bSJed Brown 
766c4762a1bSJed Brown    test:
767c4762a1bSJed Brown       suffix: bcols1
768c4762a1bSJed Brown       nsize: 2
769c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type mg -ksp_type fgmres -pc_mg_type full -mat_fd_coloring_bcols 1
770c4762a1bSJed Brown       output_file: output/ex19_1.out
771c4762a1bSJed Brown       requires: !single
772c4762a1bSJed Brown 
773c4762a1bSJed Brown    test:
774c4762a1bSJed Brown       suffix: bjacobi
775c4762a1bSJed Brown       nsize: 4
776c4762a1bSJed Brown       args: -da_refine 4 -ksp_type fgmres -pc_type bjacobi -pc_bjacobi_blocks 2 -sub_ksp_type gmres -sub_ksp_max_it 2 -sub_pc_type bjacobi -sub_sub_ksp_type preonly -sub_sub_pc_type ilu -snes_monitor_short
777c4762a1bSJed Brown       requires: !single
778c4762a1bSJed Brown 
779c4762a1bSJed Brown    test:
780c4762a1bSJed Brown       suffix: cgne
781c4762a1bSJed Brown       args: -da_refine 2 -pc_type lu -ksp_type cgne -ksp_monitor_short -ksp_converged_reason -ksp_view -ksp_norm_type unpreconditioned
782c4762a1bSJed Brown       filter: grep -v HERMITIAN
783c4762a1bSJed Brown       requires: !single
784c4762a1bSJed Brown 
785c4762a1bSJed Brown    test:
786c4762a1bSJed Brown       suffix: cgs
787c4762a1bSJed Brown       args: -da_refine 1 -ksp_monitor_short -ksp_type cgs
788c4762a1bSJed Brown       requires: !single
789c4762a1bSJed Brown 
790c4762a1bSJed Brown    test:
791c4762a1bSJed Brown       suffix: composite_fieldsplit
792c4762a1bSJed Brown       args: -ksp_type fgmres -pc_type composite -pc_composite_type MULTIPLICATIVE -pc_composite_pcs fieldsplit,none -sub_0_pc_fieldsplit_block_size 4 -sub_0_pc_fieldsplit_type additive -sub_0_pc_fieldsplit_0_fields 0,1,2 -sub_0_pc_fieldsplit_1_fields 3 -snes_monitor_short -ksp_monitor_short
793c4762a1bSJed Brown       requires: !single
794c4762a1bSJed Brown 
795c4762a1bSJed Brown    test:
796c4762a1bSJed Brown       suffix: composite_fieldsplit_bjacobi
797c4762a1bSJed Brown       args: -ksp_type fgmres -pc_type composite -pc_composite_type MULTIPLICATIVE -pc_composite_pcs fieldsplit,bjacobi -sub_0_pc_fieldsplit_block_size 4 -sub_0_pc_fieldsplit_type additive -sub_0_pc_fieldsplit_0_fields 0,1,2 -sub_0_pc_fieldsplit_1_fields 3 -sub_1_pc_bjacobi_blocks 16 -sub_1_sub_pc_type lu -snes_monitor_short -ksp_monitor_short
798c4762a1bSJed Brown       requires: !single
799c4762a1bSJed Brown 
800c4762a1bSJed Brown    test:
801c4762a1bSJed Brown       suffix: composite_fieldsplit_bjacobi_2
802c4762a1bSJed Brown       nsize: 4
803c4762a1bSJed Brown       args: -ksp_type fgmres -pc_type composite -pc_composite_type MULTIPLICATIVE -pc_composite_pcs fieldsplit,bjacobi -sub_0_pc_fieldsplit_block_size 4 -sub_0_pc_fieldsplit_type additive -sub_0_pc_fieldsplit_0_fields 0,1,2 -sub_0_pc_fieldsplit_1_fields 3 -sub_1_pc_bjacobi_blocks 16 -sub_1_sub_pc_type lu -snes_monitor_short -ksp_monitor_short
804c4762a1bSJed Brown       requires: !single
805c4762a1bSJed Brown 
806c4762a1bSJed Brown    test:
807c4762a1bSJed Brown       suffix: composite_gs_newton
808c4762a1bSJed Brown       nsize: 2
809c4762a1bSJed Brown       args: -da_refine 3 -grashof 4e4 -lidvelocity 100 -snes_monitor_short -snes_type composite -snes_composite_type additiveoptimal -snes_composite_sneses ngs,newtonls -sub_0_snes_max_it 20 -sub_1_pc_type mg
810c4762a1bSJed Brown       requires: !single
811c4762a1bSJed Brown 
812c4762a1bSJed Brown    test:
813c4762a1bSJed Brown       suffix: cuda
814c4762a1bSJed Brown       requires: cuda !single
815c4762a1bSJed Brown       args: -dm_vec_type cuda -dm_mat_type aijcusparse -pc_type none -ksp_type fgmres -snes_monitor_short -snes_rtol 1.e-5
816c4762a1bSJed Brown 
817c4762a1bSJed Brown    test:
818c4762a1bSJed Brown       suffix: draw
819c4762a1bSJed Brown       args: -pc_type fieldsplit -snes_view draw -fieldsplit_x_velocity_pc_type mg -fieldsplit_x_velocity_pc_mg_galerkin pmat -fieldsplit_x_velocity_pc_mg_levels 2 -da_refine 1 -fieldsplit_x_velocity_mg_coarse_pc_type svd
820c4762a1bSJed Brown       requires: x !single
821c4762a1bSJed Brown 
822c4762a1bSJed Brown    test:
823c4762a1bSJed Brown       suffix: drawports
824c4762a1bSJed Brown       args: -snes_monitor_solution draw::draw_ports -da_refine 1
825c4762a1bSJed Brown       output_file: output/ex19_draw.out
826c4762a1bSJed Brown       requires: x !single
827c4762a1bSJed Brown 
828c4762a1bSJed Brown    test:
829c4762a1bSJed Brown       suffix: fas
830c4762a1bSJed Brown       args: -da_refine 4 -snes_monitor_short -snes_type fas -fas_levels_snes_type ngs -fas_levels_snes_ngs_sweeps 3 -fas_levels_snes_ngs_atol 0.0 -fas_levels_snes_ngs_stol 0.0 -grashof 4e4 -snes_fas_smoothup 6 -snes_fas_smoothdown 6 -lidvelocity 100
831c4762a1bSJed Brown       requires: !single
832c4762a1bSJed Brown 
833c4762a1bSJed Brown    test:
834c4762a1bSJed Brown       suffix: fas_full
835c4762a1bSJed Brown       args: -da_refine 4 -snes_monitor_short -snes_type fas -snes_fas_type full -snes_fas_full_downsweep -fas_levels_snes_type ngs -fas_levels_snes_ngs_sweeps 3 -fas_levels_snes_ngs_atol 0.0 -fas_levels_snes_ngs_stol 0.0 -grashof 4e4 -snes_fas_smoothup 6 -snes_fas_smoothdown 6 -lidvelocity 100
836c4762a1bSJed Brown       requires: !single
837c4762a1bSJed Brown 
838c4762a1bSJed Brown    test:
839c4762a1bSJed Brown       suffix: fdcoloring_ds
840c4762a1bSJed Brown       args: -da_refine 3 -snes_converged_reason -pc_type mg -mat_fd_type ds
841c4762a1bSJed Brown       output_file: output/ex19_2.out
842c4762a1bSJed Brown       requires: !single
843c4762a1bSJed Brown 
844c4762a1bSJed Brown    test:
845c4762a1bSJed Brown       suffix: fdcoloring_ds_baij
846c4762a1bSJed Brown       args: -da_refine 3 -snes_converged_reason -pc_type mg -mat_fd_type ds -dm_mat_type baij
847c4762a1bSJed Brown       output_file: output/ex19_2.out
848c4762a1bSJed Brown       requires: !single
849c4762a1bSJed Brown 
850c4762a1bSJed Brown    test:
851c4762a1bSJed Brown       suffix: fdcoloring_ds_bcols1
852c4762a1bSJed Brown       args: -da_refine 3 -snes_converged_reason -pc_type mg -mat_fd_type ds -mat_fd_coloring_bcols 1
853c4762a1bSJed Brown       output_file: output/ex19_2.out
854c4762a1bSJed Brown       requires: !single
855c4762a1bSJed Brown 
856c4762a1bSJed Brown    test:
857c4762a1bSJed Brown       suffix: fdcoloring_wp
858c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type mg
859c4762a1bSJed Brown       requires: !single
860c4762a1bSJed Brown 
861c4762a1bSJed Brown    test:
862c4762a1bSJed Brown       suffix: fdcoloring_wp_baij
863c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type mg -dm_mat_type baij
864c4762a1bSJed Brown       output_file: output/ex19_fdcoloring_wp.out
865c4762a1bSJed Brown       requires: !single
866c4762a1bSJed Brown 
867c4762a1bSJed Brown    test:
868c4762a1bSJed Brown       suffix: fdcoloring_wp_bcols1
869c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type mg -mat_fd_coloring_bcols 1
870c4762a1bSJed Brown       output_file: output/ex19_fdcoloring_wp.out
871c4762a1bSJed Brown       requires: !single
872c4762a1bSJed Brown 
873c4762a1bSJed Brown    test:
874c4762a1bSJed Brown       suffix: fieldsplit_2
875c4762a1bSJed Brown       args: -ksp_type fgmres -pc_type fieldsplit -pc_fieldsplit_block_size 4 -pc_fieldsplit_type additive -pc_fieldsplit_0_fields 0,1,2 -pc_fieldsplit_1_fields 3 -snes_monitor_short -ksp_monitor_short
876c4762a1bSJed Brown       requires: !single
877c4762a1bSJed Brown 
878c4762a1bSJed Brown    test:
879c4762a1bSJed Brown       suffix: fieldsplit_3
880c4762a1bSJed Brown       args: -ksp_type fgmres -pc_type fieldsplit -pc_fieldsplit_block_size 4 -pc_fieldsplit_type additive -pc_fieldsplit_0_fields 0,1,2 -pc_fieldsplit_1_fields 3 -fieldsplit_0_pc_type lu -fieldsplit_1_pc_type lu -snes_monitor_short -ksp_monitor_short
881c4762a1bSJed Brown       requires: !single
882c4762a1bSJed Brown 
883c4762a1bSJed Brown    test:
884c4762a1bSJed Brown       suffix: fieldsplit_4
885c4762a1bSJed Brown       args: -ksp_type fgmres -pc_type fieldsplit -pc_fieldsplit_block_size 4 -pc_fieldsplit_type SCHUR -pc_fieldsplit_0_fields 0,1,2 -pc_fieldsplit_1_fields 3 -fieldsplit_0_pc_type lu -fieldsplit_1_pc_type lu -snes_monitor_short -ksp_monitor_short
886c4762a1bSJed Brown       requires: !single
887c4762a1bSJed Brown 
888c4762a1bSJed Brown    # HYPRE PtAP broken with complex numbers
889c4762a1bSJed Brown    test:
890c4762a1bSJed Brown       suffix: fieldsplit_hypre
891c4762a1bSJed Brown       nsize: 2
892c4762a1bSJed Brown       requires: hypre mumps !complex
893c4762a1bSJed Brown       args: -pc_type fieldsplit -pc_fieldsplit_block_size 4 -pc_fieldsplit_type SCHUR -pc_fieldsplit_0_fields 0,1,2 -pc_fieldsplit_1_fields 3 -fieldsplit_0_pc_type lu -fieldsplit_0_pc_factor_mat_solver_type mumps -fieldsplit_1_pc_type hypre -fieldsplit_1_pc_hypre_type boomeramg -snes_monitor_short -ksp_monitor_short
894c4762a1bSJed Brown 
895c4762a1bSJed Brown    test:
896c4762a1bSJed Brown       suffix: fieldsplit_mumps
897c4762a1bSJed Brown       nsize: 2
898c4762a1bSJed Brown       requires: mumps
899c4762a1bSJed Brown       args: -pc_type fieldsplit -pc_fieldsplit_block_size 4 -pc_fieldsplit_type SCHUR -pc_fieldsplit_0_fields 0,1,2 -pc_fieldsplit_1_fields 3 -fieldsplit_0_pc_type lu -fieldsplit_1_pc_type lu -snes_monitor_short -ksp_monitor_short -fieldsplit_0_pc_factor_mat_solver_type mumps -fieldsplit_1_pc_factor_mat_solver_type mumps
900c4762a1bSJed Brown       output_file: output/ex19_fieldsplit_5.out
901c4762a1bSJed Brown 
902c4762a1bSJed Brown    test:
903c4762a1bSJed Brown       suffix: greedy_coloring
904c4762a1bSJed Brown       nsize: 2
905c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -snes_fd_color -snes_fd_color_use_mat -mat_coloring_type greedy -mat_coloring_weight_type lf -mat_coloring_view> ex19_greedy_coloring.tmp 2>&1
906c4762a1bSJed Brown       requires: !single
907c4762a1bSJed Brown 
908c4762a1bSJed Brown    # HYPRE PtAP broken with complex numbers
909c4762a1bSJed Brown    test:
910c4762a1bSJed Brown       suffix: hypre
911c4762a1bSJed Brown       nsize: 2
912c4762a1bSJed Brown       requires: hypre !complex
913c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type hypre
914c4762a1bSJed Brown 
915c4762a1bSJed Brown    test:
916c4762a1bSJed Brown       suffix: ibcgs
917c4762a1bSJed Brown       nsize: 2
918c4762a1bSJed Brown       args: -ksp_type ibcgs -ksp_monitor_short -da_refine 2 -snes_view
919c4762a1bSJed Brown       requires: !complex !single
920c4762a1bSJed Brown 
921c4762a1bSJed Brown    test:
922c4762a1bSJed Brown       suffix: kaczmarz
923c4762a1bSJed Brown       nsize: 2
924c4762a1bSJed Brown       args: -pc_type kaczmarz -ksp_monitor_short -snes_monitor_short -snes_view
925c4762a1bSJed Brown       requires: !single
926c4762a1bSJed Brown 
927c4762a1bSJed Brown    test:
928c4762a1bSJed Brown       suffix: klu
929c4762a1bSJed Brown       requires: suitesparse
930c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type klu
931c4762a1bSJed Brown       output_file: output/ex19_superlu.out
932c4762a1bSJed Brown 
933c4762a1bSJed Brown    test:
934c4762a1bSJed Brown       suffix: klu_2
935c4762a1bSJed Brown       requires: suitesparse
936c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type klu -mat_klu_ordering PETSC
937c4762a1bSJed Brown       output_file: output/ex19_superlu.out
938c4762a1bSJed Brown 
939c4762a1bSJed Brown    test:
940c4762a1bSJed Brown       suffix: klu_3
941c4762a1bSJed Brown       requires: suitesparse
942c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type klu -mat_klu_use_btf 0
943c4762a1bSJed Brown       output_file: output/ex19_superlu.out
944c4762a1bSJed Brown 
945c4762a1bSJed Brown    test:
946c4762a1bSJed Brown       suffix: ml
947c4762a1bSJed Brown       nsize: 2
948c4762a1bSJed Brown       requires: ml
949c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -pc_type ml
950c4762a1bSJed Brown 
951c4762a1bSJed Brown    test:
952c4762a1bSJed Brown       suffix: ngmres_fas
953c4762a1bSJed Brown       args: -da_refine 4 -snes_monitor_short -snes_type ngmres -npc_fas_levels_snes_type ngs -npc_fas_levels_snes_ngs_sweeps 3 -npc_fas_levels_snes_ngs_atol 0.0 -npc_fas_levels_snes_ngs_stol 0.0 -npc_snes_type fas -npc_fas_levels_snes_type ngs -npc_snes_max_it 1 -npc_snes_fas_smoothup 6 -npc_snes_fas_smoothdown 6 -lidvelocity 100 -grashof 4e4
954c4762a1bSJed Brown       requires: !single
955c4762a1bSJed Brown 
956c4762a1bSJed Brown    test:
957c4762a1bSJed Brown       suffix: ngmres_fas_gssecant
958c4762a1bSJed Brown       args: -da_refine 3 -snes_monitor_short -snes_type ngmres -npc_snes_type fas -npc_fas_levels_snes_type ngs -npc_fas_levels_snes_max_it 6 -npc_fas_levels_snes_ngs_secant -npc_fas_levels_snes_ngs_max_it 1 -npc_fas_coarse_snes_max_it 1 -lidvelocity 100 -grashof 4e4
959c4762a1bSJed Brown       requires: !single
960c4762a1bSJed Brown 
961c4762a1bSJed Brown    test:
962c4762a1bSJed Brown       suffix: ngmres_fas_ms
963c4762a1bSJed Brown       nsize: 2
964c4762a1bSJed Brown       args: -snes_grid_sequence 2 -lidvelocity 200 -grashof 1e4 -snes_monitor_short -snes_view -snes_converged_reason -snes_type ngmres -npc_snes_type fas -npc_fas_coarse_snes_type newtonls -npc_fas_coarse_ksp_type preonly -npc_snes_max_it 1
965c4762a1bSJed Brown       requires: !single
966c4762a1bSJed Brown 
967c4762a1bSJed Brown    test:
968c4762a1bSJed Brown       suffix: ngmres_nasm
969c4762a1bSJed Brown       nsize: 4
970c4762a1bSJed Brown       args: -da_refine 4 -da_overlap 2 -snes_monitor_short -snes_type ngmres -snes_max_it 10 -npc_snes_type nasm -npc_snes_nasm_type basic -grashof 4e4 -lidvelocity 100
971c4762a1bSJed Brown       requires: !single
972c4762a1bSJed Brown 
973c4762a1bSJed Brown    test:
974c4762a1bSJed Brown       suffix: ngs
975c4762a1bSJed Brown       args: -snes_type ngs -snes_view -snes_monitor -snes_rtol 1e-4
976c4762a1bSJed Brown       requires: !single
977c4762a1bSJed Brown 
978c4762a1bSJed Brown    test:
979c4762a1bSJed Brown       suffix: ngs_fd
980c4762a1bSJed Brown       args: -snes_type ngs -snes_ngs_secant -snes_view -snes_monitor -snes_rtol 1e-4
981c4762a1bSJed Brown       requires: !single
982c4762a1bSJed Brown 
983c4762a1bSJed Brown    test:
984c4762a1bSJed Brown       suffix: parms
985c4762a1bSJed Brown       nsize: 2
986c4762a1bSJed Brown       requires: parms
987c4762a1bSJed Brown       args: -pc_type parms -ksp_monitor_short -snes_view
988c4762a1bSJed Brown 
989c4762a1bSJed Brown    test:
990c4762a1bSJed Brown       suffix: superlu
991c4762a1bSJed Brown       requires: superlu
992c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type superlu
993c4762a1bSJed Brown 
994c4762a1bSJed Brown    test:
995c4762a1bSJed Brown       suffix: superlu_sell
996c4762a1bSJed Brown       requires: superlu
997c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type superlu -dm_mat_type sell -pc_factor_mat_ordering_type natural
998c4762a1bSJed Brown       output_file: output/ex19_superlu.out
999c4762a1bSJed Brown 
1000c4762a1bSJed Brown    test:
1001c4762a1bSJed Brown       suffix: superlu_dist
1002c4762a1bSJed Brown       requires: superlu_dist
1003c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type superlu_dist
1004c4762a1bSJed Brown       output_file: output/ex19_superlu.out
1005c4762a1bSJed Brown 
1006c4762a1bSJed Brown    test:
1007c4762a1bSJed Brown       suffix: superlu_dist_2
1008c4762a1bSJed Brown       nsize: 2
1009c4762a1bSJed Brown       requires: superlu_dist
1010c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -pc_type lu -pc_factor_mat_solver_type superlu_dist
1011c4762a1bSJed Brown       output_file: output/ex19_superlu.out
1012c4762a1bSJed Brown 
1013c4762a1bSJed Brown    test:
1014c4762a1bSJed Brown       suffix: superlu_equil
1015c4762a1bSJed Brown       requires: superlu
1016c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -{snes,ksp}_monitor_short -pc_type lu -pc_factor_mat_solver_type superlu -mat_superlu_equil
1017c4762a1bSJed Brown 
1018c4762a1bSJed Brown    test:
1019c4762a1bSJed Brown       suffix: superlu_equil_sell
1020c4762a1bSJed Brown       requires: superlu
1021c4762a1bSJed Brown       args: -da_grid_x 20 -da_grid_y 20 -{snes,ksp}_monitor_short -pc_type lu -pc_factor_mat_solver_type superlu -mat_superlu_equil -dm_mat_type sell -pc_factor_mat_ordering_type natural
1022c4762a1bSJed Brown       output_file: output/ex19_superlu_equil.out
1023c4762a1bSJed Brown 
1024c4762a1bSJed Brown    test:
1025c4762a1bSJed Brown       suffix: tcqmr
1026c4762a1bSJed Brown       args: -da_refine 1 -ksp_monitor_short -ksp_type tcqmr
1027c4762a1bSJed Brown       requires: !single
1028c4762a1bSJed Brown 
1029c4762a1bSJed Brown    test:
1030c4762a1bSJed Brown       suffix: tfqmr
1031c4762a1bSJed Brown       args: -da_refine 1 -ksp_monitor_short -ksp_type tfqmr
1032c4762a1bSJed Brown       requires: !single
1033c4762a1bSJed Brown 
1034c4762a1bSJed Brown    test:
1035c4762a1bSJed Brown       suffix: umfpack
1036c4762a1bSJed Brown       requires: suitesparse
1037*2c7c0729SBarry Smith       args: -da_refine 2 -pc_type lu -pc_factor_mat_solver_type umfpack -snes_view -snes_monitor_short -ksp_monitor_short -pc_factor_mat_ordering_type external
1038c4762a1bSJed Brown 
1039c4762a1bSJed Brown    test:
1040c4762a1bSJed Brown       suffix: tut_1
1041c4762a1bSJed Brown       nsize: 4
1042c4762a1bSJed Brown       requires: !single
1043c4762a1bSJed Brown       args: -da_refine 5 -snes_monitor -ksp_monitor -snes_view
1044c4762a1bSJed Brown 
1045c4762a1bSJed Brown    test:
1046c4762a1bSJed Brown       suffix: tut_2
1047c4762a1bSJed Brown       nsize: 4
1048c4762a1bSJed Brown       requires: !single
1049c4762a1bSJed Brown       args: -da_refine 5 -snes_monitor -ksp_monitor -snes_view -pc_type mg
1050c4762a1bSJed Brown 
1051c4762a1bSJed Brown    # HYPRE PtAP broken with complex numbers
1052c4762a1bSJed Brown    test:
1053c4762a1bSJed Brown       suffix: tut_3
1054c4762a1bSJed Brown       nsize: 4
1055c4762a1bSJed Brown       requires: hypre !single !complex
1056c4762a1bSJed Brown       args: -da_refine 5 -snes_monitor -ksp_monitor -snes_view -pc_type hypre
1057c4762a1bSJed Brown 
1058c4762a1bSJed Brown    test:
1059c4762a1bSJed Brown       suffix: tut_8
1060c4762a1bSJed Brown       nsize: 4
1061c4762a1bSJed Brown       requires: ml !single
1062c4762a1bSJed Brown       args: -da_refine 5 -snes_monitor -ksp_monitor -snes_view -pc_type ml
1063c4762a1bSJed Brown 
1064c4762a1bSJed Brown    test:
1065c4762a1bSJed Brown       suffix: tut_4
1066c4762a1bSJed Brown       nsize: 1
1067c4762a1bSJed Brown       requires: !single
1068c4762a1bSJed Brown       args: -da_refine 5 -log_view
1069c4762a1bSJed Brown       filter: head -n 2
1070c4762a1bSJed Brown       filter_output: head -n 2
1071c4762a1bSJed Brown 
1072c4762a1bSJed Brown    test:
1073c4762a1bSJed Brown       suffix: tut_5
1074c4762a1bSJed Brown       nsize: 1
1075c4762a1bSJed Brown       requires: !single
1076c4762a1bSJed Brown       args: -da_refine 5 -log_view -pc_type mg
1077c4762a1bSJed Brown       filter: head -n 2
1078c4762a1bSJed Brown       filter_output: head -n 2
1079c4762a1bSJed Brown 
1080c4762a1bSJed Brown    test:
1081c4762a1bSJed Brown       suffix: tut_6
1082c4762a1bSJed Brown       nsize: 4
1083c4762a1bSJed Brown       requires: !single
1084c4762a1bSJed Brown       args: -da_refine 5 -log_view
1085c4762a1bSJed Brown       filter: head -n 2
1086c4762a1bSJed Brown       filter_output: head -n 2
1087c4762a1bSJed Brown 
1088c4762a1bSJed Brown    test:
1089c4762a1bSJed Brown       suffix: tut_7
1090c4762a1bSJed Brown       nsize: 4
1091c4762a1bSJed Brown       requires: !single
1092c4762a1bSJed Brown       args: -da_refine 5 -log_view -pc_type mg
1093c4762a1bSJed Brown       filter: head -n 2
1094c4762a1bSJed Brown       filter_output: head -n 2
1095c4762a1bSJed Brown 
1096c4762a1bSJed Brown    test:
1097c4762a1bSJed Brown       suffix: cuda_1
1098c4762a1bSJed Brown       nsize: 1
1099c4762a1bSJed Brown       requires: cuda
1100c4762a1bSJed Brown       args: -snes_monitor -dm_mat_type seqaijcusparse -dm_vec_type seqcuda -pc_type gamg -ksp_monitor -mg_levels_ksp_max_it 3
1101c4762a1bSJed Brown 
1102c4762a1bSJed Brown 
1103c4762a1bSJed Brown    test:
1104c4762a1bSJed Brown       suffix: cuda_2
1105c4762a1bSJed Brown       nsize: 3
1106c4762a1bSJed Brown       requires: cuda !single
1107c4762a1bSJed Brown       args: -snes_monitor -dm_mat_type mpiaijcusparse -dm_vec_type mpicuda -pc_type gamg -ksp_monitor  -mg_levels_ksp_max_it 3
1108c4762a1bSJed Brown 
1109c4762a1bSJed Brown    test:
1110c4762a1bSJed Brown       suffix: seqbaijmkl
1111c4762a1bSJed Brown       nsize: 1
1112c4762a1bSJed Brown       requires: define(PETSC_HAVE_MKL_SPARSE_OPTIMIZE)
1113c4762a1bSJed Brown       args: -dm_mat_type baij -snes_monitor -ksp_monitor -snes_view
1114c4762a1bSJed Brown 
1115c4762a1bSJed Brown    test:
1116c4762a1bSJed Brown       suffix: mpibaijmkl
1117c4762a1bSJed Brown       nsize: 2
1118c4762a1bSJed Brown       requires:  define(PETSC_HAVE_MKL_SPARSE_OPTIMIZE)
1119c4762a1bSJed Brown       args: -dm_mat_type baij -snes_monitor -ksp_monitor -snes_view
1120c4762a1bSJed Brown 
1121c4762a1bSJed Brown    test:
1122c4762a1bSJed Brown      suffix: cpardiso
1123c4762a1bSJed Brown      nsize: 4
1124c4762a1bSJed Brown      requires: mkl_cpardiso
1125c4762a1bSJed Brown      args: -pc_type lu -pc_factor_mat_solver_type mkl_cpardiso -ksp_monitor
1126c4762a1bSJed Brown 
1127c4762a1bSJed Brown    test:
1128c4762a1bSJed Brown      suffix: logviewmemory
1129c4762a1bSJed Brown      requires: define(PETSC_USE_LOG) !define(PETSC_HAVE_VALGRIND)
1130c4762a1bSJed Brown      args: -log_view -log_view_memory -da_refine 4
1131c4762a1bSJed Brown      filter: grep MatFDColorSetUp | wc -w | xargs  -I % sh -c "expr % \> 21"
1132c4762a1bSJed Brown 
1133c4762a1bSJed Brown TEST*/
1134