xref: /petsc/src/ksp/pc/impls/ml/ml.c (revision c3d102fe2dfc19c1832704c537829f04ceb136a2)
1 
2 /*
3    Provides an interface to the ML 3.0 smoothed Aggregation
4 */
5 #include "src/ksp/pc/pcimpl.h"   /*I "petscpc.h" I*/
6 #include "src/ksp/pc/impls/mg/mgimpl.h"                    /*I "petscmg.h" I*/
7 #include "src/mat/impls/aij/seq/aij.h"
8 #include "src/mat/impls/aij/mpi/mpiaij.h"
9 
10 EXTERN_C_BEGIN
11 #include <math.h>
12 #include "ml_include.h"
13 EXTERN_C_END
14 
15 /* The context (data structure) at each grid level */
16 typedef struct {
17   Vec        x,b,r;            /* global vectors */
18   Mat        A,P,R;
19   KSP        ksp;
20 } GridCtx;
21 
22 /* The context used to input PETSc matrix into ML at fine grid */
23 typedef struct {
24   Mat          A,Aloc;
25   Vec          x,y;
26   ML_Operator  *mlmat;
27   PetscScalar  *pwork; /* tmp array used by PetscML_comm() */
28 } FineGridCtx;
29 
30 /* The context associates a ML matrix with a PETSc shell matrix */
31 typedef struct {
32   Mat          A;       /* PETSc shell matrix associated with mlmat */
33   ML_Operator  *mlmat;  /* ML matrix assorciated with A */
34   Vec          y;
35 } Mat_MLShell;
36 
37 /* Private context for the ML preconditioner */
38 typedef struct {
39   ML           *ml_object;
40   ML_Aggregate *agg_object;
41   GridCtx      *gridctx;
42   FineGridCtx  *PetscMLdata;
43   PetscInt     fine_level,MaxNlevels,MaxCoarseSize,CoarsenScheme;
44   PetscReal    Threshold,DampingFactor;
45   PetscTruth   SpectralNormScheme_Anorm;
46   PetscMPIInt  size;
47   PetscErrorCode (*PCSetUp)(PC);
48   PetscErrorCode (*PCDestroy)(PC);
49 } PC_ML;
50 extern int PetscML_getrow(void *ML_data,int N_requested_rows,int requested_rows[],
51             int allocated_space,int columns[],double values[],int row_lengths[]);
52 extern int PetscML_matvec(void *ML_data, int in_length, double p[], int out_length,double ap[]);
53 extern int PetscML_comm(double x[], void *ML_data);
54 extern PetscErrorCode MatMult_ML(Mat,Vec,Vec);
55 extern PetscErrorCode MatMultAdd_ML(Mat,Vec,Vec,Vec);
56 extern PetscErrorCode MatConvert_MPIAIJ_ML(Mat,const MatType,MatReuse,Mat*);
57 extern PetscErrorCode MatDestroy_ML(Mat);
58 extern PetscErrorCode MatWrapML_SeqAIJ(ML_Operator*,Mat*);
59 extern PetscErrorCode MatWrapML_MPIAIJ(ML_Operator*,Mat*);
60 extern PetscErrorCode MatWrapML_SHELL(ML_Operator*,Mat*);
61 
62 /* -------------------------------------------------------------------------- */
63 /*
64    PCSetUp_ML - Prepares for the use of the ML preconditioner
65                     by setting data structures and options.
66 
67    Input Parameter:
68 .  pc - the preconditioner context
69 
70    Application Interface Routine: PCSetUp()
71 
72    Notes:
73    The interface routine PCSetUp() is not usually called directly by
74    the user, but instead is called by PCApply() if necessary.
75 */
76 
77 #undef __FUNCT__
78 #define __FUNCT__ "PCSetUp_ML"
79 static PetscErrorCode PCSetUp_ML(PC pc)
80 {
81   PetscErrorCode       ierr;
82   PetscMPIInt          size;
83   FineGridCtx          *PetscMLdata;
84   ML                   *ml_object;
85   ML_Aggregate         *agg_object;
86   ML_Operator          *mlmat;
87   PetscInt             nlocal_allcols,Nlevels,mllevel,level,m,fine_level;
88   Mat                  A,Aloc;
89   GridCtx              *gridctx;
90   PC_ML                *pc_ml=PETSC_NULL;
91   PetscObjectContainer container;
92 
93   PetscFunctionBegin;
94   ierr = PetscObjectQuery((PetscObject)pc,"PC_ML",(PetscObject *)&container);CHKERRQ(ierr);
95   if (container) {
96     ierr = PetscObjectContainerGetPointer(container,(void **)&pc_ml);CHKERRQ(ierr);
97   } else {
98     SETERRQ(PETSC_ERR_ARG_NULL,"Container does not exit");
99   }
100 
101   /* setup special features of PCML */
102   /*--------------------------------*/
103   /* covert A to Aloc to be used by ML at fine grid */
104   A = pc->pmat;
105   ierr = MPI_Comm_size(A->comm,&size);CHKERRQ(ierr);
106   pc_ml->size = size;
107   if (size > 1){
108     ierr = MatConvert_MPIAIJ_ML(A,PETSC_NULL,MAT_INITIAL_MATRIX,&Aloc);CHKERRQ(ierr);
109   } else {
110     Aloc = A;
111   }
112 
113   /* create and initialize struct 'PetscMLdata' */
114   ierr = PetscNew(FineGridCtx,&PetscMLdata);CHKERRQ(ierr);
115   PetscMLdata->A    = A;
116   PetscMLdata->Aloc = Aloc;
117   ierr = PetscMalloc((Aloc->n+1)*sizeof(PetscScalar),&PetscMLdata->pwork);CHKERRQ(ierr);
118   pc_ml->PetscMLdata = PetscMLdata;
119 
120   ierr = VecCreate(PETSC_COMM_SELF,&PetscMLdata->x);CHKERRQ(ierr);
121   if (size == 1){
122     ierr = VecSetSizes(PetscMLdata->x,A->n,PETSC_DECIDE);CHKERRQ(ierr);
123   } else {
124     ierr = VecSetSizes(PetscMLdata->x,Aloc->n,PETSC_DECIDE);CHKERRQ(ierr);
125   }
126   ierr = VecSetType(PetscMLdata->x,VECSEQ);CHKERRQ(ierr);
127 
128   ierr = VecCreate(PETSC_COMM_SELF,&PetscMLdata->y);CHKERRQ(ierr);
129   ierr = VecSetSizes(PetscMLdata->y,A->m,PETSC_DECIDE);CHKERRQ(ierr);
130   ierr = VecSetType(PetscMLdata->y,VECSEQ);CHKERRQ(ierr);
131 
132   /* create ML discretization matrix at fine grid */
133   ierr = MatGetSize(Aloc,&m,&nlocal_allcols);CHKERRQ(ierr);
134   ML_Create(&ml_object,pc_ml->MaxNlevels);
135   ML_Init_Amatrix(ml_object,0,m,m,PetscMLdata);
136   ML_Set_Amatrix_Getrow(ml_object,0,PetscML_getrow,PetscML_comm,nlocal_allcols);
137   ML_Set_Amatrix_Matvec(ml_object,0,PetscML_matvec);
138 
139   /* aggregation */
140   ML_Aggregate_Create(&agg_object);
141   ML_Aggregate_Set_MaxCoarseSize(agg_object,pc_ml->MaxCoarseSize);
142   /* set options */
143   switch (pc_ml->CoarsenScheme) {
144   case 1:
145     ML_Aggregate_Set_CoarsenScheme_Coupled(agg_object);break;
146   case 2:
147     ML_Aggregate_Set_CoarsenScheme_MIS(agg_object);break;
148   case 3:
149     ML_Aggregate_Set_CoarsenScheme_METIS(agg_object);break;
150   }
151   ML_Aggregate_Set_Threshold(agg_object,pc_ml->Threshold);
152   ML_Aggregate_Set_DampingFactor(agg_object,pc_ml->DampingFactor);
153   if (pc_ml->SpectralNormScheme_Anorm){
154     ML_Aggregate_Set_SpectralNormScheme_Anorm(agg_object);
155   }
156 
157   Nlevels = ML_Gen_MGHierarchy_UsingAggregation(ml_object,0,ML_INCREASING,agg_object);
158   if (Nlevels<=0) SETERRQ1(PETSC_ERR_ARG_OUTOFRANGE,"Nlevels %d must > 0",Nlevels);
159   ierr = MGSetLevels(pc,Nlevels,PETSC_NULL);CHKERRQ(ierr);
160   pc_ml->ml_object  = ml_object;
161   pc_ml->agg_object = agg_object;
162 
163   ierr = PetscMalloc(Nlevels*sizeof(GridCtx),&gridctx);CHKERRQ(ierr);
164   fine_level = Nlevels - 1;
165   pc_ml->gridctx = gridctx;
166   pc_ml->fine_level = fine_level;
167 
168   /* wrap ML matrices by PETSc shell matrices at coarsened grids.
169      Level 0 is the finest grid for ML, but coarsest for PETSc! */
170   gridctx[fine_level].A = A;
171   level = fine_level - 1;
172   if (size == 1){ /* convert ML P, R and A into seqaij format */
173     for (mllevel=1; mllevel<Nlevels; mllevel++){
174       mlmat  = &(ml_object->Pmat[mllevel]);
175       ierr = MatWrapML_SeqAIJ(mlmat,&gridctx[level].P);CHKERRQ(ierr);
176       mlmat  = &(ml_object->Amat[mllevel]);
177       ierr = MatWrapML_SeqAIJ(mlmat,&gridctx[level].A);CHKERRQ(ierr);
178       mlmat  = &(ml_object->Rmat[mllevel-1]);
179       ierr = MatWrapML_SeqAIJ(mlmat,&gridctx[level].R);CHKERRQ(ierr);
180       level--;
181     }
182   } else { /* convert ML P and R into shell format, ML A into mpiaij format */
183     for (mllevel=1; mllevel<Nlevels; mllevel++){
184       mlmat  = &(ml_object->Pmat[mllevel]);
185       ierr = MatWrapML_SHELL(mlmat,&gridctx[level].P);CHKERRQ(ierr);
186       mlmat  = &(ml_object->Rmat[mllevel-1]);
187       ierr = MatWrapML_SHELL(mlmat,&gridctx[level].R);CHKERRQ(ierr);
188       mlmat  = &(ml_object->Amat[mllevel]);
189       ierr = MatWrapML_MPIAIJ(mlmat,&gridctx[level].A);CHKERRQ(ierr);
190       level--;
191     }
192   }
193 
194   /* create coarse level and the interpolation between the levels */
195   level = fine_level;
196   while ( level >= 0 ){
197     if (level != fine_level){
198       ierr = VecCreate(gridctx[level].A->comm,&gridctx[level].x);CHKERRQ(ierr);
199       ierr = VecSetSizes(gridctx[level].x,gridctx[level].A->n,PETSC_DECIDE);CHKERRQ(ierr);
200       ierr = VecSetType(gridctx[level].x,VECMPI);CHKERRQ(ierr);
201       ierr = MGSetX(pc,level,gridctx[level].x);CHKERRQ(ierr);
202 
203       ierr = VecCreate(gridctx[level].A->comm,&gridctx[level].b);CHKERRQ(ierr);
204       ierr = VecSetSizes(gridctx[level].b,gridctx[level].A->m,PETSC_DECIDE);CHKERRQ(ierr);
205       ierr = VecSetType(gridctx[level].b,VECMPI);CHKERRQ(ierr);
206       ierr = MGSetRhs(pc,level,gridctx[level].b);CHKERRQ(ierr);
207     }
208     ierr = VecCreate(gridctx[level].A->comm,&gridctx[level].r);CHKERRQ(ierr);
209     ierr = VecSetSizes(gridctx[level].r,gridctx[level].A->m,PETSC_DECIDE);CHKERRQ(ierr);
210     ierr = VecSetType(gridctx[level].r,VECMPI);CHKERRQ(ierr);
211     ierr = MGSetR(pc,level,gridctx[level].r);CHKERRQ(ierr);
212 
213     if (level == 0){
214       ierr = MGGetCoarseSolve(pc,&gridctx[level].ksp);CHKERRQ(ierr);
215     } else {
216       ierr = MGGetSmoother(pc,level,&gridctx[level].ksp);CHKERRQ(ierr);
217       ierr = MGSetResidual(pc,level,MGDefaultResidual,gridctx[level].A);CHKERRQ(ierr);
218       if (level == fine_level){
219         ierr = KSPSetOptionsPrefix(gridctx[level].ksp,"mg_fine_");CHKERRQ(ierr);
220         ierr = MGSetR(pc,level,gridctx[level].r);CHKERRQ(ierr);
221       }
222     }
223     ierr = KSPSetOperators(gridctx[level].ksp,gridctx[level].A,gridctx[level].A,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
224 
225     if (level < fine_level){
226       ierr = MGSetInterpolate(pc,level+1,gridctx[level].P);CHKERRQ(ierr);
227       ierr = MGSetRestriction(pc,level+1,gridctx[level].R);CHKERRQ(ierr);
228     }
229     level--;
230   }
231 
232   /* now call PCSetUp_MG()         */
233   /*--------------------------------*/
234   ierr = (*pc_ml->PCSetUp)(pc);CHKERRQ(ierr);
235   PetscFunctionReturn(0);
236 }
237 
238 #undef __FUNCT__
239 #define __FUNCT__ "PetscObjectContainerDestroy_PC_ML"
240 PetscErrorCode PetscObjectContainerDestroy_PC_ML(void *ptr)
241 {
242   PetscErrorCode       ierr;
243   PC_ML                *pc_ml = (PC_ML*)ptr;
244   PetscInt             level;
245 
246   PetscFunctionBegin;
247   if (pc_ml->size > 1){ierr = MatDestroy(pc_ml->PetscMLdata->Aloc);CHKERRQ(ierr);}
248   ML_Aggregate_Destroy(&pc_ml->agg_object);
249   ML_Destroy(&pc_ml->ml_object);
250 
251   ierr = PetscFree(pc_ml->PetscMLdata->pwork);CHKERRQ(ierr);
252   ierr = VecDestroy(pc_ml->PetscMLdata->x);CHKERRQ(ierr);
253   ierr = VecDestroy(pc_ml->PetscMLdata->y);CHKERRQ(ierr);
254   ierr = PetscFree(pc_ml->PetscMLdata);CHKERRQ(ierr);
255 
256   level = pc_ml->fine_level;
257   while ( level>= 0 ){
258     if (level != pc_ml->fine_level){
259       ierr = MatDestroy(pc_ml->gridctx[level].A);CHKERRQ(ierr);
260       ierr = MatDestroy(pc_ml->gridctx[level].P);CHKERRQ(ierr);
261       ierr = MatDestroy(pc_ml->gridctx[level].R);CHKERRQ(ierr);
262       ierr = VecDestroy(pc_ml->gridctx[level].x);CHKERRQ(ierr);
263       ierr = VecDestroy(pc_ml->gridctx[level].b);CHKERRQ(ierr);
264     }
265     ierr = VecDestroy(pc_ml->gridctx[level].r);CHKERRQ(ierr);
266     level--;
267   }
268   ierr = PetscFree(pc_ml->gridctx);CHKERRQ(ierr);
269   ierr = PetscFree(pc_ml);CHKERRQ(ierr);
270   PetscFunctionReturn(0);
271 }
272 /* -------------------------------------------------------------------------- */
273 /*
274    PCDestroy_ML - Destroys the private context for the ML preconditioner
275    that was created with PCCreate_ML().
276 
277    Input Parameter:
278 .  pc - the preconditioner context
279 
280    Application Interface Routine: PCDestroy()
281 */
282 #undef __FUNCT__
283 #define __FUNCT__ "PCDestroy_ML"
284 static PetscErrorCode PCDestroy_ML(PC pc)
285 {
286   PetscErrorCode       ierr;
287   PC_ML                *pc_ml=PETSC_NULL;
288   PetscObjectContainer container;
289 
290   PetscFunctionBegin;
291   ierr = PetscObjectQuery((PetscObject)pc,"PC_ML",(PetscObject *)&container);CHKERRQ(ierr);
292   if (container) {
293     ierr = PetscObjectContainerGetPointer(container,(void **)&pc_ml);CHKERRQ(ierr);
294     pc->ops->destroy = pc_ml->PCDestroy;
295   } else {
296     SETERRQ(PETSC_ERR_ARG_NULL,"Container does not exit");
297   }
298   /* detach pc and PC_ML and dereference container */
299   ierr = PetscObjectCompose((PetscObject)pc,"PC_ML",0);CHKERRQ(ierr);
300   ierr = (*pc->ops->destroy)(pc);CHKERRQ(ierr);
301 
302   ierr = PetscObjectContainerDestroy(container);CHKERRQ(ierr);
303   PetscFunctionReturn(0);
304 }
305 
306 #undef __FUNCT__
307 #define __FUNCT__ "PCSetFromOptions_ML"
308 static PetscErrorCode PCSetFromOptions_ML(PC pc)
309 {
310   PetscErrorCode ierr;
311   PetscInt       indx,m,PrintLevel,MaxNlevels,MaxCoarseSize;
312   PetscReal      Threshold,DampingFactor;
313   PetscTruth     flg;
314   const char     *type[] = {"additive","multiplicative","full","cascade","kascade"};
315   const char     *scheme[] = {"Uncoupled","Coupled","MIS","METIS"};
316   PC_ML          *pc_ml=PETSC_NULL;
317   PetscObjectContainer container;
318 
319   PetscFunctionBegin;
320   ierr = PetscObjectQuery((PetscObject)pc,"PC_ML",(PetscObject *)&container);CHKERRQ(ierr);
321   if (container) {
322     ierr = PetscObjectContainerGetPointer(container,(void **)&pc_ml);CHKERRQ(ierr);
323   } else {
324     SETERRQ(PETSC_ERR_ARG_NULL,"Container does not exit");
325   }
326   ierr = PetscOptionsHead("MG options");CHKERRQ(ierr);
327   /* inherited MG options */
328   ierr = PetscOptionsInt("-pc_mg_cycles","1 for V cycle, 2 for W-cycle","MGSetCycles",1,&m,&flg);CHKERRQ(ierr);
329   if (flg) {
330     ierr = MGSetCycles(pc,m);CHKERRQ(ierr);
331   }
332   ierr = PetscOptionsInt("-pc_mg_smoothup","Number of post-smoothing steps","MGSetNumberSmoothUp",1,&m,&flg);CHKERRQ(ierr);
333   if (flg) {
334     ierr = MGSetNumberSmoothUp(pc,m);CHKERRQ(ierr);
335   }
336   ierr = PetscOptionsInt("-pc_mg_smoothdown","Number of pre-smoothing steps","MGSetNumberSmoothDown",1,&m,&flg);CHKERRQ(ierr);
337   if (flg) {
338     ierr = MGSetNumberSmoothDown(pc,m);CHKERRQ(ierr);
339   }
340   ierr = PetscOptionsEList("-pc_mg_type","Multigrid type","MGSetType",type,5,type[1],&indx,&flg);CHKERRQ(ierr);
341   if (flg) {
342     MGType mg = (MGType) 0;
343     switch (indx) {
344     case 0:
345       mg = MGADDITIVE;
346       break;
347     case 1:
348       mg = MGMULTIPLICATIVE;
349       break;
350     case 2:
351       mg = MGFULL;
352       break;
353     case 3:
354       mg = MGKASKADE;
355       break;
356     case 4:
357       mg = MGKASKADE;
358       break;
359     }
360     ierr = MGSetType(pc,mg);CHKERRQ(ierr);
361   }
362   ierr = PetscOptionsTail();CHKERRQ(ierr);
363 
364   /* ML options */
365   ierr = PetscOptionsHead("ML options");CHKERRQ(ierr);
366   /* set defaults */
367   PrintLevel    = 0;
368   MaxNlevels    = 10;
369   MaxCoarseSize = 1;
370   indx          = 0;
371   Threshold     = 0.0;
372   DampingFactor = 4.0/3.0;
373 
374   ierr = PetscOptionsInt("-pc_ml_PrintLevel","Print level","ML_Set_PrintLevel",PrintLevel,&PrintLevel,PETSC_NULL);CHKERRQ(ierr);
375   ML_Set_PrintLevel(PrintLevel);
376 
377   ierr = PetscOptionsInt("-pc_ml_maxNlevels","Maximum number of levels","None",MaxNlevels,&MaxNlevels,PETSC_NULL);CHKERRQ(ierr);
378   pc_ml->MaxNlevels = MaxNlevels;
379 
380   ierr = PetscOptionsInt("-pc_ml_maxCoarseSize","Maximum coarsest mesh size","ML_Aggregate_Set_MaxCoarseSize",MaxCoarseSize,&MaxCoarseSize,PETSC_NULL);CHKERRQ(ierr);
381   pc_ml->MaxCoarseSize = MaxCoarseSize;
382 
383   ierr = PetscOptionsEList("-pc_ml_CoarsenScheme","Aggregate Coarsen Scheme","ML_Aggregate_Set_CoarsenScheme_*",scheme,4,scheme[0],&indx,PETSC_NULL);CHKERRQ(ierr);
384   pc_ml->CoarsenScheme = indx;
385 
386   ierr = PetscOptionsReal("-pc_ml_DampingFactor","P damping factor","ML_Aggregate_Set_DampingFactor",DampingFactor,&DampingFactor,PETSC_NULL);CHKERRQ(ierr);
387   pc_ml->DampingFactor = DampingFactor;
388 
389   ierr = PetscOptionsReal("-pc_ml_Threshold","Smoother drop tol","ML_Aggregate_Set_Threshold",Threshold,&Threshold,PETSC_NULL);CHKERRQ(ierr);
390   pc_ml->Threshold = Threshold;
391 
392   ierr = PetscOptionsLogical("-pc_ml_SpectralNormScheme_Anorm","Method used for estimating spectral radius","ML_Aggregate_Set_SpectralNormScheme_Anorm",PETSC_FALSE,&pc_ml->SpectralNormScheme_Anorm,PETSC_FALSE);
393 
394   ierr = PetscOptionsTail();CHKERRQ(ierr);
395   PetscFunctionReturn(0);
396 }
397 
398 /* -------------------------------------------------------------------------- */
399 /*
400    PCCreate_ML - Creates a ML preconditioner context, PC_ML,
401    and sets this as the private data within the generic preconditioning
402    context, PC, that was created within PCCreate().
403 
404    Input Parameter:
405 .  pc - the preconditioner context
406 
407    Application Interface Routine: PCCreate()
408 */
409 
410 /*MC
411      PCML - Use geometric multigrid preconditioning. This preconditioner requires you provide
412        fine grid discretization matrix. The coarser grid matrices and restriction/interpolation
413        operators are computed by ML and wrapped as PETSc shell matrices.
414 
415    Options Database Key: (not done yet!)
416 +  -pc_mg_maxlevels <nlevels> - maximum number of levels including finest
417 .  -pc_mg_cycles 1 or 2 - for V or W-cycle
418 .  -pc_mg_smoothup <n> - number of smoothing steps after interpolation
419 .  -pc_mg_smoothdown <n> - number of smoothing steps before applying restriction operator
420 .  -pc_mg_type <additive,multiplicative,full,cascade> - multiplicative is the default
421 .  -pc_mg_monitor - print information on the multigrid convergence
422 -  -pc_mg_dump_matlab - dumps the matrices for each level and the restriction/interpolation matrices
423                         to the Socket viewer for reading from Matlab.
424 
425    Level: intermediate
426 
427   Concepts: multigrid
428 
429 .seealso:  PCCreate(), PCSetType(), PCType (for list of available types), PC, PCMGType,
430            MGSetLevels(), MGGetLevels(), MGSetType(), MPSetCycles(), MGSetNumberSmoothDown(),
431            MGSetNumberSmoothUp(), MGGetCoarseSolve(), MGSetResidual(), MGSetInterpolation(),
432            MGSetRestriction(), MGGetSmoother(), MGGetSmootherUp(), MGGetSmootherDown(),
433            MGSetCyclesOnLevel(), MGSetRhs(), MGSetX(), MGSetR()
434 M*/
435 
436 EXTERN_C_BEGIN
437 #undef __FUNCT__
438 #define __FUNCT__ "PCCreate_ML"
439 PetscErrorCode PCCreate_ML(PC pc)
440 {
441   PetscErrorCode       ierr;
442   PC_ML                *pc_ml;
443   PetscObjectContainer container;
444 
445   PetscFunctionBegin;
446   /* initialize pc as PCMG */
447   ierr = PCSetType(pc,PCMG);CHKERRQ(ierr); /* calls PCCreate_MG() and MGCreate_Private() */
448 
449   /* create a supporting struct and attach it to pc */
450   ierr = PetscNew(PC_ML,&pc_ml);CHKERRQ(ierr);
451   ierr = PetscObjectContainerCreate(PETSC_COMM_SELF,&container);CHKERRQ(ierr);
452   ierr = PetscObjectContainerSetPointer(container,pc_ml);CHKERRQ(ierr);
453   ierr = PetscObjectContainerSetUserDestroy(container,PetscObjectContainerDestroy_PC_ML);CHKERRQ(ierr);
454   ierr = PetscObjectCompose((PetscObject)pc,"PC_ML",(PetscObject)container);CHKERRQ(ierr);
455 
456   pc_ml->PCSetUp   = pc->ops->setup;
457   pc_ml->PCDestroy = pc->ops->destroy;
458 
459   /* overwrite the pointers of PCMG by the functions of PCML */
460   pc->ops->setfromoptions = PCSetFromOptions_ML;
461   pc->ops->setup          = PCSetUp_ML;
462   pc->ops->destroy        = PCDestroy_ML;
463   PetscFunctionReturn(0);
464 }
465 EXTERN_C_END
466 
467 int PetscML_getrow(void *ML_data, int N_requested_rows, int requested_rows[],
468    int allocated_space, int columns[], double values[], int row_lengths[])
469 {
470   PetscErrorCode ierr;
471   Mat            Aloc;
472   Mat_SeqAIJ     *a;
473   PetscInt       m,i,j,k=0,row,*aj;
474   PetscScalar    *aa;
475   FineGridCtx    *ml=(FineGridCtx*)ML_data;
476 
477   Aloc = ml->Aloc;
478   a    = (Mat_SeqAIJ*)Aloc->data;
479   ierr = MatGetSize(Aloc,&m,PETSC_NULL);CHKERRQ(ierr);
480 
481   for (i = 0; i<N_requested_rows; i++) {
482     row   = requested_rows[i];
483     row_lengths[i] = a->ilen[row];
484     if (allocated_space < k+row_lengths[i]) return(0);
485     if ( (row >= 0) || (row <= (m-1)) ) {
486       aj = a->j + a->i[row];
487       aa = a->a + a->i[row];
488       for (j=0; j<row_lengths[i]; j++){
489         columns[k]  = aj[j];
490         values[k++] = aa[j];
491       }
492     }
493   }
494   return(1);
495 }
496 
497 int PetscML_matvec(void *ML_data,int in_length,double p[],int out_length,double ap[])
498 {
499   PetscErrorCode ierr;
500   FineGridCtx    *ml=(FineGridCtx*)ML_data;
501   Mat            A=ml->A, Aloc=ml->Aloc;
502   PetscMPIInt    size;
503   PetscScalar    *pwork=ml->pwork;
504   PetscInt       i;
505 
506   ierr = MPI_Comm_size(A->comm,&size);CHKERRQ(ierr);
507   if (size == 1){
508     ierr = VecPlaceArray(ml->x,p);CHKERRQ(ierr);
509   } else {
510     for (i=0; i<in_length; i++) pwork[i] = p[i];
511     PetscML_comm(pwork,ml);
512     ierr = VecPlaceArray(ml->x,pwork);CHKERRQ(ierr);
513   }
514   ierr = VecPlaceArray(ml->y,ap);CHKERRQ(ierr);
515   ierr = MatMult(Aloc,ml->x,ml->y);CHKERRQ(ierr);
516   return 0;
517 }
518 
519 int PetscML_comm(double p[],void *ML_data)
520 {
521   PetscErrorCode ierr;
522   FineGridCtx    *ml=(FineGridCtx*)ML_data;
523   Mat            A=ml->A;
524   Mat_MPIAIJ     *a = (Mat_MPIAIJ*)A->data;
525   PetscMPIInt    size;
526   PetscInt       i,in_length=A->m,out_length=ml->Aloc->n;
527   PetscScalar    *array;
528 
529   ierr = MPI_Comm_size(A->comm,&size);CHKERRQ(ierr);
530   if (size == 1) return 0;
531 
532   ierr = VecPlaceArray(ml->y,p);CHKERRQ(ierr);
533   ierr = VecScatterBegin(ml->y,a->lvec,INSERT_VALUES,SCATTER_FORWARD,a->Mvctx);CHKERRQ(ierr);
534   ierr = VecScatterEnd(ml->y,a->lvec,INSERT_VALUES,SCATTER_FORWARD,a->Mvctx);CHKERRQ(ierr);
535   ierr = VecGetArray(a->lvec,&array);CHKERRQ(ierr);
536   for (i=in_length; i<out_length; i++){
537     p[i] = array[i-in_length];
538   }
539   return 0;
540 }
541 #undef __FUNCT__
542 #define __FUNCT__ "MatMult_ML"
543 PetscErrorCode MatMult_ML(Mat A,Vec x,Vec y)
544 {
545   PetscErrorCode   ierr;
546   Mat_MLShell      *shell;
547   PetscScalar      *xarray,*yarray;
548   PetscInt         x_length,y_length;
549 
550   PetscFunctionBegin;
551   ierr = MatShellGetContext(A,(void *)&shell);CHKERRQ(ierr);
552   ierr = VecGetArray(x,&xarray);CHKERRQ(ierr);
553   ierr = VecGetArray(y,&yarray);CHKERRQ(ierr);
554   x_length = shell->mlmat->invec_leng;
555   y_length = shell->mlmat->outvec_leng;
556 
557   ML_Operator_Apply(shell->mlmat,x_length,xarray,y_length,yarray);
558 
559   ierr = VecRestoreArray(x,&xarray);CHKERRQ(ierr);
560   ierr = VecRestoreArray(y,&yarray);CHKERRQ(ierr);
561   PetscFunctionReturn(0);
562 }
563 /* MatMultAdd_ML -  Compute y = w + A*x */
564 #undef __FUNCT__
565 #define __FUNCT__ "MatMultAdd_ML"
566 PetscErrorCode MatMultAdd_ML(Mat A,Vec x,Vec w,Vec y)
567 {
568   PetscErrorCode    ierr;
569   Mat_MLShell       *shell;
570   PetscScalar       *xarray,*yarray;
571   const PetscScalar one=1.0;
572   PetscInt          x_length,y_length;
573 
574   PetscFunctionBegin;
575   ierr = MatShellGetContext(A,(void *)&shell);CHKERRQ(ierr);
576   ierr = VecGetArray(x,&xarray);CHKERRQ(ierr);
577   ierr = VecGetArray(y,&yarray);CHKERRQ(ierr);
578 
579   x_length = shell->mlmat->invec_leng;
580   y_length = shell->mlmat->outvec_leng;
581 
582   ML_Operator_Apply(shell->mlmat,x_length,xarray,y_length,yarray);
583 
584   ierr = VecRestoreArray(x,&xarray);CHKERRQ(ierr);
585   ierr = VecRestoreArray(y,&yarray);CHKERRQ(ierr);
586   ierr = VecAXPY(&one,w,y);CHKERRQ(ierr);
587 
588   PetscFunctionReturn(0);
589 }
590 
591 /* newtype is ignored because "ml" is not listed under Petsc MatType yet */
592 #undef __FUNCT__
593 #define __FUNCT__ "MatConvert_MPIAIJ_ML"
594 PetscErrorCode MatConvert_MPIAIJ_ML(Mat A,const MatType newtype,MatReuse scall,Mat *Aloc)
595 {
596   PetscErrorCode  ierr;
597   Mat_MPIAIJ      *mpimat=(Mat_MPIAIJ*)A->data;
598   Mat_SeqAIJ      *mat,*a=(Mat_SeqAIJ*)(mpimat->A)->data,*b=(Mat_SeqAIJ*)(mpimat->B)->data;
599   PetscInt        *ai=a->i,*aj=a->j,*bi=b->i,*bj=b->j;
600   PetscScalar     *aa=a->a,*ba=b->a,*ca;
601   PetscInt        am=A->m,an=A->n,i,j,k;
602   PetscInt        *ci,*cj,ncols;
603 
604   PetscFunctionBegin;
605   if (am != an) SETERRQ2(PETSC_ERR_ARG_WRONG,"A must have a square diagonal portion, am: %d != an: %d",am,an);
606 
607   if (scall == MAT_INITIAL_MATRIX){
608     ierr = PetscMalloc((1+am)*sizeof(PetscInt),&ci);CHKERRQ(ierr);
609     ci[0] = 0;
610     for (i=0; i<am; i++){
611       ci[i+1] = ci[i] + (ai[i+1] - ai[i]) + (bi[i+1] - bi[i]);
612     }
613     ierr = PetscMalloc((1+ci[am])*sizeof(PetscInt),&cj);CHKERRQ(ierr);
614     ierr = PetscMalloc((1+ci[am])*sizeof(PetscScalar),&ca);CHKERRQ(ierr);
615 
616     k = 0;
617     for (i=0; i<am; i++){
618       /* diagonal portion of A */
619       ncols = ai[i+1] - ai[i];
620       for (j=0; j<ncols; j++) {
621         cj[k]   = *aj++;
622         ca[k++] = *aa++;
623       }
624       /* off-diagonal portion of A */
625       ncols = bi[i+1] - bi[i];
626       for (j=0; j<ncols; j++) {
627         cj[k]   = an + (*bj); bj++;
628         ca[k++] = *ba++;
629       }
630     }
631     if (k != ci[am]) SETERRQ2(PETSC_ERR_ARG_WRONG,"k: %d != ci[am]: %d",k,ci[am]);
632 
633     /* put together the new matrix */
634     an = mpimat->A->n+mpimat->B->n;
635     ierr = MatCreateSeqAIJWithArrays(PETSC_COMM_SELF,am,an,ci,cj,ca,Aloc);CHKERRQ(ierr);
636 
637     /* MatCreateSeqAIJWithArrays flags matrix so PETSc doesn't free the user's arrays. */
638     /* Since these are PETSc arrays, change flags to free them as necessary. */
639     mat = (Mat_SeqAIJ*)(*Aloc)->data;
640     mat->freedata = PETSC_TRUE;
641     mat->nonew    = 0;
642   } else if (scall == MAT_REUSE_MATRIX){
643     mat=(Mat_SeqAIJ*)(*Aloc)->data;
644     ci = mat->i; cj = mat->j; ca = mat->a;
645     for (i=0; i<am; i++) {
646       /* diagonal portion of A */
647       ncols = ai[i+1] - ai[i];
648       for (j=0; j<ncols; j++) *ca++ = *aa++;
649       /* off-diagonal portion of A */
650       ncols = bi[i+1] - bi[i];
651       for (j=0; j<ncols; j++) *ca++ = *ba++;
652     }
653   } else {
654     SETERRQ1(PETSC_ERR_ARG_WRONG,"Invalid MatReuse %d",(int)scall);
655   }
656   PetscFunctionReturn(0);
657 }
658 extern PetscErrorCode MatDestroy_Shell(Mat);
659 #undef __FUNCT__
660 #define __FUNCT__ "MatDestroy_ML"
661 PetscErrorCode MatDestroy_ML(Mat A)
662 {
663   PetscErrorCode ierr;
664   Mat_MLShell    *shell;
665 
666   PetscFunctionBegin;
667   ierr = MatShellGetContext(A,(void *)&shell);CHKERRQ(ierr);
668   ierr = VecDestroy(shell->y);CHKERRQ(ierr);
669   ierr = PetscFree(shell);CHKERRQ(ierr);
670   ierr = MatDestroy_Shell(A);CHKERRQ(ierr);
671   PetscFunctionReturn(0);
672 }
673 
674 #undef __FUNCT__
675 #define __FUNCT__ "MatWrapML_SeqAIJ"
676 PetscErrorCode MatWrapML_SeqAIJ(ML_Operator *mlmat,Mat *newmat)
677 {
678   struct ML_CSR_MSRdata *matdata = (struct ML_CSR_MSRdata *)mlmat->data;
679   PetscErrorCode  ierr;
680   PetscInt        m=mlmat->outvec_leng,n=mlmat->invec_leng,nnz[m],nz_max;
681   PetscInt        *ml_cols=matdata->columns,*aj,i,j,k;
682   PetscScalar     *ml_vals=matdata->values,*aa;
683 
684   PetscFunctionBegin;
685   if ( mlmat->getrow == NULL) SETERRQ(PETSC_ERR_ARG_NULL,"mlmat->getrow = NULL");
686   if (m != n){ /* ML Pmat and Rmat are in CSR format. Pass array pointers into SeqAIJ matrix */
687     ierr = MatCreateSeqAIJWithArrays(PETSC_COMM_SELF,m,n,matdata->rowptr,ml_cols,ml_vals,newmat);CHKERRQ(ierr);
688     PetscFunctionReturn(0);
689   }
690 
691   /* ML Amat is in MSR format. Copy its data into SeqAIJ matrix */
692   ierr = MatCreate(PETSC_COMM_SELF,m,n,PETSC_DECIDE,PETSC_DECIDE,newmat);CHKERRQ(ierr);
693   ierr = MatSetType(*newmat,MATSEQAIJ);CHKERRQ(ierr);
694 
695   nz_max = 0;
696   for (i=0; i<m; i++) {
697     nnz[i] = ml_cols[i+1] - ml_cols[i] + 1;
698     if (nnz[i] > nz_max) nz_max = nnz[i];
699   }
700   ierr = MatSeqAIJSetPreallocation(*newmat,0,nnz);CHKERRQ(ierr);
701   ierr = MatSetOption(*newmat,MAT_COLUMNS_SORTED);CHKERRQ(ierr); /* check! */
702 
703   nz_max++;
704   ierr = PetscMalloc(nz_max*(sizeof(int)+sizeof(PetscScalar)),&aj);CHKERRQ(ierr);
705   aa = (PetscScalar*)(aj + nz_max);
706 
707   for (i=0; i<m; i++){
708     k = 0;
709     /* diagonal entry */
710     aj[k] = i; aa[k++] = ml_vals[i];
711     /* off diagonal entries */
712     for (j=ml_cols[i]; j<ml_cols[i+1]; j++){
713       aj[k] = ml_cols[j]; aa[k++] = ml_vals[j];
714     }
715     /* sort aj and aa */
716     ierr = PetscSortIntWithScalarArray(nnz[i],aj,aa);CHKERRQ(ierr);
717     ierr = MatSetValues(*newmat,1,&i,nnz[i],aj,aa,INSERT_VALUES);CHKERRQ(ierr);
718   }
719   ierr = MatAssemblyBegin(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
720   ierr = MatAssemblyEnd(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
721   ierr = PetscFree(aj);CHKERRQ(ierr);
722   PetscFunctionReturn(0);
723 }
724 
725 #undef __FUNCT__
726 #define __FUNCT__ "MatWrapML_SHELL"
727 PetscErrorCode MatWrapML_SHELL(ML_Operator *mlmat,Mat *newmat)
728 {
729   PetscErrorCode ierr;
730   PetscInt       m,n;
731   ML_Comm        *MLcomm;
732   Mat_MLShell    *shellctx;
733 
734   PetscFunctionBegin;
735   m = mlmat->outvec_leng;
736   n = mlmat->invec_leng;
737   if (!m || !n){
738     newmat = PETSC_NULL;
739   } else {
740     MLcomm = mlmat->comm;
741     ierr = PetscNew(Mat_MLShell,&shellctx);CHKERRQ(ierr);
742     ierr = MatCreateShell(MLcomm->USR_comm,m,n,PETSC_DETERMINE,PETSC_DETERMINE,shellctx,newmat);CHKERRQ(ierr);
743     ierr = MatShellSetOperation(*newmat,MATOP_MULT,(void *)MatMult_ML);CHKERRQ(ierr);
744     ierr = MatShellSetOperation(*newmat,MATOP_MULT_ADD,(void *)MatMultAdd_ML);CHKERRQ(ierr);
745     shellctx->A         = *newmat;
746     shellctx->mlmat     = mlmat;
747     ierr = VecCreate(PETSC_COMM_WORLD,&shellctx->y);CHKERRQ(ierr);
748     ierr = VecSetSizes(shellctx->y,m,PETSC_DECIDE);CHKERRQ(ierr);
749     ierr = VecSetFromOptions(shellctx->y);CHKERRQ(ierr);
750     (*newmat)->ops->destroy = MatDestroy_ML;
751   }
752   PetscFunctionReturn(0);
753 }
754 
755 #undef __FUNCT__
756 #define __FUNCT__ "MatWrapML_MPIAIJ"
757 PetscErrorCode MatWrapML_MPIAIJ(ML_Operator *mlmat,Mat *newmat)
758 {
759   struct ML_CSR_MSRdata *matdata = (struct ML_CSR_MSRdata *)mlmat->data;
760   PetscInt        *ml_cols=matdata->columns,*aj;
761   PetscScalar     *ml_vals=matdata->values,*aa;
762   PetscErrorCode  ierr;
763   PetscInt        i,j,k,*gordering;
764   PetscInt        m=mlmat->outvec_leng,n,nnzA[m],nnzB[m],nnz[m],nz_max,row;
765   Mat             A;
766 
767   PetscFunctionBegin;
768   if (mlmat->getrow == NULL) SETERRQ(PETSC_ERR_ARG_NULL,"mlmat->getrow = NULL");
769   n = mlmat->invec_leng;
770   if (m != n) SETERRQ2(PETSC_ERR_ARG_OUTOFRANGE,"m %d must equal to n %d",m,n);
771 
772   ierr = MatCreate(mlmat->comm->USR_comm,m,n,PETSC_DECIDE,PETSC_DECIDE,&A);CHKERRQ(ierr);
773   ierr = MatSetType(A,MATMPIAIJ);CHKERRQ(ierr);
774   nz_max = 0;
775   for (i=0; i<m; i++){
776     nnz[i] = ml_cols[i+1] - ml_cols[i] + 1;
777     if (nz_max < nnz[i]) nz_max = nnz[i];
778     nnzA[i] = 1; /* diag */
779     for (j=ml_cols[i]; j<ml_cols[i+1]; j++){
780       if (ml_cols[j] < m) nnzA[i]++;
781     }
782     nnzB[i] = nnz[i] - nnzA[i];
783   }
784   ierr = MatMPIAIJSetPreallocation(A,0,nnzA,0,nnzB);CHKERRQ(ierr);
785 
786   /* insert mat values -- remap row and column indices */
787   nz_max++;
788   ierr = PetscMalloc(nz_max*(sizeof(int)+sizeof(PetscScalar)),&aj);CHKERRQ(ierr);
789   aa = (PetscScalar*)(aj + nz_max);
790   ML_build_global_numbering(mlmat,mlmat->comm,&gordering);
791   for (i=0; i<m; i++){
792     row = gordering[i];
793     k = 0;
794     /* diagonal entry */
795     aj[k] = row; aa[k++] = ml_vals[i];
796     /* off diagonal entries */
797     for (j=ml_cols[i]; j<ml_cols[i+1]; j++){
798       aj[k] = gordering[ml_cols[j]]; aa[k++] = ml_vals[j];
799     }
800     ierr = MatSetValues(A,1,&row,nnz[i],aj,aa,INSERT_VALUES);CHKERRQ(ierr);
801   }
802   ierr = MatAssemblyBegin(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
803   ierr = MatAssemblyEnd(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
804   *newmat = A;
805 
806   ierr = PetscFree(aj);CHKERRQ(ierr);
807   PetscFunctionReturn(0);
808 }
809