xref: /petsc/src/ksp/pc/impls/ml/ml.c (revision 0700a8246d308f50502909ba325e6169d3ee27eb)
1 #define PETSCKSP_DLL
2 
3 /*
4    Provides an interface to the ML smoothed Aggregation
5    Note: Something non-obvious breaks -pc_mg_type ADDITIVE for parallel runs
6                                     Jed Brown, see [PETSC #18321, #18449].
7 */
8 #include "private/pcimpl.h"   /*I "petscpc.h" I*/
9 #include "../src/ksp/pc/impls/mg/mgimpl.h"                    /*I "petscmg.h" I*/
10 #include "../src/mat/impls/aij/seq/aij.h"
11 #include "../src/mat/impls/aij/mpi/mpiaij.h"
12 
13 #include <math.h>
14 EXTERN_C_BEGIN
15 /* HAVE_CONFIG_H flag is required by ML include files */
16 #if !defined(HAVE_CONFIG_H)
17 #define HAVE_CONFIG_H
18 #endif
19 #include "ml_include.h"
20 EXTERN_C_END
21 
22 /* The context (data structure) at each grid level */
23 typedef struct {
24   Vec        x,b,r;           /* global vectors */
25   Mat        A,P,R;
26   KSP        ksp;
27 } GridCtx;
28 
29 /* The context used to input PETSc matrix into ML at fine grid */
30 typedef struct {
31   Mat          A;      /* Petsc matrix in aij format */
32   Mat          Aloc;   /* local portion of A to be used by ML */
33   Vec          x,y;
34   ML_Operator  *mlmat;
35   PetscScalar  *pwork; /* tmp array used by PetscML_comm() */
36 } FineGridCtx;
37 
38 /* The context associates a ML matrix with a PETSc shell matrix */
39 typedef struct {
40   Mat          A;       /* PETSc shell matrix associated with mlmat */
41   ML_Operator  *mlmat;  /* ML matrix assorciated with A */
42   Vec          y;
43 } Mat_MLShell;
44 
45 /* Private context for the ML preconditioner */
46 typedef struct {
47   ML             *ml_object;
48   ML_Aggregate   *agg_object;
49   GridCtx        *gridctx;
50   FineGridCtx    *PetscMLdata;
51   PetscInt       Nlevels,MaxNlevels,MaxCoarseSize,CoarsenScheme;
52   PetscReal      Threshold,DampingFactor;
53   PetscTruth     SpectralNormScheme_Anorm;
54   PetscMPIInt    size; /* size of communicator for pc->pmat */
55 } PC_ML;
56 
57 #undef __FUNCT__
58 #define __FUNCT__ "PetscML_getrow"
59 static int PetscML_getrow(ML_Operator *ML_data, int N_requested_rows, int requested_rows[],int allocated_space, int columns[], double values[], int row_lengths[])
60 {
61   PetscErrorCode ierr;
62   PetscInt       m,i,j,k=0,row,*aj;
63   PetscScalar    *aa;
64   FineGridCtx    *ml=(FineGridCtx*)ML_Get_MyGetrowData(ML_data);
65   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)ml->Aloc->data;
66 
67 
68   ierr = MatGetSize(ml->Aloc,&m,PETSC_NULL); if (ierr) return(0);
69   for (i = 0; i<N_requested_rows; i++) {
70     row   = requested_rows[i];
71     row_lengths[i] = a->ilen[row];
72     if (allocated_space < k+row_lengths[i]) return(0);
73     if ( (row >= 0) || (row <= (m-1)) ) {
74       aj = a->j + a->i[row];
75       aa = a->a + a->i[row];
76       for (j=0; j<row_lengths[i]; j++){
77         columns[k]  = aj[j];
78         values[k++] = aa[j];
79       }
80     }
81   }
82   return(1);
83 }
84 
85 #undef __FUNCT__
86 #define __FUNCT__ "PetscML_comm"
87 static PetscErrorCode PetscML_comm(double p[],void *ML_data)
88 {
89   PetscErrorCode ierr;
90   FineGridCtx    *ml=(FineGridCtx*)ML_data;
91   Mat            A=ml->A;
92   Mat_MPIAIJ     *a = (Mat_MPIAIJ*)A->data;
93   PetscMPIInt    size;
94   PetscInt       i,in_length=A->rmap->n,out_length=ml->Aloc->cmap->n;
95   PetscScalar    *array;
96 
97   PetscFunctionBegin;
98   ierr = MPI_Comm_size(((PetscObject)A)->comm,&size);CHKERRQ(ierr);
99   if (size == 1) return 0;
100 
101   ierr = VecPlaceArray(ml->y,p);CHKERRQ(ierr);
102   ierr = VecScatterBegin(a->Mvctx,ml->y,a->lvec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
103   ierr = VecScatterEnd(a->Mvctx,ml->y,a->lvec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
104   ierr = VecResetArray(ml->y);CHKERRQ(ierr);
105   ierr = VecGetArray(a->lvec,&array);CHKERRQ(ierr);
106   for (i=in_length; i<out_length; i++){
107     p[i] = array[i-in_length];
108   }
109   ierr = VecRestoreArray(a->lvec,&array);CHKERRQ(ierr);
110   PetscFunctionReturn(0);
111 }
112 
113 #undef __FUNCT__
114 #define __FUNCT__ "PetscML_matvec"
115 static int PetscML_matvec(ML_Operator *ML_data,int in_length,double p[],int out_length,double ap[])
116 {
117   PetscErrorCode ierr;
118   FineGridCtx    *ml=(FineGridCtx*)ML_Get_MyMatvecData(ML_data);
119   Mat            A=ml->A, Aloc=ml->Aloc;
120   PetscMPIInt    size;
121   PetscScalar    *pwork=ml->pwork;
122   PetscInt       i;
123 
124   PetscFunctionBegin;
125   ierr = MPI_Comm_size(((PetscObject)A)->comm,&size);CHKERRQ(ierr);
126   if (size == 1){
127     ierr = VecPlaceArray(ml->x,p);CHKERRQ(ierr);
128   } else {
129     for (i=0; i<in_length; i++) pwork[i] = p[i];
130     PetscML_comm(pwork,ml);
131     ierr = VecPlaceArray(ml->x,pwork);CHKERRQ(ierr);
132   }
133   ierr = VecPlaceArray(ml->y,ap);CHKERRQ(ierr);
134   ierr = MatMult(Aloc,ml->x,ml->y);CHKERRQ(ierr);
135   ierr = VecResetArray(ml->x);CHKERRQ(ierr);
136   ierr = VecResetArray(ml->y);CHKERRQ(ierr);
137   PetscFunctionReturn(0);
138 }
139 
140 #undef __FUNCT__
141 #define __FUNCT__ "MatMult_ML"
142 static PetscErrorCode MatMult_ML(Mat A,Vec x,Vec y)
143 {
144   PetscErrorCode   ierr;
145   Mat_MLShell      *shell;
146   PetscScalar      *xarray,*yarray;
147   PetscInt         x_length,y_length;
148 
149   PetscFunctionBegin;
150   ierr = MatShellGetContext(A,(void **)&shell);CHKERRQ(ierr);
151   ierr = VecGetArray(x,&xarray);CHKERRQ(ierr);
152   ierr = VecGetArray(y,&yarray);CHKERRQ(ierr);
153   x_length = shell->mlmat->invec_leng;
154   y_length = shell->mlmat->outvec_leng;
155   ML_Operator_Apply(shell->mlmat,x_length,xarray,y_length,yarray);
156   ierr = VecRestoreArray(x,&xarray);CHKERRQ(ierr);
157   ierr = VecRestoreArray(y,&yarray);CHKERRQ(ierr);
158   PetscFunctionReturn(0);
159 }
160 
161 #undef __FUNCT__
162 #define __FUNCT__ "MatMultAdd_ML"
163 static PetscErrorCode MatMultAdd_ML(Mat A,Vec x,Vec w,Vec y)
164 {
165   PetscErrorCode    ierr;
166   Mat_MLShell       *shell;
167   PetscScalar       *xarray,*yarray;
168   PetscInt          x_length,y_length;
169 
170   PetscFunctionBegin;
171   ierr = MatShellGetContext(A,(void **)&shell);CHKERRQ(ierr);
172   ierr = VecGetArray(x,&xarray);CHKERRQ(ierr);
173   ierr = VecGetArray(y,&yarray);CHKERRQ(ierr);
174   x_length = shell->mlmat->invec_leng;
175   y_length = shell->mlmat->outvec_leng;
176   ML_Operator_Apply(shell->mlmat,x_length,xarray,y_length,yarray);
177   ierr = VecRestoreArray(x,&xarray);CHKERRQ(ierr);
178   ierr = VecRestoreArray(y,&yarray);CHKERRQ(ierr);
179   ierr = VecAXPY(y,1.0,w);CHKERRQ(ierr);
180   PetscFunctionReturn(0);
181 }
182 
183 /* newtype is ignored because "ml" is not listed under Petsc MatType */
184 #undef __FUNCT__
185 #define __FUNCT__ "MatConvert_MPIAIJ_ML"
186 static PetscErrorCode MatConvert_MPIAIJ_ML(Mat A,MatType newtype,MatReuse scall,Mat *Aloc)
187 {
188   PetscErrorCode  ierr;
189   Mat_MPIAIJ      *mpimat=(Mat_MPIAIJ*)A->data;
190   Mat_SeqAIJ      *mat,*a=(Mat_SeqAIJ*)(mpimat->A)->data,*b=(Mat_SeqAIJ*)(mpimat->B)->data;
191   PetscInt        *ai=a->i,*aj=a->j,*bi=b->i,*bj=b->j;
192   PetscScalar     *aa=a->a,*ba=b->a,*ca;
193   PetscInt        am=A->rmap->n,an=A->cmap->n,i,j,k;
194   PetscInt        *ci,*cj,ncols;
195 
196   PetscFunctionBegin;
197   if (am != an) SETERRQ2(PETSC_ERR_ARG_WRONG,"A must have a square diagonal portion, am: %d != an: %d",am,an);
198 
199   if (scall == MAT_INITIAL_MATRIX){
200     ierr = PetscMalloc((1+am)*sizeof(PetscInt),&ci);CHKERRQ(ierr);
201     ci[0] = 0;
202     for (i=0; i<am; i++){
203       ci[i+1] = ci[i] + (ai[i+1] - ai[i]) + (bi[i+1] - bi[i]);
204     }
205     ierr = PetscMalloc((1+ci[am])*sizeof(PetscInt),&cj);CHKERRQ(ierr);
206     ierr = PetscMalloc((1+ci[am])*sizeof(PetscScalar),&ca);CHKERRQ(ierr);
207 
208     k = 0;
209     for (i=0; i<am; i++){
210       /* diagonal portion of A */
211       ncols = ai[i+1] - ai[i];
212       for (j=0; j<ncols; j++) {
213         cj[k]   = *aj++;
214         ca[k++] = *aa++;
215       }
216       /* off-diagonal portion of A */
217       ncols = bi[i+1] - bi[i];
218       for (j=0; j<ncols; j++) {
219         cj[k]   = an + (*bj); bj++;
220         ca[k++] = *ba++;
221       }
222     }
223     if (k != ci[am]) SETERRQ2(PETSC_ERR_ARG_WRONG,"k: %d != ci[am]: %d",k,ci[am]);
224 
225     /* put together the new matrix */
226     an = mpimat->A->cmap->n+mpimat->B->cmap->n;
227     ierr = MatCreateSeqAIJWithArrays(PETSC_COMM_SELF,am,an,ci,cj,ca,Aloc);CHKERRQ(ierr);
228 
229     /* MatCreateSeqAIJWithArrays flags matrix so PETSc doesn't free the user's arrays. */
230     /* Since these are PETSc arrays, change flags to free them as necessary. */
231     mat = (Mat_SeqAIJ*)(*Aloc)->data;
232     mat->free_a       = PETSC_TRUE;
233     mat->free_ij      = PETSC_TRUE;
234 
235     mat->nonew    = 0;
236   } else if (scall == MAT_REUSE_MATRIX){
237     mat=(Mat_SeqAIJ*)(*Aloc)->data;
238     ci = mat->i; cj = mat->j; ca = mat->a;
239     for (i=0; i<am; i++) {
240       /* diagonal portion of A */
241       ncols = ai[i+1] - ai[i];
242       for (j=0; j<ncols; j++) *ca++ = *aa++;
243       /* off-diagonal portion of A */
244       ncols = bi[i+1] - bi[i];
245       for (j=0; j<ncols; j++) *ca++ = *ba++;
246     }
247   } else {
248     SETERRQ1(PETSC_ERR_ARG_WRONG,"Invalid MatReuse %d",(int)scall);
249   }
250   PetscFunctionReturn(0);
251 }
252 
253 extern PetscErrorCode MatDestroy_Shell(Mat);
254 #undef __FUNCT__
255 #define __FUNCT__ "MatDestroy_ML"
256 static PetscErrorCode MatDestroy_ML(Mat A)
257 {
258   PetscErrorCode ierr;
259   Mat_MLShell    *shell;
260 
261   PetscFunctionBegin;
262   ierr = MatShellGetContext(A,(void **)&shell);CHKERRQ(ierr);
263   ierr = VecDestroy(shell->y);CHKERRQ(ierr);
264   ierr = PetscFree(shell);CHKERRQ(ierr);
265   ierr = MatDestroy_Shell(A);CHKERRQ(ierr);
266   ierr = PetscObjectChangeTypeName((PetscObject)A,0);CHKERRQ(ierr);
267   PetscFunctionReturn(0);
268 }
269 
270 #undef __FUNCT__
271 #define __FUNCT__ "MatWrapML_SeqAIJ"
272 static PetscErrorCode MatWrapML_SeqAIJ(ML_Operator *mlmat,MatReuse reuse,Mat *newmat)
273 {
274   struct ML_CSR_MSRdata *matdata = (struct ML_CSR_MSRdata *)mlmat->data;
275   PetscErrorCode        ierr;
276   PetscInt              m=mlmat->outvec_leng,n=mlmat->invec_leng,*nnz,nz_max;
277   PetscInt              *ml_cols=matdata->columns,*ml_rowptr=matdata->rowptr,*aj,i,j,k;
278   PetscScalar           *ml_vals=matdata->values,*aa;
279 
280   PetscFunctionBegin;
281   if ( mlmat->getrow == NULL) SETERRQ(PETSC_ERR_ARG_NULL,"mlmat->getrow = NULL");
282   if (m != n){ /* ML Pmat and Rmat are in CSR format. Pass array pointers into SeqAIJ matrix */
283     if (reuse){
284       Mat_SeqAIJ  *aij= (Mat_SeqAIJ*)(*newmat)->data;
285       aij->i = ml_rowptr;
286       aij->j = ml_cols;
287       aij->a = ml_vals;
288     } else {
289       /* sort ml_cols and ml_vals */
290       ierr = PetscMalloc((m+1)*sizeof(PetscInt),&nnz);
291       for (i=0; i<m; i++) {
292         nnz[i] = ml_rowptr[i+1] - ml_rowptr[i];
293       }
294       aj = ml_cols; aa = ml_vals;
295       for (i=0; i<m; i++){
296         ierr = PetscSortIntWithScalarArray(nnz[i],aj,aa);CHKERRQ(ierr);
297         aj += nnz[i]; aa += nnz[i];
298       }
299       ierr = MatCreateSeqAIJWithArrays(PETSC_COMM_SELF,m,n,ml_rowptr,ml_cols,ml_vals,newmat);CHKERRQ(ierr);
300       ierr = PetscFree(nnz);CHKERRQ(ierr);
301     }
302     PetscFunctionReturn(0);
303   }
304 
305   /* ML Amat is in MSR format. Copy its data into SeqAIJ matrix */
306   ierr = MatCreate(PETSC_COMM_SELF,newmat);CHKERRQ(ierr);
307   ierr = MatSetSizes(*newmat,m,n,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr);
308   ierr = MatSetType(*newmat,MATSEQAIJ);CHKERRQ(ierr);
309 
310   ierr = PetscMalloc((m+1)*sizeof(PetscInt),&nnz);
311   nz_max = 1;
312   for (i=0; i<m; i++) {
313     nnz[i] = ml_cols[i+1] - ml_cols[i] + 1;
314     if (nnz[i] > nz_max) nz_max += nnz[i];
315   }
316 
317   ierr = MatSeqAIJSetPreallocation(*newmat,0,nnz);CHKERRQ(ierr);
318   ierr = PetscMalloc2(nz_max,PetscScalar,&aa,nz_max,PetscInt,&aj);CHKERRQ(ierr);
319   for (i=0; i<m; i++){
320     k = 0;
321     /* diagonal entry */
322     aj[k] = i; aa[k++] = ml_vals[i];
323     /* off diagonal entries */
324     for (j=ml_cols[i]; j<ml_cols[i+1]; j++){
325       aj[k] = ml_cols[j]; aa[k++] = ml_vals[j];
326     }
327     /* sort aj and aa */
328     ierr = PetscSortIntWithScalarArray(nnz[i],aj,aa);CHKERRQ(ierr);
329     ierr = MatSetValues(*newmat,1,&i,nnz[i],aj,aa,INSERT_VALUES);CHKERRQ(ierr);
330   }
331   ierr = MatAssemblyBegin(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
332   ierr = MatAssemblyEnd(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
333 
334   ierr = PetscFree2(aa,aj);CHKERRQ(ierr);
335   ierr = PetscFree(nnz);CHKERRQ(ierr);
336   PetscFunctionReturn(0);
337 }
338 
339 #undef __FUNCT__
340 #define __FUNCT__ "MatWrapML_SHELL"
341 static PetscErrorCode MatWrapML_SHELL(ML_Operator *mlmat,MatReuse reuse,Mat *newmat)
342 {
343   PetscErrorCode ierr;
344   PetscInt       m,n;
345   ML_Comm        *MLcomm;
346   Mat_MLShell    *shellctx;
347 
348   PetscFunctionBegin;
349   m = mlmat->outvec_leng;
350   n = mlmat->invec_leng;
351   if (!m || !n){
352     newmat = PETSC_NULL;
353     PetscFunctionReturn(0);
354   }
355 
356   if (reuse){
357     ierr = MatShellGetContext(*newmat,(void **)&shellctx);CHKERRQ(ierr);
358     shellctx->mlmat = mlmat;
359     PetscFunctionReturn(0);
360   }
361 
362   MLcomm = mlmat->comm;
363   ierr = PetscNew(Mat_MLShell,&shellctx);CHKERRQ(ierr);
364   ierr = MatCreateShell(MLcomm->USR_comm,m,n,PETSC_DETERMINE,PETSC_DETERMINE,shellctx,newmat);CHKERRQ(ierr);
365   ierr = MatShellSetOperation(*newmat,MATOP_MULT,(void(*)(void))MatMult_ML);CHKERRQ(ierr);
366   ierr = MatShellSetOperation(*newmat,MATOP_MULT_ADD,(void(*)(void))MatMultAdd_ML);CHKERRQ(ierr);
367   shellctx->A         = *newmat;
368   shellctx->mlmat     = mlmat;
369   ierr = VecCreate(PETSC_COMM_WORLD,&shellctx->y);CHKERRQ(ierr);
370   ierr = VecSetSizes(shellctx->y,m,PETSC_DECIDE);CHKERRQ(ierr);
371   ierr = VecSetFromOptions(shellctx->y);CHKERRQ(ierr);
372   (*newmat)->ops->destroy = MatDestroy_ML;
373   PetscFunctionReturn(0);
374 }
375 
376 #undef __FUNCT__
377 #define __FUNCT__ "MatWrapML_MPIAIJ"
378 static PetscErrorCode MatWrapML_MPIAIJ(ML_Operator *mlmat,Mat *newmat)
379 {
380   struct ML_CSR_MSRdata *matdata = (struct ML_CSR_MSRdata *)mlmat->data;
381   PetscInt              *ml_cols=matdata->columns,*aj;
382   PetscScalar           *ml_vals=matdata->values,*aa;
383   PetscErrorCode        ierr;
384   PetscInt              i,j,k,*gordering;
385   PetscInt              m=mlmat->outvec_leng,n,*nnzA,*nnzB,*nnz,nz_max,row;
386   Mat                   A;
387 
388   PetscFunctionBegin;
389   if (mlmat->getrow == NULL) SETERRQ(PETSC_ERR_ARG_NULL,"mlmat->getrow = NULL");
390   n = mlmat->invec_leng;
391   if (m != n) SETERRQ2(PETSC_ERR_ARG_OUTOFRANGE,"m %d must equal to n %d",m,n);
392 
393   ierr = MatCreate(mlmat->comm->USR_comm,&A);CHKERRQ(ierr);
394   ierr = MatSetSizes(A,m,n,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr);
395   ierr = MatSetType(A,MATMPIAIJ);CHKERRQ(ierr);
396   ierr = PetscMalloc3(m,PetscInt,&nnzA,m,PetscInt,&nnzB,m,PetscInt,&nnz);CHKERRQ(ierr);
397 
398   nz_max = 0;
399   for (i=0; i<m; i++){
400     nnz[i] = ml_cols[i+1] - ml_cols[i] + 1;
401     if (nz_max < nnz[i]) nz_max = nnz[i];
402     nnzA[i] = 1; /* diag */
403     for (j=ml_cols[i]; j<ml_cols[i+1]; j++){
404       if (ml_cols[j] < m) nnzA[i]++;
405     }
406     nnzB[i] = nnz[i] - nnzA[i];
407   }
408   ierr = MatMPIAIJSetPreallocation(A,0,nnzA,0,nnzB);CHKERRQ(ierr);
409 
410   /* insert mat values -- remap row and column indices */
411   nz_max++;
412   ierr = PetscMalloc2(nz_max,PetscScalar,&aa,nz_max,PetscInt,&aj);CHKERRQ(ierr);
413   /* create global row numbering for a ML_Operator */
414   ML_build_global_numbering(mlmat,&gordering,"rows");
415   for (i=0; i<m; i++){
416     row = gordering[i];
417     k = 0;
418     /* diagonal entry */
419     aj[k] = row; aa[k++] = ml_vals[i];
420     /* off diagonal entries */
421     for (j=ml_cols[i]; j<ml_cols[i+1]; j++){
422       aj[k] = gordering[ml_cols[j]]; aa[k++] = ml_vals[j];
423     }
424     ierr = MatSetValues(A,1,&row,nnz[i],aj,aa,INSERT_VALUES);CHKERRQ(ierr);
425   }
426   ierr = MatAssemblyBegin(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
427   ierr = MatAssemblyEnd(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
428   *newmat = A;
429 
430   ierr = PetscFree3(nnzA,nnzB,nnz);
431   ierr = PetscFree2(aa,aj);CHKERRQ(ierr);
432   PetscFunctionReturn(0);
433 }
434 
435 /* -----------------------------------------------------------------------------*/
436 #undef __FUNCT__
437 #define __FUNCT__ "PCDestroy_ML_Private"
438 PetscErrorCode PCDestroy_ML_Private(void *ptr)
439 {
440   PetscErrorCode  ierr;
441   PC_ML           *pc_ml = (PC_ML*)ptr;
442   PetscInt        level,fine_level=pc_ml->Nlevels-1;
443 
444   PetscFunctionBegin;
445   ML_Aggregate_Destroy(&pc_ml->agg_object);
446   ML_Destroy(&pc_ml->ml_object);
447 
448   if (pc_ml->PetscMLdata) {
449     ierr = PetscFree(pc_ml->PetscMLdata->pwork);CHKERRQ(ierr);
450     if (pc_ml->size > 1)      {ierr = MatDestroy(pc_ml->PetscMLdata->Aloc);CHKERRQ(ierr);}
451     if (pc_ml->PetscMLdata->x){ierr = VecDestroy(pc_ml->PetscMLdata->x);CHKERRQ(ierr);}
452     if (pc_ml->PetscMLdata->y){ierr = VecDestroy(pc_ml->PetscMLdata->y);CHKERRQ(ierr);}
453   }
454   ierr = PetscFree(pc_ml->PetscMLdata);CHKERRQ(ierr);
455 
456   for (level=0; level<fine_level; level++){
457     if (pc_ml->gridctx[level].A){ierr = MatDestroy(pc_ml->gridctx[level].A);CHKERRQ(ierr);}
458     if (pc_ml->gridctx[level].P){ierr = MatDestroy(pc_ml->gridctx[level].P);CHKERRQ(ierr);}
459     if (pc_ml->gridctx[level].R){ierr = MatDestroy(pc_ml->gridctx[level].R);CHKERRQ(ierr);}
460     if (pc_ml->gridctx[level].x){ierr = VecDestroy(pc_ml->gridctx[level].x);CHKERRQ(ierr);}
461     if (pc_ml->gridctx[level].b){ierr = VecDestroy(pc_ml->gridctx[level].b);CHKERRQ(ierr);}
462     if (pc_ml->gridctx[level+1].r){ierr = VecDestroy(pc_ml->gridctx[level+1].r);CHKERRQ(ierr);}
463   }
464   ierr = PetscFree(pc_ml->gridctx);CHKERRQ(ierr);
465   PetscFunctionReturn(0);
466 }
467 /* -------------------------------------------------------------------------- */
468 /*
469    PCSetUp_ML - Prepares for the use of the ML preconditioner
470                     by setting data structures and options.
471 
472    Input Parameter:
473 .  pc - the preconditioner context
474 
475    Application Interface Routine: PCSetUp()
476 
477    Notes:
478    The interface routine PCSetUp() is not usually called directly by
479    the user, but instead is called by PCApply() if necessary.
480 */
481 extern PetscErrorCode PCSetFromOptions_MG(PC);
482 extern PetscErrorCode PCDestroy_MG_Private(PC);
483 
484 #undef __FUNCT__
485 #define __FUNCT__ "PCSetUp_ML"
486 PetscErrorCode PCSetUp_ML(PC pc)
487 {
488   PetscErrorCode  ierr;
489   PetscMPIInt     size;
490   FineGridCtx     *PetscMLdata;
491   ML              *ml_object;
492   ML_Aggregate    *agg_object;
493   ML_Operator     *mlmat;
494   PetscInt        nlocal_allcols,Nlevels,mllevel,level,level1,m,fine_level,bs;
495   Mat             A,Aloc;
496   GridCtx         *gridctx;
497   PC_MG           *mg = (PC_MG*)pc->data;
498   PC_ML           *pc_ml = (PC_ML*)mg->innerctx;
499   PetscTruth      isSeq, isMPI;
500   KSP             smoother;
501   PC              subpc;
502 
503   PetscFunctionBegin;
504   if (pc->setupcalled){
505     /* since ML can change the size of vectors/matrices at any level we must destroy everything */
506     ierr = PCDestroy_ML_Private(pc_ml);CHKERRQ(ierr);
507     ierr = PCDestroy_MG_Private(pc);CHKERRQ(ierr);
508   }
509 
510   /* setup special features of PCML */
511   /*--------------------------------*/
512   /* covert A to Aloc to be used by ML at fine grid */
513   A = pc->pmat;
514   ierr = MPI_Comm_size(((PetscObject)A)->comm,&size);CHKERRQ(ierr);
515   pc_ml->size = size;
516   ierr = PetscTypeCompare((PetscObject) A, MATSEQAIJ, &isSeq);CHKERRQ(ierr);
517   ierr = PetscTypeCompare((PetscObject) A, MATMPIAIJ, &isMPI);CHKERRQ(ierr);
518   if (isMPI){
519     ierr = MatConvert_MPIAIJ_ML(A,PETSC_NULL,MAT_INITIAL_MATRIX,&Aloc);CHKERRQ(ierr);
520   } else if (isSeq) {
521     Aloc = A;
522   } else {
523     SETERRQ(PETSC_ERR_ARG_WRONG, "Invalid matrix type for ML. ML can only handle AIJ matrices.");
524   }
525 
526   /* create and initialize struct 'PetscMLdata' */
527   ierr = PetscNewLog(pc,FineGridCtx,&PetscMLdata);CHKERRQ(ierr);
528   pc_ml->PetscMLdata = PetscMLdata;
529   ierr = PetscMalloc((Aloc->cmap->n+1)*sizeof(PetscScalar),&PetscMLdata->pwork);CHKERRQ(ierr);
530 
531   ierr = VecCreate(PETSC_COMM_SELF,&PetscMLdata->x);CHKERRQ(ierr);
532   ierr = VecSetSizes(PetscMLdata->x,Aloc->cmap->n,Aloc->cmap->n);CHKERRQ(ierr);
533   ierr = VecSetType(PetscMLdata->x,VECSEQ);CHKERRQ(ierr);
534 
535   ierr = VecCreate(PETSC_COMM_SELF,&PetscMLdata->y);CHKERRQ(ierr);
536   ierr = VecSetSizes(PetscMLdata->y,A->rmap->n,PETSC_DECIDE);CHKERRQ(ierr);
537   ierr = VecSetType(PetscMLdata->y,VECSEQ);CHKERRQ(ierr);
538   PetscMLdata->A    = A;
539   PetscMLdata->Aloc = Aloc;
540 
541   /* create ML discretization matrix at fine grid */
542   /* ML requires input of fine-grid matrix. It determines nlevels. */
543   ierr = MatGetSize(Aloc,&m,&nlocal_allcols);CHKERRQ(ierr);
544   ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr);
545   ML_Create(&ml_object,pc_ml->MaxNlevels);
546   pc_ml->ml_object = ml_object;
547   ML_Init_Amatrix(ml_object,0,m,m,PetscMLdata);
548   ML_Set_Amatrix_Getrow(ml_object,0,PetscML_getrow,PetscML_comm,nlocal_allcols);
549   ML_Set_Amatrix_Matvec(ml_object,0,PetscML_matvec);
550 
551   /* aggregation */
552   ML_Aggregate_Create(&agg_object);
553   pc_ml->agg_object = agg_object;
554 
555   ML_Aggregate_Set_NullSpace(agg_object,bs,bs,0,0);CHKERRQ(ierr);
556   ML_Aggregate_Set_MaxCoarseSize(agg_object,pc_ml->MaxCoarseSize);
557   /* set options */
558   switch (pc_ml->CoarsenScheme) {
559   case 1:
560     ML_Aggregate_Set_CoarsenScheme_Coupled(agg_object);break;
561   case 2:
562     ML_Aggregate_Set_CoarsenScheme_MIS(agg_object);break;
563   case 3:
564     ML_Aggregate_Set_CoarsenScheme_METIS(agg_object);break;
565   }
566   ML_Aggregate_Set_Threshold(agg_object,pc_ml->Threshold);
567   ML_Aggregate_Set_DampingFactor(agg_object,pc_ml->DampingFactor);
568   if (pc_ml->SpectralNormScheme_Anorm){
569     ML_Set_SpectralNormScheme_Anorm(ml_object);
570   }
571 
572   Nlevels = ML_Gen_MGHierarchy_UsingAggregation(ml_object,0,ML_INCREASING,agg_object);
573   if (Nlevels<=0) SETERRQ1(PETSC_ERR_ARG_OUTOFRANGE,"Nlevels %d must > 0",Nlevels);
574   pc_ml->Nlevels = Nlevels;
575   fine_level = Nlevels - 1;
576 
577   ierr = PCMGSetLevels(pc,Nlevels,PETSC_NULL);CHKERRQ(ierr);
578   /* set default smoothers */
579   for (level=1; level<=fine_level; level++){
580     if (size == 1){
581       ierr = PCMGGetSmoother(pc,level,&smoother);CHKERRQ(ierr);
582       ierr = KSPSetType(smoother,KSPRICHARDSON);CHKERRQ(ierr);
583       ierr = KSPGetPC(smoother,&subpc);CHKERRQ(ierr);
584       ierr = PCSetType(subpc,PCSOR);CHKERRQ(ierr);
585     } else {
586       ierr = PCMGGetSmoother(pc,level,&smoother);CHKERRQ(ierr);
587       ierr = KSPSetType(smoother,KSPRICHARDSON);CHKERRQ(ierr);
588       ierr = KSPGetPC(smoother,&subpc);CHKERRQ(ierr);
589       ierr = PCSetType(subpc,PCSOR);CHKERRQ(ierr);
590     }
591   }
592   ierr = PCSetFromOptions_MG(pc);CHKERRQ(ierr); /* should be called in PCSetFromOptions_ML(), but cannot be called prior to PCMGSetLevels() */
593 
594   ierr = PetscMalloc(Nlevels*sizeof(GridCtx),&gridctx);CHKERRQ(ierr);
595   pc_ml->gridctx = gridctx;
596 
597   /* wrap ML matrices by PETSc shell matrices at coarsened grids.
598      Level 0 is the finest grid for ML, but coarsest for PETSc! */
599   gridctx[fine_level].A = A;
600 
601   level = fine_level - 1;
602   if (size == 1){ /* convert ML P, R and A into seqaij format */
603     for (mllevel=1; mllevel<Nlevels; mllevel++){
604       mlmat = &(ml_object->Pmat[mllevel]);
605       ierr  = MatWrapML_SeqAIJ(mlmat,MAT_INITIAL_MATRIX,&gridctx[level].P);CHKERRQ(ierr);
606       mlmat = &(ml_object->Rmat[mllevel-1]);
607       ierr  = MatWrapML_SeqAIJ(mlmat,MAT_INITIAL_MATRIX,&gridctx[level].R);CHKERRQ(ierr);
608 
609       mlmat = &(ml_object->Amat[mllevel]);
610       ierr  = MatWrapML_SeqAIJ(mlmat,MAT_INITIAL_MATRIX,&gridctx[level].A);CHKERRQ(ierr);
611       level--;
612     }
613   } else { /* convert ML P and R into shell format, ML A into mpiaij format */
614     for (mllevel=1; mllevel<Nlevels; mllevel++){
615       mlmat  = &(ml_object->Pmat[mllevel]);
616       ierr = MatWrapML_SHELL(mlmat,MAT_INITIAL_MATRIX,&gridctx[level].P);CHKERRQ(ierr);
617       mlmat  = &(ml_object->Rmat[mllevel-1]);
618       ierr = MatWrapML_SHELL(mlmat,MAT_INITIAL_MATRIX,&gridctx[level].R);CHKERRQ(ierr);
619 
620       mlmat  = &(ml_object->Amat[mllevel]);
621       ierr = MatWrapML_MPIAIJ(mlmat,&gridctx[level].A);CHKERRQ(ierr);
622       level--;
623     }
624   }
625 
626   /* create vectors and ksp at all levels */
627   for (level=0; level<fine_level; level++){
628     level1 = level + 1;
629     ierr = VecCreate(((PetscObject)gridctx[level].A)->comm,&gridctx[level].x);CHKERRQ(ierr);
630     ierr = VecSetSizes(gridctx[level].x,gridctx[level].A->cmap->n,PETSC_DECIDE);CHKERRQ(ierr);
631     ierr = VecSetType(gridctx[level].x,VECMPI);CHKERRQ(ierr);
632     ierr = PCMGSetX(pc,level,gridctx[level].x);CHKERRQ(ierr);
633 
634     ierr = VecCreate(((PetscObject)gridctx[level].A)->comm,&gridctx[level].b);CHKERRQ(ierr);
635     ierr = VecSetSizes(gridctx[level].b,gridctx[level].A->rmap->n,PETSC_DECIDE);CHKERRQ(ierr);
636     ierr = VecSetType(gridctx[level].b,VECMPI);CHKERRQ(ierr);
637     ierr = PCMGSetRhs(pc,level,gridctx[level].b);CHKERRQ(ierr);
638 
639     ierr = VecCreate(((PetscObject)gridctx[level1].A)->comm,&gridctx[level1].r);CHKERRQ(ierr);
640     ierr = VecSetSizes(gridctx[level1].r,gridctx[level1].A->rmap->n,PETSC_DECIDE);CHKERRQ(ierr);
641     ierr = VecSetType(gridctx[level1].r,VECMPI);CHKERRQ(ierr);
642     ierr = PCMGSetR(pc,level1,gridctx[level1].r);CHKERRQ(ierr);
643 
644     if (level == 0){
645       ierr = PCMGGetCoarseSolve(pc,&gridctx[level].ksp);CHKERRQ(ierr);
646     } else {
647       ierr = PCMGGetSmoother(pc,level,&gridctx[level].ksp);CHKERRQ(ierr);
648     }
649   }
650   ierr = PCMGGetSmoother(pc,fine_level,&gridctx[fine_level].ksp);CHKERRQ(ierr);
651 
652   /* create coarse level and the interpolation between the levels */
653   for (level=0; level<fine_level; level++){
654     level1 = level + 1;
655     ierr = PCMGSetInterpolation(pc,level1,gridctx[level].P);CHKERRQ(ierr);
656     ierr = PCMGSetRestriction(pc,level1,gridctx[level].R);CHKERRQ(ierr);
657     if (level > 0){
658       ierr = PCMGSetResidual(pc,level,PCMGDefaultResidual,gridctx[level].A);CHKERRQ(ierr);
659     }
660     ierr = KSPSetOperators(gridctx[level].ksp,gridctx[level].A,gridctx[level].A,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
661   }
662   ierr = PCMGSetResidual(pc,fine_level,PCMGDefaultResidual,gridctx[fine_level].A);CHKERRQ(ierr);
663   ierr = KSPSetOperators(gridctx[fine_level].ksp,gridctx[level].A,gridctx[fine_level].A,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
664 
665   /* setupcalled is set to 0 so that MG is setup from scratch */
666   pc->setupcalled = 0;
667   ierr = PCSetUp_MG(pc);CHKERRQ(ierr);
668   PetscFunctionReturn(0);
669 }
670 
671 /* -------------------------------------------------------------------------- */
672 /*
673    PCDestroy_ML - Destroys the private context for the ML preconditioner
674    that was created with PCCreate_ML().
675 
676    Input Parameter:
677 .  pc - the preconditioner context
678 
679    Application Interface Routine: PCDestroy()
680 */
681 #undef __FUNCT__
682 #define __FUNCT__ "PCDestroy_ML"
683 PetscErrorCode PCDestroy_ML(PC pc)
684 {
685   PetscErrorCode  ierr;
686   PC_MG           *mg = (PC_MG*)pc->data;
687   PC_ML           *pc_ml= (PC_ML*)mg->innerctx;
688 
689   PetscFunctionBegin;
690   ierr = PCDestroy_ML_Private(pc_ml);CHKERRQ(ierr);
691   ierr = PetscFree(pc_ml);CHKERRQ(ierr);
692   ierr = PCDestroy_MG(pc);CHKERRQ(ierr);
693   PetscFunctionReturn(0);
694 }
695 
696 #undef __FUNCT__
697 #define __FUNCT__ "PCSetFromOptions_ML"
698 PetscErrorCode PCSetFromOptions_ML(PC pc)
699 {
700   PetscErrorCode  ierr;
701   PetscInt        indx,PrintLevel;
702   const char      *scheme[] = {"Uncoupled","Coupled","MIS","METIS"};
703   PC_MG           *mg = (PC_MG*)pc->data;
704   PC_ML           *pc_ml = (PC_ML*)mg->innerctx;
705 
706   PetscFunctionBegin;
707   ierr = PetscOptionsHead("ML options");CHKERRQ(ierr);
708   PrintLevel    = 0;
709   indx          = 0;
710   ierr = PetscOptionsInt("-pc_ml_PrintLevel","Print level","ML_Set_PrintLevel",PrintLevel,&PrintLevel,PETSC_NULL);CHKERRQ(ierr);
711   ML_Set_PrintLevel(PrintLevel);
712   ierr = PetscOptionsInt("-pc_ml_maxNlevels","Maximum number of levels","None",pc_ml->MaxNlevels,&pc_ml->MaxNlevels,PETSC_NULL);CHKERRQ(ierr);
713   ierr = PetscOptionsInt("-pc_ml_maxCoarseSize","Maximum coarsest mesh size","ML_Aggregate_Set_MaxCoarseSize",pc_ml->MaxCoarseSize,&pc_ml->MaxCoarseSize,PETSC_NULL);CHKERRQ(ierr);
714   ierr = PetscOptionsEList("-pc_ml_CoarsenScheme","Aggregate Coarsen Scheme","ML_Aggregate_Set_CoarsenScheme_*",scheme,4,scheme[0],&indx,PETSC_NULL);CHKERRQ(ierr);
715   pc_ml->CoarsenScheme = indx;
716   ierr = PetscOptionsReal("-pc_ml_DampingFactor","P damping factor","ML_Aggregate_Set_DampingFactor",pc_ml->DampingFactor,&pc_ml->DampingFactor,PETSC_NULL);CHKERRQ(ierr);
717   ierr = PetscOptionsReal("-pc_ml_Threshold","Smoother drop tol","ML_Aggregate_Set_Threshold",pc_ml->Threshold,&pc_ml->Threshold,PETSC_NULL);CHKERRQ(ierr);
718   ierr = PetscOptionsTruth("-pc_ml_SpectralNormScheme_Anorm","Method used for estimating spectral radius","ML_Set_SpectralNormScheme_Anorm",pc_ml->SpectralNormScheme_Anorm,&pc_ml->SpectralNormScheme_Anorm,PETSC_NULL);
719   ierr = PetscOptionsTail();CHKERRQ(ierr);
720   PetscFunctionReturn(0);
721 }
722 
723 /* -------------------------------------------------------------------------- */
724 /*
725    PCCreate_ML - Creates a ML preconditioner context, PC_ML,
726    and sets this as the private data within the generic preconditioning
727    context, PC, that was created within PCCreate().
728 
729    Input Parameter:
730 .  pc - the preconditioner context
731 
732    Application Interface Routine: PCCreate()
733 */
734 
735 /*MC
736      PCML - Use algebraic multigrid preconditioning. This preconditioner requires you provide
737        fine grid discretization matrix. The coarser grid matrices and restriction/interpolation
738        operators are computed by ML, with the matrices coverted to PETSc matrices in aij format
739        and the restriction/interpolation operators wrapped as PETSc shell matrices.
740 
741    Options Database Key:
742    Multigrid options(inherited)
743 +  -pc_mg_cycles <1>: 1 for V cycle, 2 for W-cycle (MGSetCycles)
744 .  -pc_mg_smoothup <1>: Number of post-smoothing steps (MGSetNumberSmoothUp)
745 .  -pc_mg_smoothdown <1>: Number of pre-smoothing steps (MGSetNumberSmoothDown)
746 -  -pc_mg_type <multiplicative>: (one of) additive multiplicative full cascade kascade
747 
748    ML options:
749 +  -pc_ml_PrintLevel <0>: Print level (ML_Set_PrintLevel)
750 .  -pc_ml_maxNlevels <10>: Maximum number of levels (None)
751 .  -pc_ml_maxCoarseSize <1>: Maximum coarsest mesh size (ML_Aggregate_Set_MaxCoarseSize)
752 .  -pc_ml_CoarsenScheme <Uncoupled>: (one of) Uncoupled Coupled MIS METIS
753 .  -pc_ml_DampingFactor <1.33333>: P damping factor (ML_Aggregate_Set_DampingFactor)
754 .  -pc_ml_Threshold <0>: Smoother drop tol (ML_Aggregate_Set_Threshold)
755 -  -pc_ml_SpectralNormScheme_Anorm <false>: Method used for estimating spectral radius (ML_Set_SpectralNormScheme_Anorm)
756 
757    Level: intermediate
758 
759   Concepts: multigrid
760 
761 .seealso:  PCCreate(), PCSetType(), PCType (for list of available types), PC, PCMGType,
762            PCMGSetLevels(), PCMGGetLevels(), PCMGSetType(), MPSetCycles(), PCMGSetNumberSmoothDown(),
763            PCMGSetNumberSmoothUp(), PCMGGetCoarseSolve(), PCMGSetResidual(), PCMGSetInterpolation(),
764            PCMGSetRestriction(), PCMGGetSmoother(), PCMGGetSmootherUp(), PCMGGetSmootherDown(),
765            PCMGSetCyclesOnLevel(), PCMGSetRhs(), PCMGSetX(), PCMGSetR()
766 M*/
767 
768 EXTERN_C_BEGIN
769 #undef __FUNCT__
770 #define __FUNCT__ "PCCreate_ML"
771 PetscErrorCode PETSCKSP_DLLEXPORT PCCreate_ML(PC pc)
772 {
773   PetscErrorCode  ierr;
774   PC_ML           *pc_ml;
775   PC_MG           *mg;
776 
777   PetscFunctionBegin;
778   /* PCML is an inherited class of PCMG. Initialize pc as PCMG */
779   ierr = PetscObjectChangeTypeName((PetscObject)pc,PCML);CHKERRQ(ierr);
780   ierr = PCSetType(pc,PCMG);CHKERRQ(ierr); /* calls PCCreate_MG() and MGCreate_Private() */
781 
782   /* create a supporting struct and attach it to pc */
783   ierr = PetscNewLog(pc,PC_ML,&pc_ml);CHKERRQ(ierr);
784   mg = (PC_MG*)pc->data;
785   mg->innerctx = pc_ml;
786 
787   pc_ml->ml_object     = 0;
788   pc_ml->agg_object    = 0;
789   pc_ml->gridctx       = 0;
790   pc_ml->PetscMLdata   = 0;
791   pc_ml->Nlevels       = -1;
792   pc_ml->MaxNlevels    = 10;
793   pc_ml->MaxCoarseSize = 1;
794   pc_ml->CoarsenScheme = 1;
795   pc_ml->Threshold     = 0.0;
796   pc_ml->DampingFactor = 4.0/3.0;
797   pc_ml->SpectralNormScheme_Anorm = PETSC_FALSE;
798   pc_ml->size          = 0;
799 
800   /* overwrite the pointers of PCMG by the functions of PCML */
801   pc->ops->setfromoptions = PCSetFromOptions_ML;
802   pc->ops->setup          = PCSetUp_ML;
803   pc->ops->destroy        = PCDestroy_ML;
804   PetscFunctionReturn(0);
805 }
806 EXTERN_C_END
807