/* Defines projective product routines where A is a SeqAIJ matrix C = P^T * A * P */ #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ #include <../src/mat/utils/freespace.h> #include #include #if defined(PETSC_HAVE_HYPRE) PETSC_INTERN PetscErrorCode MatPtAPSymbolic_AIJ_AIJ_wHYPRE(Mat,Mat,PetscReal,Mat*); #endif PETSC_INTERN PetscErrorCode MatPtAP_SeqAIJ_SeqAIJ(Mat A,Mat P,MatReuse scall,PetscReal fill,Mat *C) { PetscErrorCode ierr; #if !defined(PETSC_HAVE_HYPRE) const char *algTypes[2] = {"scalable","rap"}; PetscInt nalg = 2; #else const char *algTypes[3] = {"scalable","rap","hypre"}; PetscInt nalg = 3; #endif PetscInt alg = 1; /* set default algorithm */ Mat Pt; Mat_MatTransMatMult *atb; Mat_SeqAIJ *c; PetscFunctionBegin; if (scall == MAT_INITIAL_MATRIX) { /* Alg 'scalable' determines which implementations to be used: "rap": Pt = P^T and C = Pt*A*P "scalable": do outer product and two sparse axpy in MatPtAPNumeric() - might slow, does not store structure of A*P. "hypre": use boomerAMGBuildCoarseOperator. */ ierr = PetscObjectOptionsBegin((PetscObject)A);CHKERRQ(ierr); PetscOptionsObject->alreadyprinted = PETSC_FALSE; /* a hack to ensure the option shows in '-help' */ ierr = PetscOptionsEList("-matptap_via","Algorithmic approach","MatPtAP",algTypes,nalg,algTypes[0],&alg,NULL);CHKERRQ(ierr); ierr = PetscOptionsEnd();CHKERRQ(ierr); switch (alg) { case 1: ierr = PetscNew(&atb);CHKERRQ(ierr); ierr = MatTranspose_SeqAIJ(P,MAT_INITIAL_MATRIX,&Pt);CHKERRQ(ierr); ierr = MatMatMatMult(Pt,A,P,MAT_INITIAL_MATRIX,fill,C);CHKERRQ(ierr); c = (Mat_SeqAIJ*)(*C)->data; c->atb = atb; atb->At = Pt; atb->destroy = (*C)->ops->destroy; (*C)->ops->destroy = MatDestroy_SeqAIJ_MatTransMatMult; (*C)->ops->ptapnumeric = MatPtAPNumeric_SeqAIJ_SeqAIJ; PetscFunctionReturn(0); break; #if defined(PETSC_HAVE_HYPRE) case 2: ierr = MatPtAPSymbolic_AIJ_AIJ_wHYPRE(A,P,fill,C);CHKERRQ(ierr); break; #endif default: ierr = MatPtAPSymbolic_SeqAIJ_SeqAIJ_SparseAxpy(A,P,fill,C);CHKERRQ(ierr); break; } } ierr = (*(*C)->ops->ptapnumeric)(A,P,*C);CHKERRQ(ierr); PetscFunctionReturn(0); } PetscErrorCode MatDestroy_SeqAIJ_PtAP(Mat A) { PetscErrorCode ierr; Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; Mat_PtAP *ptap = a->ptap; PetscFunctionBegin; ierr = PetscFree(ptap->apa);CHKERRQ(ierr); ierr = PetscFree(ptap->api);CHKERRQ(ierr); ierr = PetscFree(ptap->apj);CHKERRQ(ierr); ierr = (ptap->destroy)(A);CHKERRQ(ierr); ierr = PetscFree(ptap);CHKERRQ(ierr); PetscFunctionReturn(0); } PetscErrorCode MatPtAPSymbolic_SeqAIJ_SeqAIJ_SparseAxpy(Mat A,Mat P,PetscReal fill,Mat *C) { PetscErrorCode ierr; PetscFreeSpaceList free_space=NULL,current_space=NULL; Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*p = (Mat_SeqAIJ*)P->data,*c; PetscInt *pti,*ptj,*ptJ,*ai=a->i,*aj=a->j,*ajj,*pi=p->i,*pj=p->j,*pjj; PetscInt *ci,*cj,*ptadenserow,*ptasparserow,*ptaj,nspacedouble=0; PetscInt an=A->cmap->N,am=A->rmap->N,pn=P->cmap->N,pm=P->rmap->N; PetscInt i,j,k,ptnzi,arow,anzj,ptanzi,prow,pnzj,cnzi,nlnk,*lnk; MatScalar *ca; PetscBT lnkbt; PetscReal afill; PetscFunctionBegin; /* Get ij structure of P^T */ ierr = MatGetSymbolicTranspose_SeqAIJ(P,&pti,&ptj);CHKERRQ(ierr); ptJ = ptj; /* Allocate ci array, arrays for fill computation and */ /* free space for accumulating nonzero column info */ ierr = PetscMalloc1(pn+1,&ci);CHKERRQ(ierr); ci[0] = 0; ierr = PetscCalloc1(2*an+1,&ptadenserow);CHKERRQ(ierr); ptasparserow = ptadenserow + an; /* create and initialize a linked list */ nlnk = pn+1; ierr = PetscLLCreate(pn,pn,nlnk,lnk,lnkbt);CHKERRQ(ierr); /* Set initial free space to be fill*(nnz(A)+ nnz(P)) */ ierr = PetscFreeSpaceGet(PetscRealIntMultTruncate(fill,PetscIntSumTruncate(ai[am],pi[pm])),&free_space);CHKERRQ(ierr); current_space = free_space; /* Determine symbolic info for each row of C: */ for (i=0; ilocal_remainingtotal_array_size),¤t_space);CHKERRQ(ierr); nspacedouble++; } /* Copy data into free space, and zero out denserows */ ierr = PetscLLClean(pn,pn,cnzi,lnk,current_space->array,lnkbt);CHKERRQ(ierr); current_space->array += cnzi; current_space->local_used += cnzi; current_space->local_remaining -= cnzi; for (j=0; jcmap->bs),PetscAbs(P->cmap->bs));CHKERRQ(ierr); /* MatCreateSeqAIJWithArrays flags matrix so PETSc doesn't free the user's arrays. */ /* Since these are PETSc arrays, change flags to free them as necessary. */ c = (Mat_SeqAIJ*)((*C)->data); c->free_a = PETSC_TRUE; c->free_ij = PETSC_TRUE; c->nonew = 0; (*C)->ops->ptapnumeric = MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy; /* set MatInfo */ afill = (PetscReal)ci[pn]/(ai[am]+pi[pm] + 1.e-5); if (afill < 1.0) afill = 1.0; c->maxnz = ci[pn]; c->nz = ci[pn]; (*C)->info.mallocs = nspacedouble; (*C)->info.fill_ratio_given = fill; (*C)->info.fill_ratio_needed = afill; /* Clean up. */ ierr = MatRestoreSymbolicTranspose_SeqAIJ(P,&pti,&ptj);CHKERRQ(ierr); #if defined(PETSC_USE_INFO) if (ci[pn] != 0) { ierr = PetscInfo3((*C),"Reallocs %D; Fill ratio: given %g needed %g.\n",nspacedouble,(double)fill,(double)afill);CHKERRQ(ierr); ierr = PetscInfo1((*C),"Use MatPtAP(A,P,MatReuse,%g,&C) for best performance.\n",(double)afill);CHKERRQ(ierr); } else { ierr = PetscInfo((*C),"Empty matrix product\n");CHKERRQ(ierr); } #endif PetscFunctionReturn(0); } PetscErrorCode MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy(Mat A,Mat P,Mat C) { PetscErrorCode ierr; Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; Mat_SeqAIJ *p = (Mat_SeqAIJ*) P->data; Mat_SeqAIJ *c = (Mat_SeqAIJ*) C->data; PetscInt *ai=a->i,*aj=a->j,*apj,*apjdense,*pi=p->i,*pj=p->j,*pJ=p->j,*pjj; PetscInt *ci=c->i,*cj=c->j,*cjj; PetscInt am =A->rmap->N,cn=C->cmap->N,cm=C->rmap->N; PetscInt i,j,k,anzi,pnzi,apnzj,nextap,pnzj,prow,crow; MatScalar *aa=a->a,*apa,*pa=p->a,*pA=p->a,*paj,*ca=c->a,*caj; PetscFunctionBegin; /* Allocate temporary array for storage of one row of A*P (cn: non-scalable) */ ierr = PetscMalloc3(cn,&apa,cn,&apjdense,cn,&apj);CHKERRQ(ierr); ierr = PetscMemzero(apa,cn*sizeof(MatScalar));CHKERRQ(ierr); ierr = PetscMemzero(apjdense,cn*sizeof(PetscInt));CHKERRQ(ierr); /* Clear old values in C */ ierr = PetscMemzero(ca,ci[cm]*sizeof(MatScalar));CHKERRQ(ierr); for (i=0; i= ci[crow+1] - ci[crow]) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"k too large k %d, crow %d",k,crow); #endif if (cjj[k]==apj[nextap]) { caj[k] += (*pA)*apa[apj[nextap++]]; } } ierr = PetscLogFlops(2.0*apnzj);CHKERRQ(ierr); pA++; } /* Zero the current row info for A*P */ for (j=0; jdata; Mat_MatTransMatMult *atb = c->atb; Mat Pt = atb->At; PetscFunctionBegin; ierr = MatTranspose_SeqAIJ(P,MAT_REUSE_MATRIX,&Pt);CHKERRQ(ierr); ierr = (C->ops->matmatmultnumeric)(Pt,A,P,C);CHKERRQ(ierr); PetscFunctionReturn(0); }