/* Defines projective product routines where A is a SeqAIJ matrix C = P^T * A * P */ #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ #include <../src/mat/utils/freespace.h> #include #include #if defined(PETSC_HAVE_HYPRE) PETSC_INTERN PetscErrorCode MatPtAPSymbolic_AIJ_AIJ_wHYPRE(Mat,Mat,PetscReal,Mat); #endif PetscErrorCode MatProductSymbolic_PtAP_SeqAIJ_SeqAIJ(Mat C) { PetscErrorCode ierr; Mat_Product *product = C->product; Mat A=product->A,P=product->B; MatProductAlgorithm alg=product->alg; PetscReal fill=product->fill; PetscBool flg; Mat Pt; PetscFunctionBegin; /* "scalable" */ ierr = PetscStrcmp(alg,"scalable",&flg);CHKERRQ(ierr); if (flg) { ierr = MatPtAPSymbolic_SeqAIJ_SeqAIJ_SparseAxpy(A,P,fill,C);CHKERRQ(ierr); C->ops->productnumeric = MatProductNumeric_PtAP; PetscFunctionReturn(0); } /* "rap" */ ierr = PetscStrcmp(alg,"rap",&flg);CHKERRQ(ierr); if (flg) { Mat_MatTransMatMult *atb; ierr = PetscNew(&atb);CHKERRQ(ierr); ierr = MatTranspose_SeqAIJ(P,MAT_INITIAL_MATRIX,&Pt);CHKERRQ(ierr); ierr = MatMatMatMultSymbolic_SeqAIJ_SeqAIJ_SeqAIJ(Pt,A,P,fill,C);CHKERRQ(ierr); atb->At = Pt; atb->data = C->product->data; atb->destroy = C->product->destroy; C->product->data = atb; C->product->destroy = MatDestroy_SeqAIJ_MatTransMatMult; C->ops->ptapnumeric = MatPtAPNumeric_SeqAIJ_SeqAIJ; C->ops->productnumeric = MatProductNumeric_PtAP; PetscFunctionReturn(0); } /* hypre */ #if defined(PETSC_HAVE_HYPRE) ierr = PetscStrcmp(alg,"hypre",&flg);CHKERRQ(ierr); if (flg) { ierr = MatPtAPSymbolic_AIJ_AIJ_wHYPRE(A,P,fill,C);CHKERRQ(ierr); PetscFunctionReturn(0); } #endif SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"MatProductType is not supported"); PetscFunctionReturn(0); } PetscErrorCode MatPtAPSymbolic_SeqAIJ_SeqAIJ_SparseAxpy(Mat A,Mat P,PetscReal fill,Mat C) { PetscErrorCode ierr; PetscFreeSpaceList free_space=NULL,current_space=NULL; Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*p = (Mat_SeqAIJ*)P->data,*c; PetscInt *pti,*ptj,*ptJ,*ai=a->i,*aj=a->j,*ajj,*pi=p->i,*pj=p->j,*pjj; PetscInt *ci,*cj,*ptadenserow,*ptasparserow,*ptaj,nspacedouble=0; PetscInt an=A->cmap->N,am=A->rmap->N,pn=P->cmap->N,pm=P->rmap->N; PetscInt i,j,k,ptnzi,arow,anzj,ptanzi,prow,pnzj,cnzi,nlnk,*lnk; MatScalar *ca; PetscBT lnkbt; PetscReal afill; PetscFunctionBegin; /* Get ij structure of P^T */ ierr = MatGetSymbolicTranspose_SeqAIJ(P,&pti,&ptj);CHKERRQ(ierr); ptJ = ptj; /* Allocate ci array, arrays for fill computation and */ /* free space for accumulating nonzero column info */ ierr = PetscMalloc1(pn+1,&ci);CHKERRQ(ierr); ci[0] = 0; ierr = PetscCalloc1(2*an+1,&ptadenserow);CHKERRQ(ierr); ptasparserow = ptadenserow + an; /* create and initialize a linked list */ nlnk = pn+1; ierr = PetscLLCreate(pn,pn,nlnk,lnk,lnkbt);CHKERRQ(ierr); /* Set initial free space to be fill*(nnz(A)+ nnz(P)) */ ierr = PetscFreeSpaceGet(PetscRealIntMultTruncate(fill,PetscIntSumTruncate(ai[am],pi[pm])),&free_space);CHKERRQ(ierr); current_space = free_space; /* Determine symbolic info for each row of C: */ for (i=0; ilocal_remainingtotal_array_size),¤t_space);CHKERRQ(ierr); nspacedouble++; } /* Copy data into free space, and zero out denserows */ ierr = PetscLLClean(pn,pn,cnzi,lnk,current_space->array,lnkbt);CHKERRQ(ierr); current_space->array += cnzi; current_space->local_used += cnzi; current_space->local_remaining -= cnzi; for (j=0; jtype_name,C);CHKERRQ(ierr); ierr = MatSetBlockSizes(C,PetscAbs(P->cmap->bs),PetscAbs(P->cmap->bs));CHKERRQ(ierr); /* MatCreateSeqAIJWithArrays flags matrix so PETSc doesn't free the user's arrays. */ /* Since these are PETSc arrays, change flags to free them as necessary. */ c = (Mat_SeqAIJ*)((C)->data); c->free_a = PETSC_TRUE; c->free_ij = PETSC_TRUE; c->nonew = 0; C->ops->ptapnumeric = MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy; /* set MatInfo */ afill = (PetscReal)ci[pn]/(ai[am]+pi[pm] + 1.e-5); if (afill < 1.0) afill = 1.0; c->maxnz = ci[pn]; c->nz = ci[pn]; C->info.mallocs = nspacedouble; C->info.fill_ratio_given = fill; C->info.fill_ratio_needed = afill; /* Clean up. */ ierr = MatRestoreSymbolicTranspose_SeqAIJ(P,&pti,&ptj);CHKERRQ(ierr); #if defined(PETSC_USE_INFO) if (ci[pn] != 0) { ierr = PetscInfo3(C,"Reallocs %D; Fill ratio: given %g needed %g.\n",nspacedouble,(double)fill,(double)afill);CHKERRQ(ierr); ierr = PetscInfo1(C,"Use MatPtAP(A,P,MatReuse,%g,&C) for best performance.\n",(double)afill);CHKERRQ(ierr); } else { ierr = PetscInfo(C,"Empty matrix product\n");CHKERRQ(ierr); } #endif PetscFunctionReturn(0); } PetscErrorCode MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy(Mat A,Mat P,Mat C) { PetscErrorCode ierr; Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; Mat_SeqAIJ *p = (Mat_SeqAIJ*) P->data; Mat_SeqAIJ *c = (Mat_SeqAIJ*) C->data; PetscInt *ai=a->i,*aj=a->j,*apj,*apjdense,*pi=p->i,*pj=p->j,*pJ=p->j,*pjj; PetscInt *ci=c->i,*cj=c->j,*cjj; PetscInt am =A->rmap->N,cn=C->cmap->N,cm=C->rmap->N; PetscInt i,j,k,anzi,pnzi,apnzj,nextap,pnzj,prow,crow; MatScalar *aa=a->a,*apa,*pa=p->a,*pA=p->a,*paj,*ca=c->a,*caj; PetscFunctionBegin; /* Allocate temporary array for storage of one row of A*P (cn: non-scalable) */ ierr = PetscCalloc2(cn,&apa,cn,&apjdense);CHKERRQ(ierr); ierr = PetscMalloc1(cn,&apj);CHKERRQ(ierr); /* Clear old values in C */ ierr = PetscArrayzero(ca,ci[cm]);CHKERRQ(ierr); for (i=0; i= ci[crow+1] - ci[crow])) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"k too large k %d, crow %d",k,crow); if (cjj[k]==apj[nextap]) { caj[k] += (*pA)*apa[apj[nextap++]]; } } ierr = PetscLogFlops(2.0*apnzj);CHKERRQ(ierr); pA++; } /* Zero the current row info for A*P */ for (j=0; jproduct->data; if (!atb) SETERRQ(PetscObjectComm((PetscObject)C),PETSC_ERR_PLIB,"Missing data structure"); ierr = MatTranspose_SeqAIJ(P,MAT_REUSE_MATRIX,&atb->At);CHKERRQ(ierr); if (!C->ops->matmultnumeric) SETERRQ(PetscObjectComm((PetscObject)C),PETSC_ERR_PLIB,"Missing numeric operation"); /* when using rap, MatMatMatMultSymbolic used a different data */ if (atb->data) C->product->data = atb->data; ierr = (*C->ops->matmatmultnumeric)(atb->At,A,P,C);CHKERRQ(ierr); C->product->data = atb; PetscFunctionReturn(0); }