#include #include #include #include /*I "petscksp.h" I*/ #include #include #include "../src/ksp/pc/impls/telescope/telescope.h" static PetscBool cited = PETSC_FALSE; static const char citation[] = "@inproceedings{MaySananRuppKnepleySmith2016,\n" " title = {Extreme-Scale Multigrid Components within PETSc},\n" " author = {Dave A. May and Patrick Sanan and Karl Rupp and Matthew G. Knepley and Barry F. Smith},\n" " booktitle = {Proceedings of the Platform for Advanced Scientific Computing Conference},\n" " series = {PASC '16},\n" " isbn = {978-1-4503-4126-4},\n" " location = {Lausanne, Switzerland},\n" " pages = {5:1--5:12},\n" " articleno = {5},\n" " numpages = {12},\n" " url = {https://doi.acm.org/10.1145/2929908.2929913},\n" " doi = {10.1145/2929908.2929913},\n" " acmid = {2929913},\n" " publisher = {ACM},\n" " address = {New York, NY, USA},\n" " keywords = {GPU, HPC, agglomeration, coarse-level solver, multigrid, parallel computing, preconditioning},\n" " year = {2016}\n" "}\n"; static PetscErrorCode _DMDADetermineRankFromGlobalIJK(PetscInt dim,PetscInt i,PetscInt j,PetscInt k, PetscInt Mp,PetscInt Np,PetscInt Pp, PetscInt start_i[],PetscInt start_j[],PetscInt start_k[], PetscInt span_i[],PetscInt span_j[],PetscInt span_k[], PetscMPIInt *_pi,PetscMPIInt *_pj,PetscMPIInt *_pk,PetscMPIInt *rank_re) { PetscInt pi,pj,pk,n; PetscFunctionBegin; *rank_re = -1; if (_pi) *_pi = -1; if (_pj) *_pj = -1; if (_pk) *_pk = -1; pi = pj = pk = -1; if (_pi) { for (n=0; n= start_i[n]) && (i < start_i[n]+span_i[n])) { pi = n; break; } } if (pi == -1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_USER,"[dmda-ijk] pi cannot be determined : range %D, val %D",Mp,i); *_pi = pi; } if (_pj) { for (n=0; n= start_j[n]) && (j < start_j[n]+span_j[n])) { pj = n; break; } } if (pj == -1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_USER,"[dmda-ijk] pj cannot be determined : range %D, val %D",Np,j); *_pj = pj; } if (_pk) { for (n=0; n= start_k[n]) && (k < start_k[n]+span_k[n])) { pk = n; break; } } if (pk == -1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_USER,"[dmda-ijk] pk cannot be determined : range %D, val %D",Pp,k); *_pk = pk; } switch (dim) { case 1: *rank_re = pi; break; case 2: *rank_re = pi + pj * Mp; break; case 3: *rank_re = pi + pj * Mp + pk * (Mp*Np); break; } PetscFunctionReturn(0); } static PetscErrorCode _DMDADetermineGlobalS0(PetscInt dim,PetscMPIInt rank_re,PetscInt Mp_re,PetscInt Np_re,PetscInt Pp_re, PetscInt range_i_re[],PetscInt range_j_re[],PetscInt range_k_re[],PetscInt *s0) { PetscInt i,j,k,start_IJK = 0; PetscInt rank_ijk; PetscFunctionBegin; switch (dim) { case 1: for (i=0; ipsubcomm; comm = PetscSubcommParent(psubcomm); subdm = ctx->dmrepart; ierr = PetscInfo(pc,"PCTelescope: setting up the coordinates (DMDA)\n");CHKERRQ(ierr); ierr = DMDAGetInfo(dm,&dim,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL);CHKERRQ(ierr); switch (dim) { case 1: SETERRQ(comm,PETSC_ERR_SUP,"Telescope: DMDA (1D) repartitioning not provided"); case 2: ierr = PCTelescopeSetUp_dmda_repart_coors2d(sred,dm,subdm);CHKERRQ(ierr); break; case 3: ierr = PCTelescopeSetUp_dmda_repart_coors3d(sred,dm,subdm);CHKERRQ(ierr); break; } PetscFunctionReturn(0); } /* setup repartitioned dm */ PetscErrorCode PCTelescopeSetUp_dmda_repart(PC pc,PC_Telescope sred,PC_Telescope_DMDACtx *ctx) { PetscErrorCode ierr; DM dm; PetscInt dim,nx,ny,nz,ndof,nsw,sum,k; DMBoundaryType bx,by,bz; DMDAStencilType stencil; const PetscInt *_range_i_re; const PetscInt *_range_j_re; const PetscInt *_range_k_re; DMDAInterpolationType itype; PetscInt refine_x,refine_y,refine_z; MPI_Comm comm,subcomm; const char *prefix; PetscFunctionBegin; comm = PetscSubcommParent(sred->psubcomm); subcomm = PetscSubcommChild(sred->psubcomm); ierr = PCGetDM(pc,&dm);CHKERRQ(ierr); ierr = DMDAGetInfo(dm,&dim,&nx,&ny,&nz,NULL,NULL,NULL,&ndof,&nsw,&bx,&by,&bz,&stencil);CHKERRQ(ierr); ierr = DMDAGetInterpolationType(dm,&itype);CHKERRQ(ierr); ierr = DMDAGetRefinementFactor(dm,&refine_x,&refine_y,&refine_z);CHKERRQ(ierr); ctx->dmrepart = NULL; _range_i_re = _range_j_re = _range_k_re = NULL; /* Create DMDA on the child communicator */ if (PCTelescope_isActiveRank(sred)) { switch (dim) { case 1: ierr = PetscInfo(pc,"PCTelescope: setting up the DMDA on comm subset (1D)\n");CHKERRQ(ierr); /*ierr = DMDACreate1d(subcomm,bx,nx,ndof,nsw,NULL,&ctx->dmrepart);CHKERRQ(ierr);*/ ny = nz = 1; by = bz = DM_BOUNDARY_NONE; break; case 2: ierr = PetscInfo(pc,"PCTelescope: setting up the DMDA on comm subset (2D)\n");CHKERRQ(ierr); /*ierr = DMDACreate2d(subcomm,bx,by,stencil,nx,ny, PETSC_DECIDE,PETSC_DECIDE, ndof,nsw, NULL,NULL,&ctx->dmrepart);CHKERRQ(ierr);*/ nz = 1; bz = DM_BOUNDARY_NONE; break; case 3: ierr = PetscInfo(pc,"PCTelescope: setting up the DMDA on comm subset (3D)\n");CHKERRQ(ierr); /*ierr = DMDACreate3d(subcomm,bx,by,bz,stencil,nx,ny,nz, PETSC_DECIDE,PETSC_DECIDE,PETSC_DECIDE, ndof,nsw, NULL,NULL,NULL,&ctx->dmrepart);CHKERRQ(ierr);*/ break; } /* The API DMDACreate1d(), DMDACreate2d(), DMDACreate3d() does not allow us to set/append a unique option prefix for the DM, thus I prefer to expose the contents of these API's here. This allows users to control the partitioning of the subDM. */ ierr = DMDACreate(subcomm,&ctx->dmrepart);CHKERRQ(ierr); /* Set unique option prefix name */ ierr = KSPGetOptionsPrefix(sred->ksp,&prefix);CHKERRQ(ierr); ierr = DMSetOptionsPrefix(ctx->dmrepart,prefix);CHKERRQ(ierr); ierr = DMAppendOptionsPrefix(ctx->dmrepart,"repart_");CHKERRQ(ierr); /* standard setup from DMDACreate{1,2,3}d() */ ierr = DMSetDimension(ctx->dmrepart,dim);CHKERRQ(ierr); ierr = DMDASetSizes(ctx->dmrepart,nx,ny,nz);CHKERRQ(ierr); ierr = DMDASetNumProcs(ctx->dmrepart,PETSC_DECIDE,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr); ierr = DMDASetBoundaryType(ctx->dmrepart,bx,by,bz);CHKERRQ(ierr); ierr = DMDASetDof(ctx->dmrepart,ndof);CHKERRQ(ierr); ierr = DMDASetStencilType(ctx->dmrepart,stencil);CHKERRQ(ierr); ierr = DMDASetStencilWidth(ctx->dmrepart,nsw);CHKERRQ(ierr); ierr = DMDASetOwnershipRanges(ctx->dmrepart,NULL,NULL,NULL);CHKERRQ(ierr); ierr = DMSetFromOptions(ctx->dmrepart);CHKERRQ(ierr); ierr = DMSetUp(ctx->dmrepart);CHKERRQ(ierr); /* Set refinement factors and interpolation type from the partent */ ierr = DMDASetRefinementFactor(ctx->dmrepart,refine_x,refine_y,refine_z);CHKERRQ(ierr); ierr = DMDASetInterpolationType(ctx->dmrepart,itype);CHKERRQ(ierr); ierr = DMDAGetInfo(ctx->dmrepart,NULL,NULL,NULL,NULL,&ctx->Mp_re,&ctx->Np_re,&ctx->Pp_re,NULL,NULL,NULL,NULL,NULL,NULL);CHKERRQ(ierr); ierr = DMDAGetOwnershipRanges(ctx->dmrepart,&_range_i_re,&_range_j_re,&_range_k_re);CHKERRQ(ierr); ctx->dmrepart->ops->creatematrix = dm->ops->creatematrix; ctx->dmrepart->ops->createdomaindecomposition = dm->ops->createdomaindecomposition; } /* generate ranges for repartitioned dm */ /* note - assume rank 0 always participates */ /* TODO: use a single MPI call */ ierr = MPI_Bcast(&ctx->Mp_re,1,MPIU_INT,0,comm);CHKERRMPI(ierr); ierr = MPI_Bcast(&ctx->Np_re,1,MPIU_INT,0,comm);CHKERRMPI(ierr); ierr = MPI_Bcast(&ctx->Pp_re,1,MPIU_INT,0,comm);CHKERRMPI(ierr); ierr = PetscCalloc3(ctx->Mp_re,&ctx->range_i_re,ctx->Np_re,&ctx->range_j_re,ctx->Pp_re,&ctx->range_k_re);CHKERRQ(ierr); if (_range_i_re) {ierr = PetscArraycpy(ctx->range_i_re,_range_i_re,ctx->Mp_re);CHKERRQ(ierr);} if (_range_j_re) {ierr = PetscArraycpy(ctx->range_j_re,_range_j_re,ctx->Np_re);CHKERRQ(ierr);} if (_range_k_re) {ierr = PetscArraycpy(ctx->range_k_re,_range_k_re,ctx->Pp_re);CHKERRQ(ierr);} /* TODO: use a single MPI call */ ierr = MPI_Bcast(ctx->range_i_re,ctx->Mp_re,MPIU_INT,0,comm);CHKERRMPI(ierr); ierr = MPI_Bcast(ctx->range_j_re,ctx->Np_re,MPIU_INT,0,comm);CHKERRMPI(ierr); ierr = MPI_Bcast(ctx->range_k_re,ctx->Pp_re,MPIU_INT,0,comm);CHKERRMPI(ierr); ierr = PetscMalloc3(ctx->Mp_re,&ctx->start_i_re,ctx->Np_re,&ctx->start_j_re,ctx->Pp_re,&ctx->start_k_re);CHKERRQ(ierr); sum = 0; for (k=0; kMp_re; k++) { ctx->start_i_re[k] = sum; sum += ctx->range_i_re[k]; } sum = 0; for (k=0; kNp_re; k++) { ctx->start_j_re[k] = sum; sum += ctx->range_j_re[k]; } sum = 0; for (k=0; kPp_re; k++) { ctx->start_k_re[k] = sum; sum += ctx->range_k_re[k]; } /* attach repartitioned dm to child ksp */ { PetscErrorCode (*dmksp_func)(KSP,Mat,Mat,void*); void *dmksp_ctx; ierr = DMKSPGetComputeOperators(dm,&dmksp_func,&dmksp_ctx);CHKERRQ(ierr); /* attach dm to ksp on sub communicator */ if (PCTelescope_isActiveRank(sred)) { ierr = KSPSetDM(sred->ksp,ctx->dmrepart);CHKERRQ(ierr); if (!dmksp_func || sred->ignore_kspcomputeoperators) { ierr = KSPSetDMActive(sred->ksp,PETSC_FALSE);CHKERRQ(ierr); } else { /* sub ksp inherits dmksp_func and context provided by user */ ierr = KSPSetComputeOperators(sred->ksp,dmksp_func,dmksp_ctx);CHKERRQ(ierr); ierr = KSPSetDMActive(sred->ksp,PETSC_TRUE);CHKERRQ(ierr); } } } PetscFunctionReturn(0); } PetscErrorCode PCTelescopeSetUp_dmda_permutation_3d(PC pc,PC_Telescope sred,PC_Telescope_DMDACtx *ctx) { PetscErrorCode ierr; DM dm; MPI_Comm comm; Mat Pscalar,P; PetscInt ndof; PetscInt i,j,k,location,startI[3],endI[3],lenI[3],nx,ny,nz; PetscInt sr,er,Mr; Vec V; PetscFunctionBegin; ierr = PetscInfo(pc,"PCTelescope: setting up the permutation matrix (DMDA-3D)\n");CHKERRQ(ierr); ierr = PetscObjectGetComm((PetscObject)pc,&comm);CHKERRQ(ierr); ierr = PCGetDM(pc,&dm);CHKERRQ(ierr); ierr = DMDAGetInfo(dm,NULL,&nx,&ny,&nz,NULL,NULL,NULL,&ndof,NULL,NULL,NULL,NULL,NULL);CHKERRQ(ierr); ierr = DMGetGlobalVector(dm,&V);CHKERRQ(ierr); ierr = VecGetSize(V,&Mr);CHKERRQ(ierr); ierr = VecGetOwnershipRange(V,&sr,&er);CHKERRQ(ierr); ierr = DMRestoreGlobalVector(dm,&V);CHKERRQ(ierr); sr = sr / ndof; er = er / ndof; Mr = Mr / ndof; ierr = MatCreate(comm,&Pscalar);CHKERRQ(ierr); ierr = MatSetSizes(Pscalar,(er-sr),(er-sr),Mr,Mr);CHKERRQ(ierr); ierr = MatSetType(Pscalar,MATAIJ);CHKERRQ(ierr); ierr = MatSeqAIJSetPreallocation(Pscalar,1,NULL);CHKERRQ(ierr); ierr = MatMPIAIJSetPreallocation(Pscalar,1,NULL,1,NULL);CHKERRQ(ierr); ierr = DMDAGetCorners(dm,NULL,NULL,NULL,&lenI[0],&lenI[1],&lenI[2]);CHKERRQ(ierr); ierr = DMDAGetCorners(dm,&startI[0],&startI[1],&startI[2],&endI[0],&endI[1],&endI[2]);CHKERRQ(ierr); endI[0] += startI[0]; endI[1] += startI[1]; endI[2] += startI[2]; for (k=startI[2]; kMp_re,ctx->Np_re,ctx->Pp_re, ctx->start_i_re,ctx->start_j_re,ctx->start_k_re, ctx->range_i_re,ctx->range_j_re,ctx->range_k_re, &rank_reI[0],&rank_reI[1],&rank_reI[2],&rank_ijk_re);CHKERRQ(ierr); ierr = _DMDADetermineGlobalS0(3,rank_ijk_re, ctx->Mp_re,ctx->Np_re,ctx->Pp_re, ctx->range_i_re,ctx->range_j_re,ctx->range_k_re, &s0_re);CHKERRQ(ierr); ii = i - ctx->start_i_re[ rank_reI[0] ]; if (ii < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"[dmdarepart-perm3d] index error ii"); jj = j - ctx->start_j_re[ rank_reI[1] ]; if (jj < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"[dmdarepart-perm3d] index error jj"); kk = k - ctx->start_k_re[ rank_reI[2] ]; if (kk < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"[dmdarepart-perm3d] index error kk"); lenI_re[0] = ctx->range_i_re[ rank_reI[0] ]; lenI_re[1] = ctx->range_j_re[ rank_reI[1] ]; lenI_re[2] = ctx->range_k_re[ rank_reI[2] ]; local_ijk_re = ii + jj * lenI_re[0] + kk * lenI_re[0] * lenI_re[1]; mapped_ijk = s0_re + local_ijk_re; ierr = MatSetValue(Pscalar,sr+location,mapped_ijk,1.0,INSERT_VALUES);CHKERRQ(ierr); } } } ierr = MatAssemblyBegin(Pscalar,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); ierr = MatAssemblyEnd(Pscalar,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); ierr = MatCreateMAIJ(Pscalar,ndof,&P);CHKERRQ(ierr); ierr = MatDestroy(&Pscalar);CHKERRQ(ierr); ctx->permutation = P; PetscFunctionReturn(0); } PetscErrorCode PCTelescopeSetUp_dmda_permutation_2d(PC pc,PC_Telescope sred,PC_Telescope_DMDACtx *ctx) { PetscErrorCode ierr; DM dm; MPI_Comm comm; Mat Pscalar,P; PetscInt ndof; PetscInt i,j,location,startI[2],endI[2],lenI[2],nx,ny,nz; PetscInt sr,er,Mr; Vec V; PetscFunctionBegin; ierr = PetscInfo(pc,"PCTelescope: setting up the permutation matrix (DMDA-2D)\n");CHKERRQ(ierr); ierr = PetscObjectGetComm((PetscObject)pc,&comm);CHKERRQ(ierr); ierr = PCGetDM(pc,&dm);CHKERRQ(ierr); ierr = DMDAGetInfo(dm,NULL,&nx,&ny,&nz,NULL,NULL,NULL,&ndof,NULL,NULL,NULL,NULL,NULL);CHKERRQ(ierr); ierr = DMGetGlobalVector(dm,&V);CHKERRQ(ierr); ierr = VecGetSize(V,&Mr);CHKERRQ(ierr); ierr = VecGetOwnershipRange(V,&sr,&er);CHKERRQ(ierr); ierr = DMRestoreGlobalVector(dm,&V);CHKERRQ(ierr); sr = sr / ndof; er = er / ndof; Mr = Mr / ndof; ierr = MatCreate(comm,&Pscalar);CHKERRQ(ierr); ierr = MatSetSizes(Pscalar,(er-sr),(er-sr),Mr,Mr);CHKERRQ(ierr); ierr = MatSetType(Pscalar,MATAIJ);CHKERRQ(ierr); ierr = MatSeqAIJSetPreallocation(Pscalar,1,NULL);CHKERRQ(ierr); ierr = MatMPIAIJSetPreallocation(Pscalar,1,NULL,1,NULL);CHKERRQ(ierr); ierr = DMDAGetCorners(dm,NULL,NULL,NULL,&lenI[0],&lenI[1],NULL);CHKERRQ(ierr); ierr = DMDAGetCorners(dm,&startI[0],&startI[1],NULL,&endI[0],&endI[1],NULL);CHKERRQ(ierr); endI[0] += startI[0]; endI[1] += startI[1]; for (j=startI[1]; jMp_re,ctx->Np_re,ctx->Pp_re, ctx->start_i_re,ctx->start_j_re,ctx->start_k_re, ctx->range_i_re,ctx->range_j_re,ctx->range_k_re, &rank_reI[0],&rank_reI[1],NULL,&rank_ijk_re);CHKERRQ(ierr); ierr = _DMDADetermineGlobalS0(2,rank_ijk_re, ctx->Mp_re,ctx->Np_re,ctx->Pp_re, ctx->range_i_re,ctx->range_j_re,ctx->range_k_re, &s0_re);CHKERRQ(ierr); ii = i - ctx->start_i_re[ rank_reI[0] ]; if (ii < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"[dmdarepart-perm2d] index error ii"); jj = j - ctx->start_j_re[ rank_reI[1] ]; if (jj < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"[dmdarepart-perm2d] index error jj"); lenI_re[0] = ctx->range_i_re[ rank_reI[0] ]; lenI_re[1] = ctx->range_j_re[ rank_reI[1] ]; local_ijk_re = ii + jj * lenI_re[0]; mapped_ijk = s0_re + local_ijk_re; ierr = MatSetValue(Pscalar,sr+location,mapped_ijk,1.0,INSERT_VALUES);CHKERRQ(ierr); } } ierr = MatAssemblyBegin(Pscalar,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); ierr = MatAssemblyEnd(Pscalar,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); ierr = MatCreateMAIJ(Pscalar,ndof,&P);CHKERRQ(ierr); ierr = MatDestroy(&Pscalar);CHKERRQ(ierr); ctx->permutation = P; PetscFunctionReturn(0); } PetscErrorCode PCTelescopeSetUp_dmda_scatters(PC pc,PC_Telescope sred,PC_Telescope_DMDACtx *ctx) { PetscErrorCode ierr; Vec xred,yred,xtmp,x,xp; VecScatter scatter; IS isin; Mat B; PetscInt m,bs,st,ed; MPI_Comm comm; PetscFunctionBegin; ierr = PetscObjectGetComm((PetscObject)pc,&comm);CHKERRQ(ierr); ierr = PCGetOperators(pc,NULL,&B);CHKERRQ(ierr); ierr = MatCreateVecs(B,&x,NULL);CHKERRQ(ierr); ierr = MatGetBlockSize(B,&bs);CHKERRQ(ierr); ierr = VecDuplicate(x,&xp);CHKERRQ(ierr); m = 0; xred = NULL; yred = NULL; if (PCTelescope_isActiveRank(sred)) { ierr = DMCreateGlobalVector(ctx->dmrepart,&xred);CHKERRQ(ierr); ierr = VecDuplicate(xred,&yred);CHKERRQ(ierr); ierr = VecGetOwnershipRange(xred,&st,&ed);CHKERRQ(ierr); ierr = ISCreateStride(comm,ed-st,st,1,&isin);CHKERRQ(ierr); ierr = VecGetLocalSize(xred,&m);CHKERRQ(ierr); } else { ierr = VecGetOwnershipRange(x,&st,&ed);CHKERRQ(ierr); ierr = ISCreateStride(comm,0,st,1,&isin);CHKERRQ(ierr); } ierr = ISSetBlockSize(isin,bs);CHKERRQ(ierr); ierr = VecCreate(comm,&xtmp);CHKERRQ(ierr); ierr = VecSetSizes(xtmp,m,PETSC_DECIDE);CHKERRQ(ierr); ierr = VecSetBlockSize(xtmp,bs);CHKERRQ(ierr); ierr = VecSetType(xtmp,((PetscObject)x)->type_name);CHKERRQ(ierr); ierr = VecScatterCreate(x,isin,xtmp,NULL,&scatter);CHKERRQ(ierr); sred->xred = xred; sred->yred = yred; sred->isin = isin; sred->scatter = scatter; sred->xtmp = xtmp; ctx->xp = xp; ierr = VecDestroy(&x);CHKERRQ(ierr); PetscFunctionReturn(0); } PetscErrorCode PCTelescopeSetUp_dmda(PC pc,PC_Telescope sred) { PC_Telescope_DMDACtx *ctx; PetscInt dim; DM dm; MPI_Comm comm; PetscErrorCode ierr; PetscFunctionBegin; ierr = PetscInfo(pc,"PCTelescope: setup (DMDA)\n");CHKERRQ(ierr); ierr = PetscNew(&ctx);CHKERRQ(ierr); sred->dm_ctx = (void*)ctx; ierr = PetscObjectGetComm((PetscObject)pc,&comm);CHKERRQ(ierr); ierr = PCGetDM(pc,&dm);CHKERRQ(ierr); ierr = DMDAGetInfo(dm,&dim,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL);CHKERRQ(ierr); PCTelescopeSetUp_dmda_repart(pc,sred,ctx); PCTelescopeSetUp_dmda_repart_coors(pc,sred,ctx); switch (dim) { case 1: SETERRQ(comm,PETSC_ERR_SUP,"Telescope: DMDA (1D) repartitioning not provided"); case 2: ierr = PCTelescopeSetUp_dmda_permutation_2d(pc,sred,ctx);CHKERRQ(ierr); break; case 3: ierr = PCTelescopeSetUp_dmda_permutation_3d(pc,sred,ctx);CHKERRQ(ierr); break; } ierr = PCTelescopeSetUp_dmda_scatters(pc,sred,ctx);CHKERRQ(ierr); PetscFunctionReturn(0); } PetscErrorCode PCTelescopeMatCreate_dmda_dmactivefalse(PC pc,PC_Telescope sred,MatReuse reuse,Mat *A) { PetscErrorCode ierr; PC_Telescope_DMDACtx *ctx; MPI_Comm comm,subcomm; Mat Bperm,Bred,B,P; PetscInt nr,nc; IS isrow,iscol; Mat Blocal,*_Blocal; PetscFunctionBegin; ierr = PetscInfo(pc,"PCTelescope: updating the redundant preconditioned operator (DMDA)\n");CHKERRQ(ierr); ierr = PetscObjectGetComm((PetscObject)pc,&comm);CHKERRQ(ierr); subcomm = PetscSubcommChild(sred->psubcomm); ctx = (PC_Telescope_DMDACtx*)sred->dm_ctx; ierr = PCGetOperators(pc,NULL,&B);CHKERRQ(ierr); ierr = MatGetSize(B,&nr,&nc);CHKERRQ(ierr); P = ctx->permutation; ierr = MatPtAP(B,P,MAT_INITIAL_MATRIX,1.1,&Bperm);CHKERRQ(ierr); /* Get submatrices */ isrow = sred->isin; ierr = ISCreateStride(comm,nc,0,1,&iscol);CHKERRQ(ierr); ierr = MatCreateSubMatrices(Bperm,1,&isrow,&iscol,MAT_INITIAL_MATRIX,&_Blocal);CHKERRQ(ierr); Blocal = *_Blocal; Bred = NULL; if (PCTelescope_isActiveRank(sred)) { PetscInt mm; if (reuse != MAT_INITIAL_MATRIX) {Bred = *A;} ierr = MatGetSize(Blocal,&mm,NULL);CHKERRQ(ierr); /* ierr = MatCreateMPIMatConcatenateSeqMat(subcomm,Blocal,PETSC_DECIDE,reuse,&Bred);CHKERRQ(ierr); */ ierr = MatCreateMPIMatConcatenateSeqMat(subcomm,Blocal,mm,reuse,&Bred);CHKERRQ(ierr); } *A = Bred; ierr = ISDestroy(&iscol);CHKERRQ(ierr); ierr = MatDestroy(&Bperm);CHKERRQ(ierr); ierr = MatDestroyMatrices(1,&_Blocal);CHKERRQ(ierr); PetscFunctionReturn(0); } PetscErrorCode PCTelescopeMatCreate_dmda(PC pc,PC_Telescope sred,MatReuse reuse,Mat *A) { PetscErrorCode ierr; DM dm; PetscErrorCode (*dmksp_func)(KSP,Mat,Mat,void*); void *dmksp_ctx; PetscFunctionBegin; ierr = PCGetDM(pc,&dm);CHKERRQ(ierr); ierr = DMKSPGetComputeOperators(dm,&dmksp_func,&dmksp_ctx);CHKERRQ(ierr); /* We assume that dmksp_func = NULL, is equivalent to dmActive = PETSC_FALSE */ if (dmksp_func && !sred->ignore_kspcomputeoperators) { DM dmrepart; Mat Ak; *A = NULL; if (PCTelescope_isActiveRank(sred)) { ierr = KSPGetDM(sred->ksp,&dmrepart);CHKERRQ(ierr); if (reuse == MAT_INITIAL_MATRIX) { ierr = DMCreateMatrix(dmrepart,&Ak);CHKERRQ(ierr); *A = Ak; } else if (reuse == MAT_REUSE_MATRIX) { Ak = *A; } /* There is no need to explicitly assemble the operator now, the sub-KSP will call the method provided to KSPSetComputeOperators() during KSPSetUp() */ } } else { ierr = PCTelescopeMatCreate_dmda_dmactivefalse(pc,sred,reuse,A);CHKERRQ(ierr); } PetscFunctionReturn(0); } PetscErrorCode PCTelescopeSubNullSpaceCreate_dmda_Telescope(PC pc,PC_Telescope sred,MatNullSpace nullspace,MatNullSpace *sub_nullspace) { PetscErrorCode ierr; PetscBool has_const; PetscInt i,k,n = 0; const Vec *vecs; Vec *sub_vecs = NULL; MPI_Comm subcomm; PC_Telescope_DMDACtx *ctx; PetscFunctionBegin; ctx = (PC_Telescope_DMDACtx*)sred->dm_ctx; subcomm = PetscSubcommChild(sred->psubcomm); ierr = MatNullSpaceGetVecs(nullspace,&has_const,&n,&vecs);CHKERRQ(ierr); if (PCTelescope_isActiveRank(sred)) { /* create new vectors */ if (n) { ierr = VecDuplicateVecs(sred->xred,n,&sub_vecs);CHKERRQ(ierr); } } /* copy entries */ for (k=0; kpermutation,vecs[k],ctx->xp);CHKERRQ(ierr); /* pull in vector x->xtmp */ ierr = VecScatterBegin(sred->scatter,ctx->xp,sred->xtmp,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); ierr = VecScatterEnd(sred->scatter,ctx->xp,sred->xtmp,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); /* copy vector entries into xred */ ierr = VecGetArrayRead(sred->xtmp,&x_array);CHKERRQ(ierr); if (sub_vecs) { if (sub_vecs[k]) { ierr = VecGetOwnershipRange(sub_vecs[k],&st,&ed);CHKERRQ(ierr); ierr = VecGetArray(sub_vecs[k],&LA_sub_vec);CHKERRQ(ierr); for (i=0; ixtmp,&x_array);CHKERRQ(ierr); } if (PCTelescope_isActiveRank(sred)) { /* create new (near) nullspace for redundant object */ ierr = MatNullSpaceCreate(subcomm,has_const,n,sub_vecs,sub_nullspace);CHKERRQ(ierr); ierr = VecDestroyVecs(n,&sub_vecs);CHKERRQ(ierr); if (nullspace->remove) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_SUP,"Propagation of custom remove callbacks not supported when propagating (near) nullspaces with PCTelescope"); if (nullspace->rmctx) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_SUP,"Propagation of custom remove callback context not supported when propagating (near) nullspaces with PCTelescope"); } PetscFunctionReturn(0); } PetscErrorCode PCTelescopeMatNullSpaceCreate_dmda(PC pc,PC_Telescope sred,Mat sub_mat) { PetscErrorCode ierr; Mat B; PetscFunctionBegin; ierr = PCGetOperators(pc,NULL,&B);CHKERRQ(ierr); { MatNullSpace nullspace,sub_nullspace; ierr = MatGetNullSpace(B,&nullspace);CHKERRQ(ierr); if (nullspace) { ierr = PetscInfo(pc,"PCTelescope: generating nullspace (DMDA)\n");CHKERRQ(ierr); ierr = PCTelescopeSubNullSpaceCreate_dmda_Telescope(pc,sred,nullspace,&sub_nullspace);CHKERRQ(ierr); if (PCTelescope_isActiveRank(sred)) { ierr = MatSetNullSpace(sub_mat,sub_nullspace);CHKERRQ(ierr); ierr = MatNullSpaceDestroy(&sub_nullspace);CHKERRQ(ierr); } } } { MatNullSpace nearnullspace,sub_nearnullspace; ierr = MatGetNearNullSpace(B,&nearnullspace);CHKERRQ(ierr); if (nearnullspace) { ierr = PetscInfo(pc,"PCTelescope: generating near nullspace (DMDA)\n");CHKERRQ(ierr); ierr = PCTelescopeSubNullSpaceCreate_dmda_Telescope(pc,sred,nearnullspace,&sub_nearnullspace);CHKERRQ(ierr); if (PCTelescope_isActiveRank(sred)) { ierr = MatSetNearNullSpace(sub_mat,sub_nearnullspace);CHKERRQ(ierr); ierr = MatNullSpaceDestroy(&sub_nearnullspace);CHKERRQ(ierr); } } } PetscFunctionReturn(0); } PetscErrorCode PCApply_Telescope_dmda(PC pc,Vec x,Vec y) { PC_Telescope sred = (PC_Telescope)pc->data; PetscErrorCode ierr; Mat perm; Vec xtmp,xp,xred,yred; PetscInt i,st,ed; VecScatter scatter; PetscScalar *array; const PetscScalar *x_array; PC_Telescope_DMDACtx *ctx; ctx = (PC_Telescope_DMDACtx*)sred->dm_ctx; xtmp = sred->xtmp; scatter = sred->scatter; xred = sred->xred; yred = sred->yred; perm = ctx->permutation; xp = ctx->xp; PetscFunctionBegin; ierr = PetscCitationsRegister(citation,&cited);CHKERRQ(ierr); /* permute vector into ordering associated with re-partitioned dmda */ ierr = MatMultTranspose(perm,x,xp);CHKERRQ(ierr); /* pull in vector x->xtmp */ ierr = VecScatterBegin(scatter,xp,xtmp,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); ierr = VecScatterEnd(scatter,xp,xtmp,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); /* copy vector entries into xred */ ierr = VecGetArrayRead(xtmp,&x_array);CHKERRQ(ierr); if (xred) { PetscScalar *LA_xred; ierr = VecGetOwnershipRange(xred,&st,&ed);CHKERRQ(ierr); ierr = VecGetArray(xred,&LA_xred);CHKERRQ(ierr); for (i=0; iksp,xred,yred);CHKERRQ(ierr); ierr = KSPCheckSolve(sred->ksp,pc,yred);CHKERRQ(ierr); } /* return vector */ ierr = VecGetArray(xtmp,&array);CHKERRQ(ierr); if (yred) { const PetscScalar *LA_yred; ierr = VecGetOwnershipRange(yred,&st,&ed);CHKERRQ(ierr); ierr = VecGetArrayRead(yred,&LA_yred);CHKERRQ(ierr); for (i=0; idata; PetscErrorCode ierr; Mat perm; Vec xtmp,xp,yred; PetscInt i,st,ed; VecScatter scatter; const PetscScalar *x_array; PetscBool default_init_guess_value = PETSC_FALSE; PC_Telescope_DMDACtx *ctx; PetscFunctionBegin; ctx = (PC_Telescope_DMDACtx*)sred->dm_ctx; xtmp = sred->xtmp; scatter = sred->scatter; yred = sred->yred; perm = ctx->permutation; xp = ctx->xp; if (its > 1) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_SUP,"PCApplyRichardson_Telescope_dmda only supports max_it = 1"); *reason = (PCRichardsonConvergedReason)0; if (!zeroguess) { ierr = PetscInfo(pc,"PCTelescopeDMDA: Scattering y for non-zero-initial guess\n");CHKERRQ(ierr); /* permute vector into ordering associated with re-partitioned dmda */ ierr = MatMultTranspose(perm,y,xp);CHKERRQ(ierr); /* pull in vector x->xtmp */ ierr = VecScatterBegin(scatter,xp,xtmp,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); ierr = VecScatterEnd(scatter,xp,xtmp,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); /* copy vector entries into xred */ ierr = VecGetArrayRead(xtmp,&x_array);CHKERRQ(ierr); if (yred) { PetscScalar *LA_yred; ierr = VecGetOwnershipRange(yred,&st,&ed);CHKERRQ(ierr); ierr = VecGetArray(yred,&LA_yred);CHKERRQ(ierr); for (i=0; iksp,&default_init_guess_value);CHKERRQ(ierr); if (!zeroguess) {ierr = KSPSetInitialGuessNonzero(sred->ksp,PETSC_TRUE);CHKERRQ(ierr);} } ierr = PCApply_Telescope_dmda(pc,x,y);CHKERRQ(ierr); if (PCTelescope_isActiveRank(sred)) { ierr = KSPSetInitialGuessNonzero(sred->ksp,default_init_guess_value);CHKERRQ(ierr); } if (!*reason) *reason = PCRICHARDSON_CONVERGED_ITS; *outits = 1; PetscFunctionReturn(0); } PetscErrorCode PCReset_Telescope_dmda(PC pc) { PetscErrorCode ierr; PC_Telescope sred = (PC_Telescope)pc->data; PC_Telescope_DMDACtx *ctx; PetscFunctionBegin; ctx = (PC_Telescope_DMDACtx*)sred->dm_ctx; ierr = VecDestroy(&ctx->xp);CHKERRQ(ierr); ierr = MatDestroy(&ctx->permutation);CHKERRQ(ierr); ierr = DMDestroy(&ctx->dmrepart);CHKERRQ(ierr); ierr = PetscFree3(ctx->range_i_re,ctx->range_j_re,ctx->range_k_re);CHKERRQ(ierr); ierr = PetscFree3(ctx->start_i_re,ctx->start_j_re,ctx->start_k_re);CHKERRQ(ierr); PetscFunctionReturn(0); } PetscErrorCode DMView_DA_Short_3d(DM dm,PetscViewer v) { PetscInt M,N,P,m,n,p,ndof,nsw; MPI_Comm comm; PetscMPIInt size; const char* prefix; PetscErrorCode ierr; PetscFunctionBegin; ierr = PetscObjectGetComm((PetscObject)dm,&comm);CHKERRQ(ierr); ierr = MPI_Comm_size(comm,&size);CHKERRMPI(ierr); ierr = DMGetOptionsPrefix(dm,&prefix);CHKERRQ(ierr); ierr = DMDAGetInfo(dm,NULL,&M,&N,&P,&m,&n,&p,&ndof,&nsw,NULL,NULL,NULL,NULL);CHKERRQ(ierr); if (prefix) {ierr = PetscViewerASCIIPrintf(v,"DMDA Object: (%s) %d MPI processes\n",prefix,size);CHKERRQ(ierr);} else {ierr = PetscViewerASCIIPrintf(v,"DMDA Object: %d MPI processes\n",size);CHKERRQ(ierr);} ierr = PetscViewerASCIIPrintf(v," M %D N %D P %D m %D n %D p %D dof %D overlap %D\n",M,N,P,m,n,p,ndof,nsw);CHKERRQ(ierr); PetscFunctionReturn(0); } PetscErrorCode DMView_DA_Short_2d(DM dm,PetscViewer v) { PetscInt M,N,m,n,ndof,nsw; MPI_Comm comm; PetscMPIInt size; const char* prefix; PetscErrorCode ierr; PetscFunctionBegin; ierr = PetscObjectGetComm((PetscObject)dm,&comm);CHKERRQ(ierr); ierr = MPI_Comm_size(comm,&size);CHKERRMPI(ierr); ierr = DMGetOptionsPrefix(dm,&prefix);CHKERRQ(ierr); ierr = DMDAGetInfo(dm,NULL,&M,&N,NULL,&m,&n,NULL,&ndof,&nsw,NULL,NULL,NULL,NULL);CHKERRQ(ierr); if (prefix) {ierr = PetscViewerASCIIPrintf(v,"DMDA Object: (%s) %d MPI processes\n",prefix,size);CHKERRQ(ierr);} else {ierr = PetscViewerASCIIPrintf(v,"DMDA Object: %d MPI processes\n",size);CHKERRQ(ierr);} ierr = PetscViewerASCIIPrintf(v," M %D N %D m %D n %D dof %D overlap %D\n",M,N,m,n,ndof,nsw);CHKERRQ(ierr); PetscFunctionReturn(0); } PetscErrorCode DMView_DA_Short(DM dm,PetscViewer v) { PetscErrorCode ierr; PetscInt dim; PetscFunctionBegin; ierr = DMDAGetInfo(dm,&dim,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL);CHKERRQ(ierr); switch (dim) { case 2: ierr = DMView_DA_Short_2d(dm,v);CHKERRQ(ierr); break; case 3: ierr = DMView_DA_Short_3d(dm,v);CHKERRQ(ierr); break; } PetscFunctionReturn(0); }