147c6ae99SBarry Smith 2af0996ceSBarry Smith #include <petsc/private/dmdaimpl.h> /*I "petscdmda.h" I*/ 307475bc1SBarry Smith #include <petscmat.h> 447c6ae99SBarry Smith 5e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_1d_MPIAIJ(DM,ISColoringType,ISColoring*); 6e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_2d_MPIAIJ(DM,ISColoringType,ISColoring*); 7e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_2d_5pt_MPIAIJ(DM,ISColoringType,ISColoring*); 8e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_3d_MPIAIJ(DM,ISColoringType,ISColoring*); 947c6ae99SBarry Smith 1047c6ae99SBarry Smith /* 1147c6ae99SBarry Smith For ghost i that may be negative or greater than the upper bound this 1247c6ae99SBarry Smith maps it into the 0:m-1 range using periodicity 1347c6ae99SBarry Smith */ 1447c6ae99SBarry Smith #define SetInRange(i,m) ((i < 0) ? m+i : ((i >= m) ? i-m : i)) 1547c6ae99SBarry Smith 1647c6ae99SBarry Smith #undef __FUNCT__ 17aa219208SBarry Smith #define __FUNCT__ "DMDASetBlockFills_Private" 18ce308e1dSBarry Smith static PetscErrorCode DMDASetBlockFills_Private(const PetscInt *dfill,PetscInt w,PetscInt **rfill) 1947c6ae99SBarry Smith { 2047c6ae99SBarry Smith PetscErrorCode ierr; 2147c6ae99SBarry Smith PetscInt i,j,nz,*fill; 2247c6ae99SBarry Smith 2347c6ae99SBarry Smith PetscFunctionBegin; 2447c6ae99SBarry Smith if (!dfill) PetscFunctionReturn(0); 2547c6ae99SBarry Smith 2647c6ae99SBarry Smith /* count number nonzeros */ 2747c6ae99SBarry Smith nz = 0; 2847c6ae99SBarry Smith for (i=0; i<w; i++) { 2947c6ae99SBarry Smith for (j=0; j<w; j++) { 3047c6ae99SBarry Smith if (dfill[w*i+j]) nz++; 3147c6ae99SBarry Smith } 3247c6ae99SBarry Smith } 33854ce69bSBarry Smith ierr = PetscMalloc1(nz + w + 1,&fill);CHKERRQ(ierr); 3447c6ae99SBarry Smith /* construct modified CSR storage of nonzero structure */ 35ce308e1dSBarry Smith /* fill[0 -- w] marks starts of each row of column indices (and end of last row) 36ce308e1dSBarry Smith so fill[1] - fill[0] gives number of nonzeros in first row etc */ 3747c6ae99SBarry Smith nz = w + 1; 3847c6ae99SBarry Smith for (i=0; i<w; i++) { 3947c6ae99SBarry Smith fill[i] = nz; 4047c6ae99SBarry Smith for (j=0; j<w; j++) { 4147c6ae99SBarry Smith if (dfill[w*i+j]) { 4247c6ae99SBarry Smith fill[nz] = j; 4347c6ae99SBarry Smith nz++; 4447c6ae99SBarry Smith } 4547c6ae99SBarry Smith } 4647c6ae99SBarry Smith } 4747c6ae99SBarry Smith fill[w] = nz; 4847c6ae99SBarry Smith 4947c6ae99SBarry Smith *rfill = fill; 5047c6ae99SBarry Smith PetscFunctionReturn(0); 5147c6ae99SBarry Smith } 5247c6ae99SBarry Smith 5347c6ae99SBarry Smith #undef __FUNCT__ 54aa219208SBarry Smith #define __FUNCT__ "DMDASetBlockFills" 5547c6ae99SBarry Smith /*@ 56aa219208SBarry Smith DMDASetBlockFills - Sets the fill pattern in each block for a multi-component problem 57950540a4SJed Brown of the matrix returned by DMCreateMatrix(). 5847c6ae99SBarry Smith 59aa219208SBarry Smith Logically Collective on DMDA 6047c6ae99SBarry Smith 6147c6ae99SBarry Smith Input Parameter: 6247c6ae99SBarry Smith + da - the distributed array 630298fd71SBarry Smith . dfill - the fill pattern in the diagonal block (may be NULL, means use dense block) 6447c6ae99SBarry Smith - ofill - the fill pattern in the off-diagonal blocks 6547c6ae99SBarry Smith 6647c6ae99SBarry Smith 6747c6ae99SBarry Smith Level: developer 6847c6ae99SBarry Smith 6947c6ae99SBarry Smith Notes: This only makes sense when you are doing multicomponent problems but using the 7047c6ae99SBarry Smith MPIAIJ matrix format 7147c6ae99SBarry Smith 7247c6ae99SBarry Smith The format for dfill and ofill is a 2 dimensional dof by dof matrix with 1 entries 7347c6ae99SBarry Smith representing coupling and 0 entries for missing coupling. For example 7447c6ae99SBarry Smith $ dfill[9] = {1, 0, 0, 7547c6ae99SBarry Smith $ 1, 1, 0, 7647c6ae99SBarry Smith $ 0, 1, 1} 7747c6ae99SBarry Smith means that row 0 is coupled with only itself in the diagonal block, row 1 is coupled with 7847c6ae99SBarry Smith itself and row 0 (in the diagonal block) and row 2 is coupled with itself and row 1 (in the 7947c6ae99SBarry Smith diagonal block). 8047c6ae99SBarry Smith 81aa219208SBarry Smith DMDASetGetMatrix() allows you to provide general code for those more complicated nonzero patterns then 8247c6ae99SBarry Smith can be represented in the dfill, ofill format 8347c6ae99SBarry Smith 8447c6ae99SBarry Smith Contributed by Glenn Hammond 8547c6ae99SBarry Smith 868ddb5d8bSBarry Smith .seealso DMCreateMatrix(), DMDASetGetMatrix(), DMSetMatrixPreallocateOnly() 8747c6ae99SBarry Smith 8847c6ae99SBarry Smith @*/ 89ce308e1dSBarry Smith PetscErrorCode DMDASetBlockFills(DM da,const PetscInt *dfill,const PetscInt *ofill) 9047c6ae99SBarry Smith { 9147c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 9247c6ae99SBarry Smith PetscErrorCode ierr; 93ae4f298aSBarry Smith PetscInt i,k,cnt = 1; 9447c6ae99SBarry Smith 9547c6ae99SBarry Smith PetscFunctionBegin; 96aa219208SBarry Smith ierr = DMDASetBlockFills_Private(dfill,dd->w,&dd->dfill);CHKERRQ(ierr); 97aa219208SBarry Smith ierr = DMDASetBlockFills_Private(ofill,dd->w,&dd->ofill);CHKERRQ(ierr); 98ae4f298aSBarry Smith 99ae4f298aSBarry Smith /* ofillcount tracks the columns of ofill that have any nonzero in thems; the value in each location is the number of 100ae4f298aSBarry Smith columns to the left with any nonzeros in them plus 1 */ 1011795a4d1SJed Brown ierr = PetscCalloc1(dd->w,&dd->ofillcols);CHKERRQ(ierr); 102ae4f298aSBarry Smith for (i=0; i<dd->w; i++) { 103ae4f298aSBarry Smith for (k=dd->ofill[i]; k<dd->ofill[i+1]; k++) dd->ofillcols[dd->ofill[k]] = 1; 104ae4f298aSBarry Smith } 105ae4f298aSBarry Smith for (i=0; i<dd->w; i++) { 106ae4f298aSBarry Smith if (dd->ofillcols[i]) { 107ae4f298aSBarry Smith dd->ofillcols[i] = cnt++; 108ae4f298aSBarry Smith } 109ae4f298aSBarry Smith } 11047c6ae99SBarry Smith PetscFunctionReturn(0); 11147c6ae99SBarry Smith } 11247c6ae99SBarry Smith 11347c6ae99SBarry Smith 11447c6ae99SBarry Smith #undef __FUNCT__ 115e727c939SJed Brown #define __FUNCT__ "DMCreateColoring_DA" 116b412c318SBarry Smith PetscErrorCode DMCreateColoring_DA(DM da,ISColoringType ctype,ISColoring *coloring) 11747c6ae99SBarry Smith { 11847c6ae99SBarry Smith PetscErrorCode ierr; 11947c6ae99SBarry Smith PetscInt dim,m,n,p,nc; 120bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by,bz; 12147c6ae99SBarry Smith MPI_Comm comm; 12247c6ae99SBarry Smith PetscMPIInt size; 12347c6ae99SBarry Smith PetscBool isBAIJ; 12447c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 12547c6ae99SBarry Smith 12647c6ae99SBarry Smith PetscFunctionBegin; 12747c6ae99SBarry Smith /* 12847c6ae99SBarry Smith m 12947c6ae99SBarry Smith ------------------------------------------------------ 13047c6ae99SBarry Smith | | 13147c6ae99SBarry Smith | | 13247c6ae99SBarry Smith | ---------------------- | 13347c6ae99SBarry Smith | | | | 13447c6ae99SBarry Smith n | yn | | | 13547c6ae99SBarry Smith | | | | 13647c6ae99SBarry Smith | .--------------------- | 13747c6ae99SBarry Smith | (xs,ys) xn | 13847c6ae99SBarry Smith | . | 13947c6ae99SBarry Smith | (gxs,gys) | 14047c6ae99SBarry Smith | | 14147c6ae99SBarry Smith ----------------------------------------------------- 14247c6ae99SBarry Smith */ 14347c6ae99SBarry Smith 14447c6ae99SBarry Smith /* 14547c6ae99SBarry Smith nc - number of components per grid point 14647c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 14747c6ae99SBarry Smith 14847c6ae99SBarry Smith */ 1491321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,0,0,0,&m,&n,&p,&nc,0,&bx,&by,&bz,0);CHKERRQ(ierr); 15047c6ae99SBarry Smith 15147c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 15247c6ae99SBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 1535bdb020cSBarry Smith if (ctype == IS_COLORING_LOCAL) { 15447c6ae99SBarry Smith if (size == 1) { 15547c6ae99SBarry Smith ctype = IS_COLORING_GLOBAL; 15647c6ae99SBarry Smith } else if (dim > 1) { 157bff4a2f0SMatthew G. Knepley if ((m==1 && bx == DM_BOUNDARY_PERIODIC) || (n==1 && by == DM_BOUNDARY_PERIODIC) || (p==1 && bz == DM_BOUNDARY_PERIODIC)) { 1585bdb020cSBarry Smith SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"IS_COLORING_LOCAL cannot be used for periodic boundary condition having both ends of the domain on the same process"); 15947c6ae99SBarry Smith } 16047c6ae99SBarry Smith } 16147c6ae99SBarry Smith } 16247c6ae99SBarry Smith 163aa219208SBarry Smith /* Tell the DMDA it has 1 degree of freedom per grid point so that the coloring for BAIJ 16447c6ae99SBarry Smith matrices is for the blocks, not the individual matrix elements */ 165b412c318SBarry Smith ierr = PetscStrcmp(da->mattype,MATBAIJ,&isBAIJ);CHKERRQ(ierr); 166b412c318SBarry Smith if (!isBAIJ) {ierr = PetscStrcmp(da->mattype,MATMPIBAIJ,&isBAIJ);CHKERRQ(ierr);} 167b412c318SBarry Smith if (!isBAIJ) {ierr = PetscStrcmp(da->mattype,MATSEQBAIJ,&isBAIJ);CHKERRQ(ierr);} 16847c6ae99SBarry Smith if (isBAIJ) { 16947c6ae99SBarry Smith dd->w = 1; 17047c6ae99SBarry Smith dd->xs = dd->xs/nc; 17147c6ae99SBarry Smith dd->xe = dd->xe/nc; 17247c6ae99SBarry Smith dd->Xs = dd->Xs/nc; 17347c6ae99SBarry Smith dd->Xe = dd->Xe/nc; 17447c6ae99SBarry Smith } 17547c6ae99SBarry Smith 17647c6ae99SBarry Smith /* 177aa219208SBarry Smith We do not provide a getcoloring function in the DMDA operations because 178aa219208SBarry Smith the basic DMDA does not know about matrices. We think of DMDA as being more 17947c6ae99SBarry Smith more low-level then matrices. 18047c6ae99SBarry Smith */ 18147c6ae99SBarry Smith if (dim == 1) { 182e727c939SJed Brown ierr = DMCreateColoring_DA_1d_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr); 18347c6ae99SBarry Smith } else if (dim == 2) { 184e727c939SJed Brown ierr = DMCreateColoring_DA_2d_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr); 18547c6ae99SBarry Smith } else if (dim == 3) { 186e727c939SJed Brown ierr = DMCreateColoring_DA_3d_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr); 187ce94432eSBarry Smith } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not done for %D dimension, send us mail petsc-maint@mcs.anl.gov for code",dim); 18847c6ae99SBarry Smith if (isBAIJ) { 18947c6ae99SBarry Smith dd->w = nc; 19047c6ae99SBarry Smith dd->xs = dd->xs*nc; 19147c6ae99SBarry Smith dd->xe = dd->xe*nc; 19247c6ae99SBarry Smith dd->Xs = dd->Xs*nc; 19347c6ae99SBarry Smith dd->Xe = dd->Xe*nc; 19447c6ae99SBarry Smith } 19547c6ae99SBarry Smith PetscFunctionReturn(0); 19647c6ae99SBarry Smith } 19747c6ae99SBarry Smith 19847c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 19947c6ae99SBarry Smith 20047c6ae99SBarry Smith #undef __FUNCT__ 201e727c939SJed Brown #define __FUNCT__ "DMCreateColoring_DA_2d_MPIAIJ" 202e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_2d_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring) 20347c6ae99SBarry Smith { 20447c6ae99SBarry Smith PetscErrorCode ierr; 20547c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,ii,gxs,gys,gnx,gny,m,n,M,N,dim,s,k,nc,col; 20647c6ae99SBarry Smith PetscInt ncolors; 20747c6ae99SBarry Smith MPI_Comm comm; 208bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by; 209aa219208SBarry Smith DMDAStencilType st; 21047c6ae99SBarry Smith ISColoringValue *colors; 21147c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 21247c6ae99SBarry Smith 21347c6ae99SBarry Smith PetscFunctionBegin; 21447c6ae99SBarry Smith /* 21547c6ae99SBarry Smith nc - number of components per grid point 21647c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 21747c6ae99SBarry Smith 21847c6ae99SBarry Smith */ 2191321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,&M,&N,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 22047c6ae99SBarry Smith col = 2*s + 1; 221aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 222aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 22347c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 22447c6ae99SBarry Smith 22547c6ae99SBarry Smith /* special case as taught to us by Paul Hovland */ 226aa219208SBarry Smith if (st == DMDA_STENCIL_STAR && s == 1) { 227e727c939SJed Brown ierr = DMCreateColoring_DA_2d_5pt_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr); 22847c6ae99SBarry Smith } else { 22947c6ae99SBarry Smith 230bff4a2f0SMatthew G. Knepley if (bx == DM_BOUNDARY_PERIODIC && (m % col)) SETERRQ2(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X (%d) is divisible\n\ 23147c6ae99SBarry Smith by 2*stencil_width + 1 (%d)\n", m, col); 232bff4a2f0SMatthew G. Knepley if (by == DM_BOUNDARY_PERIODIC && (n % col)) SETERRQ2(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y (%d) is divisible\n\ 23347c6ae99SBarry Smith by 2*stencil_width + 1 (%d)\n", n, col); 23447c6ae99SBarry Smith if (ctype == IS_COLORING_GLOBAL) { 23547c6ae99SBarry Smith if (!dd->localcoloring) { 236785e854fSJed Brown ierr = PetscMalloc1(nc*nx*ny,&colors);CHKERRQ(ierr); 23747c6ae99SBarry Smith ii = 0; 23847c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 23947c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 24047c6ae99SBarry Smith for (k=0; k<nc; k++) { 24147c6ae99SBarry Smith colors[ii++] = k + nc*((i % col) + col*(j % col)); 24247c6ae99SBarry Smith } 24347c6ae99SBarry Smith } 24447c6ae99SBarry Smith } 24547c6ae99SBarry Smith ncolors = nc + nc*(col-1 + col*(col-1)); 246aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*nx*ny,colors,PETSC_OWN_POINTER,&dd->localcoloring);CHKERRQ(ierr); 24747c6ae99SBarry Smith } 24847c6ae99SBarry Smith *coloring = dd->localcoloring; 2495bdb020cSBarry Smith } else if (ctype == IS_COLORING_LOCAL) { 25047c6ae99SBarry Smith if (!dd->ghostedcoloring) { 251785e854fSJed Brown ierr = PetscMalloc1(nc*gnx*gny,&colors);CHKERRQ(ierr); 25247c6ae99SBarry Smith ii = 0; 25347c6ae99SBarry Smith for (j=gys; j<gys+gny; j++) { 25447c6ae99SBarry Smith for (i=gxs; i<gxs+gnx; i++) { 25547c6ae99SBarry Smith for (k=0; k<nc; k++) { 25647c6ae99SBarry Smith /* the complicated stuff is to handle periodic boundaries */ 25747c6ae99SBarry Smith colors[ii++] = k + nc*((SetInRange(i,m) % col) + col*(SetInRange(j,n) % col)); 25847c6ae99SBarry Smith } 25947c6ae99SBarry Smith } 26047c6ae99SBarry Smith } 26147c6ae99SBarry Smith ncolors = nc + nc*(col - 1 + col*(col-1)); 262aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*gnx*gny,colors,PETSC_OWN_POINTER,&dd->ghostedcoloring);CHKERRQ(ierr); 26347c6ae99SBarry Smith /* PetscIntView(ncolors,(PetscInt*)colors,0); */ 26447c6ae99SBarry Smith 2655bdb020cSBarry Smith ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_LOCAL);CHKERRQ(ierr); 26647c6ae99SBarry Smith } 26747c6ae99SBarry Smith *coloring = dd->ghostedcoloring; 268ce94432eSBarry Smith } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype); 26947c6ae99SBarry Smith } 27047c6ae99SBarry Smith ierr = ISColoringReference(*coloring);CHKERRQ(ierr); 27147c6ae99SBarry Smith PetscFunctionReturn(0); 27247c6ae99SBarry Smith } 27347c6ae99SBarry Smith 27447c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 27547c6ae99SBarry Smith 27647c6ae99SBarry Smith #undef __FUNCT__ 277e727c939SJed Brown #define __FUNCT__ "DMCreateColoring_DA_3d_MPIAIJ" 278e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_3d_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring) 27947c6ae99SBarry Smith { 28047c6ae99SBarry Smith PetscErrorCode ierr; 28147c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,gxs,gys,gnx,gny,m,n,p,dim,s,k,nc,col,zs,gzs,ii,l,nz,gnz,M,N,P; 28247c6ae99SBarry Smith PetscInt ncolors; 28347c6ae99SBarry Smith MPI_Comm comm; 284bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by,bz; 285aa219208SBarry Smith DMDAStencilType st; 28647c6ae99SBarry Smith ISColoringValue *colors; 28747c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 28847c6ae99SBarry Smith 28947c6ae99SBarry Smith PetscFunctionBegin; 29047c6ae99SBarry Smith /* 29147c6ae99SBarry Smith nc - number of components per grid point 29247c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 29347c6ae99SBarry Smith 29447c6ae99SBarry Smith */ 2951321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,&p,&M,&N,&P,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 29647c6ae99SBarry Smith col = 2*s + 1; 297bff4a2f0SMatthew G. Knepley if (bx == DM_BOUNDARY_PERIODIC && (m % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X is divisible\n\ 29847c6ae99SBarry Smith by 2*stencil_width + 1\n"); 299bff4a2f0SMatthew G. Knepley if (by == DM_BOUNDARY_PERIODIC && (n % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y is divisible\n\ 30047c6ae99SBarry Smith by 2*stencil_width + 1\n"); 301bff4a2f0SMatthew G. Knepley if (bz == DM_BOUNDARY_PERIODIC && (p % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Z is divisible\n\ 30247c6ae99SBarry Smith by 2*stencil_width + 1\n"); 30347c6ae99SBarry Smith 304aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 305aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 30647c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 30747c6ae99SBarry Smith 30847c6ae99SBarry Smith /* create the coloring */ 30947c6ae99SBarry Smith if (ctype == IS_COLORING_GLOBAL) { 31047c6ae99SBarry Smith if (!dd->localcoloring) { 311785e854fSJed Brown ierr = PetscMalloc1(nc*nx*ny*nz,&colors);CHKERRQ(ierr); 31247c6ae99SBarry Smith ii = 0; 31347c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 31447c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 31547c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 31647c6ae99SBarry Smith for (l=0; l<nc; l++) { 31747c6ae99SBarry Smith colors[ii++] = l + nc*((i % col) + col*(j % col) + col*col*(k % col)); 31847c6ae99SBarry Smith } 31947c6ae99SBarry Smith } 32047c6ae99SBarry Smith } 32147c6ae99SBarry Smith } 32247c6ae99SBarry Smith ncolors = nc + nc*(col-1 + col*(col-1)+ col*col*(col-1)); 323aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*nx*ny*nz,colors,PETSC_OWN_POINTER,&dd->localcoloring);CHKERRQ(ierr); 32447c6ae99SBarry Smith } 32547c6ae99SBarry Smith *coloring = dd->localcoloring; 3265bdb020cSBarry Smith } else if (ctype == IS_COLORING_LOCAL) { 32747c6ae99SBarry Smith if (!dd->ghostedcoloring) { 328785e854fSJed Brown ierr = PetscMalloc1(nc*gnx*gny*gnz,&colors);CHKERRQ(ierr); 32947c6ae99SBarry Smith ii = 0; 33047c6ae99SBarry Smith for (k=gzs; k<gzs+gnz; k++) { 33147c6ae99SBarry Smith for (j=gys; j<gys+gny; j++) { 33247c6ae99SBarry Smith for (i=gxs; i<gxs+gnx; i++) { 33347c6ae99SBarry Smith for (l=0; l<nc; l++) { 33447c6ae99SBarry Smith /* the complicated stuff is to handle periodic boundaries */ 33547c6ae99SBarry Smith colors[ii++] = l + nc*((SetInRange(i,m) % col) + col*(SetInRange(j,n) % col) + col*col*(SetInRange(k,p) % col)); 33647c6ae99SBarry Smith } 33747c6ae99SBarry Smith } 33847c6ae99SBarry Smith } 33947c6ae99SBarry Smith } 34047c6ae99SBarry Smith ncolors = nc + nc*(col-1 + col*(col-1)+ col*col*(col-1)); 341aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*gnx*gny*gnz,colors,PETSC_OWN_POINTER,&dd->ghostedcoloring);CHKERRQ(ierr); 3425bdb020cSBarry Smith ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_LOCAL);CHKERRQ(ierr); 34347c6ae99SBarry Smith } 34447c6ae99SBarry Smith *coloring = dd->ghostedcoloring; 345ce94432eSBarry Smith } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype); 34647c6ae99SBarry Smith ierr = ISColoringReference(*coloring);CHKERRQ(ierr); 34747c6ae99SBarry Smith PetscFunctionReturn(0); 34847c6ae99SBarry Smith } 34947c6ae99SBarry Smith 35047c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 35147c6ae99SBarry Smith 35247c6ae99SBarry Smith #undef __FUNCT__ 353e727c939SJed Brown #define __FUNCT__ "DMCreateColoring_DA_1d_MPIAIJ" 354e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_1d_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring) 35547c6ae99SBarry Smith { 35647c6ae99SBarry Smith PetscErrorCode ierr; 35747c6ae99SBarry Smith PetscInt xs,nx,i,i1,gxs,gnx,l,m,M,dim,s,nc,col; 35847c6ae99SBarry Smith PetscInt ncolors; 35947c6ae99SBarry Smith MPI_Comm comm; 360bff4a2f0SMatthew G. Knepley DMBoundaryType bx; 36147c6ae99SBarry Smith ISColoringValue *colors; 36247c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 36347c6ae99SBarry Smith 36447c6ae99SBarry Smith PetscFunctionBegin; 36547c6ae99SBarry Smith /* 36647c6ae99SBarry Smith nc - number of components per grid point 36747c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 36847c6ae99SBarry Smith 36947c6ae99SBarry Smith */ 3701321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,0,0,&M,0,0,&nc,&s,&bx,0,0,0);CHKERRQ(ierr); 37147c6ae99SBarry Smith col = 2*s + 1; 37247c6ae99SBarry Smith 373bff4a2f0SMatthew G. Knepley if (bx == DM_BOUNDARY_PERIODIC && (m % col)) SETERRQ2(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points %d is divisible\n\ 37431e6f798SBarry Smith by 2*stencil_width + 1 %d\n",(int)m,(int)col); 37547c6ae99SBarry Smith 376aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,0,0,&nx,0,0);CHKERRQ(ierr); 377aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,0,0,&gnx,0,0);CHKERRQ(ierr); 37847c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 37947c6ae99SBarry Smith 38047c6ae99SBarry Smith /* create the coloring */ 38147c6ae99SBarry Smith if (ctype == IS_COLORING_GLOBAL) { 38247c6ae99SBarry Smith if (!dd->localcoloring) { 383785e854fSJed Brown ierr = PetscMalloc1(nc*nx,&colors);CHKERRQ(ierr); 384ae4f298aSBarry Smith if (dd->ofillcols) { 385ae4f298aSBarry Smith PetscInt tc = 0; 386ae4f298aSBarry Smith for (i=0; i<nc; i++) tc += (PetscInt) (dd->ofillcols[i] > 0); 387ae4f298aSBarry Smith i1 = 0; 388ae4f298aSBarry Smith for (i=xs; i<xs+nx; i++) { 389ae4f298aSBarry Smith for (l=0; l<nc; l++) { 390ae4f298aSBarry Smith if (dd->ofillcols[l] && (i % col)) { 391ae4f298aSBarry Smith colors[i1++] = nc - 1 + tc*((i % col) - 1) + dd->ofillcols[l]; 392ae4f298aSBarry Smith } else { 393ae4f298aSBarry Smith colors[i1++] = l; 394ae4f298aSBarry Smith } 395ae4f298aSBarry Smith } 396ae4f298aSBarry Smith } 397ae4f298aSBarry Smith ncolors = nc + 2*s*tc; 398ae4f298aSBarry Smith } else { 39947c6ae99SBarry Smith i1 = 0; 40047c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 40147c6ae99SBarry Smith for (l=0; l<nc; l++) { 40247c6ae99SBarry Smith colors[i1++] = l + nc*(i % col); 40347c6ae99SBarry Smith } 40447c6ae99SBarry Smith } 40547c6ae99SBarry Smith ncolors = nc + nc*(col-1); 406ae4f298aSBarry Smith } 407aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*nx,colors,PETSC_OWN_POINTER,&dd->localcoloring);CHKERRQ(ierr); 40847c6ae99SBarry Smith } 40947c6ae99SBarry Smith *coloring = dd->localcoloring; 4105bdb020cSBarry Smith } else if (ctype == IS_COLORING_LOCAL) { 41147c6ae99SBarry Smith if (!dd->ghostedcoloring) { 412785e854fSJed Brown ierr = PetscMalloc1(nc*gnx,&colors);CHKERRQ(ierr); 41347c6ae99SBarry Smith i1 = 0; 41447c6ae99SBarry Smith for (i=gxs; i<gxs+gnx; i++) { 41547c6ae99SBarry Smith for (l=0; l<nc; l++) { 41647c6ae99SBarry Smith /* the complicated stuff is to handle periodic boundaries */ 41747c6ae99SBarry Smith colors[i1++] = l + nc*(SetInRange(i,m) % col); 41847c6ae99SBarry Smith } 41947c6ae99SBarry Smith } 42047c6ae99SBarry Smith ncolors = nc + nc*(col-1); 421aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*gnx,colors,PETSC_OWN_POINTER,&dd->ghostedcoloring);CHKERRQ(ierr); 4225bdb020cSBarry Smith ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_LOCAL);CHKERRQ(ierr); 42347c6ae99SBarry Smith } 42447c6ae99SBarry Smith *coloring = dd->ghostedcoloring; 425ce94432eSBarry Smith } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype); 42647c6ae99SBarry Smith ierr = ISColoringReference(*coloring);CHKERRQ(ierr); 42747c6ae99SBarry Smith PetscFunctionReturn(0); 42847c6ae99SBarry Smith } 42947c6ae99SBarry Smith 43047c6ae99SBarry Smith #undef __FUNCT__ 431e727c939SJed Brown #define __FUNCT__ "DMCreateColoring_DA_2d_5pt_MPIAIJ" 432e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_2d_5pt_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring) 43347c6ae99SBarry Smith { 43447c6ae99SBarry Smith PetscErrorCode ierr; 43547c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,ii,gxs,gys,gnx,gny,m,n,dim,s,k,nc; 43647c6ae99SBarry Smith PetscInt ncolors; 43747c6ae99SBarry Smith MPI_Comm comm; 438bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by; 43947c6ae99SBarry Smith ISColoringValue *colors; 44047c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 44147c6ae99SBarry Smith 44247c6ae99SBarry Smith PetscFunctionBegin; 44347c6ae99SBarry Smith /* 44447c6ae99SBarry Smith nc - number of components per grid point 44547c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 44647c6ae99SBarry Smith 44747c6ae99SBarry Smith */ 4481321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,0);CHKERRQ(ierr); 449aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 450aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 45147c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 45247c6ae99SBarry Smith 453bff4a2f0SMatthew G. Knepley if (bx == DM_BOUNDARY_PERIODIC && (m % 5)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X is divisible by 5\n"); 454bff4a2f0SMatthew G. Knepley if (by == DM_BOUNDARY_PERIODIC && (n % 5)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y is divisible by 5\n"); 45547c6ae99SBarry Smith 45647c6ae99SBarry Smith /* create the coloring */ 45747c6ae99SBarry Smith if (ctype == IS_COLORING_GLOBAL) { 45847c6ae99SBarry Smith if (!dd->localcoloring) { 459785e854fSJed Brown ierr = PetscMalloc1(nc*nx*ny,&colors);CHKERRQ(ierr); 46047c6ae99SBarry Smith ii = 0; 46147c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 46247c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 46347c6ae99SBarry Smith for (k=0; k<nc; k++) { 46447c6ae99SBarry Smith colors[ii++] = k + nc*((3*j+i) % 5); 46547c6ae99SBarry Smith } 46647c6ae99SBarry Smith } 46747c6ae99SBarry Smith } 46847c6ae99SBarry Smith ncolors = 5*nc; 469aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*nx*ny,colors,PETSC_OWN_POINTER,&dd->localcoloring);CHKERRQ(ierr); 47047c6ae99SBarry Smith } 47147c6ae99SBarry Smith *coloring = dd->localcoloring; 4725bdb020cSBarry Smith } else if (ctype == IS_COLORING_LOCAL) { 47347c6ae99SBarry Smith if (!dd->ghostedcoloring) { 474785e854fSJed Brown ierr = PetscMalloc1(nc*gnx*gny,&colors);CHKERRQ(ierr); 47547c6ae99SBarry Smith ii = 0; 47647c6ae99SBarry Smith for (j=gys; j<gys+gny; j++) { 47747c6ae99SBarry Smith for (i=gxs; i<gxs+gnx; i++) { 47847c6ae99SBarry Smith for (k=0; k<nc; k++) { 47947c6ae99SBarry Smith colors[ii++] = k + nc*((3*SetInRange(j,n) + SetInRange(i,m)) % 5); 48047c6ae99SBarry Smith } 48147c6ae99SBarry Smith } 48247c6ae99SBarry Smith } 48347c6ae99SBarry Smith ncolors = 5*nc; 484aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*gnx*gny,colors,PETSC_OWN_POINTER,&dd->ghostedcoloring);CHKERRQ(ierr); 4855bdb020cSBarry Smith ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_LOCAL);CHKERRQ(ierr); 48647c6ae99SBarry Smith } 48747c6ae99SBarry Smith *coloring = dd->ghostedcoloring; 488ce94432eSBarry Smith } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype); 48947c6ae99SBarry Smith PetscFunctionReturn(0); 49047c6ae99SBarry Smith } 49147c6ae99SBarry Smith 49247c6ae99SBarry Smith /* =========================================================================== */ 493950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ(DM,Mat); 494ce308e1dSBarry Smith extern PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ_Fill(DM,Mat); 495950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ(DM,Mat); 496950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ_Fill(DM,Mat); 497950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ(DM,Mat); 498950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ_Fill(DM,Mat); 499950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPIBAIJ(DM,Mat); 500950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPIBAIJ(DM,Mat); 501950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPISBAIJ(DM,Mat); 502950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPISBAIJ(DM,Mat); 50347c6ae99SBarry Smith 50447c6ae99SBarry Smith #undef __FUNCT__ 505c688c046SMatthew G Knepley #define __FUNCT__ "MatSetupDM" 5068bbdbebaSMatthew G Knepley /*@C 507c688c046SMatthew G Knepley MatSetupDM - Sets the DMDA that is to be used by the HYPRE_StructMatrix PETSc matrix 50847c6ae99SBarry Smith 50947c6ae99SBarry Smith Logically Collective on Mat 51047c6ae99SBarry Smith 51147c6ae99SBarry Smith Input Parameters: 51247c6ae99SBarry Smith + mat - the matrix 51347c6ae99SBarry Smith - da - the da 51447c6ae99SBarry Smith 51547c6ae99SBarry Smith Level: intermediate 51647c6ae99SBarry Smith 51747c6ae99SBarry Smith @*/ 518c688c046SMatthew G Knepley PetscErrorCode MatSetupDM(Mat mat,DM da) 51947c6ae99SBarry Smith { 52047c6ae99SBarry Smith PetscErrorCode ierr; 52147c6ae99SBarry Smith 52247c6ae99SBarry Smith PetscFunctionBegin; 52347c6ae99SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 52447c6ae99SBarry Smith PetscValidHeaderSpecific(da,DM_CLASSID,1); 525c688c046SMatthew G Knepley ierr = PetscTryMethod(mat,"MatSetupDM_C",(Mat,DM),(mat,da));CHKERRQ(ierr); 52647c6ae99SBarry Smith PetscFunctionReturn(0); 52747c6ae99SBarry Smith } 52847c6ae99SBarry Smith 52947c6ae99SBarry Smith #undef __FUNCT__ 53047c6ae99SBarry Smith #define __FUNCT__ "MatView_MPI_DA" 5317087cfbeSBarry Smith PetscErrorCode MatView_MPI_DA(Mat A,PetscViewer viewer) 53247c6ae99SBarry Smith { 5339a42bb27SBarry Smith DM da; 53447c6ae99SBarry Smith PetscErrorCode ierr; 53547c6ae99SBarry Smith const char *prefix; 53647c6ae99SBarry Smith Mat Anatural; 53747c6ae99SBarry Smith AO ao; 53847c6ae99SBarry Smith PetscInt rstart,rend,*petsc,i; 53947c6ae99SBarry Smith IS is; 54047c6ae99SBarry Smith MPI_Comm comm; 54174388724SJed Brown PetscViewerFormat format; 54247c6ae99SBarry Smith 54347c6ae99SBarry Smith PetscFunctionBegin; 54474388724SJed Brown /* Check whether we are just printing info, in which case MatView() already viewed everything we wanted to view */ 54574388724SJed Brown ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 54674388724SJed Brown if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0); 54774388724SJed Brown 54847c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)A,&comm);CHKERRQ(ierr); 549c688c046SMatthew G Knepley ierr = MatGetDM(A, &da);CHKERRQ(ierr); 550ce94432eSBarry Smith if (!da) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Matrix not generated from a DMDA"); 55147c6ae99SBarry Smith 552aa219208SBarry Smith ierr = DMDAGetAO(da,&ao);CHKERRQ(ierr); 55347c6ae99SBarry Smith ierr = MatGetOwnershipRange(A,&rstart,&rend);CHKERRQ(ierr); 554854ce69bSBarry Smith ierr = PetscMalloc1(rend-rstart,&petsc);CHKERRQ(ierr); 55547c6ae99SBarry Smith for (i=rstart; i<rend; i++) petsc[i-rstart] = i; 55647c6ae99SBarry Smith ierr = AOApplicationToPetsc(ao,rend-rstart,petsc);CHKERRQ(ierr); 55747c6ae99SBarry Smith ierr = ISCreateGeneral(comm,rend-rstart,petsc,PETSC_OWN_POINTER,&is);CHKERRQ(ierr); 55847c6ae99SBarry Smith 55947c6ae99SBarry Smith /* call viewer on natural ordering */ 56047c6ae99SBarry Smith ierr = MatGetSubMatrix(A,is,is,MAT_INITIAL_MATRIX,&Anatural);CHKERRQ(ierr); 561fcfd50ebSBarry Smith ierr = ISDestroy(&is);CHKERRQ(ierr); 56247c6ae99SBarry Smith ierr = PetscObjectGetOptionsPrefix((PetscObject)A,&prefix);CHKERRQ(ierr); 56347c6ae99SBarry Smith ierr = PetscObjectSetOptionsPrefix((PetscObject)Anatural,prefix);CHKERRQ(ierr); 56447c6ae99SBarry Smith ierr = PetscObjectSetName((PetscObject)Anatural,((PetscObject)A)->name);CHKERRQ(ierr); 565539c167fSBarry Smith ierr = MatView(Anatural,viewer);CHKERRQ(ierr); 566fcfd50ebSBarry Smith ierr = MatDestroy(&Anatural);CHKERRQ(ierr); 56747c6ae99SBarry Smith PetscFunctionReturn(0); 56847c6ae99SBarry Smith } 56947c6ae99SBarry Smith 57047c6ae99SBarry Smith #undef __FUNCT__ 57147c6ae99SBarry Smith #define __FUNCT__ "MatLoad_MPI_DA" 5727087cfbeSBarry Smith PetscErrorCode MatLoad_MPI_DA(Mat A,PetscViewer viewer) 57347c6ae99SBarry Smith { 5749a42bb27SBarry Smith DM da; 57547c6ae99SBarry Smith PetscErrorCode ierr; 57647c6ae99SBarry Smith Mat Anatural,Aapp; 57747c6ae99SBarry Smith AO ao; 578539c167fSBarry Smith PetscInt rstart,rend,*app,i,m,n,M,N; 57947c6ae99SBarry Smith IS is; 58047c6ae99SBarry Smith MPI_Comm comm; 58147c6ae99SBarry Smith 58247c6ae99SBarry Smith PetscFunctionBegin; 58347c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)A,&comm);CHKERRQ(ierr); 584c688c046SMatthew G Knepley ierr = MatGetDM(A, &da);CHKERRQ(ierr); 585ce94432eSBarry Smith if (!da) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Matrix not generated from a DMDA"); 58647c6ae99SBarry Smith 58747c6ae99SBarry Smith /* Load the matrix in natural ordering */ 588ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&Anatural);CHKERRQ(ierr); 58947c6ae99SBarry Smith ierr = MatSetType(Anatural,((PetscObject)A)->type_name);CHKERRQ(ierr); 590539c167fSBarry Smith ierr = MatGetSize(A,&M,&N);CHKERRQ(ierr); 591539c167fSBarry Smith ierr = MatGetLocalSize(A,&m,&n);CHKERRQ(ierr); 592539c167fSBarry Smith ierr = MatSetSizes(Anatural,m,n,M,N);CHKERRQ(ierr); 59347c6ae99SBarry Smith ierr = MatLoad(Anatural,viewer);CHKERRQ(ierr); 59447c6ae99SBarry Smith 59547c6ae99SBarry Smith /* Map natural ordering to application ordering and create IS */ 596aa219208SBarry Smith ierr = DMDAGetAO(da,&ao);CHKERRQ(ierr); 59747c6ae99SBarry Smith ierr = MatGetOwnershipRange(Anatural,&rstart,&rend);CHKERRQ(ierr); 598854ce69bSBarry Smith ierr = PetscMalloc1(rend-rstart,&app);CHKERRQ(ierr); 59947c6ae99SBarry Smith for (i=rstart; i<rend; i++) app[i-rstart] = i; 60047c6ae99SBarry Smith ierr = AOPetscToApplication(ao,rend-rstart,app);CHKERRQ(ierr); 60147c6ae99SBarry Smith ierr = ISCreateGeneral(comm,rend-rstart,app,PETSC_OWN_POINTER,&is);CHKERRQ(ierr); 60247c6ae99SBarry Smith 60347c6ae99SBarry Smith /* Do permutation and replace header */ 60447c6ae99SBarry Smith ierr = MatGetSubMatrix(Anatural,is,is,MAT_INITIAL_MATRIX,&Aapp);CHKERRQ(ierr); 60528be2f97SBarry Smith ierr = MatHeaderReplace(A,&Aapp);CHKERRQ(ierr); 606fcfd50ebSBarry Smith ierr = ISDestroy(&is);CHKERRQ(ierr); 607fcfd50ebSBarry Smith ierr = MatDestroy(&Anatural);CHKERRQ(ierr); 60847c6ae99SBarry Smith PetscFunctionReturn(0); 60947c6ae99SBarry Smith } 61047c6ae99SBarry Smith 61147c6ae99SBarry Smith #undef __FUNCT__ 612950540a4SJed Brown #define __FUNCT__ "DMCreateMatrix_DA" 613b412c318SBarry Smith PetscErrorCode DMCreateMatrix_DA(DM da, Mat *J) 61447c6ae99SBarry Smith { 61547c6ae99SBarry Smith PetscErrorCode ierr; 61647c6ae99SBarry Smith PetscInt dim,dof,nx,ny,nz,dims[3],starts[3],M,N,P; 61747c6ae99SBarry Smith Mat A; 61847c6ae99SBarry Smith MPI_Comm comm; 61919fd82e9SBarry Smith MatType Atype; 62037d0c07bSMatthew G Knepley PetscSection section, sectionGlobal; 6210298fd71SBarry Smith void (*aij)(void)=NULL,(*baij)(void)=NULL,(*sbaij)(void)=NULL; 622b412c318SBarry Smith MatType mtype; 62347c6ae99SBarry Smith PetscMPIInt size; 62447c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 62547c6ae99SBarry Smith 62647c6ae99SBarry Smith PetscFunctionBegin; 627607a6623SBarry Smith ierr = MatInitializePackage();CHKERRQ(ierr); 628b412c318SBarry Smith mtype = da->mattype; 62947c6ae99SBarry Smith 63037d0c07bSMatthew G Knepley ierr = DMGetDefaultSection(da, §ion);CHKERRQ(ierr); 63137d0c07bSMatthew G Knepley if (section) { 63237d0c07bSMatthew G Knepley PetscInt bs = -1; 63337d0c07bSMatthew G Knepley PetscInt localSize; 63437d0c07bSMatthew G Knepley PetscBool isShell, isBlock, isSeqBlock, isMPIBlock, isSymBlock, isSymSeqBlock, isSymMPIBlock, isSymmetric; 63537d0c07bSMatthew G Knepley 63637d0c07bSMatthew G Knepley ierr = DMGetDefaultGlobalSection(da, §ionGlobal);CHKERRQ(ierr); 63737d0c07bSMatthew G Knepley ierr = PetscSectionGetConstrainedStorageSize(sectionGlobal, &localSize);CHKERRQ(ierr); 63882f516ccSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)da), J);CHKERRQ(ierr); 63937d0c07bSMatthew G Knepley ierr = MatSetSizes(*J, localSize, localSize, PETSC_DETERMINE, PETSC_DETERMINE);CHKERRQ(ierr); 64037d0c07bSMatthew G Knepley ierr = MatSetType(*J, mtype);CHKERRQ(ierr); 64137d0c07bSMatthew G Knepley ierr = MatSetFromOptions(*J);CHKERRQ(ierr); 64237d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype, MATSHELL, &isShell);CHKERRQ(ierr); 64337d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype, MATBAIJ, &isBlock);CHKERRQ(ierr); 64437d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype, MATSEQBAIJ, &isSeqBlock);CHKERRQ(ierr); 64537d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype, MATMPIBAIJ, &isMPIBlock);CHKERRQ(ierr); 64637d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype, MATSBAIJ, &isSymBlock);CHKERRQ(ierr); 64737d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype, MATSEQSBAIJ, &isSymSeqBlock);CHKERRQ(ierr); 64837d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype, MATMPISBAIJ, &isSymMPIBlock);CHKERRQ(ierr); 64937d0c07bSMatthew G Knepley /* Check for symmetric storage */ 65037d0c07bSMatthew G Knepley isSymmetric = (PetscBool) (isSymBlock || isSymSeqBlock || isSymMPIBlock); 65137d0c07bSMatthew G Knepley if (isSymmetric) { 65237d0c07bSMatthew G Knepley ierr = MatSetOption(*J, MAT_IGNORE_LOWER_TRIANGULAR, PETSC_TRUE);CHKERRQ(ierr); 65337d0c07bSMatthew G Knepley } 65437d0c07bSMatthew G Knepley if (!isShell) { 65537d0c07bSMatthew G Knepley PetscInt *dnz, *onz, *dnzu, *onzu, bsLocal; 65637d0c07bSMatthew G Knepley 65737d0c07bSMatthew G Knepley if (bs < 0) { 65837d0c07bSMatthew G Knepley if (isBlock || isSeqBlock || isMPIBlock || isSymBlock || isSymSeqBlock || isSymMPIBlock) { 65937d0c07bSMatthew G Knepley PetscInt pStart, pEnd, p, dof; 66037d0c07bSMatthew G Knepley 66137d0c07bSMatthew G Knepley ierr = PetscSectionGetChart(sectionGlobal, &pStart, &pEnd);CHKERRQ(ierr); 66237d0c07bSMatthew G Knepley for (p = pStart; p < pEnd; ++p) { 66337d0c07bSMatthew G Knepley ierr = PetscSectionGetDof(sectionGlobal, p, &dof);CHKERRQ(ierr); 66437d0c07bSMatthew G Knepley if (dof) { 66537d0c07bSMatthew G Knepley bs = dof; 66637d0c07bSMatthew G Knepley break; 66737d0c07bSMatthew G Knepley } 66837d0c07bSMatthew G Knepley } 66937d0c07bSMatthew G Knepley } else { 67037d0c07bSMatthew G Knepley bs = 1; 67137d0c07bSMatthew G Knepley } 67237d0c07bSMatthew G Knepley /* Must have same blocksize on all procs (some might have no points) */ 67337d0c07bSMatthew G Knepley bsLocal = bs; 674b2566f29SBarry Smith ierr = MPIU_Allreduce(&bsLocal, &bs, 1, MPIU_INT, MPI_MAX, PetscObjectComm((PetscObject)da));CHKERRQ(ierr); 67537d0c07bSMatthew G Knepley } 6761795a4d1SJed Brown ierr = PetscCalloc4(localSize/bs, &dnz, localSize/bs, &onz, localSize/bs, &dnzu, localSize/bs, &onzu);CHKERRQ(ierr); 677552f7358SJed Brown /* ierr = DMPlexPreallocateOperator(dm, bs, section, sectionGlobal, dnz, onz, dnzu, onzu, *J, fillMatrix);CHKERRQ(ierr); */ 67837d0c07bSMatthew G Knepley ierr = PetscFree4(dnz, onz, dnzu, onzu);CHKERRQ(ierr); 67937d0c07bSMatthew G Knepley } 68037d0c07bSMatthew G Knepley } 68147c6ae99SBarry Smith /* 68247c6ae99SBarry Smith m 68347c6ae99SBarry Smith ------------------------------------------------------ 68447c6ae99SBarry Smith | | 68547c6ae99SBarry Smith | | 68647c6ae99SBarry Smith | ---------------------- | 68747c6ae99SBarry Smith | | | | 68847c6ae99SBarry Smith n | ny | | | 68947c6ae99SBarry Smith | | | | 69047c6ae99SBarry Smith | .--------------------- | 69147c6ae99SBarry Smith | (xs,ys) nx | 69247c6ae99SBarry Smith | . | 69347c6ae99SBarry Smith | (gxs,gys) | 69447c6ae99SBarry Smith | | 69547c6ae99SBarry Smith ----------------------------------------------------- 69647c6ae99SBarry Smith */ 69747c6ae99SBarry Smith 69847c6ae99SBarry Smith /* 69947c6ae99SBarry Smith nc - number of components per grid point 70047c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 70147c6ae99SBarry Smith 70247c6ae99SBarry Smith */ 703e30e807fSPeter Brune M = dd->M; 704e30e807fSPeter Brune N = dd->N; 705e30e807fSPeter Brune P = dd->P; 706c73cfb54SMatthew G. Knepley dim = da->dim; 707e30e807fSPeter Brune dof = dd->w; 708e30e807fSPeter Brune /* ierr = DMDAGetInfo(da,&dim,&M,&N,&P,0,0,0,&dof,0,0,0,0,0);CHKERRQ(ierr); */ 709aa219208SBarry Smith ierr = DMDAGetCorners(da,0,0,0,&nx,&ny,&nz);CHKERRQ(ierr); 71047c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 71147c6ae99SBarry Smith ierr = MatCreate(comm,&A);CHKERRQ(ierr); 71247c6ae99SBarry Smith ierr = MatSetSizes(A,dof*nx*ny*nz,dof*nx*ny*nz,dof*M*N*P,dof*M*N*P);CHKERRQ(ierr); 713b412c318SBarry Smith ierr = MatSetType(A,mtype);CHKERRQ(ierr); 71495ee5b0eSBarry Smith ierr = MatSetDM(A,da);CHKERRQ(ierr); 71547c6ae99SBarry Smith ierr = MatSetFromOptions(A);CHKERRQ(ierr); 71647c6ae99SBarry Smith ierr = MatGetType(A,&Atype);CHKERRQ(ierr); 71747c6ae99SBarry Smith /* 718aa219208SBarry Smith We do not provide a getmatrix function in the DMDA operations because 719aa219208SBarry Smith the basic DMDA does not know about matrices. We think of DMDA as being more 72047c6ae99SBarry Smith more low-level than matrices. This is kind of cheating but, cause sometimes 721aa219208SBarry Smith we think of DMDA has higher level than matrices. 72247c6ae99SBarry Smith 72347c6ae99SBarry Smith We could switch based on Atype (or mtype), but we do not since the 72447c6ae99SBarry Smith specialized setting routines depend only the particular preallocation 72547c6ae99SBarry Smith details of the matrix, not the type itself. 72647c6ae99SBarry Smith */ 72747c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPIAIJSetPreallocation_C",&aij);CHKERRQ(ierr); 72847c6ae99SBarry Smith if (!aij) { 72947c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqAIJSetPreallocation_C",&aij);CHKERRQ(ierr); 73047c6ae99SBarry Smith } 73147c6ae99SBarry Smith if (!aij) { 73247c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPIBAIJSetPreallocation_C",&baij);CHKERRQ(ierr); 73347c6ae99SBarry Smith if (!baij) { 73447c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqBAIJSetPreallocation_C",&baij);CHKERRQ(ierr); 73547c6ae99SBarry Smith } 73647c6ae99SBarry Smith if (!baij) { 73747c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPISBAIJSetPreallocation_C",&sbaij);CHKERRQ(ierr); 73847c6ae99SBarry Smith if (!sbaij) { 73947c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqSBAIJSetPreallocation_C",&sbaij);CHKERRQ(ierr); 74047c6ae99SBarry Smith } 74147c6ae99SBarry Smith } 74247c6ae99SBarry Smith } 74347c6ae99SBarry Smith if (aij) { 74447c6ae99SBarry Smith if (dim == 1) { 745ce308e1dSBarry Smith if (dd->ofill) { 746ce308e1dSBarry Smith ierr = DMCreateMatrix_DA_1d_MPIAIJ_Fill(da,A);CHKERRQ(ierr); 747ce308e1dSBarry Smith } else { 748950540a4SJed Brown ierr = DMCreateMatrix_DA_1d_MPIAIJ(da,A);CHKERRQ(ierr); 749ce308e1dSBarry Smith } 75047c6ae99SBarry Smith } else if (dim == 2) { 75147c6ae99SBarry Smith if (dd->ofill) { 752950540a4SJed Brown ierr = DMCreateMatrix_DA_2d_MPIAIJ_Fill(da,A);CHKERRQ(ierr); 75347c6ae99SBarry Smith } else { 754950540a4SJed Brown ierr = DMCreateMatrix_DA_2d_MPIAIJ(da,A);CHKERRQ(ierr); 75547c6ae99SBarry Smith } 75647c6ae99SBarry Smith } else if (dim == 3) { 75747c6ae99SBarry Smith if (dd->ofill) { 758950540a4SJed Brown ierr = DMCreateMatrix_DA_3d_MPIAIJ_Fill(da,A);CHKERRQ(ierr); 75947c6ae99SBarry Smith } else { 760950540a4SJed Brown ierr = DMCreateMatrix_DA_3d_MPIAIJ(da,A);CHKERRQ(ierr); 76147c6ae99SBarry Smith } 76247c6ae99SBarry Smith } 76347c6ae99SBarry Smith } else if (baij) { 76447c6ae99SBarry Smith if (dim == 2) { 765950540a4SJed Brown ierr = DMCreateMatrix_DA_2d_MPIBAIJ(da,A);CHKERRQ(ierr); 76647c6ae99SBarry Smith } else if (dim == 3) { 767950540a4SJed Brown ierr = DMCreateMatrix_DA_3d_MPIBAIJ(da,A);CHKERRQ(ierr); 768ce94432eSBarry Smith } else SETERRQ3(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not implemented for %D dimension and Matrix Type: %s in %D dimension! Send mail to petsc-maint@mcs.anl.gov for code",dim,Atype,dim); 76947c6ae99SBarry Smith } else if (sbaij) { 77047c6ae99SBarry Smith if (dim == 2) { 771950540a4SJed Brown ierr = DMCreateMatrix_DA_2d_MPISBAIJ(da,A);CHKERRQ(ierr); 77247c6ae99SBarry Smith } else if (dim == 3) { 773950540a4SJed Brown ierr = DMCreateMatrix_DA_3d_MPISBAIJ(da,A);CHKERRQ(ierr); 774ce94432eSBarry Smith } else SETERRQ3(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not implemented for %D dimension and Matrix Type: %s in %D dimension! Send mail to petsc-maint@mcs.anl.gov for code",dim,Atype,dim); 775869776cdSLisandro Dalcin } else { 77645b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 777869776cdSLisandro Dalcin ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 7782949035bSJed Brown ierr = MatSetUp(A);CHKERRQ(ierr); 779869776cdSLisandro Dalcin ierr = MatSetLocalToGlobalMapping(A,ltog,ltog);CHKERRQ(ierr); 78047c6ae99SBarry Smith } 781aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&starts[0],&starts[1],&starts[2],&dims[0],&dims[1],&dims[2]);CHKERRQ(ierr); 78247c6ae99SBarry Smith ierr = MatSetStencil(A,dim,dims,starts,dof);CHKERRQ(ierr); 783c688c046SMatthew G Knepley ierr = MatSetDM(A,da);CHKERRQ(ierr); 78447c6ae99SBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 78547c6ae99SBarry Smith if (size > 1) { 78647c6ae99SBarry Smith /* change viewer to display matrix in natural ordering */ 78747c6ae99SBarry Smith ierr = MatShellSetOperation(A, MATOP_VIEW, (void (*)(void))MatView_MPI_DA);CHKERRQ(ierr); 78847c6ae99SBarry Smith ierr = MatShellSetOperation(A, MATOP_LOAD, (void (*)(void))MatLoad_MPI_DA);CHKERRQ(ierr); 78947c6ae99SBarry Smith } 79047c6ae99SBarry Smith *J = A; 79147c6ae99SBarry Smith PetscFunctionReturn(0); 79247c6ae99SBarry Smith } 79347c6ae99SBarry Smith 79447c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 79547c6ae99SBarry Smith #undef __FUNCT__ 796950540a4SJed Brown #define __FUNCT__ "DMCreateMatrix_DA_2d_MPIAIJ" 797950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ(DM da,Mat J) 79847c6ae99SBarry Smith { 79947c6ae99SBarry Smith PetscErrorCode ierr; 800*c1154cd5SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny,m,n,dim,s,*cols = NULL,k,nc,*rows = NULL,col,cnt,l,p,M,N; 80147c6ae99SBarry Smith PetscInt lstart,lend,pstart,pend,*dnz,*onz; 80247c6ae99SBarry Smith MPI_Comm comm; 80347c6ae99SBarry Smith PetscScalar *values; 804bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by; 80545b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 806aa219208SBarry Smith DMDAStencilType st; 807*c1154cd5SBarry Smith PetscBool removedups = PETSC_FALSE; 80847c6ae99SBarry Smith 80947c6ae99SBarry Smith PetscFunctionBegin; 81047c6ae99SBarry Smith /* 81147c6ae99SBarry Smith nc - number of components per grid point 81247c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 81347c6ae99SBarry Smith 81447c6ae99SBarry Smith */ 815*c1154cd5SBarry Smith ierr = DMDAGetInfo(da,&dim,&m,&n,&M,&N,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 81647c6ae99SBarry Smith col = 2*s + 1; 817*c1154cd5SBarry Smith /* 818*c1154cd5SBarry Smith With one processor in periodic domains in a skinny dimension the code will label nonzero columns multiple times 819*c1154cd5SBarry Smith because of "wrapping" around the end of the domain hitting an entry already counted in the other direction. 820*c1154cd5SBarry Smith */ 821*c1154cd5SBarry Smith if (M == 1 && 2*s >= m) removedups = PETSC_TRUE; 822*c1154cd5SBarry Smith if (N == 1 && 2*s >= n) removedups = PETSC_TRUE; 823aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 824aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 82547c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 82647c6ae99SBarry Smith 827dcca6d9dSJed Brown ierr = PetscMalloc2(nc,&rows,col*col*nc*nc,&cols);CHKERRQ(ierr); 8281411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 82947c6ae99SBarry Smith 83006ca8cadSBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 83147c6ae99SBarry Smith /* determine the matrix preallocation information */ 83247c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nc*nx*ny,nc*nx*ny,dnz,onz);CHKERRQ(ierr); 83347c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 83447c6ae99SBarry Smith 835bff4a2f0SMatthew G. Knepley pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 836bff4a2f0SMatthew G. Knepley pend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 83747c6ae99SBarry Smith 83847c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 83947c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 84047c6ae99SBarry Smith 841bff4a2f0SMatthew G. Knepley lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 842bff4a2f0SMatthew G. Knepley lend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 84347c6ae99SBarry Smith 84447c6ae99SBarry Smith cnt = 0; 84547c6ae99SBarry Smith for (k=0; k<nc; k++) { 84647c6ae99SBarry Smith for (l=lstart; l<lend+1; l++) { 84747c6ae99SBarry Smith for (p=pstart; p<pend+1; p++) { 848aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star have either l = 0 or p = 0 */ 84947c6ae99SBarry Smith cols[cnt++] = k + nc*(slot + gnx*l + p); 85047c6ae99SBarry Smith } 85147c6ae99SBarry Smith } 85247c6ae99SBarry Smith } 85347c6ae99SBarry Smith rows[k] = k + nc*(slot); 85447c6ae99SBarry Smith } 855*c1154cd5SBarry Smith if (removedups) { 856*c1154cd5SBarry Smith ierr = MatPreallocateSetLocalRemoveDups(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 857*c1154cd5SBarry Smith } else { 858784ac674SJed Brown ierr = MatPreallocateSetLocal(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 85947c6ae99SBarry Smith } 86047c6ae99SBarry Smith } 861*c1154cd5SBarry Smith } 862f73d5cc4SBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 86347c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr); 86447c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 86547c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 86647c6ae99SBarry Smith 867784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 86847c6ae99SBarry Smith 86947c6ae99SBarry Smith /* 87047c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 87147c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 87247c6ae99SBarry Smith PETSc ordering. 87347c6ae99SBarry Smith */ 874fcfd50ebSBarry Smith if (!da->prealloc_only) { 8751795a4d1SJed Brown ierr = PetscCalloc1(col*col*nc*nc,&values);CHKERRQ(ierr); 87647c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 87747c6ae99SBarry Smith 878bff4a2f0SMatthew G. Knepley pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 879bff4a2f0SMatthew G. Knepley pend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 88047c6ae99SBarry Smith 88147c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 88247c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 88347c6ae99SBarry Smith 884bff4a2f0SMatthew G. Knepley lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 885bff4a2f0SMatthew G. Knepley lend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 88647c6ae99SBarry Smith 88747c6ae99SBarry Smith cnt = 0; 88847c6ae99SBarry Smith for (k=0; k<nc; k++) { 88947c6ae99SBarry Smith for (l=lstart; l<lend+1; l++) { 89047c6ae99SBarry Smith for (p=pstart; p<pend+1; p++) { 891aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star have either l = 0 or p = 0 */ 89247c6ae99SBarry Smith cols[cnt++] = k + nc*(slot + gnx*l + p); 89347c6ae99SBarry Smith } 89447c6ae99SBarry Smith } 89547c6ae99SBarry Smith } 89647c6ae99SBarry Smith rows[k] = k + nc*(slot); 89747c6ae99SBarry Smith } 89847c6ae99SBarry Smith ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 89947c6ae99SBarry Smith } 90047c6ae99SBarry Smith } 90147c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 90247c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 90347c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 904189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 90547c6ae99SBarry Smith } 90647c6ae99SBarry Smith ierr = PetscFree2(rows,cols);CHKERRQ(ierr); 90747c6ae99SBarry Smith PetscFunctionReturn(0); 90847c6ae99SBarry Smith } 90947c6ae99SBarry Smith 91047c6ae99SBarry Smith #undef __FUNCT__ 911950540a4SJed Brown #define __FUNCT__ "DMCreateMatrix_DA_2d_MPIAIJ_Fill" 912950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ_Fill(DM da,Mat J) 91347c6ae99SBarry Smith { 91447c6ae99SBarry Smith PetscErrorCode ierr; 91547c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 916*c1154cd5SBarry Smith PetscInt m,n,dim,s,*cols,k,nc,row,col,cnt,maxcnt = 0,l,p,M,N; 91747c6ae99SBarry Smith PetscInt lstart,lend,pstart,pend,*dnz,*onz; 91847c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 91947c6ae99SBarry Smith PetscInt ifill_col,*ofill = dd->ofill, *dfill = dd->dfill; 92047c6ae99SBarry Smith MPI_Comm comm; 92147c6ae99SBarry Smith PetscScalar *values; 922bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by; 92345b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 924aa219208SBarry Smith DMDAStencilType st; 925*c1154cd5SBarry Smith PetscBool removedups = PETSC_FALSE; 92647c6ae99SBarry Smith 92747c6ae99SBarry Smith PetscFunctionBegin; 92847c6ae99SBarry Smith /* 92947c6ae99SBarry Smith nc - number of components per grid point 93047c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 93147c6ae99SBarry Smith 93247c6ae99SBarry Smith */ 933*c1154cd5SBarry Smith ierr = DMDAGetInfo(da,&dim,&m,&n,&M,&N,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 93447c6ae99SBarry Smith col = 2*s + 1; 935*c1154cd5SBarry Smith /* 936*c1154cd5SBarry Smith With one processor in periodic domains in a skinny dimension the code will label nonzero columns multiple times 937*c1154cd5SBarry Smith because of "wrapping" around the end of the domain hitting an entry already counted in the other direction. 938*c1154cd5SBarry Smith */ 939*c1154cd5SBarry Smith if (M == 1 && 2*s >= m) removedups = PETSC_TRUE; 940*c1154cd5SBarry Smith if (N == 1 && 2*s >= n) removedups = PETSC_TRUE; 941aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 942aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 94347c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 94447c6ae99SBarry Smith 9454b26d1cfSBarry Smith ierr = PetscMalloc1(col*col*nc,&cols);CHKERRQ(ierr); 9461411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 94747c6ae99SBarry Smith 94806ca8cadSBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 94947c6ae99SBarry Smith /* determine the matrix preallocation information */ 95047c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nc*nx*ny,nc*nx*ny,dnz,onz);CHKERRQ(ierr); 95147c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 95247c6ae99SBarry Smith 953bff4a2f0SMatthew G. Knepley pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 954bff4a2f0SMatthew G. Knepley pend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 95547c6ae99SBarry Smith 95647c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 95747c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 95847c6ae99SBarry Smith 959bff4a2f0SMatthew G. Knepley lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 960bff4a2f0SMatthew G. Knepley lend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 96147c6ae99SBarry Smith 96247c6ae99SBarry Smith for (k=0; k<nc; k++) { 96347c6ae99SBarry Smith cnt = 0; 96447c6ae99SBarry Smith for (l=lstart; l<lend+1; l++) { 96547c6ae99SBarry Smith for (p=pstart; p<pend+1; p++) { 96647c6ae99SBarry Smith if (l || p) { 967aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star */ 9688865f1eaSKarl Rupp for (ifill_col=ofill[k]; ifill_col<ofill[k+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + gnx*l + p); 96947c6ae99SBarry Smith } 97047c6ae99SBarry Smith } else { 97147c6ae99SBarry Smith if (dfill) { 9728865f1eaSKarl Rupp for (ifill_col=dfill[k]; ifill_col<dfill[k+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + gnx*l + p); 97347c6ae99SBarry Smith } else { 9748865f1eaSKarl Rupp for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + gnx*l + p); 97547c6ae99SBarry Smith } 97647c6ae99SBarry Smith } 97747c6ae99SBarry Smith } 97847c6ae99SBarry Smith } 97947c6ae99SBarry Smith row = k + nc*(slot); 980c0ab637bSBarry Smith maxcnt = PetscMax(maxcnt,cnt); 981*c1154cd5SBarry Smith if (removedups) { 982*c1154cd5SBarry Smith ierr = MatPreallocateSetLocalRemoveDups(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 983*c1154cd5SBarry Smith } else { 984784ac674SJed Brown ierr = MatPreallocateSetLocal(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 98547c6ae99SBarry Smith } 98647c6ae99SBarry Smith } 98747c6ae99SBarry Smith } 988*c1154cd5SBarry Smith } 98947c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr); 99047c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 99147c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 992784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 99347c6ae99SBarry Smith 99447c6ae99SBarry Smith /* 99547c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 99647c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 99747c6ae99SBarry Smith PETSc ordering. 99847c6ae99SBarry Smith */ 999fcfd50ebSBarry Smith if (!da->prealloc_only) { 1000c0ab637bSBarry Smith ierr = PetscCalloc1(maxcnt,&values);CHKERRQ(ierr); 100147c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 100247c6ae99SBarry Smith 1003bff4a2f0SMatthew G. Knepley pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1004bff4a2f0SMatthew G. Knepley pend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 100547c6ae99SBarry Smith 100647c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 100747c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 100847c6ae99SBarry Smith 1009bff4a2f0SMatthew G. Knepley lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1010bff4a2f0SMatthew G. Knepley lend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 101147c6ae99SBarry Smith 101247c6ae99SBarry Smith for (k=0; k<nc; k++) { 101347c6ae99SBarry Smith cnt = 0; 101447c6ae99SBarry Smith for (l=lstart; l<lend+1; l++) { 101547c6ae99SBarry Smith for (p=pstart; p<pend+1; p++) { 101647c6ae99SBarry Smith if (l || p) { 1017aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star */ 10188865f1eaSKarl Rupp for (ifill_col=ofill[k]; ifill_col<ofill[k+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + gnx*l + p); 101947c6ae99SBarry Smith } 102047c6ae99SBarry Smith } else { 102147c6ae99SBarry Smith if (dfill) { 10228865f1eaSKarl Rupp for (ifill_col=dfill[k]; ifill_col<dfill[k+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + gnx*l + p); 102347c6ae99SBarry Smith } else { 10248865f1eaSKarl Rupp for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + gnx*l + p); 102547c6ae99SBarry Smith } 102647c6ae99SBarry Smith } 102747c6ae99SBarry Smith } 102847c6ae99SBarry Smith } 102947c6ae99SBarry Smith row = k + nc*(slot); 103047c6ae99SBarry Smith ierr = MatSetValuesLocal(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 103147c6ae99SBarry Smith } 103247c6ae99SBarry Smith } 103347c6ae99SBarry Smith } 103447c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 103547c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 103647c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1037189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 103847c6ae99SBarry Smith } 103947c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 104047c6ae99SBarry Smith PetscFunctionReturn(0); 104147c6ae99SBarry Smith } 104247c6ae99SBarry Smith 104347c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 104447c6ae99SBarry Smith 104547c6ae99SBarry Smith #undef __FUNCT__ 1046950540a4SJed Brown #define __FUNCT__ "DMCreateMatrix_DA_3d_MPIAIJ" 1047950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ(DM da,Mat J) 104847c6ae99SBarry Smith { 104947c6ae99SBarry Smith PetscErrorCode ierr; 105047c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 10510298fd71SBarry Smith PetscInt m,n,dim,s,*cols = NULL,k,nc,*rows = NULL,col,cnt,l,p,*dnz = NULL,*onz = NULL; 1052*c1154cd5SBarry Smith PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk,M,N,P; 105347c6ae99SBarry Smith MPI_Comm comm; 105447c6ae99SBarry Smith PetscScalar *values; 1055bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by,bz; 105645b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 1057aa219208SBarry Smith DMDAStencilType st; 1058*c1154cd5SBarry Smith PetscBool removedups = PETSC_FALSE; 105947c6ae99SBarry Smith 106047c6ae99SBarry Smith PetscFunctionBegin; 106147c6ae99SBarry Smith /* 106247c6ae99SBarry Smith nc - number of components per grid point 106347c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 106447c6ae99SBarry Smith 106547c6ae99SBarry Smith */ 1066*c1154cd5SBarry Smith ierr = DMDAGetInfo(da,&dim,&m,&n,&p,&M,&N,&P,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 106747c6ae99SBarry Smith col = 2*s + 1; 106847c6ae99SBarry Smith 1069*c1154cd5SBarry Smith /* 1070*c1154cd5SBarry Smith With one processor in periodic domains in a skinny dimension the code will label nonzero columns multiple times 1071*c1154cd5SBarry Smith because of "wrapping" around the end of the domain hitting an entry already counted in the other direction. 1072*c1154cd5SBarry Smith */ 1073*c1154cd5SBarry Smith if (M == 1 && 2*s >= m) removedups = PETSC_TRUE; 1074*c1154cd5SBarry Smith if (N == 1 && 2*s >= n) removedups = PETSC_TRUE; 1075*c1154cd5SBarry Smith if (P == 1 && 2*s >= p) removedups = PETSC_TRUE; 1076*c1154cd5SBarry Smith 1077aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 1078aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 107947c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 108047c6ae99SBarry Smith 1081dcca6d9dSJed Brown ierr = PetscMalloc2(nc,&rows,col*col*col*nc*nc,&cols);CHKERRQ(ierr); 10821411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 108347c6ae99SBarry Smith 108406ca8cadSBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 108547c6ae99SBarry Smith /* determine the matrix preallocation information */ 108647c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nc*nx*ny*nz,nc*nx*ny*nz,dnz,onz);CHKERRQ(ierr); 108747c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1088bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1089bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 109047c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1091bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1092bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 109347c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 1094bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 1095bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 109647c6ae99SBarry Smith 109747c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 109847c6ae99SBarry Smith 109947c6ae99SBarry Smith cnt = 0; 110047c6ae99SBarry Smith for (l=0; l<nc; l++) { 110147c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 110247c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 110347c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1104aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 110547c6ae99SBarry Smith cols[cnt++] = l + nc*(slot + ii + gnx*jj + gnx*gny*kk); 110647c6ae99SBarry Smith } 110747c6ae99SBarry Smith } 110847c6ae99SBarry Smith } 110947c6ae99SBarry Smith } 111047c6ae99SBarry Smith rows[l] = l + nc*(slot); 111147c6ae99SBarry Smith } 1112*c1154cd5SBarry Smith if (removedups) { 1113*c1154cd5SBarry Smith ierr = MatPreallocateSetLocalRemoveDups(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 1114*c1154cd5SBarry Smith } else { 1115784ac674SJed Brown ierr = MatPreallocateSetLocal(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 111647c6ae99SBarry Smith } 111747c6ae99SBarry Smith } 111847c6ae99SBarry Smith } 1119*c1154cd5SBarry Smith } 1120f73d5cc4SBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 112147c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr); 112247c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 112347c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 1124784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 112547c6ae99SBarry Smith 112647c6ae99SBarry Smith /* 112747c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 112847c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 112947c6ae99SBarry Smith PETSc ordering. 113047c6ae99SBarry Smith */ 1131fcfd50ebSBarry Smith if (!da->prealloc_only) { 11321795a4d1SJed Brown ierr = PetscCalloc1(col*col*col*nc*nc*nc,&values);CHKERRQ(ierr); 113347c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1134bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1135bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 113647c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1137bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1138bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 113947c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 1140bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 1141bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 114247c6ae99SBarry Smith 114347c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 114447c6ae99SBarry Smith 114547c6ae99SBarry Smith cnt = 0; 114647c6ae99SBarry Smith for (l=0; l<nc; l++) { 114747c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 114847c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 114947c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1150aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 115147c6ae99SBarry Smith cols[cnt++] = l + nc*(slot + ii + gnx*jj + gnx*gny*kk); 115247c6ae99SBarry Smith } 115347c6ae99SBarry Smith } 115447c6ae99SBarry Smith } 115547c6ae99SBarry Smith } 115647c6ae99SBarry Smith rows[l] = l + nc*(slot); 115747c6ae99SBarry Smith } 115847c6ae99SBarry Smith ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 115947c6ae99SBarry Smith } 116047c6ae99SBarry Smith } 116147c6ae99SBarry Smith } 116247c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 116347c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 116447c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1165189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 116647c6ae99SBarry Smith } 116747c6ae99SBarry Smith ierr = PetscFree2(rows,cols);CHKERRQ(ierr); 116847c6ae99SBarry Smith PetscFunctionReturn(0); 116947c6ae99SBarry Smith } 117047c6ae99SBarry Smith 117147c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 117247c6ae99SBarry Smith 117347c6ae99SBarry Smith #undef __FUNCT__ 1174ce308e1dSBarry Smith #define __FUNCT__ "DMCreateMatrix_DA_1d_MPIAIJ_Fill" 1175ce308e1dSBarry Smith PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ_Fill(DM da,Mat J) 1176ce308e1dSBarry Smith { 1177ce308e1dSBarry Smith PetscErrorCode ierr; 1178ce308e1dSBarry Smith DM_DA *dd = (DM_DA*)da->data; 1179ce308e1dSBarry Smith PetscInt xs,nx,i,j,gxs,gnx,row,k,l; 11808d4c968fSBarry Smith PetscInt m,dim,s,*cols = NULL,nc,cnt,maxcnt = 0,*ocols; 11810acb5bebSBarry Smith PetscInt *ofill = dd->ofill,*dfill = dd->dfill; 1182ce308e1dSBarry Smith PetscScalar *values; 1183bff4a2f0SMatthew G. Knepley DMBoundaryType bx; 118445b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 1185ce308e1dSBarry Smith PetscMPIInt rank,size; 1186ce308e1dSBarry Smith 1187ce308e1dSBarry Smith PetscFunctionBegin; 1188bff4a2f0SMatthew G. Knepley if (dd->bx == DM_BOUNDARY_PERIODIC) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"With fill provided not implemented with periodic boundary conditions"); 1189ce94432eSBarry Smith ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)da),&rank);CHKERRQ(ierr); 1190ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)da),&size);CHKERRQ(ierr); 1191ce308e1dSBarry Smith 1192ce308e1dSBarry Smith /* 1193ce308e1dSBarry Smith nc - number of components per grid point 1194ce308e1dSBarry Smith 1195ce308e1dSBarry Smith */ 1196ce308e1dSBarry Smith ierr = DMDAGetInfo(da,&dim,&m,0,0,0,0,0,&nc,&s,&bx,0,0,0);CHKERRQ(ierr); 1197ce308e1dSBarry Smith ierr = DMDAGetCorners(da,&xs,0,0,&nx,0,0);CHKERRQ(ierr); 1198ce308e1dSBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,0,0,&gnx,0,0);CHKERRQ(ierr); 1199ce308e1dSBarry Smith 1200ce308e1dSBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 12011795a4d1SJed Brown ierr = PetscCalloc2(nx*nc,&cols,nx*nc,&ocols);CHKERRQ(ierr); 1202ce308e1dSBarry Smith 1203554c65c0SBarry Smith if (nx < 2) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Need at least two grid points per process"); 1204ce308e1dSBarry Smith /* 1205ce308e1dSBarry Smith note should be smaller for first and last process with no periodic 1206ce308e1dSBarry Smith does not handle dfill 1207ce308e1dSBarry Smith */ 1208ce308e1dSBarry Smith cnt = 0; 1209ce308e1dSBarry Smith /* coupling with process to the left */ 1210ce308e1dSBarry Smith for (i=0; i<s; i++) { 1211ce308e1dSBarry Smith for (j=0; j<nc; j++) { 1212ce308e1dSBarry Smith ocols[cnt] = ((!rank) ? 0 : (s - i)*(ofill[j+1] - ofill[j])); 12130acb5bebSBarry Smith cols[cnt] = dfill[j+1] - dfill[j] + (s + i)*(ofill[j+1] - ofill[j]); 1214c0ab637bSBarry Smith maxcnt = PetscMax(maxcnt,ocols[cnt]+cols[cnt]); 1215ce308e1dSBarry Smith cnt++; 1216ce308e1dSBarry Smith } 1217ce308e1dSBarry Smith } 1218ce308e1dSBarry Smith for (i=s; i<nx-s; i++) { 1219ce308e1dSBarry Smith for (j=0; j<nc; j++) { 12200acb5bebSBarry Smith cols[cnt] = dfill[j+1] - dfill[j] + 2*s*(ofill[j+1] - ofill[j]); 1221c0ab637bSBarry Smith maxcnt = PetscMax(maxcnt,ocols[cnt]+cols[cnt]); 1222ce308e1dSBarry Smith cnt++; 1223ce308e1dSBarry Smith } 1224ce308e1dSBarry Smith } 1225ce308e1dSBarry Smith /* coupling with process to the right */ 1226ce308e1dSBarry Smith for (i=nx-s; i<nx; i++) { 1227ce308e1dSBarry Smith for (j=0; j<nc; j++) { 1228ce308e1dSBarry Smith ocols[cnt] = ((rank == (size-1)) ? 0 : (i - nx + s + 1)*(ofill[j+1] - ofill[j])); 12290acb5bebSBarry Smith cols[cnt] = dfill[j+1] - dfill[j] + (s + nx - i - 1)*(ofill[j+1] - ofill[j]); 1230c0ab637bSBarry Smith maxcnt = PetscMax(maxcnt,ocols[cnt]+cols[cnt]); 1231ce308e1dSBarry Smith cnt++; 1232ce308e1dSBarry Smith } 1233ce308e1dSBarry Smith } 1234ce308e1dSBarry Smith 1235ce308e1dSBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,cols);CHKERRQ(ierr); 1236ce308e1dSBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,cols,0,ocols);CHKERRQ(ierr); 1237ce308e1dSBarry Smith ierr = PetscFree2(cols,ocols);CHKERRQ(ierr); 1238ce308e1dSBarry Smith 1239ce308e1dSBarry Smith ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 1240ce308e1dSBarry Smith ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 1241ce308e1dSBarry Smith 1242ce308e1dSBarry Smith /* 1243ce308e1dSBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 1244ce308e1dSBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 1245ce308e1dSBarry Smith PETSc ordering. 1246ce308e1dSBarry Smith */ 1247ce308e1dSBarry Smith if (!da->prealloc_only) { 1248c0ab637bSBarry Smith ierr = PetscCalloc2(maxcnt,&values,maxcnt,&cols);CHKERRQ(ierr); 1249ce308e1dSBarry Smith 1250ce308e1dSBarry Smith row = xs*nc; 1251ce308e1dSBarry Smith /* coupling with process to the left */ 1252ce308e1dSBarry Smith for (i=xs; i<xs+s; i++) { 1253ce308e1dSBarry Smith for (j=0; j<nc; j++) { 1254ce308e1dSBarry Smith cnt = 0; 1255ce308e1dSBarry Smith if (rank) { 1256ce308e1dSBarry Smith for (l=0; l<s; l++) { 1257ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i - s + l)*nc + ofill[k]; 1258ce308e1dSBarry Smith } 1259ce308e1dSBarry Smith } 12600acb5bebSBarry Smith if (dfill) { 12610acb5bebSBarry Smith for (k=dfill[j]; k<dfill[j+1]; k++) { 12620acb5bebSBarry Smith cols[cnt++] = i*nc + dfill[k]; 12630acb5bebSBarry Smith } 12640acb5bebSBarry Smith } else { 1265ce308e1dSBarry Smith for (k=0; k<nc; k++) { 1266ce308e1dSBarry Smith cols[cnt++] = i*nc + k; 1267ce308e1dSBarry Smith } 12680acb5bebSBarry Smith } 1269ce308e1dSBarry Smith for (l=0; l<s; l++) { 1270ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i + s - l)*nc + ofill[k]; 1271ce308e1dSBarry Smith } 1272ce308e1dSBarry Smith ierr = MatSetValues(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 1273ce308e1dSBarry Smith row++; 1274ce308e1dSBarry Smith } 1275ce308e1dSBarry Smith } 1276ce308e1dSBarry Smith for (i=xs+s; i<xs+nx-s; i++) { 1277ce308e1dSBarry Smith for (j=0; j<nc; j++) { 1278ce308e1dSBarry Smith cnt = 0; 1279ce308e1dSBarry Smith for (l=0; l<s; l++) { 1280ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i - s + l)*nc + ofill[k]; 1281ce308e1dSBarry Smith } 12820acb5bebSBarry Smith if (dfill) { 12830acb5bebSBarry Smith for (k=dfill[j]; k<dfill[j+1]; k++) { 12840acb5bebSBarry Smith cols[cnt++] = i*nc + dfill[k]; 12850acb5bebSBarry Smith } 12860acb5bebSBarry Smith } else { 1287ce308e1dSBarry Smith for (k=0; k<nc; k++) { 1288ce308e1dSBarry Smith cols[cnt++] = i*nc + k; 1289ce308e1dSBarry Smith } 12900acb5bebSBarry Smith } 1291ce308e1dSBarry Smith for (l=0; l<s; l++) { 1292ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i + s - l)*nc + ofill[k]; 1293ce308e1dSBarry Smith } 1294ce308e1dSBarry Smith ierr = MatSetValues(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 1295ce308e1dSBarry Smith row++; 1296ce308e1dSBarry Smith } 1297ce308e1dSBarry Smith } 1298ce308e1dSBarry Smith /* coupling with process to the right */ 1299ce308e1dSBarry Smith for (i=xs+nx-s; i<xs+nx; i++) { 1300ce308e1dSBarry Smith for (j=0; j<nc; j++) { 1301ce308e1dSBarry Smith cnt = 0; 1302ce308e1dSBarry Smith for (l=0; l<s; l++) { 1303ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i - s + l)*nc + ofill[k]; 1304ce308e1dSBarry Smith } 13050acb5bebSBarry Smith if (dfill) { 13060acb5bebSBarry Smith for (k=dfill[j]; k<dfill[j+1]; k++) { 13070acb5bebSBarry Smith cols[cnt++] = i*nc + dfill[k]; 13080acb5bebSBarry Smith } 13090acb5bebSBarry Smith } else { 1310ce308e1dSBarry Smith for (k=0; k<nc; k++) { 1311ce308e1dSBarry Smith cols[cnt++] = i*nc + k; 1312ce308e1dSBarry Smith } 13130acb5bebSBarry Smith } 1314ce308e1dSBarry Smith if (rank < size-1) { 1315ce308e1dSBarry Smith for (l=0; l<s; l++) { 1316ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i + s - l)*nc + ofill[k]; 1317ce308e1dSBarry Smith } 1318ce308e1dSBarry Smith } 1319ce308e1dSBarry Smith ierr = MatSetValues(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 1320ce308e1dSBarry Smith row++; 1321ce308e1dSBarry Smith } 1322ce308e1dSBarry Smith } 1323c0ab637bSBarry Smith ierr = PetscFree2(values,cols);CHKERRQ(ierr); 1324ce308e1dSBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1325ce308e1dSBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1326189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 1327ce308e1dSBarry Smith } 1328ce308e1dSBarry Smith PetscFunctionReturn(0); 1329ce308e1dSBarry Smith } 1330ce308e1dSBarry Smith 1331ce308e1dSBarry Smith /* ---------------------------------------------------------------------------------*/ 1332ce308e1dSBarry Smith 1333ce308e1dSBarry Smith #undef __FUNCT__ 1334950540a4SJed Brown #define __FUNCT__ "DMCreateMatrix_DA_1d_MPIAIJ" 1335950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ(DM da,Mat J) 133647c6ae99SBarry Smith { 133747c6ae99SBarry Smith PetscErrorCode ierr; 133847c6ae99SBarry Smith PetscInt xs,nx,i,i1,slot,gxs,gnx; 13390298fd71SBarry Smith PetscInt m,dim,s,*cols = NULL,nc,*rows = NULL,col,cnt,l; 134047c6ae99SBarry Smith PetscInt istart,iend; 134147c6ae99SBarry Smith PetscScalar *values; 1342bff4a2f0SMatthew G. Knepley DMBoundaryType bx; 134345b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 134447c6ae99SBarry Smith 134547c6ae99SBarry Smith PetscFunctionBegin; 134647c6ae99SBarry Smith /* 134747c6ae99SBarry Smith nc - number of components per grid point 134847c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 134947c6ae99SBarry Smith 135047c6ae99SBarry Smith */ 13511321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,0,0,0,0,0,&nc,&s,&bx,0,0,0);CHKERRQ(ierr); 135247c6ae99SBarry Smith col = 2*s + 1; 135347c6ae99SBarry Smith 1354aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,0,0,&nx,0,0);CHKERRQ(ierr); 1355aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,0,0,&gnx,0,0);CHKERRQ(ierr); 135647c6ae99SBarry Smith 1357f73d5cc4SBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 135847c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,col*nc,0);CHKERRQ(ierr); 135947c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,col*nc,0,col*nc,0);CHKERRQ(ierr); 136047c6ae99SBarry Smith 13611411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 1362784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 136347c6ae99SBarry Smith 136447c6ae99SBarry Smith /* 136547c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 136647c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 136747c6ae99SBarry Smith PETSc ordering. 136847c6ae99SBarry Smith */ 1369fcfd50ebSBarry Smith if (!da->prealloc_only) { 1370dcca6d9dSJed Brown ierr = PetscMalloc2(nc,&rows,col*nc*nc,&cols);CHKERRQ(ierr); 13711795a4d1SJed Brown ierr = PetscCalloc1(col*nc*nc,&values);CHKERRQ(ierr); 137247c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 137347c6ae99SBarry Smith istart = PetscMax(-s,gxs - i); 137447c6ae99SBarry Smith iend = PetscMin(s,gxs + gnx - i - 1); 137547c6ae99SBarry Smith slot = i - gxs; 137647c6ae99SBarry Smith 137747c6ae99SBarry Smith cnt = 0; 137847c6ae99SBarry Smith for (l=0; l<nc; l++) { 137947c6ae99SBarry Smith for (i1=istart; i1<iend+1; i1++) { 138047c6ae99SBarry Smith cols[cnt++] = l + nc*(slot + i1); 138147c6ae99SBarry Smith } 138247c6ae99SBarry Smith rows[l] = l + nc*(slot); 138347c6ae99SBarry Smith } 138447c6ae99SBarry Smith ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 138547c6ae99SBarry Smith } 138647c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 138747c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 138847c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1389189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 139047c6ae99SBarry Smith ierr = PetscFree2(rows,cols);CHKERRQ(ierr); 1391ce308e1dSBarry Smith } 139247c6ae99SBarry Smith PetscFunctionReturn(0); 139347c6ae99SBarry Smith } 139447c6ae99SBarry Smith 139547c6ae99SBarry Smith #undef __FUNCT__ 1396950540a4SJed Brown #define __FUNCT__ "DMCreateMatrix_DA_2d_MPIBAIJ" 1397950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPIBAIJ(DM da,Mat J) 139847c6ae99SBarry Smith { 139947c6ae99SBarry Smith PetscErrorCode ierr; 140047c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 140147c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,nc,col,cnt,*dnz,*onz; 140247c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,ii,jj; 140347c6ae99SBarry Smith MPI_Comm comm; 140447c6ae99SBarry Smith PetscScalar *values; 1405bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by; 1406aa219208SBarry Smith DMDAStencilType st; 140745b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 140847c6ae99SBarry Smith 140947c6ae99SBarry Smith PetscFunctionBegin; 141047c6ae99SBarry Smith /* 141147c6ae99SBarry Smith nc - number of components per grid point 141247c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 141347c6ae99SBarry Smith */ 14141321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 141547c6ae99SBarry Smith col = 2*s + 1; 141647c6ae99SBarry Smith 1417aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 1418aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 141947c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 142047c6ae99SBarry Smith 1421785e854fSJed Brown ierr = PetscMalloc1(col*col*nc*nc,&cols);CHKERRQ(ierr); 142247c6ae99SBarry Smith 14231411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 142447c6ae99SBarry Smith 142547c6ae99SBarry Smith /* determine the matrix preallocation information */ 142647c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nx*ny,nx*ny,dnz,onz);CHKERRQ(ierr); 142747c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1428bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1429bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 143047c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1431bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1432bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 143347c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 143447c6ae99SBarry Smith 143547c6ae99SBarry Smith /* Find block columns in block row */ 143647c6ae99SBarry Smith cnt = 0; 143747c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 143847c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 1439aa219208SBarry Smith if (st == DMDA_STENCIL_BOX || !ii || !jj) { /* BOX or on the STAR */ 144047c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj; 144147c6ae99SBarry Smith } 144247c6ae99SBarry Smith } 144347c6ae99SBarry Smith } 1444d6e23781SBarry Smith ierr = MatPreallocateSetLocalBlock(ltog,1,&slot,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 144547c6ae99SBarry Smith } 144647c6ae99SBarry Smith } 144747c6ae99SBarry Smith ierr = MatSeqBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr); 144847c6ae99SBarry Smith ierr = MatMPIBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr); 144947c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 145047c6ae99SBarry Smith 1451784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 145247c6ae99SBarry Smith 145347c6ae99SBarry Smith /* 145447c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 145547c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 145647c6ae99SBarry Smith PETSc ordering. 145747c6ae99SBarry Smith */ 1458fcfd50ebSBarry Smith if (!da->prealloc_only) { 14591795a4d1SJed Brown ierr = PetscCalloc1(col*col*nc*nc,&values);CHKERRQ(ierr); 146047c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1461bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1462bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 146347c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1464bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1465bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 146647c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 146747c6ae99SBarry Smith cnt = 0; 146847c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 146947c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 1470aa219208SBarry Smith if (st == DMDA_STENCIL_BOX || !ii || !jj) { /* BOX or on the STAR */ 147147c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj; 147247c6ae99SBarry Smith } 147347c6ae99SBarry Smith } 147447c6ae99SBarry Smith } 147547c6ae99SBarry Smith ierr = MatSetValuesBlockedLocal(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 147647c6ae99SBarry Smith } 147747c6ae99SBarry Smith } 147847c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 147947c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 148047c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1481189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 148247c6ae99SBarry Smith } 148347c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 148447c6ae99SBarry Smith PetscFunctionReturn(0); 148547c6ae99SBarry Smith } 148647c6ae99SBarry Smith 148747c6ae99SBarry Smith #undef __FUNCT__ 1488950540a4SJed Brown #define __FUNCT__ "DMCreateMatrix_DA_3d_MPIBAIJ" 1489950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPIBAIJ(DM da,Mat J) 149047c6ae99SBarry Smith { 149147c6ae99SBarry Smith PetscErrorCode ierr; 149247c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 149347c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,k,nc,col,cnt,p,*dnz,*onz; 149447c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk; 149547c6ae99SBarry Smith MPI_Comm comm; 149647c6ae99SBarry Smith PetscScalar *values; 1497bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by,bz; 1498aa219208SBarry Smith DMDAStencilType st; 149945b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 150047c6ae99SBarry Smith 150147c6ae99SBarry Smith PetscFunctionBegin; 150247c6ae99SBarry Smith /* 150347c6ae99SBarry Smith nc - number of components per grid point 150447c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 150547c6ae99SBarry Smith 150647c6ae99SBarry Smith */ 15071321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,&p,0,0,0,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 150847c6ae99SBarry Smith col = 2*s + 1; 150947c6ae99SBarry Smith 1510aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 1511aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 151247c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 151347c6ae99SBarry Smith 1514785e854fSJed Brown ierr = PetscMalloc1(col*col*col,&cols);CHKERRQ(ierr); 151547c6ae99SBarry Smith 15161411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 151747c6ae99SBarry Smith 151847c6ae99SBarry Smith /* determine the matrix preallocation information */ 151947c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nx*ny*nz,nx*ny*nz,dnz,onz);CHKERRQ(ierr); 152047c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1521bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1522bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 152347c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1524bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1525bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 152647c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 1527bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 1528bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 152947c6ae99SBarry Smith 153047c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 153147c6ae99SBarry Smith 153247c6ae99SBarry Smith /* Find block columns in block row */ 153347c6ae99SBarry Smith cnt = 0; 153447c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 153547c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 153647c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1537aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 153847c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk; 153947c6ae99SBarry Smith } 154047c6ae99SBarry Smith } 154147c6ae99SBarry Smith } 154247c6ae99SBarry Smith } 1543d6e23781SBarry Smith ierr = MatPreallocateSetLocalBlock(ltog,1,&slot,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 154447c6ae99SBarry Smith } 154547c6ae99SBarry Smith } 154647c6ae99SBarry Smith } 154747c6ae99SBarry Smith ierr = MatSeqBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr); 154847c6ae99SBarry Smith ierr = MatMPIBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr); 154947c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 155047c6ae99SBarry Smith 1551784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 155247c6ae99SBarry Smith 155347c6ae99SBarry Smith /* 155447c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 155547c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 155647c6ae99SBarry Smith PETSc ordering. 155747c6ae99SBarry Smith */ 1558fcfd50ebSBarry Smith if (!da->prealloc_only) { 15591795a4d1SJed Brown ierr = PetscCalloc1(col*col*col*nc*nc,&values);CHKERRQ(ierr); 156047c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1561bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1562bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 156347c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1564bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1565bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 156647c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 1567bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 1568bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 156947c6ae99SBarry Smith 157047c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 157147c6ae99SBarry Smith 157247c6ae99SBarry Smith cnt = 0; 157347c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 157447c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 157547c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1576aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 157747c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk; 157847c6ae99SBarry Smith } 157947c6ae99SBarry Smith } 158047c6ae99SBarry Smith } 158147c6ae99SBarry Smith } 158247c6ae99SBarry Smith ierr = MatSetValuesBlockedLocal(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 158347c6ae99SBarry Smith } 158447c6ae99SBarry Smith } 158547c6ae99SBarry Smith } 158647c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 158747c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 158847c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1589189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 159047c6ae99SBarry Smith } 159147c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 159247c6ae99SBarry Smith PetscFunctionReturn(0); 159347c6ae99SBarry Smith } 159447c6ae99SBarry Smith 159547c6ae99SBarry Smith #undef __FUNCT__ 159647c6ae99SBarry Smith #define __FUNCT__ "L2GFilterUpperTriangular" 159747c6ae99SBarry Smith /* 159847c6ae99SBarry Smith This helper is for of SBAIJ preallocation, to discard the lower-triangular values which are difficult to 159947c6ae99SBarry Smith identify in the local ordering with periodic domain. 160047c6ae99SBarry Smith */ 160147c6ae99SBarry Smith static PetscErrorCode L2GFilterUpperTriangular(ISLocalToGlobalMapping ltog,PetscInt *row,PetscInt *cnt,PetscInt col[]) 160247c6ae99SBarry Smith { 160347c6ae99SBarry Smith PetscErrorCode ierr; 160447c6ae99SBarry Smith PetscInt i,n; 160547c6ae99SBarry Smith 160647c6ae99SBarry Smith PetscFunctionBegin; 1607d6e23781SBarry Smith ierr = ISLocalToGlobalMappingApplyBlock(ltog,1,row,row);CHKERRQ(ierr); 1608d6e23781SBarry Smith ierr = ISLocalToGlobalMappingApplyBlock(ltog,*cnt,col,col);CHKERRQ(ierr); 160947c6ae99SBarry Smith for (i=0,n=0; i<*cnt; i++) { 161047c6ae99SBarry Smith if (col[i] >= *row) col[n++] = col[i]; 161147c6ae99SBarry Smith } 161247c6ae99SBarry Smith *cnt = n; 161347c6ae99SBarry Smith PetscFunctionReturn(0); 161447c6ae99SBarry Smith } 161547c6ae99SBarry Smith 161647c6ae99SBarry Smith #undef __FUNCT__ 1617950540a4SJed Brown #define __FUNCT__ "DMCreateMatrix_DA_2d_MPISBAIJ" 1618950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPISBAIJ(DM da,Mat J) 161947c6ae99SBarry Smith { 162047c6ae99SBarry Smith PetscErrorCode ierr; 162147c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 162247c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,nc,col,cnt,*dnz,*onz; 162347c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,ii,jj; 162447c6ae99SBarry Smith MPI_Comm comm; 162547c6ae99SBarry Smith PetscScalar *values; 1626bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by; 1627aa219208SBarry Smith DMDAStencilType st; 162845b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 162947c6ae99SBarry Smith 163047c6ae99SBarry Smith PetscFunctionBegin; 163147c6ae99SBarry Smith /* 163247c6ae99SBarry Smith nc - number of components per grid point 163347c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 163447c6ae99SBarry Smith */ 16351321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 163647c6ae99SBarry Smith col = 2*s + 1; 163747c6ae99SBarry Smith 1638aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 1639aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 164047c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 164147c6ae99SBarry Smith 1642785e854fSJed Brown ierr = PetscMalloc1(col*col*nc*nc,&cols);CHKERRQ(ierr); 164347c6ae99SBarry Smith 16441411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 164547c6ae99SBarry Smith 164647c6ae99SBarry Smith /* determine the matrix preallocation information */ 1647eabe889fSLisandro Dalcin ierr = MatPreallocateInitialize(comm,nx*ny,nx*ny,dnz,onz);CHKERRQ(ierr); 164847c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1649bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1650bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 165147c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1652bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1653bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 165447c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 165547c6ae99SBarry Smith 165647c6ae99SBarry Smith /* Find block columns in block row */ 165747c6ae99SBarry Smith cnt = 0; 165847c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 165947c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 1660aa219208SBarry Smith if (st == DMDA_STENCIL_BOX || !ii || !jj) { 166147c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj; 166247c6ae99SBarry Smith } 166347c6ae99SBarry Smith } 166447c6ae99SBarry Smith } 166545b6f7e9SBarry Smith ierr = L2GFilterUpperTriangular(ltog,&slot,&cnt,cols);CHKERRQ(ierr); 1666d6e23781SBarry Smith ierr = MatPreallocateSymmetricSetBlock(slot,cnt,cols,dnz,onz);CHKERRQ(ierr); 166747c6ae99SBarry Smith } 166847c6ae99SBarry Smith } 166947c6ae99SBarry Smith ierr = MatSeqSBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr); 167047c6ae99SBarry Smith ierr = MatMPISBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr); 167147c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 167247c6ae99SBarry Smith 1673784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 167447c6ae99SBarry Smith 167547c6ae99SBarry Smith /* 167647c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 167747c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 167847c6ae99SBarry Smith PETSc ordering. 167947c6ae99SBarry Smith */ 1680fcfd50ebSBarry Smith if (!da->prealloc_only) { 16811795a4d1SJed Brown ierr = PetscCalloc1(col*col*nc*nc,&values);CHKERRQ(ierr); 168247c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1683bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1684bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 168547c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1686bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1687bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 168847c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 168947c6ae99SBarry Smith 169047c6ae99SBarry Smith /* Find block columns in block row */ 169147c6ae99SBarry Smith cnt = 0; 169247c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 169347c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 1694aa219208SBarry Smith if (st == DMDA_STENCIL_BOX || !ii || !jj) { 169547c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj; 169647c6ae99SBarry Smith } 169747c6ae99SBarry Smith } 169847c6ae99SBarry Smith } 169945b6f7e9SBarry Smith ierr = L2GFilterUpperTriangular(ltog,&slot,&cnt,cols);CHKERRQ(ierr); 170047c6ae99SBarry Smith ierr = MatSetValuesBlocked(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 170147c6ae99SBarry Smith } 170247c6ae99SBarry Smith } 170347c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 170447c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 170547c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1706189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 170747c6ae99SBarry Smith } 170847c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 170947c6ae99SBarry Smith PetscFunctionReturn(0); 171047c6ae99SBarry Smith } 171147c6ae99SBarry Smith 171247c6ae99SBarry Smith #undef __FUNCT__ 1713950540a4SJed Brown #define __FUNCT__ "DMCreateMatrix_DA_3d_MPISBAIJ" 1714950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPISBAIJ(DM da,Mat J) 171547c6ae99SBarry Smith { 171647c6ae99SBarry Smith PetscErrorCode ierr; 171747c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 171847c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,k,nc,col,cnt,p,*dnz,*onz; 171947c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk; 172047c6ae99SBarry Smith MPI_Comm comm; 172147c6ae99SBarry Smith PetscScalar *values; 1722bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by,bz; 1723aa219208SBarry Smith DMDAStencilType st; 172445b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 172547c6ae99SBarry Smith 172647c6ae99SBarry Smith PetscFunctionBegin; 172747c6ae99SBarry Smith /* 172847c6ae99SBarry Smith nc - number of components per grid point 172947c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 173047c6ae99SBarry Smith */ 17311321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,&p,0,0,0,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 173247c6ae99SBarry Smith col = 2*s + 1; 173347c6ae99SBarry Smith 1734aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 1735aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 173647c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 173747c6ae99SBarry Smith 173847c6ae99SBarry Smith /* create the matrix */ 1739785e854fSJed Brown ierr = PetscMalloc1(col*col*col,&cols);CHKERRQ(ierr); 174047c6ae99SBarry Smith 17411411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 174247c6ae99SBarry Smith 174347c6ae99SBarry Smith /* determine the matrix preallocation information */ 1744eabe889fSLisandro Dalcin ierr = MatPreallocateInitialize(comm,nx*ny*nz,nx*ny*nz,dnz,onz);CHKERRQ(ierr); 174547c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1746bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1747bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 174847c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1749bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1750bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 175147c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 1752bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 1753bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 175447c6ae99SBarry Smith 175547c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 175647c6ae99SBarry Smith 175747c6ae99SBarry Smith /* Find block columns in block row */ 175847c6ae99SBarry Smith cnt = 0; 175947c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 176047c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 176147c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1762aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!ii && !jj) || (!jj && !kk) || (!ii && !kk)) { 176347c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk; 176447c6ae99SBarry Smith } 176547c6ae99SBarry Smith } 176647c6ae99SBarry Smith } 176747c6ae99SBarry Smith } 176845b6f7e9SBarry Smith ierr = L2GFilterUpperTriangular(ltog,&slot,&cnt,cols);CHKERRQ(ierr); 1769d6e23781SBarry Smith ierr = MatPreallocateSymmetricSetBlock(slot,cnt,cols,dnz,onz);CHKERRQ(ierr); 177047c6ae99SBarry Smith } 177147c6ae99SBarry Smith } 177247c6ae99SBarry Smith } 177347c6ae99SBarry Smith ierr = MatSeqSBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr); 177447c6ae99SBarry Smith ierr = MatMPISBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr); 177547c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 177647c6ae99SBarry Smith 1777784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 177847c6ae99SBarry Smith 177947c6ae99SBarry Smith /* 178047c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 178147c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 178247c6ae99SBarry Smith PETSc ordering. 178347c6ae99SBarry Smith */ 1784fcfd50ebSBarry Smith if (!da->prealloc_only) { 17851795a4d1SJed Brown ierr = PetscCalloc1(col*col*col*nc*nc,&values);CHKERRQ(ierr); 178647c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1787bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1788bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 178947c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1790bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1791bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 179247c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 1793bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 1794bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 179547c6ae99SBarry Smith 179647c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 179747c6ae99SBarry Smith 179847c6ae99SBarry Smith cnt = 0; 179947c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 180047c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 180147c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1802aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!ii && !jj) || (!jj && !kk) || (!ii && !kk)) { 180347c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk; 180447c6ae99SBarry Smith } 180547c6ae99SBarry Smith } 180647c6ae99SBarry Smith } 180747c6ae99SBarry Smith } 180845b6f7e9SBarry Smith ierr = L2GFilterUpperTriangular(ltog,&slot,&cnt,cols);CHKERRQ(ierr); 180947c6ae99SBarry Smith ierr = MatSetValuesBlocked(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 181047c6ae99SBarry Smith } 181147c6ae99SBarry Smith } 181247c6ae99SBarry Smith } 181347c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 181447c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 181547c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1816189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 181747c6ae99SBarry Smith } 181847c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 181947c6ae99SBarry Smith PetscFunctionReturn(0); 182047c6ae99SBarry Smith } 182147c6ae99SBarry Smith 182247c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 182347c6ae99SBarry Smith 182447c6ae99SBarry Smith #undef __FUNCT__ 1825950540a4SJed Brown #define __FUNCT__ "DMCreateMatrix_DA_3d_MPIAIJ_Fill" 1826950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ_Fill(DM da,Mat J) 182747c6ae99SBarry Smith { 182847c6ae99SBarry Smith PetscErrorCode ierr; 182947c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 1830c0ab637bSBarry Smith PetscInt m,n,dim,s,*cols,k,nc,row,col,cnt, maxcnt = 0,l,p,*dnz,*onz; 1831*c1154cd5SBarry Smith PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk,M,N,P; 183247c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 183347c6ae99SBarry Smith PetscInt ifill_col,*dfill = dd->dfill,*ofill = dd->ofill; 183447c6ae99SBarry Smith MPI_Comm comm; 183547c6ae99SBarry Smith PetscScalar *values; 1836bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by,bz; 183745b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 1838aa219208SBarry Smith DMDAStencilType st; 1839*c1154cd5SBarry Smith PetscBool removedups = PETSC_FALSE; 184047c6ae99SBarry Smith 184147c6ae99SBarry Smith PetscFunctionBegin; 184247c6ae99SBarry Smith /* 184347c6ae99SBarry Smith nc - number of components per grid point 184447c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 184547c6ae99SBarry Smith 184647c6ae99SBarry Smith */ 1847*c1154cd5SBarry Smith ierr = DMDAGetInfo(da,&dim,&m,&n,&p,&M,&N,&P,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 184847c6ae99SBarry Smith col = 2*s + 1; 1849bff4a2f0SMatthew G. Knepley if (bx == DM_BOUNDARY_PERIODIC && (m % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X is divisible\n\ 185047c6ae99SBarry Smith by 2*stencil_width + 1\n"); 1851bff4a2f0SMatthew G. Knepley if (by == DM_BOUNDARY_PERIODIC && (n % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y is divisible\n\ 185247c6ae99SBarry Smith by 2*stencil_width + 1\n"); 1853bff4a2f0SMatthew G. Knepley if (bz == DM_BOUNDARY_PERIODIC && (p % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Z is divisible\n\ 185447c6ae99SBarry Smith by 2*stencil_width + 1\n"); 185547c6ae99SBarry Smith 1856*c1154cd5SBarry Smith /* 1857*c1154cd5SBarry Smith With one processor in periodic domains in a skinny dimension the code will label nonzero columns multiple times 1858*c1154cd5SBarry Smith because of "wrapping" around the end of the domain hitting an entry already counted in the other direction. 1859*c1154cd5SBarry Smith */ 1860*c1154cd5SBarry Smith if (M == 1 && 2*s >= m) removedups = PETSC_TRUE; 1861*c1154cd5SBarry Smith if (N == 1 && 2*s >= n) removedups = PETSC_TRUE; 1862*c1154cd5SBarry Smith if (P == 1 && 2*s >= p) removedups = PETSC_TRUE; 1863*c1154cd5SBarry Smith 1864aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 1865aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 186647c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 186747c6ae99SBarry Smith 1868785e854fSJed Brown ierr = PetscMalloc1(col*col*col*nc,&cols);CHKERRQ(ierr); 18691411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 187047c6ae99SBarry Smith 187147c6ae99SBarry Smith /* determine the matrix preallocation information */ 187247c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nc*nx*ny*nz,nc*nx*ny*nz,dnz,onz);CHKERRQ(ierr); 187347c6ae99SBarry Smith 187406ca8cadSBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 187547c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1876bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1877bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 187847c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1879bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1880bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 188147c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 1882bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 1883bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 188447c6ae99SBarry Smith 188547c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 188647c6ae99SBarry Smith 188747c6ae99SBarry Smith for (l=0; l<nc; l++) { 188847c6ae99SBarry Smith cnt = 0; 188947c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 189047c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 189147c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 189247c6ae99SBarry Smith if (ii || jj || kk) { 1893aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 18948865f1eaSKarl Rupp for (ifill_col=ofill[l]; ifill_col<ofill[l+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk); 189547c6ae99SBarry Smith } 189647c6ae99SBarry Smith } else { 189747c6ae99SBarry Smith if (dfill) { 18988865f1eaSKarl Rupp for (ifill_col=dfill[l]; ifill_col<dfill[l+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk); 189947c6ae99SBarry Smith } else { 19008865f1eaSKarl Rupp for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + ii + gnx*jj + gnx*gny*kk); 190147c6ae99SBarry Smith } 190247c6ae99SBarry Smith } 190347c6ae99SBarry Smith } 190447c6ae99SBarry Smith } 190547c6ae99SBarry Smith } 190647c6ae99SBarry Smith row = l + nc*(slot); 1907c0ab637bSBarry Smith maxcnt = PetscMax(maxcnt,cnt); 1908*c1154cd5SBarry Smith if (removedups) { 1909*c1154cd5SBarry Smith ierr = MatPreallocateSetLocalRemoveDups(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 1910*c1154cd5SBarry Smith } else { 1911784ac674SJed Brown ierr = MatPreallocateSetLocal(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 191247c6ae99SBarry Smith } 191347c6ae99SBarry Smith } 191447c6ae99SBarry Smith } 191547c6ae99SBarry Smith } 1916*c1154cd5SBarry Smith } 191747c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr); 191847c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 191947c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 1920784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 192147c6ae99SBarry Smith 192247c6ae99SBarry Smith /* 192347c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 192447c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 192547c6ae99SBarry Smith PETSc ordering. 192647c6ae99SBarry Smith */ 1927fcfd50ebSBarry Smith if (!da->prealloc_only) { 1928c0ab637bSBarry Smith ierr = PetscCalloc1(maxcnt,&values);CHKERRQ(ierr); 192947c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1930bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1931bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 193247c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1933bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1934bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 193547c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 1936bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 1937bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 193847c6ae99SBarry Smith 193947c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 194047c6ae99SBarry Smith 194147c6ae99SBarry Smith for (l=0; l<nc; l++) { 194247c6ae99SBarry Smith cnt = 0; 194347c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 194447c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 194547c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 194647c6ae99SBarry Smith if (ii || jj || kk) { 1947aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 19488865f1eaSKarl Rupp for (ifill_col=ofill[l]; ifill_col<ofill[l+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk); 194947c6ae99SBarry Smith } 195047c6ae99SBarry Smith } else { 195147c6ae99SBarry Smith if (dfill) { 19528865f1eaSKarl Rupp for (ifill_col=dfill[l]; ifill_col<dfill[l+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk); 195347c6ae99SBarry Smith } else { 19548865f1eaSKarl Rupp for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + ii + gnx*jj + gnx*gny*kk); 195547c6ae99SBarry Smith } 195647c6ae99SBarry Smith } 195747c6ae99SBarry Smith } 195847c6ae99SBarry Smith } 195947c6ae99SBarry Smith } 196047c6ae99SBarry Smith row = l + nc*(slot); 196147c6ae99SBarry Smith ierr = MatSetValuesLocal(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 196247c6ae99SBarry Smith } 196347c6ae99SBarry Smith } 196447c6ae99SBarry Smith } 196547c6ae99SBarry Smith } 196647c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 196747c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 196847c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1969189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 197047c6ae99SBarry Smith } 197147c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 197247c6ae99SBarry Smith PetscFunctionReturn(0); 197347c6ae99SBarry Smith } 1974