1be1d678aSKris Buschelman #define PETSCMAT_DLL 2be1d678aSKris Buschelman 367e560aaSBarry Smith /* 467e560aaSBarry Smith Defines the basic matrix operations for sequential dense. 567e560aaSBarry Smith */ 6289bc588SBarry Smith 77c4f633dSBarry Smith #include "../src/mat/impls/dense/seq/dense.h" 8f3da1532SBarry Smith #include "petscblaslapack.h" 9289bc588SBarry Smith 104a2ae208SSatish Balay #undef __FUNCT__ 114a2ae208SSatish Balay #define __FUNCT__ "MatAXPY_SeqDense" 12f4df32b1SMatthew Knepley PetscErrorCode MatAXPY_SeqDense(Mat Y,PetscScalar alpha,Mat X,MatStructure str) 131987afe7SBarry Smith { 141987afe7SBarry Smith Mat_SeqDense *x = (Mat_SeqDense*)X->data,*y = (Mat_SeqDense*)Y->data; 15f4df32b1SMatthew Knepley PetscScalar oalpha = alpha; 1613f74950SBarry Smith PetscInt j; 170805154bSBarry Smith PetscBLASInt N,m,ldax,lday,one = 1; 18efee365bSSatish Balay PetscErrorCode ierr; 193a40ed3dSBarry Smith 203a40ed3dSBarry Smith PetscFunctionBegin; 21d0f46423SBarry Smith N = PetscBLASIntCast(X->rmap->n*X->cmap->n); 22d0f46423SBarry Smith m = PetscBLASIntCast(X->rmap->n); 230805154bSBarry Smith ldax = PetscBLASIntCast(x->lda); 240805154bSBarry Smith lday = PetscBLASIntCast(y->lda); 25a5ce6ee0Svictorle if (ldax>m || lday>m) { 26d0f46423SBarry Smith for (j=0; j<X->cmap->n; j++) { 27f4df32b1SMatthew Knepley BLASaxpy_(&m,&oalpha,x->v+j*ldax,&one,y->v+j*lday,&one); 28a5ce6ee0Svictorle } 29a5ce6ee0Svictorle } else { 30f4df32b1SMatthew Knepley BLASaxpy_(&N,&oalpha,x->v,&one,y->v,&one); 31a5ce6ee0Svictorle } 320450473dSBarry Smith ierr = PetscLogFlops(PetscMax(2*N-1,0));CHKERRQ(ierr); 333a40ed3dSBarry Smith PetscFunctionReturn(0); 341987afe7SBarry Smith } 351987afe7SBarry Smith 364a2ae208SSatish Balay #undef __FUNCT__ 374a2ae208SSatish Balay #define __FUNCT__ "MatGetInfo_SeqDense" 38dfbe8321SBarry Smith PetscErrorCode MatGetInfo_SeqDense(Mat A,MatInfoType flag,MatInfo *info) 39289bc588SBarry Smith { 40d0f46423SBarry Smith PetscInt N = A->rmap->n*A->cmap->n; 413a40ed3dSBarry Smith 423a40ed3dSBarry Smith PetscFunctionBegin; 434e220ebcSLois Curfman McInnes info->block_size = 1.0; 444e220ebcSLois Curfman McInnes info->nz_allocated = (double)N; 456de62eeeSBarry Smith info->nz_used = (double)N; 466de62eeeSBarry Smith info->nz_unneeded = (double)0; 474e220ebcSLois Curfman McInnes info->assemblies = (double)A->num_ass; 484e220ebcSLois Curfman McInnes info->mallocs = 0; 497adad957SLisandro Dalcin info->memory = ((PetscObject)A)->mem; 504e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 514e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 524e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 533a40ed3dSBarry Smith PetscFunctionReturn(0); 54289bc588SBarry Smith } 55289bc588SBarry Smith 564a2ae208SSatish Balay #undef __FUNCT__ 574a2ae208SSatish Balay #define __FUNCT__ "MatScale_SeqDense" 58f4df32b1SMatthew Knepley PetscErrorCode MatScale_SeqDense(Mat A,PetscScalar alpha) 5980cd9d93SLois Curfman McInnes { 60273d9f13SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 61f4df32b1SMatthew Knepley PetscScalar oalpha = alpha; 62efee365bSSatish Balay PetscErrorCode ierr; 630805154bSBarry Smith PetscBLASInt one = 1,j,nz,lda = PetscBLASIntCast(a->lda); 6480cd9d93SLois Curfman McInnes 653a40ed3dSBarry Smith PetscFunctionBegin; 66d0f46423SBarry Smith if (lda>A->rmap->n) { 67d0f46423SBarry Smith nz = PetscBLASIntCast(A->rmap->n); 68d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 69f4df32b1SMatthew Knepley BLASscal_(&nz,&oalpha,a->v+j*lda,&one); 70a5ce6ee0Svictorle } 71a5ce6ee0Svictorle } else { 72d0f46423SBarry Smith nz = PetscBLASIntCast(A->rmap->n*A->cmap->n); 73f4df32b1SMatthew Knepley BLASscal_(&nz,&oalpha,a->v,&one); 74a5ce6ee0Svictorle } 75efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 763a40ed3dSBarry Smith PetscFunctionReturn(0); 7780cd9d93SLois Curfman McInnes } 7880cd9d93SLois Curfman McInnes 791cbb95d3SBarry Smith #undef __FUNCT__ 801cbb95d3SBarry Smith #define __FUNCT__ "MatIsHermitian_SeqDense" 81ace3abfcSBarry Smith PetscErrorCode MatIsHermitian_SeqDense(Mat A,PetscReal rtol,PetscBool *fl) 821cbb95d3SBarry Smith { 831cbb95d3SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 84d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,N; 851cbb95d3SBarry Smith PetscScalar *v = a->v; 861cbb95d3SBarry Smith 871cbb95d3SBarry Smith PetscFunctionBegin; 881cbb95d3SBarry Smith *fl = PETSC_FALSE; 89d0f46423SBarry Smith if (A->rmap->n != A->cmap->n) PetscFunctionReturn(0); 901cbb95d3SBarry Smith N = a->lda; 911cbb95d3SBarry Smith 921cbb95d3SBarry Smith for (i=0; i<m; i++) { 931cbb95d3SBarry Smith for (j=i+1; j<m; j++) { 941cbb95d3SBarry Smith if (PetscAbsScalar(v[i+j*N] - PetscConj(v[j+i*N])) > rtol) PetscFunctionReturn(0); 951cbb95d3SBarry Smith } 961cbb95d3SBarry Smith } 971cbb95d3SBarry Smith *fl = PETSC_TRUE; 981cbb95d3SBarry Smith PetscFunctionReturn(0); 991cbb95d3SBarry Smith } 1001cbb95d3SBarry Smith 101b24902e0SBarry Smith #undef __FUNCT__ 102b24902e0SBarry Smith #define __FUNCT__ "MatDuplicateNoCreate_SeqDense" 103719d5645SBarry Smith PetscErrorCode MatDuplicateNoCreate_SeqDense(Mat newi,Mat A,MatDuplicateOption cpvalues) 104b24902e0SBarry Smith { 105b24902e0SBarry Smith Mat_SeqDense *mat = (Mat_SeqDense*)A->data,*l; 106b24902e0SBarry Smith PetscErrorCode ierr; 107b24902e0SBarry Smith PetscInt lda = (PetscInt)mat->lda,j,m; 108b24902e0SBarry Smith 109b24902e0SBarry Smith PetscFunctionBegin; 110719d5645SBarry Smith ierr = MatSeqDenseSetPreallocation(newi,PETSC_NULL);CHKERRQ(ierr); 111b24902e0SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 112b24902e0SBarry Smith l = (Mat_SeqDense*)newi->data; 113d0f46423SBarry Smith if (lda>A->rmap->n) { 114d0f46423SBarry Smith m = A->rmap->n; 115d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 116b24902e0SBarry Smith ierr = PetscMemcpy(l->v+j*m,mat->v+j*lda,m*sizeof(PetscScalar));CHKERRQ(ierr); 117b24902e0SBarry Smith } 118b24902e0SBarry Smith } else { 119d0f46423SBarry Smith ierr = PetscMemcpy(l->v,mat->v,A->rmap->n*A->cmap->n*sizeof(PetscScalar));CHKERRQ(ierr); 120b24902e0SBarry Smith } 121b24902e0SBarry Smith } 122b24902e0SBarry Smith newi->assembled = PETSC_TRUE; 123b24902e0SBarry Smith PetscFunctionReturn(0); 124b24902e0SBarry Smith } 125b24902e0SBarry Smith 1264a2ae208SSatish Balay #undef __FUNCT__ 1274a2ae208SSatish Balay #define __FUNCT__ "MatDuplicate_SeqDense" 128dfbe8321SBarry Smith PetscErrorCode MatDuplicate_SeqDense(Mat A,MatDuplicateOption cpvalues,Mat *newmat) 12902cad45dSBarry Smith { 1306849ba73SBarry Smith PetscErrorCode ierr; 13102cad45dSBarry Smith 1323a40ed3dSBarry Smith PetscFunctionBegin; 1335c9eb25fSBarry Smith ierr = MatCreate(((PetscObject)A)->comm,newmat);CHKERRQ(ierr); 134d0f46423SBarry Smith ierr = MatSetSizes(*newmat,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 1355c9eb25fSBarry Smith ierr = MatSetType(*newmat,((PetscObject)A)->type_name);CHKERRQ(ierr); 136719d5645SBarry Smith ierr = MatDuplicateNoCreate_SeqDense(*newmat,A,cpvalues);CHKERRQ(ierr); 137b24902e0SBarry Smith PetscFunctionReturn(0); 138b24902e0SBarry Smith } 139b24902e0SBarry Smith 1406ee01492SSatish Balay 1410481f469SBarry Smith extern PetscErrorCode MatLUFactor_SeqDense(Mat,IS,IS,const MatFactorInfo*); 142719d5645SBarry Smith 1434a2ae208SSatish Balay #undef __FUNCT__ 1444a2ae208SSatish Balay #define __FUNCT__ "MatLUFactorNumeric_SeqDense" 1450481f469SBarry Smith PetscErrorCode MatLUFactorNumeric_SeqDense(Mat fact,Mat A,const MatFactorInfo *info_dummy) 146289bc588SBarry Smith { 1474482741eSBarry Smith MatFactorInfo info; 148a093e273SMatthew Knepley PetscErrorCode ierr; 1493a40ed3dSBarry Smith 1503a40ed3dSBarry Smith PetscFunctionBegin; 151c3ef05f6SHong Zhang ierr = MatDuplicateNoCreate_SeqDense(fact,A,MAT_COPY_VALUES);CHKERRQ(ierr); 152719d5645SBarry Smith ierr = MatLUFactor_SeqDense(fact,0,0,&info);CHKERRQ(ierr); 1533a40ed3dSBarry Smith PetscFunctionReturn(0); 154289bc588SBarry Smith } 1556ee01492SSatish Balay 1560b4b3355SBarry Smith #undef __FUNCT__ 1574a2ae208SSatish Balay #define __FUNCT__ "MatSolve_SeqDense" 158dfbe8321SBarry Smith PetscErrorCode MatSolve_SeqDense(Mat A,Vec xx,Vec yy) 159289bc588SBarry Smith { 160c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 1616849ba73SBarry Smith PetscErrorCode ierr; 16287828ca2SBarry Smith PetscScalar *x,*y; 163d0f46423SBarry Smith PetscBLASInt one = 1,info,m = PetscBLASIntCast(A->rmap->n); 16467e560aaSBarry Smith 1653a40ed3dSBarry Smith PetscFunctionBegin; 1661ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 1671ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 168d0f46423SBarry Smith ierr = PetscMemcpy(y,x,A->rmap->n*sizeof(PetscScalar));CHKERRQ(ierr); 169d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_LU) { 170ae7cfcebSSatish Balay #if defined(PETSC_MISSING_LAPACK_GETRS) 171e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"GETRS - Lapack routine is unavailable."); 172ae7cfcebSSatish Balay #else 17371044d3cSBarry Smith LAPACKgetrs_("N",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info); 174e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"GETRS - Bad solve"); 175ae7cfcebSSatish Balay #endif 176d5f3da31SBarry Smith } else if (A->factortype == MAT_FACTOR_CHOLESKY){ 177ae7cfcebSSatish Balay #if defined(PETSC_MISSING_LAPACK_POTRS) 178e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"POTRS - Lapack routine is unavailable."); 179ae7cfcebSSatish Balay #else 18071044d3cSBarry Smith LAPACKpotrs_("L",&m,&one,mat->v,&mat->lda,y,&m,&info); 181e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS Bad solve"); 182ae7cfcebSSatish Balay #endif 183289bc588SBarry Smith } 184e32f2f54SBarry Smith else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix must be factored to solve"); 1851ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 1861ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 187dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->cmap->n - A->cmap->n);CHKERRQ(ierr); 1883a40ed3dSBarry Smith PetscFunctionReturn(0); 189289bc588SBarry Smith } 1906ee01492SSatish Balay 1914a2ae208SSatish Balay #undef __FUNCT__ 1924a2ae208SSatish Balay #define __FUNCT__ "MatSolveTranspose_SeqDense" 193dfbe8321SBarry Smith PetscErrorCode MatSolveTranspose_SeqDense(Mat A,Vec xx,Vec yy) 194da3a660dSBarry Smith { 195c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 196dfbe8321SBarry Smith PetscErrorCode ierr; 19787828ca2SBarry Smith PetscScalar *x,*y; 198d0f46423SBarry Smith PetscBLASInt one = 1,info,m = PetscBLASIntCast(A->rmap->n); 19967e560aaSBarry Smith 2003a40ed3dSBarry Smith PetscFunctionBegin; 2011ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 2021ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 203d0f46423SBarry Smith ierr = PetscMemcpy(y,x,A->rmap->n*sizeof(PetscScalar));CHKERRQ(ierr); 204752f5567SLois Curfman McInnes /* assume if pivots exist then use LU; else Cholesky */ 205da3a660dSBarry Smith if (mat->pivots) { 206ae7cfcebSSatish Balay #if defined(PETSC_MISSING_LAPACK_GETRS) 207e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"GETRS - Lapack routine is unavailable."); 208ae7cfcebSSatish Balay #else 20971044d3cSBarry Smith LAPACKgetrs_("T",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info); 210e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS - Bad solve"); 211ae7cfcebSSatish Balay #endif 2127a97a34bSBarry Smith } else { 213ae7cfcebSSatish Balay #if defined(PETSC_MISSING_LAPACK_POTRS) 214e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"POTRS - Lapack routine is unavailable."); 215ae7cfcebSSatish Balay #else 21671044d3cSBarry Smith LAPACKpotrs_("L",&m,&one,mat->v,&mat->lda,y,&m,&info); 217e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS - Bad solve"); 218ae7cfcebSSatish Balay #endif 219da3a660dSBarry Smith } 2201ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 2211ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 222dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->cmap->n - A->cmap->n);CHKERRQ(ierr); 2233a40ed3dSBarry Smith PetscFunctionReturn(0); 224da3a660dSBarry Smith } 2256ee01492SSatish Balay 2264a2ae208SSatish Balay #undef __FUNCT__ 2274a2ae208SSatish Balay #define __FUNCT__ "MatSolveAdd_SeqDense" 228dfbe8321SBarry Smith PetscErrorCode MatSolveAdd_SeqDense(Mat A,Vec xx,Vec zz,Vec yy) 229da3a660dSBarry Smith { 230c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 231dfbe8321SBarry Smith PetscErrorCode ierr; 23287828ca2SBarry Smith PetscScalar *x,*y,sone = 1.0; 233da3a660dSBarry Smith Vec tmp = 0; 234d0f46423SBarry Smith PetscBLASInt one = 1,info,m = PetscBLASIntCast(A->rmap->n); 23567e560aaSBarry Smith 2363a40ed3dSBarry Smith PetscFunctionBegin; 2371ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 2381ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 239d0f46423SBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 240da3a660dSBarry Smith if (yy == zz) { 24178b31e54SBarry Smith ierr = VecDuplicate(yy,&tmp);CHKERRQ(ierr); 24252e6d16bSBarry Smith ierr = PetscLogObjectParent(A,tmp);CHKERRQ(ierr); 24378b31e54SBarry Smith ierr = VecCopy(yy,tmp);CHKERRQ(ierr); 244da3a660dSBarry Smith } 245d0f46423SBarry Smith ierr = PetscMemcpy(y,x,A->rmap->n*sizeof(PetscScalar));CHKERRQ(ierr); 246752f5567SLois Curfman McInnes /* assume if pivots exist then use LU; else Cholesky */ 247da3a660dSBarry Smith if (mat->pivots) { 248ae7cfcebSSatish Balay #if defined(PETSC_MISSING_LAPACK_GETRS) 249e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"GETRS - Lapack routine is unavailable."); 250ae7cfcebSSatish Balay #else 25171044d3cSBarry Smith LAPACKgetrs_("N",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info); 252e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"Bad solve"); 253ae7cfcebSSatish Balay #endif 254a8c6a408SBarry Smith } else { 255ae7cfcebSSatish Balay #if defined(PETSC_MISSING_LAPACK_POTRS) 256e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"POTRS - Lapack routine is unavailable."); 257ae7cfcebSSatish Balay #else 25871044d3cSBarry Smith LAPACKpotrs_("L",&m,&one,mat->v,&mat->lda,y,&m,&info); 259e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"Bad solve"); 260ae7cfcebSSatish Balay #endif 261da3a660dSBarry Smith } 2622dcb1b2aSMatthew Knepley if (tmp) {ierr = VecAXPY(yy,sone,tmp);CHKERRQ(ierr); ierr = VecDestroy(tmp);CHKERRQ(ierr);} 2632dcb1b2aSMatthew Knepley else {ierr = VecAXPY(yy,sone,zz);CHKERRQ(ierr);} 2641ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 2651ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 266dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->cmap->n);CHKERRQ(ierr); 2673a40ed3dSBarry Smith PetscFunctionReturn(0); 268da3a660dSBarry Smith } 26967e560aaSBarry Smith 2704a2ae208SSatish Balay #undef __FUNCT__ 2714a2ae208SSatish Balay #define __FUNCT__ "MatSolveTransposeAdd_SeqDense" 272dfbe8321SBarry Smith PetscErrorCode MatSolveTransposeAdd_SeqDense(Mat A,Vec xx,Vec zz,Vec yy) 273da3a660dSBarry Smith { 274c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 2756849ba73SBarry Smith PetscErrorCode ierr; 27687828ca2SBarry Smith PetscScalar *x,*y,sone = 1.0; 277da3a660dSBarry Smith Vec tmp; 278d0f46423SBarry Smith PetscBLASInt one = 1,info,m = PetscBLASIntCast(A->rmap->n); 27967e560aaSBarry Smith 2803a40ed3dSBarry Smith PetscFunctionBegin; 281d0f46423SBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 2821ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 2831ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 284da3a660dSBarry Smith if (yy == zz) { 28578b31e54SBarry Smith ierr = VecDuplicate(yy,&tmp);CHKERRQ(ierr); 28652e6d16bSBarry Smith ierr = PetscLogObjectParent(A,tmp);CHKERRQ(ierr); 28778b31e54SBarry Smith ierr = VecCopy(yy,tmp);CHKERRQ(ierr); 288da3a660dSBarry Smith } 289d0f46423SBarry Smith ierr = PetscMemcpy(y,x,A->rmap->n*sizeof(PetscScalar));CHKERRQ(ierr); 290752f5567SLois Curfman McInnes /* assume if pivots exist then use LU; else Cholesky */ 291da3a660dSBarry Smith if (mat->pivots) { 292ae7cfcebSSatish Balay #if defined(PETSC_MISSING_LAPACK_GETRS) 293e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"GETRS - Lapack routine is unavailable."); 294ae7cfcebSSatish Balay #else 29571044d3cSBarry Smith LAPACKgetrs_("T",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info); 296e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"Bad solve"); 297ae7cfcebSSatish Balay #endif 2983a40ed3dSBarry Smith } else { 299ae7cfcebSSatish Balay #if defined(PETSC_MISSING_LAPACK_POTRS) 300e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"POTRS - Lapack routine is unavailable."); 301ae7cfcebSSatish Balay #else 30271044d3cSBarry Smith LAPACKpotrs_("L",&m,&one,mat->v,&mat->lda,y,&m,&info); 303e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"Bad solve"); 304ae7cfcebSSatish Balay #endif 305da3a660dSBarry Smith } 30690f02eecSBarry Smith if (tmp) { 3072dcb1b2aSMatthew Knepley ierr = VecAXPY(yy,sone,tmp);CHKERRQ(ierr); 30890f02eecSBarry Smith ierr = VecDestroy(tmp);CHKERRQ(ierr); 3093a40ed3dSBarry Smith } else { 3102dcb1b2aSMatthew Knepley ierr = VecAXPY(yy,sone,zz);CHKERRQ(ierr); 31190f02eecSBarry Smith } 3121ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 3131ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 314dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->cmap->n);CHKERRQ(ierr); 3153a40ed3dSBarry Smith PetscFunctionReturn(0); 316da3a660dSBarry Smith } 317db4efbfdSBarry Smith 318db4efbfdSBarry Smith /* ---------------------------------------------------------------*/ 319db4efbfdSBarry Smith /* COMMENT: I have chosen to hide row permutation in the pivots, 320db4efbfdSBarry Smith rather than put it in the Mat->row slot.*/ 321db4efbfdSBarry Smith #undef __FUNCT__ 322db4efbfdSBarry Smith #define __FUNCT__ "MatLUFactor_SeqDense" 3230481f469SBarry Smith PetscErrorCode MatLUFactor_SeqDense(Mat A,IS row,IS col,const MatFactorInfo *minfo) 324db4efbfdSBarry Smith { 325db4efbfdSBarry Smith #if defined(PETSC_MISSING_LAPACK_GETRF) 326db4efbfdSBarry Smith PetscFunctionBegin; 327e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"GETRF - Lapack routine is unavailable."); 328db4efbfdSBarry Smith #else 329db4efbfdSBarry Smith Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 330db4efbfdSBarry Smith PetscErrorCode ierr; 331db4efbfdSBarry Smith PetscBLASInt n,m,info; 332db4efbfdSBarry Smith 333db4efbfdSBarry Smith PetscFunctionBegin; 334db4efbfdSBarry Smith n = PetscBLASIntCast(A->cmap->n); 335db4efbfdSBarry Smith m = PetscBLASIntCast(A->rmap->n); 336db4efbfdSBarry Smith if (!mat->pivots) { 337db4efbfdSBarry Smith ierr = PetscMalloc((A->rmap->n+1)*sizeof(PetscBLASInt),&mat->pivots);CHKERRQ(ierr); 338db4efbfdSBarry Smith ierr = PetscLogObjectMemory(A,A->rmap->n*sizeof(PetscBLASInt));CHKERRQ(ierr); 339db4efbfdSBarry Smith } 340db4efbfdSBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 341db4efbfdSBarry Smith LAPACKgetrf_(&m,&n,mat->v,&mat->lda,mat->pivots,&info); 342e32f2f54SBarry Smith if (info<0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"Bad argument to LU factorization"); 343e32f2f54SBarry Smith if (info>0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_MAT_LU_ZRPVT,"Bad LU factorization"); 344db4efbfdSBarry Smith A->ops->solve = MatSolve_SeqDense; 345db4efbfdSBarry Smith A->ops->solvetranspose = MatSolveTranspose_SeqDense; 346db4efbfdSBarry Smith A->ops->solveadd = MatSolveAdd_SeqDense; 347db4efbfdSBarry Smith A->ops->solvetransposeadd = MatSolveTransposeAdd_SeqDense; 348d5f3da31SBarry Smith A->factortype = MAT_FACTOR_LU; 349db4efbfdSBarry Smith 350dc0b31edSSatish Balay ierr = PetscLogFlops((2.0*A->cmap->n*A->cmap->n*A->cmap->n)/3);CHKERRQ(ierr); 351db4efbfdSBarry Smith #endif 352db4efbfdSBarry Smith PetscFunctionReturn(0); 353db4efbfdSBarry Smith } 354db4efbfdSBarry Smith 355db4efbfdSBarry Smith #undef __FUNCT__ 356db4efbfdSBarry Smith #define __FUNCT__ "MatCholeskyFactor_SeqDense" 3570481f469SBarry Smith PetscErrorCode MatCholeskyFactor_SeqDense(Mat A,IS perm,const MatFactorInfo *factinfo) 358db4efbfdSBarry Smith { 359db4efbfdSBarry Smith #if defined(PETSC_MISSING_LAPACK_POTRF) 360db4efbfdSBarry Smith PetscFunctionBegin; 361e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"POTRF - Lapack routine is unavailable."); 362db4efbfdSBarry Smith #else 363db4efbfdSBarry Smith Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 364db4efbfdSBarry Smith PetscErrorCode ierr; 365db4efbfdSBarry Smith PetscBLASInt info,n = PetscBLASIntCast(A->cmap->n); 366db4efbfdSBarry Smith 367db4efbfdSBarry Smith PetscFunctionBegin; 368db4efbfdSBarry Smith ierr = PetscFree(mat->pivots);CHKERRQ(ierr); 369db4efbfdSBarry Smith mat->pivots = 0; 370db4efbfdSBarry Smith 371db4efbfdSBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 372db4efbfdSBarry Smith LAPACKpotrf_("L",&n,mat->v,&mat->lda,&info); 373e32f2f54SBarry Smith if (info) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_MAT_CH_ZRPVT,"Bad factorization: zero pivot in row %D",(PetscInt)info-1); 374db4efbfdSBarry Smith A->ops->solve = MatSolve_SeqDense; 375db4efbfdSBarry Smith A->ops->solvetranspose = MatSolveTranspose_SeqDense; 376db4efbfdSBarry Smith A->ops->solveadd = MatSolveAdd_SeqDense; 377db4efbfdSBarry Smith A->ops->solvetransposeadd = MatSolveTransposeAdd_SeqDense; 378d5f3da31SBarry Smith A->factortype = MAT_FACTOR_CHOLESKY; 379dc0b31edSSatish Balay ierr = PetscLogFlops((A->cmap->n*A->cmap->n*A->cmap->n)/3.0);CHKERRQ(ierr); 380db4efbfdSBarry Smith #endif 381db4efbfdSBarry Smith PetscFunctionReturn(0); 382db4efbfdSBarry Smith } 383db4efbfdSBarry Smith 384db4efbfdSBarry Smith 385db4efbfdSBarry Smith #undef __FUNCT__ 386db4efbfdSBarry Smith #define __FUNCT__ "MatCholeskyFactorNumeric_SeqDense" 3870481f469SBarry Smith PetscErrorCode MatCholeskyFactorNumeric_SeqDense(Mat fact,Mat A,const MatFactorInfo *info_dummy) 388db4efbfdSBarry Smith { 389db4efbfdSBarry Smith PetscErrorCode ierr; 390db4efbfdSBarry Smith MatFactorInfo info; 391db4efbfdSBarry Smith 392db4efbfdSBarry Smith PetscFunctionBegin; 393db4efbfdSBarry Smith info.fill = 1.0; 394c3ef05f6SHong Zhang ierr = MatDuplicateNoCreate_SeqDense(fact,A,MAT_COPY_VALUES);CHKERRQ(ierr); 395719d5645SBarry Smith ierr = MatCholeskyFactor_SeqDense(fact,0,&info);CHKERRQ(ierr); 396db4efbfdSBarry Smith PetscFunctionReturn(0); 397db4efbfdSBarry Smith } 398db4efbfdSBarry Smith 399db4efbfdSBarry Smith #undef __FUNCT__ 400db4efbfdSBarry Smith #define __FUNCT__ "MatCholeskyFactorSymbolic_SeqDense" 4010481f469SBarry Smith PetscErrorCode MatCholeskyFactorSymbolic_SeqDense(Mat fact,Mat A,IS row,const MatFactorInfo *info) 402db4efbfdSBarry Smith { 403db4efbfdSBarry Smith PetscFunctionBegin; 404c3ef05f6SHong Zhang fact->assembled = PETSC_TRUE; 405719d5645SBarry Smith fact->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqDense; 406db4efbfdSBarry Smith PetscFunctionReturn(0); 407db4efbfdSBarry Smith } 408db4efbfdSBarry Smith 409db4efbfdSBarry Smith #undef __FUNCT__ 410db4efbfdSBarry Smith #define __FUNCT__ "MatLUFactorSymbolic_SeqDense" 4110481f469SBarry Smith PetscErrorCode MatLUFactorSymbolic_SeqDense(Mat fact,Mat A,IS row,IS col,const MatFactorInfo *info) 412db4efbfdSBarry Smith { 413db4efbfdSBarry Smith PetscFunctionBegin; 414c3ef05f6SHong Zhang fact->assembled = PETSC_TRUE; 415719d5645SBarry Smith fact->ops->lufactornumeric = MatLUFactorNumeric_SeqDense; 416db4efbfdSBarry Smith PetscFunctionReturn(0); 417db4efbfdSBarry Smith } 418db4efbfdSBarry Smith 419bb5747d9SMatthew Knepley EXTERN_C_BEGIN 420db4efbfdSBarry Smith #undef __FUNCT__ 421db4efbfdSBarry Smith #define __FUNCT__ "MatGetFactor_seqdense_petsc" 422db4efbfdSBarry Smith PetscErrorCode MatGetFactor_seqdense_petsc(Mat A,MatFactorType ftype,Mat *fact) 423db4efbfdSBarry Smith { 424db4efbfdSBarry Smith PetscErrorCode ierr; 425db4efbfdSBarry Smith 426db4efbfdSBarry Smith PetscFunctionBegin; 427db4efbfdSBarry Smith ierr = MatCreate(((PetscObject)A)->comm,fact);CHKERRQ(ierr); 428db4efbfdSBarry Smith ierr = MatSetSizes(*fact,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 429db4efbfdSBarry Smith ierr = MatSetType(*fact,((PetscObject)A)->type_name);CHKERRQ(ierr); 430db4efbfdSBarry Smith if (ftype == MAT_FACTOR_LU){ 431db4efbfdSBarry Smith (*fact)->ops->lufactorsymbolic = MatLUFactorSymbolic_SeqDense; 432db4efbfdSBarry Smith } else { 433db4efbfdSBarry Smith (*fact)->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_SeqDense; 434db4efbfdSBarry Smith } 435d5f3da31SBarry Smith (*fact)->factortype = ftype; 436db4efbfdSBarry Smith PetscFunctionReturn(0); 437db4efbfdSBarry Smith } 438bb5747d9SMatthew Knepley EXTERN_C_END 439db4efbfdSBarry Smith 440289bc588SBarry Smith /* ------------------------------------------------------------------*/ 4414a2ae208SSatish Balay #undef __FUNCT__ 44241f059aeSBarry Smith #define __FUNCT__ "MatSOR_SeqDense" 44341f059aeSBarry Smith PetscErrorCode MatSOR_SeqDense(Mat A,Vec bb,PetscReal omega,MatSORType flag,PetscReal shift,PetscInt its,PetscInt lits,Vec xx) 444289bc588SBarry Smith { 445c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 44687828ca2SBarry Smith PetscScalar *x,*b,*v = mat->v,zero = 0.0,xt; 447dfbe8321SBarry Smith PetscErrorCode ierr; 448d0f46423SBarry Smith PetscInt m = A->rmap->n,i; 449aa482453SBarry Smith #if !defined(PETSC_USE_COMPLEX) 4500805154bSBarry Smith PetscBLASInt o = 1,bm = PetscBLASIntCast(m); 451bc1b551cSSatish Balay #endif 452289bc588SBarry Smith 4533a40ed3dSBarry Smith PetscFunctionBegin; 454289bc588SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 45571044d3cSBarry Smith /* this is a hack fix, should have another version without the second BLASdot */ 4562dcb1b2aSMatthew Knepley ierr = VecSet(xx,zero);CHKERRQ(ierr); 457289bc588SBarry Smith } 4581ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 4591ebc52fbSHong Zhang ierr = VecGetArray(bb,&b);CHKERRQ(ierr); 460b965ef7fSBarry Smith its = its*lits; 461e32f2f54SBarry Smith if (its <= 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Relaxation requires global its %D and local its %D both positive",its,lits); 462289bc588SBarry Smith while (its--) { 463fccaa45eSBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP){ 464289bc588SBarry Smith for (i=0; i<m; i++) { 465aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 466f1747703SBarry Smith /* cannot use BLAS dot for complex because compiler/linker is 467f1747703SBarry Smith not happy about returning a double complex */ 46813f74950SBarry Smith PetscInt _i; 46987828ca2SBarry Smith PetscScalar sum = b[i]; 470f1747703SBarry Smith for (_i=0; _i<m; _i++) { 4713f6de6efSSatish Balay sum -= PetscConj(v[i+_i*m])*x[_i]; 472f1747703SBarry Smith } 473f1747703SBarry Smith xt = sum; 474f1747703SBarry Smith #else 47571044d3cSBarry Smith xt = b[i] - BLASdot_(&bm,v+i,&bm,x,&o); 476f1747703SBarry Smith #endif 47755a1b374SBarry Smith x[i] = (1. - omega)*x[i] + omega*(xt+v[i + i*m]*x[i])/(v[i + i*m]+shift); 478289bc588SBarry Smith } 479289bc588SBarry Smith } 480fccaa45eSBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP){ 481289bc588SBarry Smith for (i=m-1; i>=0; i--) { 482aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 483f1747703SBarry Smith /* cannot use BLAS dot for complex because compiler/linker is 484f1747703SBarry Smith not happy about returning a double complex */ 48513f74950SBarry Smith PetscInt _i; 48687828ca2SBarry Smith PetscScalar sum = b[i]; 487f1747703SBarry Smith for (_i=0; _i<m; _i++) { 4883f6de6efSSatish Balay sum -= PetscConj(v[i+_i*m])*x[_i]; 489f1747703SBarry Smith } 490f1747703SBarry Smith xt = sum; 491f1747703SBarry Smith #else 49271044d3cSBarry Smith xt = b[i] - BLASdot_(&bm,v+i,&bm,x,&o); 493f1747703SBarry Smith #endif 49455a1b374SBarry Smith x[i] = (1. - omega)*x[i] + omega*(xt+v[i + i*m]*x[i])/(v[i + i*m]+shift); 495289bc588SBarry Smith } 496289bc588SBarry Smith } 497289bc588SBarry Smith } 4981ebc52fbSHong Zhang ierr = VecRestoreArray(bb,&b);CHKERRQ(ierr); 4991ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 5003a40ed3dSBarry Smith PetscFunctionReturn(0); 501289bc588SBarry Smith } 502289bc588SBarry Smith 503289bc588SBarry Smith /* -----------------------------------------------------------------*/ 5044a2ae208SSatish Balay #undef __FUNCT__ 5054a2ae208SSatish Balay #define __FUNCT__ "MatMultTranspose_SeqDense" 506dfbe8321SBarry Smith PetscErrorCode MatMultTranspose_SeqDense(Mat A,Vec xx,Vec yy) 507289bc588SBarry Smith { 508c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 50987828ca2SBarry Smith PetscScalar *v = mat->v,*x,*y; 510dfbe8321SBarry Smith PetscErrorCode ierr; 5110805154bSBarry Smith PetscBLASInt m, n,_One=1; 512ea709b57SSatish Balay PetscScalar _DOne=1.0,_DZero=0.0; 5133a40ed3dSBarry Smith 5143a40ed3dSBarry Smith PetscFunctionBegin; 515d0f46423SBarry Smith m = PetscBLASIntCast(A->rmap->n); 516d0f46423SBarry Smith n = PetscBLASIntCast(A->cmap->n); 517d0f46423SBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 5181ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 5191ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 52071044d3cSBarry Smith BLASgemv_("T",&m,&n,&_DOne,v,&mat->lda,x,&_One,&_DZero,y,&_One); 5211ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 5221ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 523dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n - A->cmap->n);CHKERRQ(ierr); 5243a40ed3dSBarry Smith PetscFunctionReturn(0); 525289bc588SBarry Smith } 526800995b7SMatthew Knepley 5274a2ae208SSatish Balay #undef __FUNCT__ 5284a2ae208SSatish Balay #define __FUNCT__ "MatMult_SeqDense" 529dfbe8321SBarry Smith PetscErrorCode MatMult_SeqDense(Mat A,Vec xx,Vec yy) 530289bc588SBarry Smith { 531c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 53287828ca2SBarry Smith PetscScalar *v = mat->v,*x,*y,_DOne=1.0,_DZero=0.0; 533dfbe8321SBarry Smith PetscErrorCode ierr; 5340805154bSBarry Smith PetscBLASInt m, n, _One=1; 5353a40ed3dSBarry Smith 5363a40ed3dSBarry Smith PetscFunctionBegin; 537d0f46423SBarry Smith m = PetscBLASIntCast(A->rmap->n); 538d0f46423SBarry Smith n = PetscBLASIntCast(A->cmap->n); 539d0f46423SBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 5401ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 5411ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 54271044d3cSBarry Smith BLASgemv_("N",&m,&n,&_DOne,v,&(mat->lda),x,&_One,&_DZero,y,&_One); 5431ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 5441ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 545dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n - A->rmap->n);CHKERRQ(ierr); 5463a40ed3dSBarry Smith PetscFunctionReturn(0); 547289bc588SBarry Smith } 5486ee01492SSatish Balay 5494a2ae208SSatish Balay #undef __FUNCT__ 5504a2ae208SSatish Balay #define __FUNCT__ "MatMultAdd_SeqDense" 551dfbe8321SBarry Smith PetscErrorCode MatMultAdd_SeqDense(Mat A,Vec xx,Vec zz,Vec yy) 552289bc588SBarry Smith { 553c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 55487828ca2SBarry Smith PetscScalar *v = mat->v,*x,*y,_DOne=1.0; 555dfbe8321SBarry Smith PetscErrorCode ierr; 5560805154bSBarry Smith PetscBLASInt m, n, _One=1; 5573a40ed3dSBarry Smith 5583a40ed3dSBarry Smith PetscFunctionBegin; 559d0f46423SBarry Smith m = PetscBLASIntCast(A->rmap->n); 560d0f46423SBarry Smith n = PetscBLASIntCast(A->cmap->n); 561d0f46423SBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 562600d6d0bSBarry Smith if (zz != yy) {ierr = VecCopy(zz,yy);CHKERRQ(ierr);} 5631ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 5641ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 56571044d3cSBarry Smith BLASgemv_("N",&m,&n,&_DOne,v,&(mat->lda),x,&_One,&_DOne,y,&_One); 5661ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 5671ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 568dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n);CHKERRQ(ierr); 5693a40ed3dSBarry Smith PetscFunctionReturn(0); 570289bc588SBarry Smith } 5716ee01492SSatish Balay 5724a2ae208SSatish Balay #undef __FUNCT__ 5734a2ae208SSatish Balay #define __FUNCT__ "MatMultTransposeAdd_SeqDense" 574dfbe8321SBarry Smith PetscErrorCode MatMultTransposeAdd_SeqDense(Mat A,Vec xx,Vec zz,Vec yy) 575289bc588SBarry Smith { 576c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 57787828ca2SBarry Smith PetscScalar *v = mat->v,*x,*y; 578dfbe8321SBarry Smith PetscErrorCode ierr; 5790805154bSBarry Smith PetscBLASInt m, n, _One=1; 58087828ca2SBarry Smith PetscScalar _DOne=1.0; 5813a40ed3dSBarry Smith 5823a40ed3dSBarry Smith PetscFunctionBegin; 583d0f46423SBarry Smith m = PetscBLASIntCast(A->rmap->n); 584d0f46423SBarry Smith n = PetscBLASIntCast(A->cmap->n); 585d0f46423SBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 586600d6d0bSBarry Smith if (zz != yy) {ierr = VecCopy(zz,yy);CHKERRQ(ierr);} 5871ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 5881ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 58971044d3cSBarry Smith BLASgemv_("T",&m,&n,&_DOne,v,&(mat->lda),x,&_One,&_DOne,y,&_One); 5901ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 5911ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 592dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n);CHKERRQ(ierr); 5933a40ed3dSBarry Smith PetscFunctionReturn(0); 594289bc588SBarry Smith } 595289bc588SBarry Smith 596289bc588SBarry Smith /* -----------------------------------------------------------------*/ 5974a2ae208SSatish Balay #undef __FUNCT__ 5984a2ae208SSatish Balay #define __FUNCT__ "MatGetRow_SeqDense" 59913f74950SBarry Smith PetscErrorCode MatGetRow_SeqDense(Mat A,PetscInt row,PetscInt *ncols,PetscInt **cols,PetscScalar **vals) 600289bc588SBarry Smith { 601c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 60287828ca2SBarry Smith PetscScalar *v; 6036849ba73SBarry Smith PetscErrorCode ierr; 60413f74950SBarry Smith PetscInt i; 60567e560aaSBarry Smith 6063a40ed3dSBarry Smith PetscFunctionBegin; 607d0f46423SBarry Smith *ncols = A->cmap->n; 608289bc588SBarry Smith if (cols) { 609d0f46423SBarry Smith ierr = PetscMalloc((A->cmap->n+1)*sizeof(PetscInt),cols);CHKERRQ(ierr); 610d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) (*cols)[i] = i; 611289bc588SBarry Smith } 612289bc588SBarry Smith if (vals) { 613d0f46423SBarry Smith ierr = PetscMalloc((A->cmap->n+1)*sizeof(PetscScalar),vals);CHKERRQ(ierr); 614289bc588SBarry Smith v = mat->v + row; 615d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) {(*vals)[i] = *v; v += mat->lda;} 616289bc588SBarry Smith } 6173a40ed3dSBarry Smith PetscFunctionReturn(0); 618289bc588SBarry Smith } 6196ee01492SSatish Balay 6204a2ae208SSatish Balay #undef __FUNCT__ 6214a2ae208SSatish Balay #define __FUNCT__ "MatRestoreRow_SeqDense" 62213f74950SBarry Smith PetscErrorCode MatRestoreRow_SeqDense(Mat A,PetscInt row,PetscInt *ncols,PetscInt **cols,PetscScalar **vals) 623289bc588SBarry Smith { 624dfbe8321SBarry Smith PetscErrorCode ierr; 625606d414cSSatish Balay PetscFunctionBegin; 626606d414cSSatish Balay if (cols) {ierr = PetscFree(*cols);CHKERRQ(ierr);} 627606d414cSSatish Balay if (vals) {ierr = PetscFree(*vals);CHKERRQ(ierr); } 6283a40ed3dSBarry Smith PetscFunctionReturn(0); 629289bc588SBarry Smith } 630289bc588SBarry Smith /* ----------------------------------------------------------------*/ 6314a2ae208SSatish Balay #undef __FUNCT__ 6324a2ae208SSatish Balay #define __FUNCT__ "MatSetValues_SeqDense" 63313f74950SBarry Smith PetscErrorCode MatSetValues_SeqDense(Mat A,PetscInt m,const PetscInt indexm[],PetscInt n,const PetscInt indexn[],const PetscScalar v[],InsertMode addv) 634289bc588SBarry Smith { 635c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 63613f74950SBarry Smith PetscInt i,j,idx=0; 637d6dfbf8fSBarry Smith 6383a40ed3dSBarry Smith PetscFunctionBegin; 63971fd2e92SBarry Smith if (v) PetscValidScalarPointer(v,6); 640289bc588SBarry Smith if (!mat->roworiented) { 641dbb450caSBarry Smith if (addv == INSERT_VALUES) { 642289bc588SBarry Smith for (j=0; j<n; j++) { 643cddbea37SSatish Balay if (indexn[j] < 0) {idx += m; continue;} 6442515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 645e32f2f54SBarry Smith if (indexn[j] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 64658804f6dSBarry Smith #endif 647289bc588SBarry Smith for (i=0; i<m; i++) { 648cddbea37SSatish Balay if (indexm[i] < 0) {idx++; continue;} 6492515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 650e32f2f54SBarry Smith if (indexm[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 65158804f6dSBarry Smith #endif 652cddbea37SSatish Balay mat->v[indexn[j]*mat->lda + indexm[i]] = v[idx++]; 653289bc588SBarry Smith } 654289bc588SBarry Smith } 6553a40ed3dSBarry Smith } else { 656289bc588SBarry Smith for (j=0; j<n; j++) { 657cddbea37SSatish Balay if (indexn[j] < 0) {idx += m; continue;} 6582515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 659e32f2f54SBarry Smith if (indexn[j] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 66058804f6dSBarry Smith #endif 661289bc588SBarry Smith for (i=0; i<m; i++) { 662cddbea37SSatish Balay if (indexm[i] < 0) {idx++; continue;} 6632515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 664e32f2f54SBarry Smith if (indexm[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 66558804f6dSBarry Smith #endif 666cddbea37SSatish Balay mat->v[indexn[j]*mat->lda + indexm[i]] += v[idx++]; 667289bc588SBarry Smith } 668289bc588SBarry Smith } 669289bc588SBarry Smith } 6703a40ed3dSBarry Smith } else { 671dbb450caSBarry Smith if (addv == INSERT_VALUES) { 672e8d4e0b9SBarry Smith for (i=0; i<m; i++) { 673cddbea37SSatish Balay if (indexm[i] < 0) { idx += n; continue;} 6742515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 675e32f2f54SBarry Smith if (indexm[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 67658804f6dSBarry Smith #endif 677e8d4e0b9SBarry Smith for (j=0; j<n; j++) { 678cddbea37SSatish Balay if (indexn[j] < 0) { idx++; continue;} 6792515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 680e32f2f54SBarry Smith if (indexn[j] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 68158804f6dSBarry Smith #endif 682cddbea37SSatish Balay mat->v[indexn[j]*mat->lda + indexm[i]] = v[idx++]; 683e8d4e0b9SBarry Smith } 684e8d4e0b9SBarry Smith } 6853a40ed3dSBarry Smith } else { 686289bc588SBarry Smith for (i=0; i<m; i++) { 687cddbea37SSatish Balay if (indexm[i] < 0) { idx += n; continue;} 6882515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 689e32f2f54SBarry Smith if (indexm[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 69058804f6dSBarry Smith #endif 691289bc588SBarry Smith for (j=0; j<n; j++) { 692cddbea37SSatish Balay if (indexn[j] < 0) { idx++; continue;} 6932515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 694e32f2f54SBarry Smith if (indexn[j] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 69558804f6dSBarry Smith #endif 696cddbea37SSatish Balay mat->v[indexn[j]*mat->lda + indexm[i]] += v[idx++]; 697289bc588SBarry Smith } 698289bc588SBarry Smith } 699289bc588SBarry Smith } 700e8d4e0b9SBarry Smith } 7013a40ed3dSBarry Smith PetscFunctionReturn(0); 702289bc588SBarry Smith } 703e8d4e0b9SBarry Smith 7044a2ae208SSatish Balay #undef __FUNCT__ 7054a2ae208SSatish Balay #define __FUNCT__ "MatGetValues_SeqDense" 70613f74950SBarry Smith PetscErrorCode MatGetValues_SeqDense(Mat A,PetscInt m,const PetscInt indexm[],PetscInt n,const PetscInt indexn[],PetscScalar v[]) 707ae80bb75SLois Curfman McInnes { 708ae80bb75SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 70913f74950SBarry Smith PetscInt i,j; 710ae80bb75SLois Curfman McInnes 7113a40ed3dSBarry Smith PetscFunctionBegin; 712ae80bb75SLois Curfman McInnes /* row-oriented output */ 713ae80bb75SLois Curfman McInnes for (i=0; i<m; i++) { 71497e567efSBarry Smith if (indexm[i] < 0) {v += n;continue;} 715e32f2f54SBarry Smith if (indexm[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D requested larger than number rows %D",indexm[i],A->rmap->n); 716ae80bb75SLois Curfman McInnes for (j=0; j<n; j++) { 7176f31f424SBarry Smith if (indexn[j] < 0) {v++; continue;} 718e32f2f54SBarry Smith if (indexn[j] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column %D requested larger than number columns %D",indexn[j],A->cmap->n); 71997e567efSBarry Smith *v++ = mat->v[indexn[j]*mat->lda + indexm[i]]; 720ae80bb75SLois Curfman McInnes } 721ae80bb75SLois Curfman McInnes } 7223a40ed3dSBarry Smith PetscFunctionReturn(0); 723ae80bb75SLois Curfman McInnes } 724ae80bb75SLois Curfman McInnes 725289bc588SBarry Smith /* -----------------------------------------------------------------*/ 726289bc588SBarry Smith 7274a2ae208SSatish Balay #undef __FUNCT__ 7285bba2384SShri Abhyankar #define __FUNCT__ "MatLoad_SeqDense" 729112444f4SShri Abhyankar PetscErrorCode MatLoad_SeqDense(Mat newmat,PetscViewer viewer) 730aabbc4fbSShri Abhyankar { 731aabbc4fbSShri Abhyankar Mat_SeqDense *a; 732aabbc4fbSShri Abhyankar PetscErrorCode ierr; 733aabbc4fbSShri Abhyankar PetscInt *scols,i,j,nz,header[4]; 734aabbc4fbSShri Abhyankar int fd; 735aabbc4fbSShri Abhyankar PetscMPIInt size; 736aabbc4fbSShri Abhyankar PetscInt *rowlengths = 0,M,N,*cols,grows,gcols; 737aabbc4fbSShri Abhyankar PetscScalar *vals,*svals,*v,*w; 738aabbc4fbSShri Abhyankar MPI_Comm comm = ((PetscObject)viewer)->comm; 739aabbc4fbSShri Abhyankar 740aabbc4fbSShri Abhyankar PetscFunctionBegin; 741aabbc4fbSShri Abhyankar ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 742aabbc4fbSShri Abhyankar if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"view must have one processor"); 743aabbc4fbSShri Abhyankar ierr = PetscViewerBinaryGetDescriptor(viewer,&fd);CHKERRQ(ierr); 744aabbc4fbSShri Abhyankar ierr = PetscBinaryRead(fd,header,4,PETSC_INT);CHKERRQ(ierr); 745aabbc4fbSShri Abhyankar if (header[0] != MAT_FILE_CLASSID) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Not matrix object"); 746aabbc4fbSShri Abhyankar M = header[1]; N = header[2]; nz = header[3]; 747aabbc4fbSShri Abhyankar 748aabbc4fbSShri Abhyankar /* set global size if not set already*/ 749aabbc4fbSShri Abhyankar if (newmat->rmap->n < 0 && newmat->rmap->N < 0 && newmat->cmap->n < 0 && newmat->cmap->N < 0) { 750aabbc4fbSShri Abhyankar ierr = MatSetSizes(newmat,M,N,M,N);CHKERRQ(ierr); 751aabbc4fbSShri Abhyankar } else { 752aabbc4fbSShri Abhyankar /* if sizes and type are already set, check if the vector global sizes are correct */ 753aabbc4fbSShri Abhyankar ierr = MatGetSize(newmat,&grows,&gcols);CHKERRQ(ierr); 754aabbc4fbSShri Abhyankar if (M != grows || N != gcols) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%d, %d) than the input matrix (%d, %d)",M,N,grows,gcols); 755aabbc4fbSShri Abhyankar } 756aabbc4fbSShri Abhyankar ierr = MatSeqDenseSetPreallocation(newmat,PETSC_NULL);CHKERRQ(ierr); 757aabbc4fbSShri Abhyankar 758aabbc4fbSShri Abhyankar if (nz == MATRIX_BINARY_FORMAT_DENSE) { /* matrix in file is dense */ 759aabbc4fbSShri Abhyankar a = (Mat_SeqDense*)newmat->data; 760aabbc4fbSShri Abhyankar v = a->v; 761aabbc4fbSShri Abhyankar /* Allocate some temp space to read in the values and then flip them 762aabbc4fbSShri Abhyankar from row major to column major */ 763aabbc4fbSShri Abhyankar ierr = PetscMalloc((M*N > 0 ? M*N : 1)*sizeof(PetscScalar),&w);CHKERRQ(ierr); 764aabbc4fbSShri Abhyankar /* read in nonzero values */ 765aabbc4fbSShri Abhyankar ierr = PetscBinaryRead(fd,w,M*N,PETSC_SCALAR);CHKERRQ(ierr); 766aabbc4fbSShri Abhyankar /* now flip the values and store them in the matrix*/ 767aabbc4fbSShri Abhyankar for (j=0; j<N; j++) { 768aabbc4fbSShri Abhyankar for (i=0; i<M; i++) { 769aabbc4fbSShri Abhyankar *v++ =w[i*N+j]; 770aabbc4fbSShri Abhyankar } 771aabbc4fbSShri Abhyankar } 772aabbc4fbSShri Abhyankar ierr = PetscFree(w);CHKERRQ(ierr); 773aabbc4fbSShri Abhyankar } else { 774aabbc4fbSShri Abhyankar /* read row lengths */ 775aabbc4fbSShri Abhyankar ierr = PetscMalloc((M+1)*sizeof(PetscInt),&rowlengths);CHKERRQ(ierr); 776aabbc4fbSShri Abhyankar ierr = PetscBinaryRead(fd,rowlengths,M,PETSC_INT);CHKERRQ(ierr); 777aabbc4fbSShri Abhyankar 778aabbc4fbSShri Abhyankar a = (Mat_SeqDense*)newmat->data; 779aabbc4fbSShri Abhyankar v = a->v; 780aabbc4fbSShri Abhyankar 781aabbc4fbSShri Abhyankar /* read column indices and nonzeros */ 782aabbc4fbSShri Abhyankar ierr = PetscMalloc((nz+1)*sizeof(PetscInt),&scols);CHKERRQ(ierr); 783aabbc4fbSShri Abhyankar cols = scols; 784aabbc4fbSShri Abhyankar ierr = PetscBinaryRead(fd,cols,nz,PETSC_INT);CHKERRQ(ierr); 785aabbc4fbSShri Abhyankar ierr = PetscMalloc((nz+1)*sizeof(PetscScalar),&svals);CHKERRQ(ierr); 786aabbc4fbSShri Abhyankar vals = svals; 787aabbc4fbSShri Abhyankar ierr = PetscBinaryRead(fd,vals,nz,PETSC_SCALAR);CHKERRQ(ierr); 788aabbc4fbSShri Abhyankar 789aabbc4fbSShri Abhyankar /* insert into matrix */ 790aabbc4fbSShri Abhyankar for (i=0; i<M; i++) { 791aabbc4fbSShri Abhyankar for (j=0; j<rowlengths[i]; j++) v[i+M*scols[j]] = svals[j]; 792aabbc4fbSShri Abhyankar svals += rowlengths[i]; scols += rowlengths[i]; 793aabbc4fbSShri Abhyankar } 794aabbc4fbSShri Abhyankar ierr = PetscFree(vals);CHKERRQ(ierr); 795aabbc4fbSShri Abhyankar ierr = PetscFree(cols);CHKERRQ(ierr); 796aabbc4fbSShri Abhyankar ierr = PetscFree(rowlengths);CHKERRQ(ierr); 797aabbc4fbSShri Abhyankar } 798aabbc4fbSShri Abhyankar ierr = MatAssemblyBegin(newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 799aabbc4fbSShri Abhyankar ierr = MatAssemblyEnd(newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 800aabbc4fbSShri Abhyankar 801aabbc4fbSShri Abhyankar PetscFunctionReturn(0); 802aabbc4fbSShri Abhyankar } 803aabbc4fbSShri Abhyankar 804aabbc4fbSShri Abhyankar #undef __FUNCT__ 8054a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqDense_ASCII" 8066849ba73SBarry Smith static PetscErrorCode MatView_SeqDense_ASCII(Mat A,PetscViewer viewer) 807289bc588SBarry Smith { 808932b0c3eSLois Curfman McInnes Mat_SeqDense *a = (Mat_SeqDense*)A->data; 809dfbe8321SBarry Smith PetscErrorCode ierr; 81013f74950SBarry Smith PetscInt i,j; 8112dcb1b2aSMatthew Knepley const char *name; 81287828ca2SBarry Smith PetscScalar *v; 813f3ef73ceSBarry Smith PetscViewerFormat format; 8145f481a85SSatish Balay #if defined(PETSC_USE_COMPLEX) 815ace3abfcSBarry Smith PetscBool allreal = PETSC_TRUE; 8165f481a85SSatish Balay #endif 817932b0c3eSLois Curfman McInnes 8183a40ed3dSBarry Smith PetscFunctionBegin; 819b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 820456192e2SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) { 8213a40ed3dSBarry Smith PetscFunctionReturn(0); /* do nothing for now */ 822fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 823b0a32e0cSBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_NO);CHKERRQ(ierr); 8247566de4bSShri Abhyankar ierr = PetscObjectPrintClassNamePrefixType((PetscObject)A,viewer,"Matrix Object");CHKERRQ(ierr); 825d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 82644cd7ae7SLois Curfman McInnes v = a->v + i; 82777431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 828d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 829aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 830329f5518SBarry Smith if (PetscRealPart(*v) != 0.0 && PetscImaginaryPart(*v) != 0.0) { 831a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G + %G i) ",j,PetscRealPart(*v),PetscImaginaryPart(*v));CHKERRQ(ierr); 832329f5518SBarry Smith } else if (PetscRealPart(*v)) { 833a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",j,PetscRealPart(*v));CHKERRQ(ierr); 8346831982aSBarry Smith } 83580cd9d93SLois Curfman McInnes #else 8366831982aSBarry Smith if (*v) { 837a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",j,*v);CHKERRQ(ierr); 8386831982aSBarry Smith } 83980cd9d93SLois Curfman McInnes #endif 8401b807ce4Svictorle v += a->lda; 84180cd9d93SLois Curfman McInnes } 842b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 84380cd9d93SLois Curfman McInnes } 844b0a32e0cSBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_YES);CHKERRQ(ierr); 8453a40ed3dSBarry Smith } else { 846b0a32e0cSBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_NO);CHKERRQ(ierr); 847aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 84847989497SBarry Smith /* determine if matrix has all real values */ 84947989497SBarry Smith v = a->v; 850d0f46423SBarry Smith for (i=0; i<A->rmap->n*A->cmap->n; i++) { 851ffac6cdbSBarry Smith if (PetscImaginaryPart(v[i])) { allreal = PETSC_FALSE; break ;} 85247989497SBarry Smith } 85347989497SBarry Smith #endif 854fb9695e5SSatish Balay if (format == PETSC_VIEWER_ASCII_MATLAB) { 8553a7fca6bSBarry Smith ierr = PetscObjectGetName((PetscObject)A,&name);CHKERRQ(ierr); 856d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Size = %D %D \n",A->rmap->n,A->cmap->n);CHKERRQ(ierr); 857d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%s = zeros(%D,%D);\n",name,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 858fb9695e5SSatish Balay ierr = PetscViewerASCIIPrintf(viewer,"%s = [\n",name);CHKERRQ(ierr); 8597566de4bSShri Abhyankar } else { 8607566de4bSShri Abhyankar ierr = PetscObjectPrintClassNamePrefixType((PetscObject)A,viewer,"Matrix Object");CHKERRQ(ierr); 861ffac6cdbSBarry Smith } 862ffac6cdbSBarry Smith 863d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 864932b0c3eSLois Curfman McInnes v = a->v + i; 865d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 866aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 86747989497SBarry Smith if (allreal) { 868f32d5d43SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%18.16e ",PetscRealPart(*v));CHKERRQ(ierr); 86947989497SBarry Smith } else { 870f32d5d43SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%18.16e + %18.16e i ",PetscRealPart(*v),PetscImaginaryPart(*v));CHKERRQ(ierr); 87147989497SBarry Smith } 872289bc588SBarry Smith #else 873f32d5d43SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%18.16e ",*v);CHKERRQ(ierr); 874289bc588SBarry Smith #endif 8751b807ce4Svictorle v += a->lda; 876289bc588SBarry Smith } 877b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 878289bc588SBarry Smith } 879fb9695e5SSatish Balay if (format == PETSC_VIEWER_ASCII_MATLAB) { 880b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"];\n");CHKERRQ(ierr); 881ffac6cdbSBarry Smith } 882b0a32e0cSBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_YES);CHKERRQ(ierr); 883da3a660dSBarry Smith } 884b0a32e0cSBarry Smith ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 8853a40ed3dSBarry Smith PetscFunctionReturn(0); 886289bc588SBarry Smith } 887289bc588SBarry Smith 8884a2ae208SSatish Balay #undef __FUNCT__ 8894a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqDense_Binary" 8906849ba73SBarry Smith static PetscErrorCode MatView_SeqDense_Binary(Mat A,PetscViewer viewer) 891932b0c3eSLois Curfman McInnes { 892932b0c3eSLois Curfman McInnes Mat_SeqDense *a = (Mat_SeqDense*)A->data; 8936849ba73SBarry Smith PetscErrorCode ierr; 89413f74950SBarry Smith int fd; 895d0f46423SBarry Smith PetscInt ict,j,n = A->cmap->n,m = A->rmap->n,i,*col_lens,nz = m*n; 896f4403165SShri Abhyankar PetscScalar *v,*anonz,*vals; 897f4403165SShri Abhyankar PetscViewerFormat format; 898932b0c3eSLois Curfman McInnes 8993a40ed3dSBarry Smith PetscFunctionBegin; 900b0a32e0cSBarry Smith ierr = PetscViewerBinaryGetDescriptor(viewer,&fd);CHKERRQ(ierr); 90190ace30eSBarry Smith 902f4403165SShri Abhyankar ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 903f4403165SShri Abhyankar if (format == PETSC_VIEWER_NATIVE) { 904f4403165SShri Abhyankar /* store the matrix as a dense matrix */ 905f4403165SShri Abhyankar ierr = PetscMalloc(4*sizeof(PetscInt),&col_lens);CHKERRQ(ierr); 906f4403165SShri Abhyankar col_lens[0] = MAT_FILE_CLASSID; 907f4403165SShri Abhyankar col_lens[1] = m; 908f4403165SShri Abhyankar col_lens[2] = n; 909f4403165SShri Abhyankar col_lens[3] = MATRIX_BINARY_FORMAT_DENSE; 910f4403165SShri Abhyankar ierr = PetscBinaryWrite(fd,col_lens,4,PETSC_INT,PETSC_TRUE);CHKERRQ(ierr); 911f4403165SShri Abhyankar ierr = PetscFree(col_lens);CHKERRQ(ierr); 912f4403165SShri Abhyankar 913f4403165SShri Abhyankar /* write out matrix, by rows */ 914f4403165SShri Abhyankar ierr = PetscMalloc((m*n+1)*sizeof(PetscScalar),&vals);CHKERRQ(ierr); 915f4403165SShri Abhyankar v = a->v; 916f4403165SShri Abhyankar for (j=0; j<n; j++) { 917f4403165SShri Abhyankar for (i=0; i<m; i++) { 918f4403165SShri Abhyankar vals[j + i*n] = *v++; 919f4403165SShri Abhyankar } 920f4403165SShri Abhyankar } 921f4403165SShri Abhyankar ierr = PetscBinaryWrite(fd,vals,n*m,PETSC_SCALAR,PETSC_FALSE);CHKERRQ(ierr); 922f4403165SShri Abhyankar ierr = PetscFree(vals);CHKERRQ(ierr); 923f4403165SShri Abhyankar } else { 92413f74950SBarry Smith ierr = PetscMalloc((4+nz)*sizeof(PetscInt),&col_lens);CHKERRQ(ierr); 9250700a824SBarry Smith col_lens[0] = MAT_FILE_CLASSID; 926932b0c3eSLois Curfman McInnes col_lens[1] = m; 927932b0c3eSLois Curfman McInnes col_lens[2] = n; 928932b0c3eSLois Curfman McInnes col_lens[3] = nz; 929932b0c3eSLois Curfman McInnes 930932b0c3eSLois Curfman McInnes /* store lengths of each row and write (including header) to file */ 931932b0c3eSLois Curfman McInnes for (i=0; i<m; i++) col_lens[4+i] = n; 9326f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,col_lens,4+m,PETSC_INT,PETSC_TRUE);CHKERRQ(ierr); 933932b0c3eSLois Curfman McInnes 934932b0c3eSLois Curfman McInnes /* Possibly should write in smaller increments, not whole matrix at once? */ 935932b0c3eSLois Curfman McInnes /* store column indices (zero start index) */ 936932b0c3eSLois Curfman McInnes ict = 0; 937932b0c3eSLois Curfman McInnes for (i=0; i<m; i++) { 938932b0c3eSLois Curfman McInnes for (j=0; j<n; j++) col_lens[ict++] = j; 939932b0c3eSLois Curfman McInnes } 9406f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,col_lens,nz,PETSC_INT,PETSC_FALSE);CHKERRQ(ierr); 941606d414cSSatish Balay ierr = PetscFree(col_lens);CHKERRQ(ierr); 942932b0c3eSLois Curfman McInnes 943932b0c3eSLois Curfman McInnes /* store nonzero values */ 94487828ca2SBarry Smith ierr = PetscMalloc((nz+1)*sizeof(PetscScalar),&anonz);CHKERRQ(ierr); 945932b0c3eSLois Curfman McInnes ict = 0; 946932b0c3eSLois Curfman McInnes for (i=0; i<m; i++) { 947932b0c3eSLois Curfman McInnes v = a->v + i; 948932b0c3eSLois Curfman McInnes for (j=0; j<n; j++) { 9491b807ce4Svictorle anonz[ict++] = *v; v += a->lda; 950932b0c3eSLois Curfman McInnes } 951932b0c3eSLois Curfman McInnes } 9526f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,anonz,nz,PETSC_SCALAR,PETSC_FALSE);CHKERRQ(ierr); 953606d414cSSatish Balay ierr = PetscFree(anonz);CHKERRQ(ierr); 954f4403165SShri Abhyankar } 9553a40ed3dSBarry Smith PetscFunctionReturn(0); 956932b0c3eSLois Curfman McInnes } 957932b0c3eSLois Curfman McInnes 9584a2ae208SSatish Balay #undef __FUNCT__ 9594a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqDense_Draw_Zoom" 960dfbe8321SBarry Smith PetscErrorCode MatView_SeqDense_Draw_Zoom(PetscDraw draw,void *Aa) 961f1af5d2fSBarry Smith { 962f1af5d2fSBarry Smith Mat A = (Mat) Aa; 963f1af5d2fSBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 9646849ba73SBarry Smith PetscErrorCode ierr; 965d0f46423SBarry Smith PetscInt m = A->rmap->n,n = A->cmap->n,color,i,j; 96687828ca2SBarry Smith PetscScalar *v = a->v; 967b0a32e0cSBarry Smith PetscViewer viewer; 968b0a32e0cSBarry Smith PetscDraw popup; 969329f5518SBarry Smith PetscReal xl,yl,xr,yr,x_l,x_r,y_l,y_r,scale,maxv = 0.0; 970f3ef73ceSBarry Smith PetscViewerFormat format; 971f1af5d2fSBarry Smith 972f1af5d2fSBarry Smith PetscFunctionBegin; 973f1af5d2fSBarry Smith 974f1af5d2fSBarry Smith ierr = PetscObjectQuery((PetscObject)A,"Zoomviewer",(PetscObject*)&viewer);CHKERRQ(ierr); 975b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 976b0a32e0cSBarry Smith ierr = PetscDrawGetCoordinates(draw,&xl,&yl,&xr,&yr);CHKERRQ(ierr); 977f1af5d2fSBarry Smith 978f1af5d2fSBarry Smith /* Loop over matrix elements drawing boxes */ 979fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 980f1af5d2fSBarry Smith /* Blue for negative and Red for positive */ 981b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 982f1af5d2fSBarry Smith for(j = 0; j < n; j++) { 983f1af5d2fSBarry Smith x_l = j; 984f1af5d2fSBarry Smith x_r = x_l + 1.0; 985f1af5d2fSBarry Smith for(i = 0; i < m; i++) { 986f1af5d2fSBarry Smith y_l = m - i - 1.0; 987f1af5d2fSBarry Smith y_r = y_l + 1.0; 988f1af5d2fSBarry Smith #if defined(PETSC_USE_COMPLEX) 989329f5518SBarry Smith if (PetscRealPart(v[j*m+i]) > 0.) { 990b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 991329f5518SBarry Smith } else if (PetscRealPart(v[j*m+i]) < 0.) { 992b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 993f1af5d2fSBarry Smith } else { 994f1af5d2fSBarry Smith continue; 995f1af5d2fSBarry Smith } 996f1af5d2fSBarry Smith #else 997f1af5d2fSBarry Smith if (v[j*m+i] > 0.) { 998b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 999f1af5d2fSBarry Smith } else if (v[j*m+i] < 0.) { 1000b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 1001f1af5d2fSBarry Smith } else { 1002f1af5d2fSBarry Smith continue; 1003f1af5d2fSBarry Smith } 1004f1af5d2fSBarry Smith #endif 1005b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 1006f1af5d2fSBarry Smith } 1007f1af5d2fSBarry Smith } 1008f1af5d2fSBarry Smith } else { 1009f1af5d2fSBarry Smith /* use contour shading to indicate magnitude of values */ 1010f1af5d2fSBarry Smith /* first determine max of all nonzero values */ 1011f1af5d2fSBarry Smith for(i = 0; i < m*n; i++) { 1012f1af5d2fSBarry Smith if (PetscAbsScalar(v[i]) > maxv) maxv = PetscAbsScalar(v[i]); 1013f1af5d2fSBarry Smith } 1014b0a32e0cSBarry Smith scale = (245.0 - PETSC_DRAW_BASIC_COLORS)/maxv; 1015b0a32e0cSBarry Smith ierr = PetscDrawGetPopup(draw,&popup);CHKERRQ(ierr); 1016b0a32e0cSBarry Smith if (popup) {ierr = PetscDrawScalePopup(popup,0.0,maxv);CHKERRQ(ierr);} 1017f1af5d2fSBarry Smith for(j = 0; j < n; j++) { 1018f1af5d2fSBarry Smith x_l = j; 1019f1af5d2fSBarry Smith x_r = x_l + 1.0; 1020f1af5d2fSBarry Smith for(i = 0; i < m; i++) { 1021f1af5d2fSBarry Smith y_l = m - i - 1.0; 1022f1af5d2fSBarry Smith y_r = y_l + 1.0; 1023b0a32e0cSBarry Smith color = PETSC_DRAW_BASIC_COLORS + (int)(scale*PetscAbsScalar(v[j*m+i])); 1024b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 1025f1af5d2fSBarry Smith } 1026f1af5d2fSBarry Smith } 1027f1af5d2fSBarry Smith } 1028f1af5d2fSBarry Smith PetscFunctionReturn(0); 1029f1af5d2fSBarry Smith } 1030f1af5d2fSBarry Smith 10314a2ae208SSatish Balay #undef __FUNCT__ 10324a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqDense_Draw" 1033dfbe8321SBarry Smith PetscErrorCode MatView_SeqDense_Draw(Mat A,PetscViewer viewer) 1034f1af5d2fSBarry Smith { 1035b0a32e0cSBarry Smith PetscDraw draw; 1036ace3abfcSBarry Smith PetscBool isnull; 1037329f5518SBarry Smith PetscReal xr,yr,xl,yl,h,w; 1038dfbe8321SBarry Smith PetscErrorCode ierr; 1039f1af5d2fSBarry Smith 1040f1af5d2fSBarry Smith PetscFunctionBegin; 1041b0a32e0cSBarry Smith ierr = PetscViewerDrawGetDraw(viewer,0,&draw);CHKERRQ(ierr); 1042b0a32e0cSBarry Smith ierr = PetscDrawIsNull(draw,&isnull);CHKERRQ(ierr); 1043abc0a331SBarry Smith if (isnull) PetscFunctionReturn(0); 1044f1af5d2fSBarry Smith 1045f1af5d2fSBarry Smith ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",(PetscObject)viewer);CHKERRQ(ierr); 1046d0f46423SBarry Smith xr = A->cmap->n; yr = A->rmap->n; h = yr/10.0; w = xr/10.0; 1047f1af5d2fSBarry Smith xr += w; yr += h; xl = -w; yl = -h; 1048b0a32e0cSBarry Smith ierr = PetscDrawSetCoordinates(draw,xl,yl,xr,yr);CHKERRQ(ierr); 1049b0a32e0cSBarry Smith ierr = PetscDrawZoom(draw,MatView_SeqDense_Draw_Zoom,A);CHKERRQ(ierr); 1050f1af5d2fSBarry Smith ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",PETSC_NULL);CHKERRQ(ierr); 1051f1af5d2fSBarry Smith PetscFunctionReturn(0); 1052f1af5d2fSBarry Smith } 1053f1af5d2fSBarry Smith 10544a2ae208SSatish Balay #undef __FUNCT__ 10554a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqDense" 1056dfbe8321SBarry Smith PetscErrorCode MatView_SeqDense(Mat A,PetscViewer viewer) 1057932b0c3eSLois Curfman McInnes { 1058dfbe8321SBarry Smith PetscErrorCode ierr; 1059ace3abfcSBarry Smith PetscBool iascii,isbinary,isdraw; 1060932b0c3eSLois Curfman McInnes 10613a40ed3dSBarry Smith PetscFunctionBegin; 10622692d6eeSBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 10632692d6eeSBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 10642692d6eeSBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSCVIEWERDRAW,&isdraw);CHKERRQ(ierr); 10650f5bd95cSBarry Smith 1066c45a1595SBarry Smith if (iascii) { 1067c45a1595SBarry Smith ierr = MatView_SeqDense_ASCII(A,viewer);CHKERRQ(ierr); 10680f5bd95cSBarry Smith } else if (isbinary) { 10693a40ed3dSBarry Smith ierr = MatView_SeqDense_Binary(A,viewer);CHKERRQ(ierr); 1070f1af5d2fSBarry Smith } else if (isdraw) { 1071f1af5d2fSBarry Smith ierr = MatView_SeqDense_Draw(A,viewer);CHKERRQ(ierr); 10725cd90555SBarry Smith } else { 1073e32f2f54SBarry Smith SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"Viewer type %s not supported by dense matrix",((PetscObject)viewer)->type_name); 1074932b0c3eSLois Curfman McInnes } 10753a40ed3dSBarry Smith PetscFunctionReturn(0); 1076932b0c3eSLois Curfman McInnes } 1077289bc588SBarry Smith 10784a2ae208SSatish Balay #undef __FUNCT__ 10794a2ae208SSatish Balay #define __FUNCT__ "MatDestroy_SeqDense" 1080dfbe8321SBarry Smith PetscErrorCode MatDestroy_SeqDense(Mat mat) 1081289bc588SBarry Smith { 1082ec8511deSBarry Smith Mat_SeqDense *l = (Mat_SeqDense*)mat->data; 1083dfbe8321SBarry Smith PetscErrorCode ierr; 108490f02eecSBarry Smith 10853a40ed3dSBarry Smith PetscFunctionBegin; 1086aa482453SBarry Smith #if defined(PETSC_USE_LOG) 1087d0f46423SBarry Smith PetscLogObjectState((PetscObject)mat,"Rows %D Cols %D",mat->rmap->n,mat->cmap->n); 1088a5a9c739SBarry Smith #endif 108905b42c5fSBarry Smith ierr = PetscFree(l->pivots);CHKERRQ(ierr); 10906857c123SSatish Balay if (!l->user_alloc) {ierr = PetscFree(l->v);CHKERRQ(ierr);} 1091606d414cSSatish Balay ierr = PetscFree(l);CHKERRQ(ierr); 1092dbd8c25aSHong Zhang 1093dbd8c25aSHong Zhang ierr = PetscObjectChangeTypeName((PetscObject)mat,0);CHKERRQ(ierr); 1094901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)mat,"MatSeqDenseSetPreallocation_C","",PETSC_NULL);CHKERRQ(ierr); 10954ae313f4SHong Zhang ierr = PetscObjectComposeFunctionDynamic((PetscObject)mat,"MatMatMult_seqaij_seqdense_C","",PETSC_NULL);CHKERRQ(ierr); 10964ae313f4SHong Zhang ierr = PetscObjectComposeFunctionDynamic((PetscObject)mat,"MatMatMultSymbolic_seqaij_seqdense_C","",PETSC_NULL);CHKERRQ(ierr); 10974ae313f4SHong Zhang ierr = PetscObjectComposeFunctionDynamic((PetscObject)mat,"MatMatMultNumeric_seqaij_seqdense_C","",PETSC_NULL);CHKERRQ(ierr); 10983a40ed3dSBarry Smith PetscFunctionReturn(0); 1099289bc588SBarry Smith } 1100289bc588SBarry Smith 11014a2ae208SSatish Balay #undef __FUNCT__ 11024a2ae208SSatish Balay #define __FUNCT__ "MatTranspose_SeqDense" 1103fc4dec0aSBarry Smith PetscErrorCode MatTranspose_SeqDense(Mat A,MatReuse reuse,Mat *matout) 1104289bc588SBarry Smith { 1105c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 11066849ba73SBarry Smith PetscErrorCode ierr; 110713f74950SBarry Smith PetscInt k,j,m,n,M; 110887828ca2SBarry Smith PetscScalar *v,tmp; 110948b35521SBarry Smith 11103a40ed3dSBarry Smith PetscFunctionBegin; 1111d0f46423SBarry Smith v = mat->v; m = A->rmap->n; M = mat->lda; n = A->cmap->n; 1112e9695a30SBarry Smith if (reuse == MAT_REUSE_MATRIX && *matout == A) { /* in place transpose */ 1113e7e72b3dSBarry Smith if (m != n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Can not transpose non-square matrix in place"); 1114e7e72b3dSBarry Smith else { 1115d3e5ee88SLois Curfman McInnes for (j=0; j<m; j++) { 1116289bc588SBarry Smith for (k=0; k<j; k++) { 11171b807ce4Svictorle tmp = v[j + k*M]; 11181b807ce4Svictorle v[j + k*M] = v[k + j*M]; 11191b807ce4Svictorle v[k + j*M] = tmp; 1120289bc588SBarry Smith } 1121289bc588SBarry Smith } 1122d64ed03dSBarry Smith } 11233a40ed3dSBarry Smith } else { /* out-of-place transpose */ 1124d3e5ee88SLois Curfman McInnes Mat tmat; 1125ec8511deSBarry Smith Mat_SeqDense *tmatd; 112687828ca2SBarry Smith PetscScalar *v2; 1127ea709b57SSatish Balay 1128fc4dec0aSBarry Smith if (reuse == MAT_INITIAL_MATRIX) { 11297adad957SLisandro Dalcin ierr = MatCreate(((PetscObject)A)->comm,&tmat);CHKERRQ(ierr); 1130d0f46423SBarry Smith ierr = MatSetSizes(tmat,A->cmap->n,A->rmap->n,A->cmap->n,A->rmap->n);CHKERRQ(ierr); 11317adad957SLisandro Dalcin ierr = MatSetType(tmat,((PetscObject)A)->type_name);CHKERRQ(ierr); 11325c5985e7SKris Buschelman ierr = MatSeqDenseSetPreallocation(tmat,PETSC_NULL);CHKERRQ(ierr); 1133fc4dec0aSBarry Smith } else { 1134fc4dec0aSBarry Smith tmat = *matout; 1135fc4dec0aSBarry Smith } 1136ec8511deSBarry Smith tmatd = (Mat_SeqDense*)tmat->data; 11370de55854SLois Curfman McInnes v = mat->v; v2 = tmatd->v; 1138d3e5ee88SLois Curfman McInnes for (j=0; j<n; j++) { 11391b807ce4Svictorle for (k=0; k<m; k++) v2[j + k*n] = v[k + j*M]; 1140d3e5ee88SLois Curfman McInnes } 11416d4a8577SBarry Smith ierr = MatAssemblyBegin(tmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 11426d4a8577SBarry Smith ierr = MatAssemblyEnd(tmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1143d3e5ee88SLois Curfman McInnes *matout = tmat; 114448b35521SBarry Smith } 11453a40ed3dSBarry Smith PetscFunctionReturn(0); 1146289bc588SBarry Smith } 1147289bc588SBarry Smith 11484a2ae208SSatish Balay #undef __FUNCT__ 11494a2ae208SSatish Balay #define __FUNCT__ "MatEqual_SeqDense" 1150ace3abfcSBarry Smith PetscErrorCode MatEqual_SeqDense(Mat A1,Mat A2,PetscBool *flg) 1151289bc588SBarry Smith { 1152c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat1 = (Mat_SeqDense*)A1->data; 1153c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat2 = (Mat_SeqDense*)A2->data; 115413f74950SBarry Smith PetscInt i,j; 115587828ca2SBarry Smith PetscScalar *v1 = mat1->v,*v2 = mat2->v; 11569ea5d5aeSSatish Balay 11573a40ed3dSBarry Smith PetscFunctionBegin; 1158d0f46423SBarry Smith if (A1->rmap->n != A2->rmap->n) {*flg = PETSC_FALSE; PetscFunctionReturn(0);} 1159d0f46423SBarry Smith if (A1->cmap->n != A2->cmap->n) {*flg = PETSC_FALSE; PetscFunctionReturn(0);} 1160d0f46423SBarry Smith for (i=0; i<A1->rmap->n; i++) { 11611b807ce4Svictorle v1 = mat1->v+i; v2 = mat2->v+i; 1162d0f46423SBarry Smith for (j=0; j<A1->cmap->n; j++) { 11633a40ed3dSBarry Smith if (*v1 != *v2) {*flg = PETSC_FALSE; PetscFunctionReturn(0);} 11641b807ce4Svictorle v1 += mat1->lda; v2 += mat2->lda; 11651b807ce4Svictorle } 1166289bc588SBarry Smith } 116777c4ece6SBarry Smith *flg = PETSC_TRUE; 11683a40ed3dSBarry Smith PetscFunctionReturn(0); 1169289bc588SBarry Smith } 1170289bc588SBarry Smith 11714a2ae208SSatish Balay #undef __FUNCT__ 11724a2ae208SSatish Balay #define __FUNCT__ "MatGetDiagonal_SeqDense" 1173dfbe8321SBarry Smith PetscErrorCode MatGetDiagonal_SeqDense(Mat A,Vec v) 1174289bc588SBarry Smith { 1175c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 1176dfbe8321SBarry Smith PetscErrorCode ierr; 117713f74950SBarry Smith PetscInt i,n,len; 117887828ca2SBarry Smith PetscScalar *x,zero = 0.0; 117944cd7ae7SLois Curfman McInnes 11803a40ed3dSBarry Smith PetscFunctionBegin; 11812dcb1b2aSMatthew Knepley ierr = VecSet(v,zero);CHKERRQ(ierr); 11827a97a34bSBarry Smith ierr = VecGetSize(v,&n);CHKERRQ(ierr); 11831ebc52fbSHong Zhang ierr = VecGetArray(v,&x);CHKERRQ(ierr); 1184d0f46423SBarry Smith len = PetscMin(A->rmap->n,A->cmap->n); 1185e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming mat and vec"); 118644cd7ae7SLois Curfman McInnes for (i=0; i<len; i++) { 11871b807ce4Svictorle x[i] = mat->v[i*mat->lda + i]; 1188289bc588SBarry Smith } 11891ebc52fbSHong Zhang ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 11903a40ed3dSBarry Smith PetscFunctionReturn(0); 1191289bc588SBarry Smith } 1192289bc588SBarry Smith 11934a2ae208SSatish Balay #undef __FUNCT__ 11944a2ae208SSatish Balay #define __FUNCT__ "MatDiagonalScale_SeqDense" 1195dfbe8321SBarry Smith PetscErrorCode MatDiagonalScale_SeqDense(Mat A,Vec ll,Vec rr) 1196289bc588SBarry Smith { 1197c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 119887828ca2SBarry Smith PetscScalar *l,*r,x,*v; 1199dfbe8321SBarry Smith PetscErrorCode ierr; 1200d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n; 120155659b69SBarry Smith 12023a40ed3dSBarry Smith PetscFunctionBegin; 120328988994SBarry Smith if (ll) { 12047a97a34bSBarry Smith ierr = VecGetSize(ll,&m);CHKERRQ(ierr); 12051ebc52fbSHong Zhang ierr = VecGetArray(ll,&l);CHKERRQ(ierr); 1206e32f2f54SBarry Smith if (m != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Left scaling vec wrong size"); 1207da3a660dSBarry Smith for (i=0; i<m; i++) { 1208da3a660dSBarry Smith x = l[i]; 1209da3a660dSBarry Smith v = mat->v + i; 1210da3a660dSBarry Smith for (j=0; j<n; j++) { (*v) *= x; v+= m;} 1211da3a660dSBarry Smith } 12121ebc52fbSHong Zhang ierr = VecRestoreArray(ll,&l);CHKERRQ(ierr); 1213efee365bSSatish Balay ierr = PetscLogFlops(n*m);CHKERRQ(ierr); 1214da3a660dSBarry Smith } 121528988994SBarry Smith if (rr) { 12167a97a34bSBarry Smith ierr = VecGetSize(rr,&n);CHKERRQ(ierr); 12171ebc52fbSHong Zhang ierr = VecGetArray(rr,&r);CHKERRQ(ierr); 1218e32f2f54SBarry Smith if (n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Right scaling vec wrong size"); 1219da3a660dSBarry Smith for (i=0; i<n; i++) { 1220da3a660dSBarry Smith x = r[i]; 1221da3a660dSBarry Smith v = mat->v + i*m; 1222da3a660dSBarry Smith for (j=0; j<m; j++) { (*v++) *= x;} 1223da3a660dSBarry Smith } 12241ebc52fbSHong Zhang ierr = VecRestoreArray(rr,&r);CHKERRQ(ierr); 1225efee365bSSatish Balay ierr = PetscLogFlops(n*m);CHKERRQ(ierr); 1226da3a660dSBarry Smith } 12273a40ed3dSBarry Smith PetscFunctionReturn(0); 1228289bc588SBarry Smith } 1229289bc588SBarry Smith 12304a2ae208SSatish Balay #undef __FUNCT__ 12314a2ae208SSatish Balay #define __FUNCT__ "MatNorm_SeqDense" 1232dfbe8321SBarry Smith PetscErrorCode MatNorm_SeqDense(Mat A,NormType type,PetscReal *nrm) 1233289bc588SBarry Smith { 1234c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 123587828ca2SBarry Smith PetscScalar *v = mat->v; 1236329f5518SBarry Smith PetscReal sum = 0.0; 1237d0f46423SBarry Smith PetscInt lda=mat->lda,m=A->rmap->n,i,j; 1238efee365bSSatish Balay PetscErrorCode ierr; 123955659b69SBarry Smith 12403a40ed3dSBarry Smith PetscFunctionBegin; 1241289bc588SBarry Smith if (type == NORM_FROBENIUS) { 1242a5ce6ee0Svictorle if (lda>m) { 1243d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1244a5ce6ee0Svictorle v = mat->v+j*lda; 1245a5ce6ee0Svictorle for (i=0; i<m; i++) { 1246a5ce6ee0Svictorle #if defined(PETSC_USE_COMPLEX) 1247a5ce6ee0Svictorle sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 1248a5ce6ee0Svictorle #else 1249a5ce6ee0Svictorle sum += (*v)*(*v); v++; 1250a5ce6ee0Svictorle #endif 1251a5ce6ee0Svictorle } 1252a5ce6ee0Svictorle } 1253a5ce6ee0Svictorle } else { 1254d0f46423SBarry Smith for (i=0; i<A->cmap->n*A->rmap->n; i++) { 1255aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 1256329f5518SBarry Smith sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 1257289bc588SBarry Smith #else 1258289bc588SBarry Smith sum += (*v)*(*v); v++; 1259289bc588SBarry Smith #endif 1260289bc588SBarry Smith } 1261a5ce6ee0Svictorle } 1262064f8208SBarry Smith *nrm = sqrt(sum); 1263dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->rmap->n);CHKERRQ(ierr); 12643a40ed3dSBarry Smith } else if (type == NORM_1) { 1265064f8208SBarry Smith *nrm = 0.0; 1266d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 12671b807ce4Svictorle v = mat->v + j*mat->lda; 1268289bc588SBarry Smith sum = 0.0; 1269d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 127033a8263dSBarry Smith sum += PetscAbsScalar(*v); v++; 1271289bc588SBarry Smith } 1272064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 1273289bc588SBarry Smith } 1274d0f46423SBarry Smith ierr = PetscLogFlops(A->cmap->n*A->rmap->n);CHKERRQ(ierr); 12753a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 1276064f8208SBarry Smith *nrm = 0.0; 1277d0f46423SBarry Smith for (j=0; j<A->rmap->n; j++) { 1278289bc588SBarry Smith v = mat->v + j; 1279289bc588SBarry Smith sum = 0.0; 1280d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) { 12811b807ce4Svictorle sum += PetscAbsScalar(*v); v += mat->lda; 1282289bc588SBarry Smith } 1283064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 1284289bc588SBarry Smith } 1285d0f46423SBarry Smith ierr = PetscLogFlops(A->cmap->n*A->rmap->n);CHKERRQ(ierr); 1286e7e72b3dSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"No two norm"); 12873a40ed3dSBarry Smith PetscFunctionReturn(0); 1288289bc588SBarry Smith } 1289289bc588SBarry Smith 12904a2ae208SSatish Balay #undef __FUNCT__ 12914a2ae208SSatish Balay #define __FUNCT__ "MatSetOption_SeqDense" 1292ace3abfcSBarry Smith PetscErrorCode MatSetOption_SeqDense(Mat A,MatOption op,PetscBool flg) 1293289bc588SBarry Smith { 1294c0bbcb79SLois Curfman McInnes Mat_SeqDense *aij = (Mat_SeqDense*)A->data; 129563ba0a88SBarry Smith PetscErrorCode ierr; 129667e560aaSBarry Smith 12973a40ed3dSBarry Smith PetscFunctionBegin; 1298b5a2b587SKris Buschelman switch (op) { 1299b5a2b587SKris Buschelman case MAT_ROW_ORIENTED: 13004e0d8c25SBarry Smith aij->roworiented = flg; 1301b5a2b587SKris Buschelman break; 1302512a5fc5SBarry Smith case MAT_NEW_NONZERO_LOCATIONS: 1303b5a2b587SKris Buschelman case MAT_NEW_NONZERO_LOCATION_ERR: 13043971808eSMatthew Knepley case MAT_NEW_NONZERO_ALLOCATION_ERR: 13054e0d8c25SBarry Smith case MAT_NEW_DIAGONALS: 1306b5a2b587SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1307b5a2b587SKris Buschelman case MAT_USE_HASH_TABLE: 130877e54ba9SKris Buschelman case MAT_SYMMETRIC: 130977e54ba9SKris Buschelman case MAT_STRUCTURALLY_SYMMETRIC: 13109a4540c5SBarry Smith case MAT_HERMITIAN: 13119a4540c5SBarry Smith case MAT_SYMMETRY_ETERNAL: 1312600fe468SBarry Smith case MAT_IGNORE_LOWER_TRIANGULAR: 1313290bbb0aSBarry Smith ierr = PetscInfo1(A,"Option %s ignored\n",MatOptions[op]);CHKERRQ(ierr); 131477e54ba9SKris Buschelman break; 1315b5a2b587SKris Buschelman default: 1316e32f2f54SBarry Smith SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"unknown option %s",MatOptions[op]); 13173a40ed3dSBarry Smith } 13183a40ed3dSBarry Smith PetscFunctionReturn(0); 1319289bc588SBarry Smith } 1320289bc588SBarry Smith 13214a2ae208SSatish Balay #undef __FUNCT__ 13224a2ae208SSatish Balay #define __FUNCT__ "MatZeroEntries_SeqDense" 1323dfbe8321SBarry Smith PetscErrorCode MatZeroEntries_SeqDense(Mat A) 13246f0a148fSBarry Smith { 1325ec8511deSBarry Smith Mat_SeqDense *l = (Mat_SeqDense*)A->data; 13266849ba73SBarry Smith PetscErrorCode ierr; 1327d0f46423SBarry Smith PetscInt lda=l->lda,m=A->rmap->n,j; 13283a40ed3dSBarry Smith 13293a40ed3dSBarry Smith PetscFunctionBegin; 1330a5ce6ee0Svictorle if (lda>m) { 1331d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1332a5ce6ee0Svictorle ierr = PetscMemzero(l->v+j*lda,m*sizeof(PetscScalar));CHKERRQ(ierr); 1333a5ce6ee0Svictorle } 1334a5ce6ee0Svictorle } else { 1335d0f46423SBarry Smith ierr = PetscMemzero(l->v,A->rmap->n*A->cmap->n*sizeof(PetscScalar));CHKERRQ(ierr); 1336a5ce6ee0Svictorle } 13373a40ed3dSBarry Smith PetscFunctionReturn(0); 13386f0a148fSBarry Smith } 13396f0a148fSBarry Smith 13404a2ae208SSatish Balay #undef __FUNCT__ 13414a2ae208SSatish Balay #define __FUNCT__ "MatZeroRows_SeqDense" 1342*2b40b63fSBarry Smith PetscErrorCode MatZeroRows_SeqDense(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 13436f0a148fSBarry Smith { 1344ec8511deSBarry Smith Mat_SeqDense *l = (Mat_SeqDense*)A->data; 1345d0f46423SBarry Smith PetscInt n = A->cmap->n,i,j; 134687828ca2SBarry Smith PetscScalar *slot; 134755659b69SBarry Smith 13483a40ed3dSBarry Smith PetscFunctionBegin; 13496f0a148fSBarry Smith for (i=0; i<N; i++) { 13506f0a148fSBarry Smith slot = l->v + rows[i]; 13516f0a148fSBarry Smith for (j=0; j<n; j++) { *slot = 0.0; slot += n;} 13526f0a148fSBarry Smith } 1353f4df32b1SMatthew Knepley if (diag != 0.0) { 13546f0a148fSBarry Smith for (i=0; i<N; i++) { 13556f0a148fSBarry Smith slot = l->v + (n+1)*rows[i]; 1356f4df32b1SMatthew Knepley *slot = diag; 13576f0a148fSBarry Smith } 13586f0a148fSBarry Smith } 13593a40ed3dSBarry Smith PetscFunctionReturn(0); 13606f0a148fSBarry Smith } 1361557bce09SLois Curfman McInnes 13624a2ae208SSatish Balay #undef __FUNCT__ 13634a2ae208SSatish Balay #define __FUNCT__ "MatGetArray_SeqDense" 1364dfbe8321SBarry Smith PetscErrorCode MatGetArray_SeqDense(Mat A,PetscScalar *array[]) 136564e87e97SBarry Smith { 1366c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 13673a40ed3dSBarry Smith 13683a40ed3dSBarry Smith PetscFunctionBegin; 1369e32f2f54SBarry Smith if (mat->lda != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot get array for Dense matrices with LDA different from number of rows"); 137064e87e97SBarry Smith *array = mat->v; 13713a40ed3dSBarry Smith PetscFunctionReturn(0); 137264e87e97SBarry Smith } 13730754003eSLois Curfman McInnes 13744a2ae208SSatish Balay #undef __FUNCT__ 13754a2ae208SSatish Balay #define __FUNCT__ "MatRestoreArray_SeqDense" 1376dfbe8321SBarry Smith PetscErrorCode MatRestoreArray_SeqDense(Mat A,PetscScalar *array[]) 1377ff14e315SSatish Balay { 13783a40ed3dSBarry Smith PetscFunctionBegin; 137909b544d4SBarry Smith *array = 0; /* user cannot accidently use the array later */ 13803a40ed3dSBarry Smith PetscFunctionReturn(0); 1381ff14e315SSatish Balay } 13820754003eSLois Curfman McInnes 13834a2ae208SSatish Balay #undef __FUNCT__ 13844a2ae208SSatish Balay #define __FUNCT__ "MatGetSubMatrix_SeqDense" 138513f74950SBarry Smith static PetscErrorCode MatGetSubMatrix_SeqDense(Mat A,IS isrow,IS iscol,PetscInt cs,MatReuse scall,Mat *B) 13860754003eSLois Curfman McInnes { 1387c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 13886849ba73SBarry Smith PetscErrorCode ierr; 13895d0c19d7SBarry Smith PetscInt i,j,nrows,ncols; 13905d0c19d7SBarry Smith const PetscInt *irow,*icol; 139187828ca2SBarry Smith PetscScalar *av,*bv,*v = mat->v; 13920754003eSLois Curfman McInnes Mat newmat; 13930754003eSLois Curfman McInnes 13943a40ed3dSBarry Smith PetscFunctionBegin; 139578b31e54SBarry Smith ierr = ISGetIndices(isrow,&irow);CHKERRQ(ierr); 139678b31e54SBarry Smith ierr = ISGetIndices(iscol,&icol);CHKERRQ(ierr); 1397e03a110bSBarry Smith ierr = ISGetLocalSize(isrow,&nrows);CHKERRQ(ierr); 1398e03a110bSBarry Smith ierr = ISGetLocalSize(iscol,&ncols);CHKERRQ(ierr); 13990754003eSLois Curfman McInnes 1400182d2002SSatish Balay /* Check submatrixcall */ 1401182d2002SSatish Balay if (scall == MAT_REUSE_MATRIX) { 140213f74950SBarry Smith PetscInt n_cols,n_rows; 1403182d2002SSatish Balay ierr = MatGetSize(*B,&n_rows,&n_cols);CHKERRQ(ierr); 140421a2c019SBarry Smith if (n_rows != nrows || n_cols != ncols) { 140521a2c019SBarry Smith /* resize the result result matrix to match number of requested rows/columns */ 1406c61587bbSBarry Smith ierr = MatSetSizes(*B,nrows,ncols,nrows,ncols);CHKERRQ(ierr); 140721a2c019SBarry Smith } 1408182d2002SSatish Balay newmat = *B; 1409182d2002SSatish Balay } else { 14100754003eSLois Curfman McInnes /* Create and fill new matrix */ 14117adad957SLisandro Dalcin ierr = MatCreate(((PetscObject)A)->comm,&newmat);CHKERRQ(ierr); 1412f69a0ea3SMatthew Knepley ierr = MatSetSizes(newmat,nrows,ncols,nrows,ncols);CHKERRQ(ierr); 14137adad957SLisandro Dalcin ierr = MatSetType(newmat,((PetscObject)A)->type_name);CHKERRQ(ierr); 14145c5985e7SKris Buschelman ierr = MatSeqDenseSetPreallocation(newmat,PETSC_NULL);CHKERRQ(ierr); 1415182d2002SSatish Balay } 1416182d2002SSatish Balay 1417182d2002SSatish Balay /* Now extract the data pointers and do the copy,column at a time */ 1418182d2002SSatish Balay bv = ((Mat_SeqDense*)newmat->data)->v; 1419182d2002SSatish Balay 1420182d2002SSatish Balay for (i=0; i<ncols; i++) { 14216de62eeeSBarry Smith av = v + mat->lda*icol[i]; 1422182d2002SSatish Balay for (j=0; j<nrows; j++) { 1423182d2002SSatish Balay *bv++ = av[irow[j]]; 14240754003eSLois Curfman McInnes } 14250754003eSLois Curfman McInnes } 1426182d2002SSatish Balay 1427182d2002SSatish Balay /* Assemble the matrices so that the correct flags are set */ 14286d4a8577SBarry Smith ierr = MatAssemblyBegin(newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 14296d4a8577SBarry Smith ierr = MatAssemblyEnd(newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 14300754003eSLois Curfman McInnes 14310754003eSLois Curfman McInnes /* Free work space */ 143278b31e54SBarry Smith ierr = ISRestoreIndices(isrow,&irow);CHKERRQ(ierr); 143378b31e54SBarry Smith ierr = ISRestoreIndices(iscol,&icol);CHKERRQ(ierr); 1434182d2002SSatish Balay *B = newmat; 14353a40ed3dSBarry Smith PetscFunctionReturn(0); 14360754003eSLois Curfman McInnes } 14370754003eSLois Curfman McInnes 14384a2ae208SSatish Balay #undef __FUNCT__ 14394a2ae208SSatish Balay #define __FUNCT__ "MatGetSubMatrices_SeqDense" 144013f74950SBarry Smith PetscErrorCode MatGetSubMatrices_SeqDense(Mat A,PetscInt n,const IS irow[],const IS icol[],MatReuse scall,Mat *B[]) 1441905e6a2fSBarry Smith { 14426849ba73SBarry Smith PetscErrorCode ierr; 144313f74950SBarry Smith PetscInt i; 1444905e6a2fSBarry Smith 14453a40ed3dSBarry Smith PetscFunctionBegin; 1446905e6a2fSBarry Smith if (scall == MAT_INITIAL_MATRIX) { 1447b0a32e0cSBarry Smith ierr = PetscMalloc((n+1)*sizeof(Mat),B);CHKERRQ(ierr); 1448905e6a2fSBarry Smith } 1449905e6a2fSBarry Smith 1450905e6a2fSBarry Smith for (i=0; i<n; i++) { 14516a6a5d1dSBarry Smith ierr = MatGetSubMatrix_SeqDense(A,irow[i],icol[i],PETSC_DECIDE,scall,&(*B)[i]);CHKERRQ(ierr); 1452905e6a2fSBarry Smith } 14533a40ed3dSBarry Smith PetscFunctionReturn(0); 1454905e6a2fSBarry Smith } 1455905e6a2fSBarry Smith 14564a2ae208SSatish Balay #undef __FUNCT__ 1457c0aa2d19SHong Zhang #define __FUNCT__ "MatAssemblyBegin_SeqDense" 1458c0aa2d19SHong Zhang PetscErrorCode MatAssemblyBegin_SeqDense(Mat mat,MatAssemblyType mode) 1459c0aa2d19SHong Zhang { 1460c0aa2d19SHong Zhang PetscFunctionBegin; 1461c0aa2d19SHong Zhang PetscFunctionReturn(0); 1462c0aa2d19SHong Zhang } 1463c0aa2d19SHong Zhang 1464c0aa2d19SHong Zhang #undef __FUNCT__ 1465c0aa2d19SHong Zhang #define __FUNCT__ "MatAssemblyEnd_SeqDense" 1466c0aa2d19SHong Zhang PetscErrorCode MatAssemblyEnd_SeqDense(Mat mat,MatAssemblyType mode) 1467c0aa2d19SHong Zhang { 1468c0aa2d19SHong Zhang PetscFunctionBegin; 1469c0aa2d19SHong Zhang PetscFunctionReturn(0); 1470c0aa2d19SHong Zhang } 1471c0aa2d19SHong Zhang 1472c0aa2d19SHong Zhang #undef __FUNCT__ 14734a2ae208SSatish Balay #define __FUNCT__ "MatCopy_SeqDense" 1474dfbe8321SBarry Smith PetscErrorCode MatCopy_SeqDense(Mat A,Mat B,MatStructure str) 14754b0e389bSBarry Smith { 14764b0e389bSBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data,*b = (Mat_SeqDense *)B->data; 14776849ba73SBarry Smith PetscErrorCode ierr; 1478d0f46423SBarry Smith PetscInt lda1=a->lda,lda2=b->lda, m=A->rmap->n,n=A->cmap->n, j; 14793a40ed3dSBarry Smith 14803a40ed3dSBarry Smith PetscFunctionBegin; 148133f4a19fSKris Buschelman /* If the two matrices don't have the same copy implementation, they aren't compatible for fast copy. */ 148233f4a19fSKris Buschelman if (A->ops->copy != B->ops->copy) { 1483cb5b572fSBarry Smith ierr = MatCopy_Basic(A,B,str);CHKERRQ(ierr); 14843a40ed3dSBarry Smith PetscFunctionReturn(0); 14853a40ed3dSBarry Smith } 1486e32f2f54SBarry Smith if (m != B->rmap->n || n != B->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"size(B) != size(A)"); 1487a5ce6ee0Svictorle if (lda1>m || lda2>m) { 14880dbb7854Svictorle for (j=0; j<n; j++) { 1489a5ce6ee0Svictorle ierr = PetscMemcpy(b->v+j*lda2,a->v+j*lda1,m*sizeof(PetscScalar));CHKERRQ(ierr); 1490a5ce6ee0Svictorle } 1491a5ce6ee0Svictorle } else { 1492d0f46423SBarry Smith ierr = PetscMemcpy(b->v,a->v,A->rmap->n*A->cmap->n*sizeof(PetscScalar));CHKERRQ(ierr); 1493a5ce6ee0Svictorle } 1494273d9f13SBarry Smith PetscFunctionReturn(0); 1495273d9f13SBarry Smith } 1496273d9f13SBarry Smith 14974a2ae208SSatish Balay #undef __FUNCT__ 14984a2ae208SSatish Balay #define __FUNCT__ "MatSetUpPreallocation_SeqDense" 1499dfbe8321SBarry Smith PetscErrorCode MatSetUpPreallocation_SeqDense(Mat A) 1500273d9f13SBarry Smith { 1501dfbe8321SBarry Smith PetscErrorCode ierr; 1502273d9f13SBarry Smith 1503273d9f13SBarry Smith PetscFunctionBegin; 1504273d9f13SBarry Smith ierr = MatSeqDenseSetPreallocation(A,0);CHKERRQ(ierr); 15053a40ed3dSBarry Smith PetscFunctionReturn(0); 15064b0e389bSBarry Smith } 15074b0e389bSBarry Smith 1508284134d9SBarry Smith #undef __FUNCT__ 1509284134d9SBarry Smith #define __FUNCT__ "MatSetSizes_SeqDense" 1510284134d9SBarry Smith PetscErrorCode MatSetSizes_SeqDense(Mat A,PetscInt m,PetscInt n,PetscInt M,PetscInt N) 1511284134d9SBarry Smith { 1512284134d9SBarry Smith PetscFunctionBegin; 151321a2c019SBarry Smith /* this will not be called before lda, Mmax, and Nmax have been set */ 1514284134d9SBarry Smith m = PetscMax(m,M); 1515284134d9SBarry Smith n = PetscMax(n,N); 1516a868139aSShri Abhyankar 151786d161a7SShri Abhyankar /* if (m > a->Mmax) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot yet resize number rows of dense matrix larger then its initial size %d, requested %d",a->lda,(int)m); 151886d161a7SShri Abhyankar if (n > a->Nmax) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot yet resize number columns of dense matrix larger then its initial size %d, requested %d",a->Nmax,(int)n); 151986d161a7SShri Abhyankar */ 1520dc5cefdeSJed Brown A->rmap->n = A->rmap->N = m; 1521d0f46423SBarry Smith A->cmap->n = A->cmap->N = n; 1522284134d9SBarry Smith PetscFunctionReturn(0); 1523284134d9SBarry Smith } 1524170fe5c8SBarry Smith 1525ba337c44SJed Brown #undef __FUNCT__ 1526ba337c44SJed Brown #define __FUNCT__ "MatConjugate_SeqDense" 1527ba337c44SJed Brown static PetscErrorCode MatConjugate_SeqDense(Mat A) 1528ba337c44SJed Brown { 1529ba337c44SJed Brown Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1530ba337c44SJed Brown PetscInt i,nz = A->rmap->n*A->cmap->n; 1531ba337c44SJed Brown PetscScalar *aa = a->v; 1532ba337c44SJed Brown 1533ba337c44SJed Brown PetscFunctionBegin; 1534ba337c44SJed Brown for (i=0; i<nz; i++) aa[i] = PetscConj(aa[i]); 1535ba337c44SJed Brown PetscFunctionReturn(0); 1536ba337c44SJed Brown } 1537ba337c44SJed Brown 1538ba337c44SJed Brown #undef __FUNCT__ 1539ba337c44SJed Brown #define __FUNCT__ "MatRealPart_SeqDense" 1540ba337c44SJed Brown static PetscErrorCode MatRealPart_SeqDense(Mat A) 1541ba337c44SJed Brown { 1542ba337c44SJed Brown Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1543ba337c44SJed Brown PetscInt i,nz = A->rmap->n*A->cmap->n; 1544ba337c44SJed Brown PetscScalar *aa = a->v; 1545ba337c44SJed Brown 1546ba337c44SJed Brown PetscFunctionBegin; 1547ba337c44SJed Brown for (i=0; i<nz; i++) aa[i] = PetscRealPart(aa[i]); 1548ba337c44SJed Brown PetscFunctionReturn(0); 1549ba337c44SJed Brown } 1550ba337c44SJed Brown 1551ba337c44SJed Brown #undef __FUNCT__ 1552ba337c44SJed Brown #define __FUNCT__ "MatImaginaryPart_SeqDense" 1553ba337c44SJed Brown static PetscErrorCode MatImaginaryPart_SeqDense(Mat A) 1554ba337c44SJed Brown { 1555ba337c44SJed Brown Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1556ba337c44SJed Brown PetscInt i,nz = A->rmap->n*A->cmap->n; 1557ba337c44SJed Brown PetscScalar *aa = a->v; 1558ba337c44SJed Brown 1559ba337c44SJed Brown PetscFunctionBegin; 1560ba337c44SJed Brown for (i=0; i<nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 1561ba337c44SJed Brown PetscFunctionReturn(0); 1562ba337c44SJed Brown } 1563284134d9SBarry Smith 1564a9fe9ddaSSatish Balay /* ----------------------------------------------------------------*/ 1565a9fe9ddaSSatish Balay #undef __FUNCT__ 1566a9fe9ddaSSatish Balay #define __FUNCT__ "MatMatMult_SeqDense_SeqDense" 1567a9fe9ddaSSatish Balay PetscErrorCode MatMatMult_SeqDense_SeqDense(Mat A,Mat B,MatReuse scall,PetscReal fill,Mat *C) 1568a9fe9ddaSSatish Balay { 1569a9fe9ddaSSatish Balay PetscErrorCode ierr; 1570a9fe9ddaSSatish Balay 1571a9fe9ddaSSatish Balay PetscFunctionBegin; 1572a9fe9ddaSSatish Balay if (scall == MAT_INITIAL_MATRIX){ 1573a9fe9ddaSSatish Balay ierr = MatMatMultSymbolic_SeqDense_SeqDense(A,B,fill,C);CHKERRQ(ierr); 1574a9fe9ddaSSatish Balay } 1575a9fe9ddaSSatish Balay ierr = MatMatMultNumeric_SeqDense_SeqDense(A,B,*C);CHKERRQ(ierr); 1576a9fe9ddaSSatish Balay PetscFunctionReturn(0); 1577a9fe9ddaSSatish Balay } 1578a9fe9ddaSSatish Balay 1579a9fe9ddaSSatish Balay #undef __FUNCT__ 1580a9fe9ddaSSatish Balay #define __FUNCT__ "MatMatMultSymbolic_SeqDense_SeqDense" 1581a9fe9ddaSSatish Balay PetscErrorCode MatMatMultSymbolic_SeqDense_SeqDense(Mat A,Mat B,PetscReal fill,Mat *C) 1582a9fe9ddaSSatish Balay { 1583ee16a9a1SHong Zhang PetscErrorCode ierr; 1584d0f46423SBarry Smith PetscInt m=A->rmap->n,n=B->cmap->n; 1585ee16a9a1SHong Zhang Mat Cmat; 1586a9fe9ddaSSatish Balay 1587ee16a9a1SHong Zhang PetscFunctionBegin; 1588e32f2f54SBarry Smith if (A->cmap->n != B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"A->cmap->n %d != B->rmap->n %d\n",A->cmap->n,B->rmap->n); 1589ee16a9a1SHong Zhang ierr = MatCreate(PETSC_COMM_SELF,&Cmat);CHKERRQ(ierr); 1590ee16a9a1SHong Zhang ierr = MatSetSizes(Cmat,m,n,m,n);CHKERRQ(ierr); 1591ee16a9a1SHong Zhang ierr = MatSetType(Cmat,MATSEQDENSE);CHKERRQ(ierr); 1592ee16a9a1SHong Zhang ierr = MatSeqDenseSetPreallocation(Cmat,PETSC_NULL);CHKERRQ(ierr); 1593ee16a9a1SHong Zhang Cmat->assembled = PETSC_TRUE; 1594ee16a9a1SHong Zhang *C = Cmat; 1595ee16a9a1SHong Zhang PetscFunctionReturn(0); 1596ee16a9a1SHong Zhang } 1597a9fe9ddaSSatish Balay 159898a3b096SSatish Balay #undef __FUNCT__ 1599a9fe9ddaSSatish Balay #define __FUNCT__ "MatMatMultNumeric_SeqDense_SeqDense" 1600a9fe9ddaSSatish Balay PetscErrorCode MatMatMultNumeric_SeqDense_SeqDense(Mat A,Mat B,Mat C) 1601a9fe9ddaSSatish Balay { 1602a9fe9ddaSSatish Balay Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1603a9fe9ddaSSatish Balay Mat_SeqDense *b = (Mat_SeqDense*)B->data; 1604a9fe9ddaSSatish Balay Mat_SeqDense *c = (Mat_SeqDense*)C->data; 16050805154bSBarry Smith PetscBLASInt m,n,k; 1606a9fe9ddaSSatish Balay PetscScalar _DOne=1.0,_DZero=0.0; 1607a9fe9ddaSSatish Balay 1608a9fe9ddaSSatish Balay PetscFunctionBegin; 1609d0f46423SBarry Smith m = PetscBLASIntCast(A->rmap->n); 1610d0f46423SBarry Smith n = PetscBLASIntCast(B->cmap->n); 1611d0f46423SBarry Smith k = PetscBLASIntCast(A->cmap->n); 1612a9fe9ddaSSatish Balay BLASgemm_("N","N",&m,&n,&k,&_DOne,a->v,&a->lda,b->v,&b->lda,&_DZero,c->v,&c->lda); 1613a9fe9ddaSSatish Balay PetscFunctionReturn(0); 1614a9fe9ddaSSatish Balay } 1615a9fe9ddaSSatish Balay 1616a9fe9ddaSSatish Balay #undef __FUNCT__ 1617a9fe9ddaSSatish Balay #define __FUNCT__ "MatMatMultTranspose_SeqDense_SeqDense" 1618a9fe9ddaSSatish Balay PetscErrorCode MatMatMultTranspose_SeqDense_SeqDense(Mat A,Mat B,MatReuse scall,PetscReal fill,Mat *C) 1619a9fe9ddaSSatish Balay { 1620a9fe9ddaSSatish Balay PetscErrorCode ierr; 1621a9fe9ddaSSatish Balay 1622a9fe9ddaSSatish Balay PetscFunctionBegin; 1623a9fe9ddaSSatish Balay if (scall == MAT_INITIAL_MATRIX){ 1624a9fe9ddaSSatish Balay ierr = MatMatMultTransposeSymbolic_SeqDense_SeqDense(A,B,fill,C);CHKERRQ(ierr); 1625a9fe9ddaSSatish Balay } 1626a9fe9ddaSSatish Balay ierr = MatMatMultTransposeNumeric_SeqDense_SeqDense(A,B,*C);CHKERRQ(ierr); 1627a9fe9ddaSSatish Balay PetscFunctionReturn(0); 1628a9fe9ddaSSatish Balay } 1629a9fe9ddaSSatish Balay 1630a9fe9ddaSSatish Balay #undef __FUNCT__ 1631a9fe9ddaSSatish Balay #define __FUNCT__ "MatMatMultTransposeSymbolic_SeqDense_SeqDense" 1632a9fe9ddaSSatish Balay PetscErrorCode MatMatMultTransposeSymbolic_SeqDense_SeqDense(Mat A,Mat B,PetscReal fill,Mat *C) 1633a9fe9ddaSSatish Balay { 1634ee16a9a1SHong Zhang PetscErrorCode ierr; 1635d0f46423SBarry Smith PetscInt m=A->cmap->n,n=B->cmap->n; 1636ee16a9a1SHong Zhang Mat Cmat; 1637a9fe9ddaSSatish Balay 1638ee16a9a1SHong Zhang PetscFunctionBegin; 1639e32f2f54SBarry Smith if (A->rmap->n != B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"A->rmap->n %d != B->rmap->n %d\n",A->rmap->n,B->rmap->n); 1640ee16a9a1SHong Zhang ierr = MatCreate(PETSC_COMM_SELF,&Cmat);CHKERRQ(ierr); 1641ee16a9a1SHong Zhang ierr = MatSetSizes(Cmat,m,n,m,n);CHKERRQ(ierr); 1642ee16a9a1SHong Zhang ierr = MatSetType(Cmat,MATSEQDENSE);CHKERRQ(ierr); 1643ee16a9a1SHong Zhang ierr = MatSeqDenseSetPreallocation(Cmat,PETSC_NULL);CHKERRQ(ierr); 1644ee16a9a1SHong Zhang Cmat->assembled = PETSC_TRUE; 1645ee16a9a1SHong Zhang *C = Cmat; 1646ee16a9a1SHong Zhang PetscFunctionReturn(0); 1647ee16a9a1SHong Zhang } 1648a9fe9ddaSSatish Balay 1649a9fe9ddaSSatish Balay #undef __FUNCT__ 1650a9fe9ddaSSatish Balay #define __FUNCT__ "MatMatMultTransposeNumeric_SeqDense_SeqDense" 1651a9fe9ddaSSatish Balay PetscErrorCode MatMatMultTransposeNumeric_SeqDense_SeqDense(Mat A,Mat B,Mat C) 1652a9fe9ddaSSatish Balay { 1653a9fe9ddaSSatish Balay Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1654a9fe9ddaSSatish Balay Mat_SeqDense *b = (Mat_SeqDense*)B->data; 1655a9fe9ddaSSatish Balay Mat_SeqDense *c = (Mat_SeqDense*)C->data; 16560805154bSBarry Smith PetscBLASInt m,n,k; 1657a9fe9ddaSSatish Balay PetscScalar _DOne=1.0,_DZero=0.0; 1658a9fe9ddaSSatish Balay 1659a9fe9ddaSSatish Balay PetscFunctionBegin; 1660d0f46423SBarry Smith m = PetscBLASIntCast(A->cmap->n); 1661d0f46423SBarry Smith n = PetscBLASIntCast(B->cmap->n); 1662d0f46423SBarry Smith k = PetscBLASIntCast(A->rmap->n); 16632fbe02b9SBarry Smith /* 16642fbe02b9SBarry Smith Note the m and n arguments below are the number rows and columns of A', not A! 16652fbe02b9SBarry Smith */ 1666a9fe9ddaSSatish Balay BLASgemm_("T","N",&m,&n,&k,&_DOne,a->v,&a->lda,b->v,&b->lda,&_DZero,c->v,&c->lda); 1667a9fe9ddaSSatish Balay PetscFunctionReturn(0); 1668a9fe9ddaSSatish Balay } 1669985db425SBarry Smith 1670985db425SBarry Smith #undef __FUNCT__ 1671985db425SBarry Smith #define __FUNCT__ "MatGetRowMax_SeqDense" 1672985db425SBarry Smith PetscErrorCode MatGetRowMax_SeqDense(Mat A,Vec v,PetscInt idx[]) 1673985db425SBarry Smith { 1674985db425SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1675985db425SBarry Smith PetscErrorCode ierr; 1676d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,p; 1677985db425SBarry Smith PetscScalar *x; 1678985db425SBarry Smith MatScalar *aa = a->v; 1679985db425SBarry Smith 1680985db425SBarry Smith PetscFunctionBegin; 1681e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 1682985db425SBarry Smith 1683985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 1684985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 1685985db425SBarry Smith ierr = VecGetLocalSize(v,&p);CHKERRQ(ierr); 1686e32f2f54SBarry Smith if (p != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 1687985db425SBarry Smith for (i=0; i<m; i++) { 1688985db425SBarry Smith x[i] = aa[i]; if (idx) idx[i] = 0; 1689985db425SBarry Smith for (j=1; j<n; j++){ 1690985db425SBarry Smith if (PetscRealPart(x[i]) < PetscRealPart(aa[i+m*j])) {x[i] = aa[i + m*j]; if (idx) idx[i] = j;} 1691985db425SBarry Smith } 1692985db425SBarry Smith } 1693985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 1694985db425SBarry Smith PetscFunctionReturn(0); 1695985db425SBarry Smith } 1696985db425SBarry Smith 1697985db425SBarry Smith #undef __FUNCT__ 1698985db425SBarry Smith #define __FUNCT__ "MatGetRowMaxAbs_SeqDense" 1699985db425SBarry Smith PetscErrorCode MatGetRowMaxAbs_SeqDense(Mat A,Vec v,PetscInt idx[]) 1700985db425SBarry Smith { 1701985db425SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1702985db425SBarry Smith PetscErrorCode ierr; 1703d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,p; 1704985db425SBarry Smith PetscScalar *x; 1705985db425SBarry Smith PetscReal atmp; 1706985db425SBarry Smith MatScalar *aa = a->v; 1707985db425SBarry Smith 1708985db425SBarry Smith PetscFunctionBegin; 1709e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 1710985db425SBarry Smith 1711985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 1712985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 1713985db425SBarry Smith ierr = VecGetLocalSize(v,&p);CHKERRQ(ierr); 1714e32f2f54SBarry Smith if (p != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 1715985db425SBarry Smith for (i=0; i<m; i++) { 17169189402eSHong Zhang x[i] = PetscAbsScalar(aa[i]); 1717985db425SBarry Smith for (j=1; j<n; j++){ 1718985db425SBarry Smith atmp = PetscAbsScalar(aa[i+m*j]); 1719985db425SBarry Smith if (PetscAbsScalar(x[i]) < atmp) {x[i] = atmp; if (idx) idx[i] = j;} 1720985db425SBarry Smith } 1721985db425SBarry Smith } 1722985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 1723985db425SBarry Smith PetscFunctionReturn(0); 1724985db425SBarry Smith } 1725985db425SBarry Smith 1726985db425SBarry Smith #undef __FUNCT__ 1727985db425SBarry Smith #define __FUNCT__ "MatGetRowMin_SeqDense" 1728985db425SBarry Smith PetscErrorCode MatGetRowMin_SeqDense(Mat A,Vec v,PetscInt idx[]) 1729985db425SBarry Smith { 1730985db425SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1731985db425SBarry Smith PetscErrorCode ierr; 1732d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,p; 1733985db425SBarry Smith PetscScalar *x; 1734985db425SBarry Smith MatScalar *aa = a->v; 1735985db425SBarry Smith 1736985db425SBarry Smith PetscFunctionBegin; 1737e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 1738985db425SBarry Smith 1739985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 1740985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 1741985db425SBarry Smith ierr = VecGetLocalSize(v,&p);CHKERRQ(ierr); 1742e32f2f54SBarry Smith if (p != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 1743985db425SBarry Smith for (i=0; i<m; i++) { 1744985db425SBarry Smith x[i] = aa[i]; if (idx) idx[i] = 0; 1745985db425SBarry Smith for (j=1; j<n; j++){ 1746985db425SBarry Smith if (PetscRealPart(x[i]) > PetscRealPart(aa[i+m*j])) {x[i] = aa[i + m*j]; if (idx) idx[i] = j;} 1747985db425SBarry Smith } 1748985db425SBarry Smith } 1749985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 1750985db425SBarry Smith PetscFunctionReturn(0); 1751985db425SBarry Smith } 1752985db425SBarry Smith 17538d0534beSBarry Smith #undef __FUNCT__ 17548d0534beSBarry Smith #define __FUNCT__ "MatGetColumnVector_SeqDense" 17558d0534beSBarry Smith PetscErrorCode MatGetColumnVector_SeqDense(Mat A,Vec v,PetscInt col) 17568d0534beSBarry Smith { 17578d0534beSBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 17588d0534beSBarry Smith PetscErrorCode ierr; 17598d0534beSBarry Smith PetscScalar *x; 17608d0534beSBarry Smith 17618d0534beSBarry Smith PetscFunctionBegin; 1762e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 17638d0534beSBarry Smith 17648d0534beSBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 1765d0f46423SBarry Smith ierr = PetscMemcpy(x,a->v+col*a->lda,A->rmap->n*sizeof(PetscScalar));CHKERRQ(ierr); 17668d0534beSBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 17678d0534beSBarry Smith PetscFunctionReturn(0); 17688d0534beSBarry Smith } 17698d0534beSBarry Smith 1770289bc588SBarry Smith /* -------------------------------------------------------------------*/ 1771a5ae1ecdSBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqDense, 1772905e6a2fSBarry Smith MatGetRow_SeqDense, 1773905e6a2fSBarry Smith MatRestoreRow_SeqDense, 1774905e6a2fSBarry Smith MatMult_SeqDense, 177597304618SKris Buschelman /* 4*/ MatMultAdd_SeqDense, 17767c922b88SBarry Smith MatMultTranspose_SeqDense, 17777c922b88SBarry Smith MatMultTransposeAdd_SeqDense, 1778db4efbfdSBarry Smith 0, 1779db4efbfdSBarry Smith 0, 1780db4efbfdSBarry Smith 0, 1781db4efbfdSBarry Smith /*10*/ 0, 1782905e6a2fSBarry Smith MatLUFactor_SeqDense, 1783905e6a2fSBarry Smith MatCholeskyFactor_SeqDense, 178441f059aeSBarry Smith MatSOR_SeqDense, 1785ec8511deSBarry Smith MatTranspose_SeqDense, 178697304618SKris Buschelman /*15*/ MatGetInfo_SeqDense, 1787905e6a2fSBarry Smith MatEqual_SeqDense, 1788905e6a2fSBarry Smith MatGetDiagonal_SeqDense, 1789905e6a2fSBarry Smith MatDiagonalScale_SeqDense, 1790905e6a2fSBarry Smith MatNorm_SeqDense, 1791c0aa2d19SHong Zhang /*20*/ MatAssemblyBegin_SeqDense, 1792c0aa2d19SHong Zhang MatAssemblyEnd_SeqDense, 1793905e6a2fSBarry Smith MatSetOption_SeqDense, 1794905e6a2fSBarry Smith MatZeroEntries_SeqDense, 1795d519adbfSMatthew Knepley /*24*/ MatZeroRows_SeqDense, 1796db4efbfdSBarry Smith 0, 1797db4efbfdSBarry Smith 0, 1798db4efbfdSBarry Smith 0, 1799db4efbfdSBarry Smith 0, 1800d519adbfSMatthew Knepley /*29*/ MatSetUpPreallocation_SeqDense, 1801273d9f13SBarry Smith 0, 1802905e6a2fSBarry Smith 0, 1803905e6a2fSBarry Smith MatGetArray_SeqDense, 1804905e6a2fSBarry Smith MatRestoreArray_SeqDense, 1805d519adbfSMatthew Knepley /*34*/ MatDuplicate_SeqDense, 1806a5ae1ecdSBarry Smith 0, 1807a5ae1ecdSBarry Smith 0, 1808a5ae1ecdSBarry Smith 0, 1809a5ae1ecdSBarry Smith 0, 1810d519adbfSMatthew Knepley /*39*/ MatAXPY_SeqDense, 1811a5ae1ecdSBarry Smith MatGetSubMatrices_SeqDense, 1812a5ae1ecdSBarry Smith 0, 18134b0e389bSBarry Smith MatGetValues_SeqDense, 1814a5ae1ecdSBarry Smith MatCopy_SeqDense, 1815d519adbfSMatthew Knepley /*44*/ MatGetRowMax_SeqDense, 1816a5ae1ecdSBarry Smith MatScale_SeqDense, 1817a5ae1ecdSBarry Smith 0, 1818a5ae1ecdSBarry Smith 0, 1819a5ae1ecdSBarry Smith 0, 1820d519adbfSMatthew Knepley /*49*/ 0, 1821a5ae1ecdSBarry Smith 0, 1822a5ae1ecdSBarry Smith 0, 1823a5ae1ecdSBarry Smith 0, 1824a5ae1ecdSBarry Smith 0, 1825d519adbfSMatthew Knepley /*54*/ 0, 1826a5ae1ecdSBarry Smith 0, 1827a5ae1ecdSBarry Smith 0, 1828a5ae1ecdSBarry Smith 0, 1829a5ae1ecdSBarry Smith 0, 1830d519adbfSMatthew Knepley /*59*/ 0, 1831e03a110bSBarry Smith MatDestroy_SeqDense, 1832e03a110bSBarry Smith MatView_SeqDense, 1833357abbc8SBarry Smith 0, 183497304618SKris Buschelman 0, 1835d519adbfSMatthew Knepley /*64*/ 0, 183697304618SKris Buschelman 0, 183797304618SKris Buschelman 0, 183897304618SKris Buschelman 0, 183997304618SKris Buschelman 0, 1840d519adbfSMatthew Knepley /*69*/ MatGetRowMaxAbs_SeqDense, 184197304618SKris Buschelman 0, 184297304618SKris Buschelman 0, 184397304618SKris Buschelman 0, 184497304618SKris Buschelman 0, 1845d519adbfSMatthew Knepley /*74*/ 0, 184697304618SKris Buschelman 0, 184797304618SKris Buschelman 0, 184897304618SKris Buschelman 0, 184997304618SKris Buschelman 0, 1850d519adbfSMatthew Knepley /*79*/ 0, 185197304618SKris Buschelman 0, 185297304618SKris Buschelman 0, 185397304618SKris Buschelman 0, 18545bba2384SShri Abhyankar /*83*/ MatLoad_SeqDense, 1855865e5f61SKris Buschelman 0, 18561cbb95d3SBarry Smith MatIsHermitian_SeqDense, 1857865e5f61SKris Buschelman 0, 1858865e5f61SKris Buschelman 0, 1859865e5f61SKris Buschelman 0, 1860d519adbfSMatthew Knepley /*89*/ MatMatMult_SeqDense_SeqDense, 1861a9fe9ddaSSatish Balay MatMatMultSymbolic_SeqDense_SeqDense, 1862a9fe9ddaSSatish Balay MatMatMultNumeric_SeqDense_SeqDense, 1863865e5f61SKris Buschelman 0, 1864865e5f61SKris Buschelman 0, 1865d519adbfSMatthew Knepley /*94*/ 0, 1866a9fe9ddaSSatish Balay MatMatMultTranspose_SeqDense_SeqDense, 1867a9fe9ddaSSatish Balay MatMatMultTransposeSymbolic_SeqDense_SeqDense, 1868a9fe9ddaSSatish Balay MatMatMultTransposeNumeric_SeqDense_SeqDense, 1869284134d9SBarry Smith 0, 1870d519adbfSMatthew Knepley /*99*/ 0, 1871284134d9SBarry Smith 0, 1872284134d9SBarry Smith 0, 1873ba337c44SJed Brown MatConjugate_SeqDense, 1874985db425SBarry Smith MatSetSizes_SeqDense, 1875ba337c44SJed Brown /*104*/0, 1876ba337c44SJed Brown MatRealPart_SeqDense, 1877ba337c44SJed Brown MatImaginaryPart_SeqDense, 1878985db425SBarry Smith 0, 1879985db425SBarry Smith 0, 1880d519adbfSMatthew Knepley /*109*/0, 1881985db425SBarry Smith 0, 18828d0534beSBarry Smith MatGetRowMin_SeqDense, 1883aabbc4fbSShri Abhyankar MatGetColumnVector_SeqDense, 1884aabbc4fbSShri Abhyankar 0, 1885aabbc4fbSShri Abhyankar /*114*/0, 1886aabbc4fbSShri Abhyankar 0, 1887aabbc4fbSShri Abhyankar 0, 1888aabbc4fbSShri Abhyankar 0, 1889aabbc4fbSShri Abhyankar 0, 1890aabbc4fbSShri Abhyankar /*119*/0, 1891aabbc4fbSShri Abhyankar 0, 1892aabbc4fbSShri Abhyankar 0, 18935bba2384SShri Abhyankar 0 1894985db425SBarry Smith }; 189590ace30eSBarry Smith 18964a2ae208SSatish Balay #undef __FUNCT__ 18974a2ae208SSatish Balay #define __FUNCT__ "MatCreateSeqDense" 18984b828684SBarry Smith /*@C 1899fafbff53SBarry Smith MatCreateSeqDense - Creates a sequential dense matrix that 1900d65003e9SLois Curfman McInnes is stored in column major order (the usual Fortran 77 manner). Many 1901d65003e9SLois Curfman McInnes of the matrix operations use the BLAS and LAPACK routines. 1902289bc588SBarry Smith 1903db81eaa0SLois Curfman McInnes Collective on MPI_Comm 1904db81eaa0SLois Curfman McInnes 190520563c6bSBarry Smith Input Parameters: 1906db81eaa0SLois Curfman McInnes + comm - MPI communicator, set to PETSC_COMM_SELF 19070c775827SLois Curfman McInnes . m - number of rows 190818f449edSLois Curfman McInnes . n - number of columns 1909c0235b3cSMatthew Knepley - data - optional location of matrix data in column major order. Set data=PETSC_NULL for PETSc 1910dfc5480cSLois Curfman McInnes to control all matrix memory allocation. 191120563c6bSBarry Smith 191220563c6bSBarry Smith Output Parameter: 191344cd7ae7SLois Curfman McInnes . A - the matrix 191420563c6bSBarry Smith 1915b259b22eSLois Curfman McInnes Notes: 191618f449edSLois Curfman McInnes The data input variable is intended primarily for Fortran programmers 191718f449edSLois Curfman McInnes who wish to allocate their own matrix memory space. Most users should 1918b4fd4287SBarry Smith set data=PETSC_NULL. 191918f449edSLois Curfman McInnes 1920027ccd11SLois Curfman McInnes Level: intermediate 1921027ccd11SLois Curfman McInnes 1922dbd7a890SLois Curfman McInnes .keywords: dense, matrix, LAPACK, BLAS 1923d65003e9SLois Curfman McInnes 1924db81eaa0SLois Curfman McInnes .seealso: MatCreate(), MatCreateMPIDense(), MatSetValues() 192520563c6bSBarry Smith @*/ 1926be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatCreateSeqDense(MPI_Comm comm,PetscInt m,PetscInt n,PetscScalar *data,Mat *A) 1927289bc588SBarry Smith { 1928dfbe8321SBarry Smith PetscErrorCode ierr; 19293b2fbd54SBarry Smith 19303a40ed3dSBarry Smith PetscFunctionBegin; 1931f69a0ea3SMatthew Knepley ierr = MatCreate(comm,A);CHKERRQ(ierr); 1932f69a0ea3SMatthew Knepley ierr = MatSetSizes(*A,m,n,m,n);CHKERRQ(ierr); 1933273d9f13SBarry Smith ierr = MatSetType(*A,MATSEQDENSE);CHKERRQ(ierr); 1934273d9f13SBarry Smith ierr = MatSeqDenseSetPreallocation(*A,data);CHKERRQ(ierr); 1935273d9f13SBarry Smith PetscFunctionReturn(0); 1936273d9f13SBarry Smith } 1937273d9f13SBarry Smith 19384a2ae208SSatish Balay #undef __FUNCT__ 1939afc30d2aSLisandro Dalcin #define __FUNCT__ "MatSeqDenseSetPreallocation" 1940273d9f13SBarry Smith /*@C 1941273d9f13SBarry Smith MatSeqDenseSetPreallocation - Sets the array used for storing the matrix elements 1942273d9f13SBarry Smith 1943273d9f13SBarry Smith Collective on MPI_Comm 1944273d9f13SBarry Smith 1945273d9f13SBarry Smith Input Parameters: 1946273d9f13SBarry Smith + A - the matrix 1947273d9f13SBarry Smith - data - the array (or PETSC_NULL) 1948273d9f13SBarry Smith 1949273d9f13SBarry Smith Notes: 1950273d9f13SBarry Smith The data input variable is intended primarily for Fortran programmers 1951273d9f13SBarry Smith who wish to allocate their own matrix memory space. Most users should 1952284134d9SBarry Smith need not call this routine. 1953273d9f13SBarry Smith 1954273d9f13SBarry Smith Level: intermediate 1955273d9f13SBarry Smith 1956273d9f13SBarry Smith .keywords: dense, matrix, LAPACK, BLAS 1957273d9f13SBarry Smith 1958867c911aSBarry Smith .seealso: MatCreate(), MatCreateMPIDense(), MatSetValues(), MatSeqDenseSetLDA() 1959867c911aSBarry Smith 1960273d9f13SBarry Smith @*/ 1961be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatSeqDenseSetPreallocation(Mat B,PetscScalar data[]) 1962273d9f13SBarry Smith { 19634ac538c5SBarry Smith PetscErrorCode ierr; 1964a23d5eceSKris Buschelman 1965a23d5eceSKris Buschelman PetscFunctionBegin; 19664ac538c5SBarry Smith ierr = PetscTryMethod(B,"MatSeqDenseSetPreallocation_C",(Mat,PetscScalar[]),(B,data));CHKERRQ(ierr); 1967a23d5eceSKris Buschelman PetscFunctionReturn(0); 1968a23d5eceSKris Buschelman } 1969a23d5eceSKris Buschelman 1970a23d5eceSKris Buschelman EXTERN_C_BEGIN 1971a23d5eceSKris Buschelman #undef __FUNCT__ 1972afc30d2aSLisandro Dalcin #define __FUNCT__ "MatSeqDenseSetPreallocation_SeqDense" 1973be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatSeqDenseSetPreallocation_SeqDense(Mat B,PetscScalar *data) 1974a23d5eceSKris Buschelman { 1975273d9f13SBarry Smith Mat_SeqDense *b; 1976dfbe8321SBarry Smith PetscErrorCode ierr; 1977273d9f13SBarry Smith 1978273d9f13SBarry Smith PetscFunctionBegin; 1979273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 1980a868139aSShri Abhyankar 198134ef9618SShri Abhyankar ierr = PetscLayoutSetBlockSize(B->rmap,1);CHKERRQ(ierr); 198234ef9618SShri Abhyankar ierr = PetscLayoutSetBlockSize(B->cmap,1);CHKERRQ(ierr); 198334ef9618SShri Abhyankar ierr = PetscLayoutSetUp(B->rmap);CHKERRQ(ierr); 198434ef9618SShri Abhyankar ierr = PetscLayoutSetUp(B->cmap);CHKERRQ(ierr); 198534ef9618SShri Abhyankar 1986273d9f13SBarry Smith b = (Mat_SeqDense*)B->data; 198786d161a7SShri Abhyankar b->Mmax = B->rmap->n; 198886d161a7SShri Abhyankar b->Nmax = B->cmap->n; 198986d161a7SShri Abhyankar if(b->lda <= 0 || b->changelda) b->lda = B->rmap->n; 199086d161a7SShri Abhyankar 19919e8f95c4SLisandro Dalcin if (!data) { /* petsc-allocated storage */ 19929e8f95c4SLisandro Dalcin if (!b->user_alloc) { ierr = PetscFree(b->v);CHKERRQ(ierr); } 19935afd5e0cSBarry Smith ierr = PetscMalloc(b->lda*b->Nmax*sizeof(PetscScalar),&b->v);CHKERRQ(ierr); 1994284134d9SBarry Smith ierr = PetscMemzero(b->v,b->lda*b->Nmax*sizeof(PetscScalar));CHKERRQ(ierr); 1995284134d9SBarry Smith ierr = PetscLogObjectMemory(B,b->lda*b->Nmax*sizeof(PetscScalar));CHKERRQ(ierr); 19969e8f95c4SLisandro Dalcin b->user_alloc = PETSC_FALSE; 1997273d9f13SBarry Smith } else { /* user-allocated storage */ 19989e8f95c4SLisandro Dalcin if (!b->user_alloc) { ierr = PetscFree(b->v);CHKERRQ(ierr); } 1999273d9f13SBarry Smith b->v = data; 2000273d9f13SBarry Smith b->user_alloc = PETSC_TRUE; 2001273d9f13SBarry Smith } 20020450473dSBarry Smith B->assembled = PETSC_TRUE; 2003273d9f13SBarry Smith PetscFunctionReturn(0); 2004273d9f13SBarry Smith } 2005a23d5eceSKris Buschelman EXTERN_C_END 2006273d9f13SBarry Smith 20071b807ce4Svictorle #undef __FUNCT__ 20081b807ce4Svictorle #define __FUNCT__ "MatSeqDenseSetLDA" 20091b807ce4Svictorle /*@C 20101b807ce4Svictorle MatSeqDenseSetLDA - Declare the leading dimension of the user-provided array 20111b807ce4Svictorle 20121b807ce4Svictorle Input parameter: 20131b807ce4Svictorle + A - the matrix 20141b807ce4Svictorle - lda - the leading dimension 20151b807ce4Svictorle 20161b807ce4Svictorle Notes: 2017867c911aSBarry Smith This routine is to be used in conjunction with MatSeqDenseSetPreallocation(); 20181b807ce4Svictorle it asserts that the preallocation has a leading dimension (the LDA parameter 20191b807ce4Svictorle of Blas and Lapack fame) larger than M, the first dimension of the matrix. 20201b807ce4Svictorle 20211b807ce4Svictorle Level: intermediate 20221b807ce4Svictorle 20231b807ce4Svictorle .keywords: dense, matrix, LAPACK, BLAS 20241b807ce4Svictorle 2025284134d9SBarry Smith .seealso: MatCreate(), MatCreateSeqDense(), MatSeqDenseSetPreallocation(), MatSetMaximumSize() 2026867c911aSBarry Smith 20271b807ce4Svictorle @*/ 2028be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatSeqDenseSetLDA(Mat B,PetscInt lda) 20291b807ce4Svictorle { 20301b807ce4Svictorle Mat_SeqDense *b = (Mat_SeqDense*)B->data; 203121a2c019SBarry Smith 20321b807ce4Svictorle PetscFunctionBegin; 2033e32f2f54SBarry Smith if (lda < B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"LDA %D must be at least matrix dimension %D",lda,B->rmap->n); 20341b807ce4Svictorle b->lda = lda; 203521a2c019SBarry Smith b->changelda = PETSC_FALSE; 203621a2c019SBarry Smith b->Mmax = PetscMax(b->Mmax,lda); 20371b807ce4Svictorle PetscFunctionReturn(0); 20381b807ce4Svictorle } 20391b807ce4Svictorle 20400bad9183SKris Buschelman /*MC 2041fafad747SKris Buschelman MATSEQDENSE - MATSEQDENSE = "seqdense" - A matrix type to be used for sequential dense matrices. 20420bad9183SKris Buschelman 20430bad9183SKris Buschelman Options Database Keys: 20440bad9183SKris Buschelman . -mat_type seqdense - sets the matrix type to "seqdense" during a call to MatSetFromOptions() 20450bad9183SKris Buschelman 20460bad9183SKris Buschelman Level: beginner 20470bad9183SKris Buschelman 204889665df3SBarry Smith .seealso: MatCreateSeqDense() 204989665df3SBarry Smith 20500bad9183SKris Buschelman M*/ 20510bad9183SKris Buschelman 2052273d9f13SBarry Smith EXTERN_C_BEGIN 20534a2ae208SSatish Balay #undef __FUNCT__ 20544a2ae208SSatish Balay #define __FUNCT__ "MatCreate_SeqDense" 2055be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatCreate_SeqDense(Mat B) 2056273d9f13SBarry Smith { 2057273d9f13SBarry Smith Mat_SeqDense *b; 2058dfbe8321SBarry Smith PetscErrorCode ierr; 20597c334f02SBarry Smith PetscMPIInt size; 2060273d9f13SBarry Smith 2061273d9f13SBarry Smith PetscFunctionBegin; 20627adad957SLisandro Dalcin ierr = MPI_Comm_size(((PetscObject)B)->comm,&size);CHKERRQ(ierr); 2063e32f2f54SBarry Smith if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Comm must be of size 1"); 206455659b69SBarry Smith 206538f2d2fdSLisandro Dalcin ierr = PetscNewLog(B,Mat_SeqDense,&b);CHKERRQ(ierr); 2066549d3d68SSatish Balay ierr = PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps));CHKERRQ(ierr); 206790f02eecSBarry Smith B->mapping = 0; 206844cd7ae7SLois Curfman McInnes B->data = (void*)b; 206918f449edSLois Curfman McInnes 207044cd7ae7SLois Curfman McInnes b->pivots = 0; 2071273d9f13SBarry Smith b->roworiented = PETSC_TRUE; 2072273d9f13SBarry Smith b->v = 0; 207321a2c019SBarry Smith b->changelda = PETSC_FALSE; 20744e220ebcSLois Curfman McInnes 2075b24902e0SBarry Smith 2076ec1065edSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_petsc_C", 2077b24902e0SBarry Smith "MatGetFactor_seqdense_petsc", 2078b24902e0SBarry Smith MatGetFactor_seqdense_petsc);CHKERRQ(ierr); 2079a23d5eceSKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatSeqDenseSetPreallocation_C", 2080a23d5eceSKris Buschelman "MatSeqDenseSetPreallocation_SeqDense", 2081a23d5eceSKris Buschelman MatSeqDenseSetPreallocation_SeqDense);CHKERRQ(ierr); 20824ae313f4SHong Zhang ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatMatMult_seqaij_seqdense_C", 20834ae313f4SHong Zhang "MatMatMult_SeqAIJ_SeqDense", 20844ae313f4SHong Zhang MatMatMult_SeqAIJ_SeqDense);CHKERRQ(ierr); 20854ae313f4SHong Zhang ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatMatMultSymbolic_seqaij_seqdense_C", 20864ae313f4SHong Zhang "MatMatMultSymbolic_SeqAIJ_SeqDense", 20874ae313f4SHong Zhang MatMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 20884ae313f4SHong Zhang ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatMatMultNumeric_seqaij_seqdense_C", 20894ae313f4SHong Zhang "MatMatMultNumeric_SeqAIJ_SeqDense", 20904ae313f4SHong Zhang MatMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 209117667f90SBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQDENSE);CHKERRQ(ierr); 20923a40ed3dSBarry Smith PetscFunctionReturn(0); 2093289bc588SBarry Smith } 2094273d9f13SBarry Smith EXTERN_C_END 2095