1be1d678aSKris Buschelman 267e560aaSBarry Smith /* 367e560aaSBarry Smith Defines the basic matrix operations for sequential dense. 467e560aaSBarry Smith */ 5289bc588SBarry Smith 6dec5eb66SMatthew G Knepley #include <../src/mat/impls/dense/seq/dense.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8289bc588SBarry Smith 96a63e612SBarry Smith #include <../src/mat/impls/aij/seq/aij.h> 10b2573a8aSBarry Smith 11ca15aa20SStefano Zampini PetscErrorCode MatSeqDenseSymmetrize_Private(Mat A, PetscBool hermitian) 128c178816SStefano Zampini { 138c178816SStefano Zampini Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 148c178816SStefano Zampini PetscInt j, k, n = A->rmap->n; 15ca15aa20SStefano Zampini PetscScalar *v; 16ca15aa20SStefano Zampini PetscErrorCode ierr; 178c178816SStefano Zampini 188c178816SStefano Zampini PetscFunctionBegin; 198c178816SStefano Zampini if (A->rmap->n != A->cmap->n) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot symmetrize a rectangular matrix"); 20ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 218c178816SStefano Zampini if (!hermitian) { 228c178816SStefano Zampini for (k=0;k<n;k++) { 238c178816SStefano Zampini for (j=k;j<n;j++) { 24ca15aa20SStefano Zampini v[j*mat->lda + k] = v[k*mat->lda + j]; 258c178816SStefano Zampini } 268c178816SStefano Zampini } 278c178816SStefano Zampini } else { 288c178816SStefano Zampini for (k=0;k<n;k++) { 298c178816SStefano Zampini for (j=k;j<n;j++) { 30ca15aa20SStefano Zampini v[j*mat->lda + k] = PetscConj(v[k*mat->lda + j]); 318c178816SStefano Zampini } 328c178816SStefano Zampini } 338c178816SStefano Zampini } 34ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 358c178816SStefano Zampini PetscFunctionReturn(0); 368c178816SStefano Zampini } 378c178816SStefano Zampini 3805709791SSatish Balay PETSC_EXTERN PetscErrorCode MatSeqDenseInvertFactors_Private(Mat A) 398c178816SStefano Zampini { 408c178816SStefano Zampini #if defined(PETSC_MISSING_LAPACK_POTRF) 418c178816SStefano Zampini PetscFunctionBegin; 428c178816SStefano Zampini SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"POTRF - Lapack routine is unavailable."); 438c178816SStefano Zampini #else 448c178816SStefano Zampini Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 458c178816SStefano Zampini PetscErrorCode ierr; 468c178816SStefano Zampini PetscBLASInt info,n; 478c178816SStefano Zampini 488c178816SStefano Zampini PetscFunctionBegin; 498c178816SStefano Zampini if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 508c178816SStefano Zampini ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 518c178816SStefano Zampini if (A->factortype == MAT_FACTOR_LU) { 528c178816SStefano Zampini if (!mat->pivots) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Pivots not present"); 538c178816SStefano Zampini if (!mat->fwork) { 548c178816SStefano Zampini mat->lfwork = n; 558c178816SStefano Zampini ierr = PetscMalloc1(mat->lfwork,&mat->fwork);CHKERRQ(ierr); 568c178816SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)A,mat->lfwork*sizeof(PetscBLASInt));CHKERRQ(ierr); 578c178816SStefano Zampini } 5800121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 598c178816SStefano Zampini PetscStackCallBLAS("LAPACKgetri",LAPACKgetri_(&n,mat->v,&mat->lda,mat->pivots,mat->fwork,&mat->lfwork,&info)); 6000121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 61ca15aa20SStefano Zampini ierr = PetscLogFlops((1.0*A->cmap->n*A->cmap->n*A->cmap->n)/3.0);CHKERRQ(ierr); 628c178816SStefano Zampini } else if (A->factortype == MAT_FACTOR_CHOLESKY) { 638c178816SStefano Zampini if (A->spd) { 6400121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 658c178816SStefano Zampini PetscStackCallBLAS("LAPACKpotri",LAPACKpotri_("L",&n,mat->v,&mat->lda,&info)); 6600121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 678c178816SStefano Zampini ierr = MatSeqDenseSymmetrize_Private(A,PETSC_TRUE);CHKERRQ(ierr); 688c178816SStefano Zampini #if defined(PETSC_USE_COMPLEX) 698c178816SStefano Zampini } else if (A->hermitian) { 708c178816SStefano Zampini if (!mat->pivots) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Pivots not present"); 718c178816SStefano Zampini if (!mat->fwork) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Fwork not present"); 7200121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 738c178816SStefano Zampini PetscStackCallBLAS("LAPACKhetri",LAPACKhetri_("L",&n,mat->v,&mat->lda,mat->pivots,mat->fwork,&info)); 7400121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 758c178816SStefano Zampini ierr = MatSeqDenseSymmetrize_Private(A,PETSC_TRUE);CHKERRQ(ierr); 768c178816SStefano Zampini #endif 778c178816SStefano Zampini } else { /* symmetric case */ 788c178816SStefano Zampini if (!mat->pivots) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Pivots not present"); 798c178816SStefano Zampini if (!mat->fwork) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Fwork not present"); 8000121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 818c178816SStefano Zampini PetscStackCallBLAS("LAPACKsytri",LAPACKsytri_("L",&n,mat->v,&mat->lda,mat->pivots,mat->fwork,&info)); 8200121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 838c178816SStefano Zampini ierr = MatSeqDenseSymmetrize_Private(A,PETSC_FALSE);CHKERRQ(ierr); 848c178816SStefano Zampini } 858c178816SStefano Zampini if (info) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_MAT_CH_ZRPVT,"Bad Inversion: zero pivot in row %D",(PetscInt)info-1); 86ca15aa20SStefano Zampini ierr = PetscLogFlops((1.0*A->cmap->n*A->cmap->n*A->cmap->n)/3.0);CHKERRQ(ierr); 878c178816SStefano Zampini } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix must be factored to solve"); 888c178816SStefano Zampini #endif 898c178816SStefano Zampini 908c178816SStefano Zampini A->ops->solve = NULL; 918c178816SStefano Zampini A->ops->matsolve = NULL; 928c178816SStefano Zampini A->ops->solvetranspose = NULL; 938c178816SStefano Zampini A->ops->matsolvetranspose = NULL; 948c178816SStefano Zampini A->ops->solveadd = NULL; 958c178816SStefano Zampini A->ops->solvetransposeadd = NULL; 968c178816SStefano Zampini A->factortype = MAT_FACTOR_NONE; 978c178816SStefano Zampini ierr = PetscFree(A->solvertype);CHKERRQ(ierr); 988c178816SStefano Zampini PetscFunctionReturn(0); 998c178816SStefano Zampini } 1008c178816SStefano Zampini 1013f49a652SStefano Zampini PetscErrorCode MatZeroRowsColumns_SeqDense(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 1023f49a652SStefano Zampini { 1033f49a652SStefano Zampini PetscErrorCode ierr; 1043f49a652SStefano Zampini Mat_SeqDense *l = (Mat_SeqDense*)A->data; 1053f49a652SStefano Zampini PetscInt m = l->lda, n = A->cmap->n,r = A->rmap->n, i,j; 106ca15aa20SStefano Zampini PetscScalar *slot,*bb,*v; 1073f49a652SStefano Zampini const PetscScalar *xx; 1083f49a652SStefano Zampini 1093f49a652SStefano Zampini PetscFunctionBegin; 1103f49a652SStefano Zampini #if defined(PETSC_USE_DEBUG) 1113f49a652SStefano Zampini for (i=0; i<N; i++) { 1123f49a652SStefano Zampini if (rows[i] < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row requested to be zeroed"); 1133f49a652SStefano Zampini if (rows[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D requested to be zeroed greater than or equal number of rows %D",rows[i],A->rmap->n); 1143f49a652SStefano Zampini if (rows[i] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Col %D requested to be zeroed greater than or equal number of cols %D",rows[i],A->cmap->n); 1153f49a652SStefano Zampini } 1163f49a652SStefano Zampini #endif 117ca15aa20SStefano Zampini if (!N) PetscFunctionReturn(0); 1183f49a652SStefano Zampini 1193f49a652SStefano Zampini /* fix right hand side if needed */ 1203f49a652SStefano Zampini if (x && b) { 1216c4d906cSStefano Zampini Vec xt; 1226c4d906cSStefano Zampini 1236c4d906cSStefano Zampini if (A->rmap->n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Only coded for square matrices"); 1246c4d906cSStefano Zampini ierr = VecDuplicate(x,&xt);CHKERRQ(ierr); 1256c4d906cSStefano Zampini ierr = VecCopy(x,xt);CHKERRQ(ierr); 1266c4d906cSStefano Zampini ierr = VecScale(xt,-1.0);CHKERRQ(ierr); 1276c4d906cSStefano Zampini ierr = MatMultAdd(A,xt,b,b);CHKERRQ(ierr); 1286c4d906cSStefano Zampini ierr = VecDestroy(&xt);CHKERRQ(ierr); 1293f49a652SStefano Zampini ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 1303f49a652SStefano Zampini ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 1313f49a652SStefano Zampini for (i=0; i<N; i++) bb[rows[i]] = diag*xx[rows[i]]; 1323f49a652SStefano Zampini ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 1333f49a652SStefano Zampini ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 1343f49a652SStefano Zampini } 1353f49a652SStefano Zampini 136ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 1373f49a652SStefano Zampini for (i=0; i<N; i++) { 138ca15aa20SStefano Zampini slot = v + rows[i]*m; 139580bdb30SBarry Smith ierr = PetscArrayzero(slot,r);CHKERRQ(ierr); 1403f49a652SStefano Zampini } 1413f49a652SStefano Zampini for (i=0; i<N; i++) { 142ca15aa20SStefano Zampini slot = v + rows[i]; 1433f49a652SStefano Zampini for (j=0; j<n; j++) { *slot = 0.0; slot += m;} 1443f49a652SStefano Zampini } 1453f49a652SStefano Zampini if (diag != 0.0) { 1463f49a652SStefano Zampini if (A->rmap->n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Only coded for square matrices"); 1473f49a652SStefano Zampini for (i=0; i<N; i++) { 148ca15aa20SStefano Zampini slot = v + (m+1)*rows[i]; 1493f49a652SStefano Zampini *slot = diag; 1503f49a652SStefano Zampini } 1513f49a652SStefano Zampini } 152ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 1533f49a652SStefano Zampini PetscFunctionReturn(0); 1543f49a652SStefano Zampini } 1553f49a652SStefano Zampini 156abc3b08eSStefano Zampini PetscErrorCode MatPtAPNumeric_SeqDense_SeqDense(Mat A,Mat P,Mat C) 157abc3b08eSStefano Zampini { 158abc3b08eSStefano Zampini Mat_SeqDense *c = (Mat_SeqDense*)(C->data); 159abc3b08eSStefano Zampini PetscErrorCode ierr; 160abc3b08eSStefano Zampini 161abc3b08eSStefano Zampini PetscFunctionBegin; 162ca15aa20SStefano Zampini if (c->ptapwork) { 163ca15aa20SStefano Zampini ierr = (*C->ops->matmultnumeric)(A,P,c->ptapwork);CHKERRQ(ierr); 164ca15aa20SStefano Zampini ierr = (*C->ops->transposematmultnumeric)(P,c->ptapwork,C);CHKERRQ(ierr); 165ca15aa20SStefano Zampini } else { /* first time went trough the basic. Should we add better dispatching for subclasses? */ 166ca15aa20SStefano Zampini ierr = MatPtAP_Basic(A,P,MAT_REUSE_MATRIX,PETSC_DEFAULT,&C);CHKERRQ(ierr); 167ca15aa20SStefano Zampini } 168abc3b08eSStefano Zampini PetscFunctionReturn(0); 169abc3b08eSStefano Zampini } 170abc3b08eSStefano Zampini 171abc3b08eSStefano Zampini PetscErrorCode MatPtAPSymbolic_SeqDense_SeqDense(Mat A,Mat P,PetscReal fill,Mat *C) 172abc3b08eSStefano Zampini { 173abc3b08eSStefano Zampini Mat_SeqDense *c; 174ca15aa20SStefano Zampini PetscBool flg; 175abc3b08eSStefano Zampini PetscErrorCode ierr; 176abc3b08eSStefano Zampini 177abc3b08eSStefano Zampini PetscFunctionBegin; 178ca15aa20SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)P,((PetscObject)A)->type_name,&flg);CHKERRQ(ierr); 179ca15aa20SStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)A),C);CHKERRQ(ierr); 180ca15aa20SStefano Zampini ierr = MatSetSizes(*C,P->cmap->n,P->cmap->n,P->cmap->N,P->cmap->N);CHKERRQ(ierr); 181ca15aa20SStefano Zampini ierr = MatSetType(*C,flg ? ((PetscObject)A)->type_name : MATDENSE);CHKERRQ(ierr); 182ca15aa20SStefano Zampini ierr = MatSeqDenseSetPreallocation(*C,NULL);CHKERRQ(ierr); 183abc3b08eSStefano Zampini c = (Mat_SeqDense*)((*C)->data); 184ca15aa20SStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)A),&c->ptapwork);CHKERRQ(ierr); 185ca15aa20SStefano Zampini ierr = MatSetSizes(c->ptapwork,A->rmap->n,P->cmap->n,A->rmap->N,P->cmap->N);CHKERRQ(ierr); 186ca15aa20SStefano Zampini ierr = MatSetType(c->ptapwork,flg ? ((PetscObject)A)->type_name : MATDENSE);CHKERRQ(ierr); 187ca15aa20SStefano Zampini ierr = MatSeqDenseSetPreallocation(c->ptapwork,NULL);CHKERRQ(ierr); 188abc3b08eSStefano Zampini PetscFunctionReturn(0); 189abc3b08eSStefano Zampini } 190abc3b08eSStefano Zampini 191150d2497SBarry Smith PETSC_INTERN PetscErrorCode MatPtAP_SeqDense_SeqDense(Mat A,Mat P,MatReuse reuse,PetscReal fill,Mat *C) 192abc3b08eSStefano Zampini { 193abc3b08eSStefano Zampini PetscErrorCode ierr; 194abc3b08eSStefano Zampini 195abc3b08eSStefano Zampini PetscFunctionBegin; 196abc3b08eSStefano Zampini if (reuse == MAT_INITIAL_MATRIX) { 197abc3b08eSStefano Zampini ierr = MatPtAPSymbolic_SeqDense_SeqDense(A,P,fill,C);CHKERRQ(ierr); 198abc3b08eSStefano Zampini } 199abc3b08eSStefano Zampini ierr = PetscLogEventBegin(MAT_PtAPNumeric,A,P,0,0);CHKERRQ(ierr); 200abc3b08eSStefano Zampini ierr = (*(*C)->ops->ptapnumeric)(A,P,*C);CHKERRQ(ierr); 201abc3b08eSStefano Zampini ierr = PetscLogEventEnd(MAT_PtAPNumeric,A,P,0,0);CHKERRQ(ierr); 202abc3b08eSStefano Zampini PetscFunctionReturn(0); 203abc3b08eSStefano Zampini } 204abc3b08eSStefano Zampini 205cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqDense(Mat A,MatType newtype,MatReuse reuse,Mat *newmat) 206b49cda9fSStefano Zampini { 207a13144ffSStefano Zampini Mat B = NULL; 208b49cda9fSStefano Zampini Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 209b49cda9fSStefano Zampini Mat_SeqDense *b; 210b49cda9fSStefano Zampini PetscErrorCode ierr; 211b49cda9fSStefano Zampini PetscInt *ai=a->i,*aj=a->j,m=A->rmap->N,n=A->cmap->N,i; 212b49cda9fSStefano Zampini MatScalar *av=a->a; 213a13144ffSStefano Zampini PetscBool isseqdense; 214b49cda9fSStefano Zampini 215b49cda9fSStefano Zampini PetscFunctionBegin; 216a13144ffSStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 217a13144ffSStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)*newmat,MATSEQDENSE,&isseqdense);CHKERRQ(ierr); 218a32993e3SJed Brown if (!isseqdense) SETERRQ1(PetscObjectComm((PetscObject)*newmat),PETSC_ERR_USER,"Cannot reuse matrix of type %s",((PetscObject)(*newmat))->type_name); 219a13144ffSStefano Zampini } 220a13144ffSStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 221b49cda9fSStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 222b49cda9fSStefano Zampini ierr = MatSetSizes(B,m,n,m,n);CHKERRQ(ierr); 223b49cda9fSStefano Zampini ierr = MatSetType(B,MATSEQDENSE);CHKERRQ(ierr); 224b49cda9fSStefano Zampini ierr = MatSeqDenseSetPreallocation(B,NULL);CHKERRQ(ierr); 225b49cda9fSStefano Zampini b = (Mat_SeqDense*)(B->data); 226a13144ffSStefano Zampini } else { 227a13144ffSStefano Zampini b = (Mat_SeqDense*)((*newmat)->data); 228580bdb30SBarry Smith ierr = PetscArrayzero(b->v,m*n);CHKERRQ(ierr); 229a13144ffSStefano Zampini } 230b49cda9fSStefano Zampini for (i=0; i<m; i++) { 231b49cda9fSStefano Zampini PetscInt j; 232b49cda9fSStefano Zampini for (j=0;j<ai[1]-ai[0];j++) { 233b49cda9fSStefano Zampini b->v[*aj*m+i] = *av; 234b49cda9fSStefano Zampini aj++; 235b49cda9fSStefano Zampini av++; 236b49cda9fSStefano Zampini } 237b49cda9fSStefano Zampini ai++; 238b49cda9fSStefano Zampini } 239b49cda9fSStefano Zampini 240511c6705SHong Zhang if (reuse == MAT_INPLACE_MATRIX) { 241a13144ffSStefano Zampini ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 242a13144ffSStefano Zampini ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 24328be2f97SBarry Smith ierr = MatHeaderReplace(A,&B);CHKERRQ(ierr); 244b49cda9fSStefano Zampini } else { 245a13144ffSStefano Zampini if (B) *newmat = B; 246a13144ffSStefano Zampini ierr = MatAssemblyBegin(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 247a13144ffSStefano Zampini ierr = MatAssemblyEnd(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 248b49cda9fSStefano Zampini } 249b49cda9fSStefano Zampini PetscFunctionReturn(0); 250b49cda9fSStefano Zampini } 251b49cda9fSStefano Zampini 252cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqDense_SeqAIJ(Mat A, MatType newtype,MatReuse reuse,Mat *newmat) 2536a63e612SBarry Smith { 2546a63e612SBarry Smith Mat B; 2556a63e612SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2566a63e612SBarry Smith PetscErrorCode ierr; 2579399e1b8SMatthew G. Knepley PetscInt i, j; 2589399e1b8SMatthew G. Knepley PetscInt *rows, *nnz; 2599399e1b8SMatthew G. Knepley MatScalar *aa = a->v, *vals; 2606a63e612SBarry Smith 2616a63e612SBarry Smith PetscFunctionBegin; 262ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 2636a63e612SBarry Smith ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 2646a63e612SBarry Smith ierr = MatSetType(B,MATSEQAIJ);CHKERRQ(ierr); 2659399e1b8SMatthew G. Knepley ierr = PetscCalloc3(A->rmap->n,&rows,A->rmap->n,&nnz,A->rmap->n,&vals);CHKERRQ(ierr); 2669399e1b8SMatthew G. Knepley for (j=0; j<A->cmap->n; j++) { 2679399e1b8SMatthew G. Knepley for (i=0; i<A->rmap->n; i++) if (aa[i] != 0.0 || i == j) ++nnz[i]; 2686a63e612SBarry Smith aa += a->lda; 2696a63e612SBarry Smith } 2709399e1b8SMatthew G. Knepley ierr = MatSeqAIJSetPreallocation(B,PETSC_DETERMINE,nnz);CHKERRQ(ierr); 2719399e1b8SMatthew G. Knepley aa = a->v; 2729399e1b8SMatthew G. Knepley for (j=0; j<A->cmap->n; j++) { 2739399e1b8SMatthew G. Knepley PetscInt numRows = 0; 2749399e1b8SMatthew G. Knepley for (i=0; i<A->rmap->n; i++) if (aa[i] != 0.0 || i == j) {rows[numRows] = i; vals[numRows++] = aa[i];} 2759399e1b8SMatthew G. Knepley ierr = MatSetValues(B,numRows,rows,1,&j,vals,INSERT_VALUES);CHKERRQ(ierr); 2769399e1b8SMatthew G. Knepley aa += a->lda; 2779399e1b8SMatthew G. Knepley } 2789399e1b8SMatthew G. Knepley ierr = PetscFree3(rows,nnz,vals);CHKERRQ(ierr); 2796a63e612SBarry Smith ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2806a63e612SBarry Smith ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2816a63e612SBarry Smith 282511c6705SHong Zhang if (reuse == MAT_INPLACE_MATRIX) { 28328be2f97SBarry Smith ierr = MatHeaderReplace(A,&B);CHKERRQ(ierr); 2846a63e612SBarry Smith } else { 2856a63e612SBarry Smith *newmat = B; 2866a63e612SBarry Smith } 2876a63e612SBarry Smith PetscFunctionReturn(0); 2886a63e612SBarry Smith } 2896a63e612SBarry Smith 290ca15aa20SStefano Zampini PetscErrorCode MatAXPY_SeqDense(Mat Y,PetscScalar alpha,Mat X,MatStructure str) 2911987afe7SBarry Smith { 2921987afe7SBarry Smith Mat_SeqDense *x = (Mat_SeqDense*)X->data,*y = (Mat_SeqDense*)Y->data; 293ca15aa20SStefano Zampini const PetscScalar *xv; 294ca15aa20SStefano Zampini PetscScalar *yv; 2950805154bSBarry Smith PetscBLASInt N,m,ldax,lday,one = 1; 296efee365bSSatish Balay PetscErrorCode ierr; 2973a40ed3dSBarry Smith 2983a40ed3dSBarry Smith PetscFunctionBegin; 299ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(X,&xv);CHKERRQ(ierr); 300ca15aa20SStefano Zampini ierr = MatDenseGetArray(Y,&yv);CHKERRQ(ierr); 301c5df96a5SBarry Smith ierr = PetscBLASIntCast(X->rmap->n*X->cmap->n,&N);CHKERRQ(ierr); 302c5df96a5SBarry Smith ierr = PetscBLASIntCast(X->rmap->n,&m);CHKERRQ(ierr); 303c5df96a5SBarry Smith ierr = PetscBLASIntCast(x->lda,&ldax);CHKERRQ(ierr); 304c5df96a5SBarry Smith ierr = PetscBLASIntCast(y->lda,&lday);CHKERRQ(ierr); 305a5ce6ee0Svictorle if (ldax>m || lday>m) { 306ca15aa20SStefano Zampini PetscInt j; 307ca15aa20SStefano Zampini 308d0f46423SBarry Smith for (j=0; j<X->cmap->n; j++) { 309ca15aa20SStefano Zampini PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&m,&alpha,xv+j*ldax,&one,yv+j*lday,&one)); 310a5ce6ee0Svictorle } 311a5ce6ee0Svictorle } else { 312ca15aa20SStefano Zampini PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&N,&alpha,xv,&one,yv,&one)); 313a5ce6ee0Svictorle } 314ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(X,&xv);CHKERRQ(ierr); 315ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(Y,&yv);CHKERRQ(ierr); 3160450473dSBarry Smith ierr = PetscLogFlops(PetscMax(2*N-1,0));CHKERRQ(ierr); 3173a40ed3dSBarry Smith PetscFunctionReturn(0); 3181987afe7SBarry Smith } 3191987afe7SBarry Smith 320e0877f53SBarry Smith static PetscErrorCode MatGetInfo_SeqDense(Mat A,MatInfoType flag,MatInfo *info) 321289bc588SBarry Smith { 322ca15aa20SStefano Zampini PetscLogDouble N = A->rmap->n*A->cmap->n; 3233a40ed3dSBarry Smith 3243a40ed3dSBarry Smith PetscFunctionBegin; 3254e220ebcSLois Curfman McInnes info->block_size = 1.0; 326ca15aa20SStefano Zampini info->nz_allocated = N; 327ca15aa20SStefano Zampini info->nz_used = N; 328ca15aa20SStefano Zampini info->nz_unneeded = 0; 329ca15aa20SStefano Zampini info->assemblies = A->num_ass; 3304e220ebcSLois Curfman McInnes info->mallocs = 0; 3317adad957SLisandro Dalcin info->memory = ((PetscObject)A)->mem; 3324e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 3334e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 3344e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 3353a40ed3dSBarry Smith PetscFunctionReturn(0); 336289bc588SBarry Smith } 337289bc588SBarry Smith 338e0877f53SBarry Smith static PetscErrorCode MatScale_SeqDense(Mat A,PetscScalar alpha) 33980cd9d93SLois Curfman McInnes { 340273d9f13SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 341ca15aa20SStefano Zampini PetscScalar *v; 342efee365bSSatish Balay PetscErrorCode ierr; 343c5df96a5SBarry Smith PetscBLASInt one = 1,j,nz,lda; 34480cd9d93SLois Curfman McInnes 3453a40ed3dSBarry Smith PetscFunctionBegin; 346ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 347c5df96a5SBarry Smith ierr = PetscBLASIntCast(a->lda,&lda);CHKERRQ(ierr); 348d0f46423SBarry Smith if (lda>A->rmap->n) { 349c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&nz);CHKERRQ(ierr); 350d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 351ca15aa20SStefano Zampini PetscStackCallBLAS("BLASscal",BLASscal_(&nz,&alpha,v+j*lda,&one)); 352a5ce6ee0Svictorle } 353a5ce6ee0Svictorle } else { 354c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n*A->cmap->n,&nz);CHKERRQ(ierr); 355ca15aa20SStefano Zampini PetscStackCallBLAS("BLASscal",BLASscal_(&nz,&alpha,v,&one)); 356a5ce6ee0Svictorle } 357efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 358ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 3593a40ed3dSBarry Smith PetscFunctionReturn(0); 36080cd9d93SLois Curfman McInnes } 36180cd9d93SLois Curfman McInnes 362e0877f53SBarry Smith static PetscErrorCode MatIsHermitian_SeqDense(Mat A,PetscReal rtol,PetscBool *fl) 3631cbb95d3SBarry Smith { 3641cbb95d3SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 365ca15aa20SStefano Zampini PetscInt i,j,m = A->rmap->n,N = a->lda; 366ca15aa20SStefano Zampini const PetscScalar *v; 367ca15aa20SStefano Zampini PetscErrorCode ierr; 3681cbb95d3SBarry Smith 3691cbb95d3SBarry Smith PetscFunctionBegin; 3701cbb95d3SBarry Smith *fl = PETSC_FALSE; 371d0f46423SBarry Smith if (A->rmap->n != A->cmap->n) PetscFunctionReturn(0); 372ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&v);CHKERRQ(ierr); 3731cbb95d3SBarry Smith for (i=0; i<m; i++) { 374ca15aa20SStefano Zampini for (j=i; j<m; j++) { 3751cbb95d3SBarry Smith if (PetscAbsScalar(v[i+j*N] - PetscConj(v[j+i*N])) > rtol) PetscFunctionReturn(0); 3761cbb95d3SBarry Smith } 3771cbb95d3SBarry Smith } 378ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&v);CHKERRQ(ierr); 3791cbb95d3SBarry Smith *fl = PETSC_TRUE; 3801cbb95d3SBarry Smith PetscFunctionReturn(0); 3811cbb95d3SBarry Smith } 3821cbb95d3SBarry Smith 383ca15aa20SStefano Zampini PetscErrorCode MatDuplicateNoCreate_SeqDense(Mat newi,Mat A,MatDuplicateOption cpvalues) 384b24902e0SBarry Smith { 385ca15aa20SStefano Zampini Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 386b24902e0SBarry Smith PetscErrorCode ierr; 387b24902e0SBarry Smith PetscInt lda = (PetscInt)mat->lda,j,m; 388b24902e0SBarry Smith 389b24902e0SBarry Smith PetscFunctionBegin; 390aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->rmap,&newi->rmap);CHKERRQ(ierr); 391aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->cmap,&newi->cmap);CHKERRQ(ierr); 3920298fd71SBarry Smith ierr = MatSeqDenseSetPreallocation(newi,NULL);CHKERRQ(ierr); 393b24902e0SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 394ca15aa20SStefano Zampini const PetscScalar *av; 395ca15aa20SStefano Zampini PetscScalar *v; 396ca15aa20SStefano Zampini 397ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&av);CHKERRQ(ierr); 398ca15aa20SStefano Zampini ierr = MatDenseGetArray(newi,&v);CHKERRQ(ierr); 399d0f46423SBarry Smith if (lda>A->rmap->n) { 400d0f46423SBarry Smith m = A->rmap->n; 401d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 402ca15aa20SStefano Zampini ierr = PetscArraycpy(v+j*m,av+j*lda,m);CHKERRQ(ierr); 403b24902e0SBarry Smith } 404b24902e0SBarry Smith } else { 405ca15aa20SStefano Zampini ierr = PetscArraycpy(v,av,A->rmap->n*A->cmap->n);CHKERRQ(ierr); 406b24902e0SBarry Smith } 407ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(newi,&v);CHKERRQ(ierr); 408ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&av);CHKERRQ(ierr); 409b24902e0SBarry Smith } 410b24902e0SBarry Smith PetscFunctionReturn(0); 411b24902e0SBarry Smith } 412b24902e0SBarry Smith 413ca15aa20SStefano Zampini PetscErrorCode MatDuplicate_SeqDense(Mat A,MatDuplicateOption cpvalues,Mat *newmat) 41402cad45dSBarry Smith { 4156849ba73SBarry Smith PetscErrorCode ierr; 41602cad45dSBarry Smith 4173a40ed3dSBarry Smith PetscFunctionBegin; 418ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),newmat);CHKERRQ(ierr); 419d0f46423SBarry Smith ierr = MatSetSizes(*newmat,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 4205c9eb25fSBarry Smith ierr = MatSetType(*newmat,((PetscObject)A)->type_name);CHKERRQ(ierr); 421719d5645SBarry Smith ierr = MatDuplicateNoCreate_SeqDense(*newmat,A,cpvalues);CHKERRQ(ierr); 422b24902e0SBarry Smith PetscFunctionReturn(0); 423b24902e0SBarry Smith } 424b24902e0SBarry Smith 425e0877f53SBarry Smith static PetscErrorCode MatLUFactorNumeric_SeqDense(Mat fact,Mat A,const MatFactorInfo *info_dummy) 426289bc588SBarry Smith { 4274482741eSBarry Smith MatFactorInfo info; 428a093e273SMatthew Knepley PetscErrorCode ierr; 4293a40ed3dSBarry Smith 4303a40ed3dSBarry Smith PetscFunctionBegin; 431c3ef05f6SHong Zhang ierr = MatDuplicateNoCreate_SeqDense(fact,A,MAT_COPY_VALUES);CHKERRQ(ierr); 432ca15aa20SStefano Zampini ierr = (*fact->ops->lufactor)(fact,0,0,&info);CHKERRQ(ierr); 4333a40ed3dSBarry Smith PetscFunctionReturn(0); 434289bc588SBarry Smith } 4356ee01492SSatish Balay 436e0877f53SBarry Smith static PetscErrorCode MatSolve_SeqDense(Mat A,Vec xx,Vec yy) 437289bc588SBarry Smith { 438c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 4396849ba73SBarry Smith PetscErrorCode ierr; 440f1ceaac6SMatthew G. Knepley const PetscScalar *x; 441f1ceaac6SMatthew G. Knepley PetscScalar *y; 442c5df96a5SBarry Smith PetscBLASInt one = 1,info,m; 44367e560aaSBarry Smith 4443a40ed3dSBarry Smith PetscFunctionBegin; 445c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 446f1ceaac6SMatthew G. Knepley ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 4471ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 448580bdb30SBarry Smith ierr = PetscArraycpy(y,x,A->rmap->n);CHKERRQ(ierr); 449d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_LU) { 450ae7cfcebSSatish Balay #if defined(PETSC_MISSING_LAPACK_GETRS) 451e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"GETRS - Lapack routine is unavailable."); 452ae7cfcebSSatish Balay #else 45300121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 4548b83055fSJed Brown PetscStackCallBLAS("LAPACKgetrs",LAPACKgetrs_("N",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 45500121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 456e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"GETRS - Bad solve"); 457ae7cfcebSSatish Balay #endif 458d5f3da31SBarry Smith } else if (A->factortype == MAT_FACTOR_CHOLESKY) { 459ae7cfcebSSatish Balay #if defined(PETSC_MISSING_LAPACK_POTRS) 460e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"POTRS - Lapack routine is unavailable."); 461ae7cfcebSSatish Balay #else 462a49dc2a2SStefano Zampini if (A->spd) { 46300121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 4648b83055fSJed Brown PetscStackCallBLAS("LAPACKpotrs",LAPACKpotrs_("L",&m,&one,mat->v,&mat->lda,y,&m,&info)); 46500121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 466e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS Bad solve"); 467a49dc2a2SStefano Zampini #if defined(PETSC_USE_COMPLEX) 468a49dc2a2SStefano Zampini } else if (A->hermitian) { 46900121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 470a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKhetrs",LAPACKhetrs_("L",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 47100121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 472a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"HETRS Bad solve"); 473a49dc2a2SStefano Zampini #endif 474a49dc2a2SStefano Zampini } else { /* symmetric case */ 47500121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 476a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKsytrs",LAPACKsytrs_("L",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 47700121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 478a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"SYTRS Bad solve"); 479a49dc2a2SStefano Zampini } 480ae7cfcebSSatish Balay #endif 4812205254eSKarl Rupp } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix must be factored to solve"); 482f1ceaac6SMatthew G. Knepley ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 4831ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 484dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->cmap->n - A->cmap->n);CHKERRQ(ierr); 4853a40ed3dSBarry Smith PetscFunctionReturn(0); 486289bc588SBarry Smith } 4876ee01492SSatish Balay 488e0877f53SBarry Smith static PetscErrorCode MatMatSolve_SeqDense(Mat A,Mat B,Mat X) 48985e2c93fSHong Zhang { 49085e2c93fSHong Zhang Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 49185e2c93fSHong Zhang PetscErrorCode ierr; 4921683a169SBarry Smith const PetscScalar *b; 4931683a169SBarry Smith PetscScalar *x; 494efb80c78SLisandro Dalcin PetscInt n; 495783b601eSJed Brown PetscBLASInt nrhs,info,m; 49685e2c93fSHong Zhang 49785e2c93fSHong Zhang PetscFunctionBegin; 498c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 4990298fd71SBarry Smith ierr = MatGetSize(B,NULL,&n);CHKERRQ(ierr); 500c5df96a5SBarry Smith ierr = PetscBLASIntCast(n,&nrhs);CHKERRQ(ierr); 5011683a169SBarry Smith ierr = MatDenseGetArrayRead(B,&b);CHKERRQ(ierr); 5028c778c55SBarry Smith ierr = MatDenseGetArray(X,&x);CHKERRQ(ierr); 50385e2c93fSHong Zhang 504580bdb30SBarry Smith ierr = PetscArraycpy(x,b,m*nrhs);CHKERRQ(ierr); 50585e2c93fSHong Zhang 50685e2c93fSHong Zhang if (A->factortype == MAT_FACTOR_LU) { 50785e2c93fSHong Zhang #if defined(PETSC_MISSING_LAPACK_GETRS) 50885e2c93fSHong Zhang SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"GETRS - Lapack routine is unavailable."); 50985e2c93fSHong Zhang #else 51000121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5118b83055fSJed Brown PetscStackCallBLAS("LAPACKgetrs",LAPACKgetrs_("N",&m,&nrhs,mat->v,&mat->lda,mat->pivots,x,&m,&info)); 51200121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 51385e2c93fSHong Zhang if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"GETRS - Bad solve"); 51485e2c93fSHong Zhang #endif 51585e2c93fSHong Zhang } else if (A->factortype == MAT_FACTOR_CHOLESKY) { 51685e2c93fSHong Zhang #if defined(PETSC_MISSING_LAPACK_POTRS) 51785e2c93fSHong Zhang SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"POTRS - Lapack routine is unavailable."); 51885e2c93fSHong Zhang #else 519a49dc2a2SStefano Zampini if (A->spd) { 52000121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5218b83055fSJed Brown PetscStackCallBLAS("LAPACKpotrs",LAPACKpotrs_("L",&m,&nrhs,mat->v,&mat->lda,x,&m,&info)); 52200121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 52385e2c93fSHong Zhang if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS Bad solve"); 524a49dc2a2SStefano Zampini #if defined(PETSC_USE_COMPLEX) 525a49dc2a2SStefano Zampini } else if (A->hermitian) { 52600121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 527a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKhetrs",LAPACKhetrs_("L",&m,&nrhs,mat->v,&mat->lda,mat->pivots,x,&m,&info)); 52800121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 529a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"HETRS Bad solve"); 530a49dc2a2SStefano Zampini #endif 531a49dc2a2SStefano Zampini } else { /* symmetric case */ 53200121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 533a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKsytrs",LAPACKsytrs_("L",&m,&nrhs,mat->v,&mat->lda,mat->pivots,x,&m,&info)); 53400121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 535a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"SYTRS Bad solve"); 536a49dc2a2SStefano Zampini } 53785e2c93fSHong Zhang #endif 5382205254eSKarl Rupp } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix must be factored to solve"); 53985e2c93fSHong Zhang 5401683a169SBarry Smith ierr = MatDenseRestoreArrayRead(B,&b);CHKERRQ(ierr); 5418c778c55SBarry Smith ierr = MatDenseRestoreArray(X,&x);CHKERRQ(ierr); 54285e2c93fSHong Zhang ierr = PetscLogFlops(nrhs*(2.0*m*m - m));CHKERRQ(ierr); 54385e2c93fSHong Zhang PetscFunctionReturn(0); 54485e2c93fSHong Zhang } 54585e2c93fSHong Zhang 54600121966SStefano Zampini static PetscErrorCode MatConjugate_SeqDense(Mat); 54700121966SStefano Zampini 548e0877f53SBarry Smith static PetscErrorCode MatSolveTranspose_SeqDense(Mat A,Vec xx,Vec yy) 549da3a660dSBarry Smith { 550c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 551dfbe8321SBarry Smith PetscErrorCode ierr; 552f1ceaac6SMatthew G. Knepley const PetscScalar *x; 553f1ceaac6SMatthew G. Knepley PetscScalar *y; 554c5df96a5SBarry Smith PetscBLASInt one = 1,info,m; 55567e560aaSBarry Smith 5563a40ed3dSBarry Smith PetscFunctionBegin; 557c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 558f1ceaac6SMatthew G. Knepley ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 5591ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 560580bdb30SBarry Smith ierr = PetscArraycpy(y,x,A->rmap->n);CHKERRQ(ierr); 5618208b9aeSStefano Zampini if (A->factortype == MAT_FACTOR_LU) { 562ae7cfcebSSatish Balay #if defined(PETSC_MISSING_LAPACK_GETRS) 563e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"GETRS - Lapack routine is unavailable."); 564ae7cfcebSSatish Balay #else 56500121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5668b83055fSJed Brown PetscStackCallBLAS("LAPACKgetrs",LAPACKgetrs_("T",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 56700121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 568e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS - Bad solve"); 569ae7cfcebSSatish Balay #endif 5708208b9aeSStefano Zampini } else if (A->factortype == MAT_FACTOR_CHOLESKY) { 571ae7cfcebSSatish Balay #if defined(PETSC_MISSING_LAPACK_POTRS) 572e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"POTRS - Lapack routine is unavailable."); 573ae7cfcebSSatish Balay #else 574a49dc2a2SStefano Zampini if (A->spd) { 57500121966SStefano Zampini #if defined(PETSC_USE_COMPLEX) 57600121966SStefano Zampini ierr = MatConjugate_SeqDense(A);CHKERRQ(ierr); 57700121966SStefano Zampini #endif 57800121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5798b83055fSJed Brown PetscStackCallBLAS("LAPACKpotrs",LAPACKpotrs_("L",&m,&one,mat->v,&mat->lda,y,&m,&info)); 58000121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 58100121966SStefano Zampini #if defined(PETSC_USE_COMPLEX) 58200121966SStefano Zampini ierr = MatConjugate_SeqDense(A);CHKERRQ(ierr); 58300121966SStefano Zampini #endif 584a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS Bad solve"); 585a49dc2a2SStefano Zampini #if defined(PETSC_USE_COMPLEX) 586a49dc2a2SStefano Zampini } else if (A->hermitian) { 58700121966SStefano Zampini ierr = MatConjugate_SeqDense(A);CHKERRQ(ierr); 58800121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 58900121966SStefano Zampini PetscStackCallBLAS("LAPACKhetrs",LAPACKhetrs_("L",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 59000121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 59100121966SStefano Zampini ierr = MatConjugate_SeqDense(A);CHKERRQ(ierr); 592ae7cfcebSSatish Balay #endif 593a49dc2a2SStefano Zampini } else { /* symmetric case */ 59400121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 595a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKsytrs",LAPACKsytrs_("L",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 59600121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 597a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"SYTRS Bad solve"); 598da3a660dSBarry Smith } 599a49dc2a2SStefano Zampini #endif 600a49dc2a2SStefano Zampini } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix must be factored to solve"); 601f1ceaac6SMatthew G. Knepley ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 6021ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 603dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->cmap->n - A->cmap->n);CHKERRQ(ierr); 6043a40ed3dSBarry Smith PetscFunctionReturn(0); 605da3a660dSBarry Smith } 6066ee01492SSatish Balay 607db4efbfdSBarry Smith /* ---------------------------------------------------------------*/ 608db4efbfdSBarry Smith /* COMMENT: I have chosen to hide row permutation in the pivots, 609db4efbfdSBarry Smith rather than put it in the Mat->row slot.*/ 610ca15aa20SStefano Zampini PetscErrorCode MatLUFactor_SeqDense(Mat A,IS row,IS col,const MatFactorInfo *minfo) 611db4efbfdSBarry Smith { 612db4efbfdSBarry Smith #if defined(PETSC_MISSING_LAPACK_GETRF) 613db4efbfdSBarry Smith PetscFunctionBegin; 614e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"GETRF - Lapack routine is unavailable."); 615db4efbfdSBarry Smith #else 616db4efbfdSBarry Smith Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 617db4efbfdSBarry Smith PetscErrorCode ierr; 618db4efbfdSBarry Smith PetscBLASInt n,m,info; 619db4efbfdSBarry Smith 620db4efbfdSBarry Smith PetscFunctionBegin; 621c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 622c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 623db4efbfdSBarry Smith if (!mat->pivots) { 6248208b9aeSStefano Zampini ierr = PetscMalloc1(A->rmap->n,&mat->pivots);CHKERRQ(ierr); 6253bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)A,A->rmap->n*sizeof(PetscBLASInt));CHKERRQ(ierr); 626db4efbfdSBarry Smith } 627db4efbfdSBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 6288e57ea43SSatish Balay ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 6298b83055fSJed Brown PetscStackCallBLAS("LAPACKgetrf",LAPACKgetrf_(&m,&n,mat->v,&mat->lda,mat->pivots,&info)); 6308e57ea43SSatish Balay ierr = PetscFPTrapPop();CHKERRQ(ierr); 6318e57ea43SSatish Balay 632e32f2f54SBarry Smith if (info<0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"Bad argument to LU factorization"); 633e32f2f54SBarry Smith if (info>0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_MAT_LU_ZRPVT,"Bad LU factorization"); 6348208b9aeSStefano Zampini 635db4efbfdSBarry Smith A->ops->solve = MatSolve_SeqDense; 6368208b9aeSStefano Zampini A->ops->matsolve = MatMatSolve_SeqDense; 637db4efbfdSBarry Smith A->ops->solvetranspose = MatSolveTranspose_SeqDense; 638d5f3da31SBarry Smith A->factortype = MAT_FACTOR_LU; 639db4efbfdSBarry Smith 640f6224b95SHong Zhang ierr = PetscFree(A->solvertype);CHKERRQ(ierr); 641f6224b95SHong Zhang ierr = PetscStrallocpy(MATSOLVERPETSC,&A->solvertype);CHKERRQ(ierr); 642f6224b95SHong Zhang 643dc0b31edSSatish Balay ierr = PetscLogFlops((2.0*A->cmap->n*A->cmap->n*A->cmap->n)/3);CHKERRQ(ierr); 644db4efbfdSBarry Smith #endif 645db4efbfdSBarry Smith PetscFunctionReturn(0); 646db4efbfdSBarry Smith } 647db4efbfdSBarry Smith 648a49dc2a2SStefano Zampini /* Cholesky as L*L^T or L*D*L^T and the symmetric/hermitian complex variants */ 649ca15aa20SStefano Zampini PetscErrorCode MatCholeskyFactor_SeqDense(Mat A,IS perm,const MatFactorInfo *factinfo) 650db4efbfdSBarry Smith { 651db4efbfdSBarry Smith #if defined(PETSC_MISSING_LAPACK_POTRF) 652db4efbfdSBarry Smith PetscFunctionBegin; 653e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"POTRF - Lapack routine is unavailable."); 654db4efbfdSBarry Smith #else 655db4efbfdSBarry Smith Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 656db4efbfdSBarry Smith PetscErrorCode ierr; 657c5df96a5SBarry Smith PetscBLASInt info,n; 658db4efbfdSBarry Smith 659db4efbfdSBarry Smith PetscFunctionBegin; 660c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 661db4efbfdSBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 662a49dc2a2SStefano Zampini if (A->spd) { 66300121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 6648b83055fSJed Brown PetscStackCallBLAS("LAPACKpotrf",LAPACKpotrf_("L",&n,mat->v,&mat->lda,&info)); 66500121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 666a49dc2a2SStefano Zampini #if defined(PETSC_USE_COMPLEX) 667a49dc2a2SStefano Zampini } else if (A->hermitian) { 668a49dc2a2SStefano Zampini if (!mat->pivots) { 669a49dc2a2SStefano Zampini ierr = PetscMalloc1(A->rmap->n,&mat->pivots);CHKERRQ(ierr); 670a49dc2a2SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)A,A->rmap->n*sizeof(PetscBLASInt));CHKERRQ(ierr); 671a49dc2a2SStefano Zampini } 672a49dc2a2SStefano Zampini if (!mat->fwork) { 673a49dc2a2SStefano Zampini PetscScalar dummy; 674a49dc2a2SStefano Zampini 675a49dc2a2SStefano Zampini mat->lfwork = -1; 67600121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 677a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKhetrf",LAPACKhetrf_("L",&n,mat->v,&mat->lda,mat->pivots,&dummy,&mat->lfwork,&info)); 67800121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 679a49dc2a2SStefano Zampini mat->lfwork = (PetscInt)PetscRealPart(dummy); 680a49dc2a2SStefano Zampini ierr = PetscMalloc1(mat->lfwork,&mat->fwork);CHKERRQ(ierr); 681a49dc2a2SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)A,mat->lfwork*sizeof(PetscBLASInt));CHKERRQ(ierr); 682a49dc2a2SStefano Zampini } 68300121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 684a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKhetrf",LAPACKhetrf_("L",&n,mat->v,&mat->lda,mat->pivots,mat->fwork,&mat->lfwork,&info)); 68500121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 686a49dc2a2SStefano Zampini #endif 687a49dc2a2SStefano Zampini } else { /* symmetric case */ 688a49dc2a2SStefano Zampini if (!mat->pivots) { 689a49dc2a2SStefano Zampini ierr = PetscMalloc1(A->rmap->n,&mat->pivots);CHKERRQ(ierr); 690a49dc2a2SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)A,A->rmap->n*sizeof(PetscBLASInt));CHKERRQ(ierr); 691a49dc2a2SStefano Zampini } 692a49dc2a2SStefano Zampini if (!mat->fwork) { 693a49dc2a2SStefano Zampini PetscScalar dummy; 694a49dc2a2SStefano Zampini 695a49dc2a2SStefano Zampini mat->lfwork = -1; 69600121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 697a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_("L",&n,mat->v,&mat->lda,mat->pivots,&dummy,&mat->lfwork,&info)); 69800121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 699a49dc2a2SStefano Zampini mat->lfwork = (PetscInt)PetscRealPart(dummy); 700a49dc2a2SStefano Zampini ierr = PetscMalloc1(mat->lfwork,&mat->fwork);CHKERRQ(ierr); 701a49dc2a2SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)A,mat->lfwork*sizeof(PetscBLASInt));CHKERRQ(ierr); 702a49dc2a2SStefano Zampini } 70300121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 704a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_("L",&n,mat->v,&mat->lda,mat->pivots,mat->fwork,&mat->lfwork,&info)); 70500121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 706a49dc2a2SStefano Zampini } 707e32f2f54SBarry Smith if (info) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_MAT_CH_ZRPVT,"Bad factorization: zero pivot in row %D",(PetscInt)info-1); 7088208b9aeSStefano Zampini 709db4efbfdSBarry Smith A->ops->solve = MatSolve_SeqDense; 7108208b9aeSStefano Zampini A->ops->matsolve = MatMatSolve_SeqDense; 711db4efbfdSBarry Smith A->ops->solvetranspose = MatSolveTranspose_SeqDense; 712d5f3da31SBarry Smith A->factortype = MAT_FACTOR_CHOLESKY; 7132205254eSKarl Rupp 714f6224b95SHong Zhang ierr = PetscFree(A->solvertype);CHKERRQ(ierr); 715f6224b95SHong Zhang ierr = PetscStrallocpy(MATSOLVERPETSC,&A->solvertype);CHKERRQ(ierr); 716f6224b95SHong Zhang 717eb3f19e4SBarry Smith ierr = PetscLogFlops((1.0*A->cmap->n*A->cmap->n*A->cmap->n)/3.0);CHKERRQ(ierr); 718db4efbfdSBarry Smith #endif 719db4efbfdSBarry Smith PetscFunctionReturn(0); 720db4efbfdSBarry Smith } 721db4efbfdSBarry Smith 722db4efbfdSBarry Smith 7230481f469SBarry Smith PetscErrorCode MatCholeskyFactorNumeric_SeqDense(Mat fact,Mat A,const MatFactorInfo *info_dummy) 724db4efbfdSBarry Smith { 725db4efbfdSBarry Smith PetscErrorCode ierr; 726db4efbfdSBarry Smith MatFactorInfo info; 727db4efbfdSBarry Smith 728db4efbfdSBarry Smith PetscFunctionBegin; 729db4efbfdSBarry Smith info.fill = 1.0; 7302205254eSKarl Rupp 731c3ef05f6SHong Zhang ierr = MatDuplicateNoCreate_SeqDense(fact,A,MAT_COPY_VALUES);CHKERRQ(ierr); 732ca15aa20SStefano Zampini ierr = (*fact->ops->choleskyfactor)(fact,0,&info);CHKERRQ(ierr); 733db4efbfdSBarry Smith PetscFunctionReturn(0); 734db4efbfdSBarry Smith } 735db4efbfdSBarry Smith 736ca15aa20SStefano Zampini PetscErrorCode MatCholeskyFactorSymbolic_SeqDense(Mat fact,Mat A,IS row,const MatFactorInfo *info) 737db4efbfdSBarry Smith { 738db4efbfdSBarry Smith PetscFunctionBegin; 739c3ef05f6SHong Zhang fact->assembled = PETSC_TRUE; 7401bbcc794SSatish Balay fact->preallocated = PETSC_TRUE; 741719d5645SBarry Smith fact->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqDense; 742bd443b22SStefano Zampini fact->ops->solve = MatSolve_SeqDense; 743bd443b22SStefano Zampini fact->ops->matsolve = MatMatSolve_SeqDense; 744bd443b22SStefano Zampini fact->ops->solvetranspose = MatSolveTranspose_SeqDense; 745db4efbfdSBarry Smith PetscFunctionReturn(0); 746db4efbfdSBarry Smith } 747db4efbfdSBarry Smith 748ca15aa20SStefano Zampini PetscErrorCode MatLUFactorSymbolic_SeqDense(Mat fact,Mat A,IS row,IS col,const MatFactorInfo *info) 749db4efbfdSBarry Smith { 750db4efbfdSBarry Smith PetscFunctionBegin; 751b66fe19dSMatthew G Knepley fact->preallocated = PETSC_TRUE; 752c3ef05f6SHong Zhang fact->assembled = PETSC_TRUE; 753719d5645SBarry Smith fact->ops->lufactornumeric = MatLUFactorNumeric_SeqDense; 754bd443b22SStefano Zampini fact->ops->solve = MatSolve_SeqDense; 755bd443b22SStefano Zampini fact->ops->matsolve = MatMatSolve_SeqDense; 756bd443b22SStefano Zampini fact->ops->solvetranspose = MatSolveTranspose_SeqDense; 757db4efbfdSBarry Smith PetscFunctionReturn(0); 758db4efbfdSBarry Smith } 759db4efbfdSBarry Smith 760ca15aa20SStefano Zampini /* uses LAPACK */ 761cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatGetFactor_seqdense_petsc(Mat A,MatFactorType ftype,Mat *fact) 762db4efbfdSBarry Smith { 763db4efbfdSBarry Smith PetscErrorCode ierr; 764db4efbfdSBarry Smith 765db4efbfdSBarry Smith PetscFunctionBegin; 766ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),fact);CHKERRQ(ierr); 767db4efbfdSBarry Smith ierr = MatSetSizes(*fact,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 768ca15aa20SStefano Zampini ierr = MatSetType(*fact,MATDENSE);CHKERRQ(ierr); 769db4efbfdSBarry Smith if (ftype == MAT_FACTOR_LU) { 770db4efbfdSBarry Smith (*fact)->ops->lufactorsymbolic = MatLUFactorSymbolic_SeqDense; 771db4efbfdSBarry Smith } else { 772db4efbfdSBarry Smith (*fact)->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_SeqDense; 773db4efbfdSBarry Smith } 774d5f3da31SBarry Smith (*fact)->factortype = ftype; 77500c67f3bSHong Zhang 77600c67f3bSHong Zhang ierr = PetscFree((*fact)->solvertype);CHKERRQ(ierr); 77700c67f3bSHong Zhang ierr = PetscStrallocpy(MATSOLVERPETSC,&(*fact)->solvertype);CHKERRQ(ierr); 778db4efbfdSBarry Smith PetscFunctionReturn(0); 779db4efbfdSBarry Smith } 780db4efbfdSBarry Smith 781289bc588SBarry Smith /* ------------------------------------------------------------------*/ 782e0877f53SBarry Smith static PetscErrorCode MatSOR_SeqDense(Mat A,Vec bb,PetscReal omega,MatSORType flag,PetscReal shift,PetscInt its,PetscInt lits,Vec xx) 783289bc588SBarry Smith { 784c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 785d9ca1df4SBarry Smith PetscScalar *x,*v = mat->v,zero = 0.0,xt; 786d9ca1df4SBarry Smith const PetscScalar *b; 787dfbe8321SBarry Smith PetscErrorCode ierr; 788d0f46423SBarry Smith PetscInt m = A->rmap->n,i; 789c5df96a5SBarry Smith PetscBLASInt o = 1,bm; 790289bc588SBarry Smith 7913a40ed3dSBarry Smith PetscFunctionBegin; 792ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 793c70f7ee4SJunchao Zhang if (A->offloadmask == PETSC_OFFLOAD_GPU) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Not implemented"); 794ca15aa20SStefano Zampini #endif 795422a814eSBarry Smith if (shift == -1) shift = 0.0; /* negative shift indicates do not error on zero diagonal; this code never zeros on zero diagonal */ 796c5df96a5SBarry Smith ierr = PetscBLASIntCast(m,&bm);CHKERRQ(ierr); 797289bc588SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 7983bffc371SBarry Smith /* this is a hack fix, should have another version without the second BLASdotu */ 7992dcb1b2aSMatthew Knepley ierr = VecSet(xx,zero);CHKERRQ(ierr); 800289bc588SBarry Smith } 8011ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 802d9ca1df4SBarry Smith ierr = VecGetArrayRead(bb,&b);CHKERRQ(ierr); 803b965ef7fSBarry Smith its = its*lits; 804e32f2f54SBarry Smith if (its <= 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Relaxation requires global its %D and local its %D both positive",its,lits); 805289bc588SBarry Smith while (its--) { 806fccaa45eSBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 807289bc588SBarry Smith for (i=0; i<m; i++) { 8083bffc371SBarry Smith PetscStackCallBLAS("BLASdotu",xt = b[i] - BLASdotu_(&bm,v+i,&bm,x,&o)); 80955a1b374SBarry Smith x[i] = (1. - omega)*x[i] + omega*(xt+v[i + i*m]*x[i])/(v[i + i*m]+shift); 810289bc588SBarry Smith } 811289bc588SBarry Smith } 812fccaa45eSBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 813289bc588SBarry Smith for (i=m-1; i>=0; i--) { 8143bffc371SBarry Smith PetscStackCallBLAS("BLASdotu",xt = b[i] - BLASdotu_(&bm,v+i,&bm,x,&o)); 81555a1b374SBarry Smith x[i] = (1. - omega)*x[i] + omega*(xt+v[i + i*m]*x[i])/(v[i + i*m]+shift); 816289bc588SBarry Smith } 817289bc588SBarry Smith } 818289bc588SBarry Smith } 819d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 8201ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 8213a40ed3dSBarry Smith PetscFunctionReturn(0); 822289bc588SBarry Smith } 823289bc588SBarry Smith 824289bc588SBarry Smith /* -----------------------------------------------------------------*/ 825ca15aa20SStefano Zampini PetscErrorCode MatMultTranspose_SeqDense(Mat A,Vec xx,Vec yy) 826289bc588SBarry Smith { 827c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 828d9ca1df4SBarry Smith const PetscScalar *v = mat->v,*x; 829d9ca1df4SBarry Smith PetscScalar *y; 830dfbe8321SBarry Smith PetscErrorCode ierr; 8310805154bSBarry Smith PetscBLASInt m, n,_One=1; 832ea709b57SSatish Balay PetscScalar _DOne=1.0,_DZero=0.0; 8333a40ed3dSBarry Smith 8343a40ed3dSBarry Smith PetscFunctionBegin; 835c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 836c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 837d9ca1df4SBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 8382bf066beSStefano Zampini ierr = VecGetArrayWrite(yy,&y);CHKERRQ(ierr); 8395ac36cfcSBarry Smith if (!A->rmap->n || !A->cmap->n) { 8405ac36cfcSBarry Smith PetscBLASInt i; 8415ac36cfcSBarry Smith for (i=0; i<n; i++) y[i] = 0.0; 8425ac36cfcSBarry Smith } else { 8438b83055fSJed Brown PetscStackCallBLAS("BLASgemv",BLASgemv_("T",&m,&n,&_DOne,v,&mat->lda,x,&_One,&_DZero,y,&_One)); 8445ac36cfcSBarry Smith ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n - A->cmap->n);CHKERRQ(ierr); 8455ac36cfcSBarry Smith } 846d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 8472bf066beSStefano Zampini ierr = VecRestoreArrayWrite(yy,&y);CHKERRQ(ierr); 8483a40ed3dSBarry Smith PetscFunctionReturn(0); 849289bc588SBarry Smith } 850800995b7SMatthew Knepley 851ca15aa20SStefano Zampini PetscErrorCode MatMult_SeqDense(Mat A,Vec xx,Vec yy) 852289bc588SBarry Smith { 853c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 854d9ca1df4SBarry Smith PetscScalar *y,_DOne=1.0,_DZero=0.0; 855dfbe8321SBarry Smith PetscErrorCode ierr; 8560805154bSBarry Smith PetscBLASInt m, n, _One=1; 857d9ca1df4SBarry Smith const PetscScalar *v = mat->v,*x; 8583a40ed3dSBarry Smith 8593a40ed3dSBarry Smith PetscFunctionBegin; 860c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 861c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 862d9ca1df4SBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 8632bf066beSStefano Zampini ierr = VecGetArrayWrite(yy,&y);CHKERRQ(ierr); 8645ac36cfcSBarry Smith if (!A->rmap->n || !A->cmap->n) { 8655ac36cfcSBarry Smith PetscBLASInt i; 8665ac36cfcSBarry Smith for (i=0; i<m; i++) y[i] = 0.0; 8675ac36cfcSBarry Smith } else { 8688b83055fSJed Brown PetscStackCallBLAS("BLASgemv",BLASgemv_("N",&m,&n,&_DOne,v,&(mat->lda),x,&_One,&_DZero,y,&_One)); 8695ac36cfcSBarry Smith ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n - A->rmap->n);CHKERRQ(ierr); 8705ac36cfcSBarry Smith } 871d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 8722bf066beSStefano Zampini ierr = VecRestoreArrayWrite(yy,&y);CHKERRQ(ierr); 8733a40ed3dSBarry Smith PetscFunctionReturn(0); 874289bc588SBarry Smith } 8756ee01492SSatish Balay 876ca15aa20SStefano Zampini PetscErrorCode MatMultAdd_SeqDense(Mat A,Vec xx,Vec zz,Vec yy) 877289bc588SBarry Smith { 878c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 879d9ca1df4SBarry Smith const PetscScalar *v = mat->v,*x; 880d9ca1df4SBarry Smith PetscScalar *y,_DOne=1.0; 881dfbe8321SBarry Smith PetscErrorCode ierr; 8820805154bSBarry Smith PetscBLASInt m, n, _One=1; 8833a40ed3dSBarry Smith 8843a40ed3dSBarry Smith PetscFunctionBegin; 885c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 886c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 887d0f46423SBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 888600d6d0bSBarry Smith if (zz != yy) {ierr = VecCopy(zz,yy);CHKERRQ(ierr);} 889d9ca1df4SBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 8901ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 8918b83055fSJed Brown PetscStackCallBLAS("BLASgemv",BLASgemv_("N",&m,&n,&_DOne,v,&(mat->lda),x,&_One,&_DOne,y,&_One)); 892d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 8931ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 894dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n);CHKERRQ(ierr); 8953a40ed3dSBarry Smith PetscFunctionReturn(0); 896289bc588SBarry Smith } 8976ee01492SSatish Balay 898ca15aa20SStefano Zampini PetscErrorCode MatMultTransposeAdd_SeqDense(Mat A,Vec xx,Vec zz,Vec yy) 899289bc588SBarry Smith { 900c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 901d9ca1df4SBarry Smith const PetscScalar *v = mat->v,*x; 902d9ca1df4SBarry Smith PetscScalar *y; 903dfbe8321SBarry Smith PetscErrorCode ierr; 9040805154bSBarry Smith PetscBLASInt m, n, _One=1; 90587828ca2SBarry Smith PetscScalar _DOne=1.0; 9063a40ed3dSBarry Smith 9073a40ed3dSBarry Smith PetscFunctionBegin; 908c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 909c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 910d0f46423SBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 911600d6d0bSBarry Smith if (zz != yy) {ierr = VecCopy(zz,yy);CHKERRQ(ierr);} 912d9ca1df4SBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 9131ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 9148b83055fSJed Brown PetscStackCallBLAS("BLASgemv",BLASgemv_("T",&m,&n,&_DOne,v,&(mat->lda),x,&_One,&_DOne,y,&_One)); 915d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 9161ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 917dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n);CHKERRQ(ierr); 9183a40ed3dSBarry Smith PetscFunctionReturn(0); 919289bc588SBarry Smith } 920289bc588SBarry Smith 921289bc588SBarry Smith /* -----------------------------------------------------------------*/ 922e0877f53SBarry Smith static PetscErrorCode MatGetRow_SeqDense(Mat A,PetscInt row,PetscInt *ncols,PetscInt **cols,PetscScalar **vals) 923289bc588SBarry Smith { 924c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 9256849ba73SBarry Smith PetscErrorCode ierr; 92613f74950SBarry Smith PetscInt i; 92767e560aaSBarry Smith 9283a40ed3dSBarry Smith PetscFunctionBegin; 929d0f46423SBarry Smith *ncols = A->cmap->n; 930289bc588SBarry Smith if (cols) { 931854ce69bSBarry Smith ierr = PetscMalloc1(A->cmap->n+1,cols);CHKERRQ(ierr); 932d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) (*cols)[i] = i; 933289bc588SBarry Smith } 934289bc588SBarry Smith if (vals) { 935ca15aa20SStefano Zampini const PetscScalar *v; 936ca15aa20SStefano Zampini 937ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&v);CHKERRQ(ierr); 938854ce69bSBarry Smith ierr = PetscMalloc1(A->cmap->n+1,vals);CHKERRQ(ierr); 939ca15aa20SStefano Zampini v += row; 940d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) {(*vals)[i] = *v; v += mat->lda;} 941ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&v);CHKERRQ(ierr); 942289bc588SBarry Smith } 9433a40ed3dSBarry Smith PetscFunctionReturn(0); 944289bc588SBarry Smith } 9456ee01492SSatish Balay 946e0877f53SBarry Smith static PetscErrorCode MatRestoreRow_SeqDense(Mat A,PetscInt row,PetscInt *ncols,PetscInt **cols,PetscScalar **vals) 947289bc588SBarry Smith { 948dfbe8321SBarry Smith PetscErrorCode ierr; 9496e111a19SKarl Rupp 950606d414cSSatish Balay PetscFunctionBegin; 951606d414cSSatish Balay if (cols) {ierr = PetscFree(*cols);CHKERRQ(ierr);} 952606d414cSSatish Balay if (vals) {ierr = PetscFree(*vals);CHKERRQ(ierr); } 9533a40ed3dSBarry Smith PetscFunctionReturn(0); 954289bc588SBarry Smith } 955289bc588SBarry Smith /* ----------------------------------------------------------------*/ 956e0877f53SBarry Smith static PetscErrorCode MatSetValues_SeqDense(Mat A,PetscInt m,const PetscInt indexm[],PetscInt n,const PetscInt indexn[],const PetscScalar v[],InsertMode addv) 957289bc588SBarry Smith { 958c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 959ca15aa20SStefano Zampini PetscScalar *av; 96013f74950SBarry Smith PetscInt i,j,idx=0; 961ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 962c70f7ee4SJunchao Zhang PetscOffloadMask oldf; 963ca15aa20SStefano Zampini #endif 964ca15aa20SStefano Zampini PetscErrorCode ierr; 965d6dfbf8fSBarry Smith 9663a40ed3dSBarry Smith PetscFunctionBegin; 967ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&av);CHKERRQ(ierr); 968289bc588SBarry Smith if (!mat->roworiented) { 969dbb450caSBarry Smith if (addv == INSERT_VALUES) { 970289bc588SBarry Smith for (j=0; j<n; j++) { 971cddbea37SSatish Balay if (indexn[j] < 0) {idx += m; continue;} 9722515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 973e32f2f54SBarry Smith if (indexn[j] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 97458804f6dSBarry Smith #endif 975289bc588SBarry Smith for (i=0; i<m; i++) { 976cddbea37SSatish Balay if (indexm[i] < 0) {idx++; continue;} 9772515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 978e32f2f54SBarry Smith if (indexm[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 97958804f6dSBarry Smith #endif 980ca15aa20SStefano Zampini av[indexn[j]*mat->lda + indexm[i]] = v[idx++]; 981289bc588SBarry Smith } 982289bc588SBarry Smith } 9833a40ed3dSBarry Smith } else { 984289bc588SBarry Smith for (j=0; j<n; j++) { 985cddbea37SSatish Balay if (indexn[j] < 0) {idx += m; continue;} 9862515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 987e32f2f54SBarry Smith if (indexn[j] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 98858804f6dSBarry Smith #endif 989289bc588SBarry Smith for (i=0; i<m; i++) { 990cddbea37SSatish Balay if (indexm[i] < 0) {idx++; continue;} 9912515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 992e32f2f54SBarry Smith if (indexm[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 99358804f6dSBarry Smith #endif 994ca15aa20SStefano Zampini av[indexn[j]*mat->lda + indexm[i]] += v[idx++]; 995289bc588SBarry Smith } 996289bc588SBarry Smith } 997289bc588SBarry Smith } 9983a40ed3dSBarry Smith } else { 999dbb450caSBarry Smith if (addv == INSERT_VALUES) { 1000e8d4e0b9SBarry Smith for (i=0; i<m; i++) { 1001cddbea37SSatish Balay if (indexm[i] < 0) { idx += n; continue;} 10022515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 1003e32f2f54SBarry Smith if (indexm[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 100458804f6dSBarry Smith #endif 1005e8d4e0b9SBarry Smith for (j=0; j<n; j++) { 1006cddbea37SSatish Balay if (indexn[j] < 0) { idx++; continue;} 10072515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 1008e32f2f54SBarry Smith if (indexn[j] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 100958804f6dSBarry Smith #endif 1010ca15aa20SStefano Zampini av[indexn[j]*mat->lda + indexm[i]] = v[idx++]; 1011e8d4e0b9SBarry Smith } 1012e8d4e0b9SBarry Smith } 10133a40ed3dSBarry Smith } else { 1014289bc588SBarry Smith for (i=0; i<m; i++) { 1015cddbea37SSatish Balay if (indexm[i] < 0) { idx += n; continue;} 10162515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 1017e32f2f54SBarry Smith if (indexm[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 101858804f6dSBarry Smith #endif 1019289bc588SBarry Smith for (j=0; j<n; j++) { 1020cddbea37SSatish Balay if (indexn[j] < 0) { idx++; continue;} 10212515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 1022e32f2f54SBarry Smith if (indexn[j] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 102358804f6dSBarry Smith #endif 1024ca15aa20SStefano Zampini av[indexn[j]*mat->lda + indexm[i]] += v[idx++]; 1025289bc588SBarry Smith } 1026289bc588SBarry Smith } 1027289bc588SBarry Smith } 1028e8d4e0b9SBarry Smith } 1029ca15aa20SStefano Zampini /* hack to prevent unneeded copy to the GPU while returning the array */ 1030ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 1031c70f7ee4SJunchao Zhang oldf = A->offloadmask; 1032c70f7ee4SJunchao Zhang A->offloadmask = PETSC_OFFLOAD_GPU; 1033ca15aa20SStefano Zampini #endif 1034ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&av);CHKERRQ(ierr); 1035ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 1036c70f7ee4SJunchao Zhang A->offloadmask = (oldf == PETSC_OFFLOAD_UNALLOCATED ? PETSC_OFFLOAD_UNALLOCATED : PETSC_OFFLOAD_CPU); 1037ca15aa20SStefano Zampini #endif 10383a40ed3dSBarry Smith PetscFunctionReturn(0); 1039289bc588SBarry Smith } 1040e8d4e0b9SBarry Smith 1041e0877f53SBarry Smith static PetscErrorCode MatGetValues_SeqDense(Mat A,PetscInt m,const PetscInt indexm[],PetscInt n,const PetscInt indexn[],PetscScalar v[]) 1042ae80bb75SLois Curfman McInnes { 1043ae80bb75SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 1044ca15aa20SStefano Zampini const PetscScalar *vv; 104513f74950SBarry Smith PetscInt i,j; 1046ca15aa20SStefano Zampini PetscErrorCode ierr; 1047ae80bb75SLois Curfman McInnes 10483a40ed3dSBarry Smith PetscFunctionBegin; 1049ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&vv);CHKERRQ(ierr); 1050ae80bb75SLois Curfman McInnes /* row-oriented output */ 1051ae80bb75SLois Curfman McInnes for (i=0; i<m; i++) { 105297e567efSBarry Smith if (indexm[i] < 0) {v += n;continue;} 1053e32f2f54SBarry Smith if (indexm[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D requested larger than number rows %D",indexm[i],A->rmap->n); 1054ae80bb75SLois Curfman McInnes for (j=0; j<n; j++) { 10556f31f424SBarry Smith if (indexn[j] < 0) {v++; continue;} 1056e32f2f54SBarry Smith if (indexn[j] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column %D requested larger than number columns %D",indexn[j],A->cmap->n); 1057ca15aa20SStefano Zampini *v++ = vv[indexn[j]*mat->lda + indexm[i]]; 1058ae80bb75SLois Curfman McInnes } 1059ae80bb75SLois Curfman McInnes } 1060ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&vv);CHKERRQ(ierr); 10613a40ed3dSBarry Smith PetscFunctionReturn(0); 1062ae80bb75SLois Curfman McInnes } 1063ae80bb75SLois Curfman McInnes 1064289bc588SBarry Smith /* -----------------------------------------------------------------*/ 1065289bc588SBarry Smith 1066eb91f321SVaclav Hapla static PetscErrorCode MatLoad_SeqDense_Binary(Mat newmat,PetscViewer viewer) 1067aabbc4fbSShri Abhyankar { 1068aabbc4fbSShri Abhyankar Mat_SeqDense *a; 1069aabbc4fbSShri Abhyankar PetscErrorCode ierr; 1070aabbc4fbSShri Abhyankar PetscInt *scols,i,j,nz,header[4]; 1071aabbc4fbSShri Abhyankar int fd; 1072aabbc4fbSShri Abhyankar PetscMPIInt size; 1073aabbc4fbSShri Abhyankar PetscInt *rowlengths = 0,M,N,*cols,grows,gcols; 1074aabbc4fbSShri Abhyankar PetscScalar *vals,*svals,*v,*w; 1075ce94432eSBarry Smith MPI_Comm comm; 1076aabbc4fbSShri Abhyankar 1077aabbc4fbSShri Abhyankar PetscFunctionBegin; 1078ce94432eSBarry Smith ierr = PetscObjectGetComm((PetscObject)viewer,&comm);CHKERRQ(ierr); 1079aabbc4fbSShri Abhyankar ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 1080aabbc4fbSShri Abhyankar if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"view must have one processor"); 1081aabbc4fbSShri Abhyankar ierr = PetscViewerBinaryGetDescriptor(viewer,&fd);CHKERRQ(ierr); 10829860990eSLisandro Dalcin ierr = PetscBinaryRead(fd,header,4,NULL,PETSC_INT);CHKERRQ(ierr); 1083aabbc4fbSShri Abhyankar if (header[0] != MAT_FILE_CLASSID) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Not matrix object"); 1084aabbc4fbSShri Abhyankar M = header[1]; N = header[2]; nz = header[3]; 1085aabbc4fbSShri Abhyankar 1086aabbc4fbSShri Abhyankar /* set global size if not set already*/ 1087aabbc4fbSShri Abhyankar if (newmat->rmap->n < 0 && newmat->rmap->N < 0 && newmat->cmap->n < 0 && newmat->cmap->N < 0) { 1088aabbc4fbSShri Abhyankar ierr = MatSetSizes(newmat,M,N,M,N);CHKERRQ(ierr); 1089aabbc4fbSShri Abhyankar } else { 1090aabbc4fbSShri Abhyankar /* if sizes and type are already set, check if the vector global sizes are correct */ 1091aabbc4fbSShri Abhyankar ierr = MatGetSize(newmat,&grows,&gcols);CHKERRQ(ierr); 1092aabbc4fbSShri Abhyankar if (M != grows || N != gcols) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%d, %d) than the input matrix (%d, %d)",M,N,grows,gcols); 1093aabbc4fbSShri Abhyankar } 1094e6324fbbSBarry Smith a = (Mat_SeqDense*)newmat->data; 1095e6324fbbSBarry Smith if (!a->user_alloc) { 10960298fd71SBarry Smith ierr = MatSeqDenseSetPreallocation(newmat,NULL);CHKERRQ(ierr); 1097e6324fbbSBarry Smith } 1098aabbc4fbSShri Abhyankar 1099aabbc4fbSShri Abhyankar if (nz == MATRIX_BINARY_FORMAT_DENSE) { /* matrix in file is dense */ 1100aabbc4fbSShri Abhyankar a = (Mat_SeqDense*)newmat->data; 1101aabbc4fbSShri Abhyankar v = a->v; 1102aabbc4fbSShri Abhyankar /* Allocate some temp space to read in the values and then flip them 1103aabbc4fbSShri Abhyankar from row major to column major */ 1104854ce69bSBarry Smith ierr = PetscMalloc1(M*N > 0 ? M*N : 1,&w);CHKERRQ(ierr); 1105aabbc4fbSShri Abhyankar /* read in nonzero values */ 11069860990eSLisandro Dalcin ierr = PetscBinaryRead(fd,w,M*N,NULL,PETSC_SCALAR);CHKERRQ(ierr); 1107aabbc4fbSShri Abhyankar /* now flip the values and store them in the matrix*/ 1108aabbc4fbSShri Abhyankar for (j=0; j<N; j++) { 1109aabbc4fbSShri Abhyankar for (i=0; i<M; i++) { 1110aabbc4fbSShri Abhyankar *v++ =w[i*N+j]; 1111aabbc4fbSShri Abhyankar } 1112aabbc4fbSShri Abhyankar } 1113aabbc4fbSShri Abhyankar ierr = PetscFree(w);CHKERRQ(ierr); 1114aabbc4fbSShri Abhyankar } else { 1115aabbc4fbSShri Abhyankar /* read row lengths */ 1116854ce69bSBarry Smith ierr = PetscMalloc1(M+1,&rowlengths);CHKERRQ(ierr); 11179860990eSLisandro Dalcin ierr = PetscBinaryRead(fd,rowlengths,M,NULL,PETSC_INT);CHKERRQ(ierr); 1118aabbc4fbSShri Abhyankar 1119aabbc4fbSShri Abhyankar a = (Mat_SeqDense*)newmat->data; 1120aabbc4fbSShri Abhyankar v = a->v; 1121aabbc4fbSShri Abhyankar 1122aabbc4fbSShri Abhyankar /* read column indices and nonzeros */ 1123854ce69bSBarry Smith ierr = PetscMalloc1(nz+1,&scols);CHKERRQ(ierr); 1124aabbc4fbSShri Abhyankar cols = scols; 11259860990eSLisandro Dalcin ierr = PetscBinaryRead(fd,cols,nz,NULL,PETSC_INT);CHKERRQ(ierr); 1126854ce69bSBarry Smith ierr = PetscMalloc1(nz+1,&svals);CHKERRQ(ierr); 1127aabbc4fbSShri Abhyankar vals = svals; 11289860990eSLisandro Dalcin ierr = PetscBinaryRead(fd,vals,nz,NULL,PETSC_SCALAR);CHKERRQ(ierr); 1129aabbc4fbSShri Abhyankar 1130aabbc4fbSShri Abhyankar /* insert into matrix */ 1131aabbc4fbSShri Abhyankar for (i=0; i<M; i++) { 1132aabbc4fbSShri Abhyankar for (j=0; j<rowlengths[i]; j++) v[i+M*scols[j]] = svals[j]; 1133aabbc4fbSShri Abhyankar svals += rowlengths[i]; scols += rowlengths[i]; 1134aabbc4fbSShri Abhyankar } 1135aabbc4fbSShri Abhyankar ierr = PetscFree(vals);CHKERRQ(ierr); 1136aabbc4fbSShri Abhyankar ierr = PetscFree(cols);CHKERRQ(ierr); 1137aabbc4fbSShri Abhyankar ierr = PetscFree(rowlengths);CHKERRQ(ierr); 1138aabbc4fbSShri Abhyankar } 1139aabbc4fbSShri Abhyankar ierr = MatAssemblyBegin(newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1140aabbc4fbSShri Abhyankar ierr = MatAssemblyEnd(newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1141aabbc4fbSShri Abhyankar PetscFunctionReturn(0); 1142aabbc4fbSShri Abhyankar } 1143aabbc4fbSShri Abhyankar 1144eb91f321SVaclav Hapla PetscErrorCode MatLoad_SeqDense(Mat newMat, PetscViewer viewer) 1145eb91f321SVaclav Hapla { 1146eb91f321SVaclav Hapla PetscBool isbinary, ishdf5; 1147eb91f321SVaclav Hapla PetscErrorCode ierr; 1148eb91f321SVaclav Hapla 1149eb91f321SVaclav Hapla PetscFunctionBegin; 1150eb91f321SVaclav Hapla PetscValidHeaderSpecific(newMat,MAT_CLASSID,1); 1151eb91f321SVaclav Hapla PetscValidHeaderSpecific(viewer,PETSC_VIEWER_CLASSID,2); 1152eb91f321SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 1153eb91f321SVaclav Hapla ierr = PetscViewerSetUp(viewer);CHKERRQ(ierr); 1154eb91f321SVaclav Hapla ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 1155eb91f321SVaclav Hapla ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERHDF5, &ishdf5);CHKERRQ(ierr); 1156eb91f321SVaclav Hapla if (isbinary) { 1157eb91f321SVaclav Hapla ierr = MatLoad_SeqDense_Binary(newMat,viewer);CHKERRQ(ierr); 1158eb91f321SVaclav Hapla } else if (ishdf5) { 1159eb91f321SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 1160eb91f321SVaclav Hapla ierr = MatLoad_Dense_HDF5(newMat,viewer);CHKERRQ(ierr); 1161eb91f321SVaclav Hapla #else 1162eb91f321SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 1163eb91f321SVaclav Hapla #endif 1164eb91f321SVaclav Hapla } else { 1165eb91f321SVaclav Hapla SETERRQ2(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"Viewer type %s not yet supported for reading %s matrices",((PetscObject)viewer)->type_name,((PetscObject)newMat)->type_name); 1166eb91f321SVaclav Hapla } 1167eb91f321SVaclav Hapla PetscFunctionReturn(0); 1168eb91f321SVaclav Hapla } 1169eb91f321SVaclav Hapla 11706849ba73SBarry Smith static PetscErrorCode MatView_SeqDense_ASCII(Mat A,PetscViewer viewer) 1171289bc588SBarry Smith { 1172932b0c3eSLois Curfman McInnes Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1173dfbe8321SBarry Smith PetscErrorCode ierr; 117413f74950SBarry Smith PetscInt i,j; 11752dcb1b2aSMatthew Knepley const char *name; 1176ca15aa20SStefano Zampini PetscScalar *v,*av; 1177f3ef73ceSBarry Smith PetscViewerFormat format; 11785f481a85SSatish Balay #if defined(PETSC_USE_COMPLEX) 1179ace3abfcSBarry Smith PetscBool allreal = PETSC_TRUE; 11805f481a85SSatish Balay #endif 1181932b0c3eSLois Curfman McInnes 11823a40ed3dSBarry Smith PetscFunctionBegin; 1183ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,(const PetscScalar**)&av);CHKERRQ(ierr); 1184b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 1185456192e2SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) { 11863a40ed3dSBarry Smith PetscFunctionReturn(0); /* do nothing for now */ 1187fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 1188d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 1189d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 1190ca15aa20SStefano Zampini v = av + i; 119177431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 1192d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1193aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 1194329f5518SBarry Smith if (PetscRealPart(*v) != 0.0 && PetscImaginaryPart(*v) != 0.0) { 119557622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i) ",j,(double)PetscRealPart(*v),(double)PetscImaginaryPart(*v));CHKERRQ(ierr); 1196329f5518SBarry Smith } else if (PetscRealPart(*v)) { 119757622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",j,(double)PetscRealPart(*v));CHKERRQ(ierr); 11986831982aSBarry Smith } 119980cd9d93SLois Curfman McInnes #else 12006831982aSBarry Smith if (*v) { 120157622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",j,(double)*v);CHKERRQ(ierr); 12026831982aSBarry Smith } 120380cd9d93SLois Curfman McInnes #endif 12041b807ce4Svictorle v += a->lda; 120580cd9d93SLois Curfman McInnes } 1206b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 120780cd9d93SLois Curfman McInnes } 1208d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 12093a40ed3dSBarry Smith } else { 1210d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 1211aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 121247989497SBarry Smith /* determine if matrix has all real values */ 1213ca15aa20SStefano Zampini v = av; 1214d0f46423SBarry Smith for (i=0; i<A->rmap->n*A->cmap->n; i++) { 1215ffac6cdbSBarry Smith if (PetscImaginaryPart(v[i])) { allreal = PETSC_FALSE; break;} 121647989497SBarry Smith } 121747989497SBarry Smith #endif 1218fb9695e5SSatish Balay if (format == PETSC_VIEWER_ASCII_MATLAB) { 12193a7fca6bSBarry Smith ierr = PetscObjectGetName((PetscObject)A,&name);CHKERRQ(ierr); 1220d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Size = %D %D \n",A->rmap->n,A->cmap->n);CHKERRQ(ierr); 1221d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%s = zeros(%D,%D);\n",name,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 1222fb9695e5SSatish Balay ierr = PetscViewerASCIIPrintf(viewer,"%s = [\n",name);CHKERRQ(ierr); 1223ffac6cdbSBarry Smith } 1224ffac6cdbSBarry Smith 1225d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 1226ca15aa20SStefano Zampini v = av + i; 1227d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1228aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 122947989497SBarry Smith if (allreal) { 1230c61cd2faSJed Brown ierr = PetscViewerASCIIPrintf(viewer,"%18.16e ",(double)PetscRealPart(*v));CHKERRQ(ierr); 123147989497SBarry Smith } else { 1232c61cd2faSJed Brown ierr = PetscViewerASCIIPrintf(viewer,"%18.16e + %18.16ei ",(double)PetscRealPart(*v),(double)PetscImaginaryPart(*v));CHKERRQ(ierr); 123347989497SBarry Smith } 1234289bc588SBarry Smith #else 1235c61cd2faSJed Brown ierr = PetscViewerASCIIPrintf(viewer,"%18.16e ",(double)*v);CHKERRQ(ierr); 1236289bc588SBarry Smith #endif 12371b807ce4Svictorle v += a->lda; 1238289bc588SBarry Smith } 1239b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 1240289bc588SBarry Smith } 1241fb9695e5SSatish Balay if (format == PETSC_VIEWER_ASCII_MATLAB) { 1242b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"];\n");CHKERRQ(ierr); 1243ffac6cdbSBarry Smith } 1244d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 1245da3a660dSBarry Smith } 1246ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,(const PetscScalar**)&av);CHKERRQ(ierr); 1247b0a32e0cSBarry Smith ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 12483a40ed3dSBarry Smith PetscFunctionReturn(0); 1249289bc588SBarry Smith } 1250289bc588SBarry Smith 12516849ba73SBarry Smith static PetscErrorCode MatView_SeqDense_Binary(Mat A,PetscViewer viewer) 1252932b0c3eSLois Curfman McInnes { 1253932b0c3eSLois Curfman McInnes Mat_SeqDense *a = (Mat_SeqDense*)A->data; 12546849ba73SBarry Smith PetscErrorCode ierr; 125513f74950SBarry Smith int fd; 1256d0f46423SBarry Smith PetscInt ict,j,n = A->cmap->n,m = A->rmap->n,i,*col_lens,nz = m*n; 1257ca15aa20SStefano Zampini PetscScalar *av,*v,*anonz,*vals; 1258f4403165SShri Abhyankar PetscViewerFormat format; 1259932b0c3eSLois Curfman McInnes 12603a40ed3dSBarry Smith PetscFunctionBegin; 1261b0a32e0cSBarry Smith ierr = PetscViewerBinaryGetDescriptor(viewer,&fd);CHKERRQ(ierr); 1262ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,(const PetscScalar**)&av);CHKERRQ(ierr); 1263f4403165SShri Abhyankar ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 1264f4403165SShri Abhyankar if (format == PETSC_VIEWER_NATIVE) { 1265f4403165SShri Abhyankar /* store the matrix as a dense matrix */ 1266785e854fSJed Brown ierr = PetscMalloc1(4,&col_lens);CHKERRQ(ierr); 12672205254eSKarl Rupp 1268f4403165SShri Abhyankar col_lens[0] = MAT_FILE_CLASSID; 1269f4403165SShri Abhyankar col_lens[1] = m; 1270f4403165SShri Abhyankar col_lens[2] = n; 1271f4403165SShri Abhyankar col_lens[3] = MATRIX_BINARY_FORMAT_DENSE; 12722205254eSKarl Rupp 1273f4403165SShri Abhyankar ierr = PetscBinaryWrite(fd,col_lens,4,PETSC_INT,PETSC_TRUE);CHKERRQ(ierr); 1274f4403165SShri Abhyankar ierr = PetscFree(col_lens);CHKERRQ(ierr); 1275f4403165SShri Abhyankar 1276f4403165SShri Abhyankar /* write out matrix, by rows */ 1277854ce69bSBarry Smith ierr = PetscMalloc1(m*n+1,&vals);CHKERRQ(ierr); 1278ca15aa20SStefano Zampini v = av; 1279f4403165SShri Abhyankar for (j=0; j<n; j++) { 1280f4403165SShri Abhyankar for (i=0; i<m; i++) { 1281f4403165SShri Abhyankar vals[j + i*n] = *v++; 1282f4403165SShri Abhyankar } 1283f4403165SShri Abhyankar } 1284f4403165SShri Abhyankar ierr = PetscBinaryWrite(fd,vals,n*m,PETSC_SCALAR,PETSC_FALSE);CHKERRQ(ierr); 1285f4403165SShri Abhyankar ierr = PetscFree(vals);CHKERRQ(ierr); 1286f4403165SShri Abhyankar } else { 1287854ce69bSBarry Smith ierr = PetscMalloc1(4+nz,&col_lens);CHKERRQ(ierr); 12882205254eSKarl Rupp 12890700a824SBarry Smith col_lens[0] = MAT_FILE_CLASSID; 1290932b0c3eSLois Curfman McInnes col_lens[1] = m; 1291932b0c3eSLois Curfman McInnes col_lens[2] = n; 1292932b0c3eSLois Curfman McInnes col_lens[3] = nz; 1293932b0c3eSLois Curfman McInnes 1294932b0c3eSLois Curfman McInnes /* store lengths of each row and write (including header) to file */ 1295932b0c3eSLois Curfman McInnes for (i=0; i<m; i++) col_lens[4+i] = n; 12966f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,col_lens,4+m,PETSC_INT,PETSC_TRUE);CHKERRQ(ierr); 1297932b0c3eSLois Curfman McInnes 1298932b0c3eSLois Curfman McInnes /* Possibly should write in smaller increments, not whole matrix at once? */ 1299932b0c3eSLois Curfman McInnes /* store column indices (zero start index) */ 1300932b0c3eSLois Curfman McInnes ict = 0; 1301932b0c3eSLois Curfman McInnes for (i=0; i<m; i++) { 1302932b0c3eSLois Curfman McInnes for (j=0; j<n; j++) col_lens[ict++] = j; 1303932b0c3eSLois Curfman McInnes } 13046f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,col_lens,nz,PETSC_INT,PETSC_FALSE);CHKERRQ(ierr); 1305606d414cSSatish Balay ierr = PetscFree(col_lens);CHKERRQ(ierr); 1306932b0c3eSLois Curfman McInnes 1307932b0c3eSLois Curfman McInnes /* store nonzero values */ 1308854ce69bSBarry Smith ierr = PetscMalloc1(nz+1,&anonz);CHKERRQ(ierr); 1309932b0c3eSLois Curfman McInnes ict = 0; 1310932b0c3eSLois Curfman McInnes for (i=0; i<m; i++) { 1311ca15aa20SStefano Zampini v = av + i; 1312932b0c3eSLois Curfman McInnes for (j=0; j<n; j++) { 13131b807ce4Svictorle anonz[ict++] = *v; v += a->lda; 1314932b0c3eSLois Curfman McInnes } 1315932b0c3eSLois Curfman McInnes } 13166f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,anonz,nz,PETSC_SCALAR,PETSC_FALSE);CHKERRQ(ierr); 1317606d414cSSatish Balay ierr = PetscFree(anonz);CHKERRQ(ierr); 1318f4403165SShri Abhyankar } 1319ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,(const PetscScalar**)&av);CHKERRQ(ierr); 13203a40ed3dSBarry Smith PetscFunctionReturn(0); 1321932b0c3eSLois Curfman McInnes } 1322932b0c3eSLois Curfman McInnes 13239804daf3SBarry Smith #include <petscdraw.h> 1324e0877f53SBarry Smith static PetscErrorCode MatView_SeqDense_Draw_Zoom(PetscDraw draw,void *Aa) 1325f1af5d2fSBarry Smith { 1326f1af5d2fSBarry Smith Mat A = (Mat) Aa; 13276849ba73SBarry Smith PetscErrorCode ierr; 1328383922c3SLisandro Dalcin PetscInt m = A->rmap->n,n = A->cmap->n,i,j; 1329383922c3SLisandro Dalcin int color = PETSC_DRAW_WHITE; 1330ca15aa20SStefano Zampini const PetscScalar *v; 1331b0a32e0cSBarry Smith PetscViewer viewer; 1332b05fc000SLisandro Dalcin PetscReal xl,yl,xr,yr,x_l,x_r,y_l,y_r; 1333f3ef73ceSBarry Smith PetscViewerFormat format; 1334f1af5d2fSBarry Smith 1335f1af5d2fSBarry Smith PetscFunctionBegin; 1336f1af5d2fSBarry Smith ierr = PetscObjectQuery((PetscObject)A,"Zoomviewer",(PetscObject*)&viewer);CHKERRQ(ierr); 1337b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 1338b0a32e0cSBarry Smith ierr = PetscDrawGetCoordinates(draw,&xl,&yl,&xr,&yr);CHKERRQ(ierr); 1339f1af5d2fSBarry Smith 1340f1af5d2fSBarry Smith /* Loop over matrix elements drawing boxes */ 1341ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&v);CHKERRQ(ierr); 1342fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 1343383922c3SLisandro Dalcin ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr); 1344f1af5d2fSBarry Smith /* Blue for negative and Red for positive */ 1345f1af5d2fSBarry Smith for (j = 0; j < n; j++) { 1346383922c3SLisandro Dalcin x_l = j; x_r = x_l + 1.0; 1347f1af5d2fSBarry Smith for (i = 0; i < m; i++) { 1348f1af5d2fSBarry Smith y_l = m - i - 1.0; 1349f1af5d2fSBarry Smith y_r = y_l + 1.0; 1350ca15aa20SStefano Zampini if (PetscRealPart(v[j*m+i]) > 0.) color = PETSC_DRAW_RED; 1351ca15aa20SStefano Zampini else if (PetscRealPart(v[j*m+i]) < 0.) color = PETSC_DRAW_BLUE; 1352ca15aa20SStefano Zampini else continue; 1353b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 1354f1af5d2fSBarry Smith } 1355f1af5d2fSBarry Smith } 1356383922c3SLisandro Dalcin ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr); 1357f1af5d2fSBarry Smith } else { 1358f1af5d2fSBarry Smith /* use contour shading to indicate magnitude of values */ 1359f1af5d2fSBarry Smith /* first determine max of all nonzero values */ 1360b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1361b05fc000SLisandro Dalcin PetscDraw popup; 1362b05fc000SLisandro Dalcin 1363f1af5d2fSBarry Smith for (i=0; i < m*n; i++) { 1364f1af5d2fSBarry Smith if (PetscAbsScalar(v[i]) > maxv) maxv = PetscAbsScalar(v[i]); 1365f1af5d2fSBarry Smith } 1366383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 1367b0a32e0cSBarry Smith ierr = PetscDrawGetPopup(draw,&popup);CHKERRQ(ierr); 136845f3bb6eSLisandro Dalcin ierr = PetscDrawScalePopup(popup,minv,maxv);CHKERRQ(ierr); 1369383922c3SLisandro Dalcin 1370383922c3SLisandro Dalcin ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr); 1371f1af5d2fSBarry Smith for (j=0; j<n; j++) { 1372f1af5d2fSBarry Smith x_l = j; 1373f1af5d2fSBarry Smith x_r = x_l + 1.0; 1374f1af5d2fSBarry Smith for (i=0; i<m; i++) { 1375f1af5d2fSBarry Smith y_l = m - i - 1.0; 1376f1af5d2fSBarry Smith y_r = y_l + 1.0; 1377b05fc000SLisandro Dalcin color = PetscDrawRealToColor(PetscAbsScalar(v[j*m+i]),minv,maxv); 1378b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 1379f1af5d2fSBarry Smith } 1380f1af5d2fSBarry Smith } 1381383922c3SLisandro Dalcin ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr); 1382f1af5d2fSBarry Smith } 1383ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&v);CHKERRQ(ierr); 1384f1af5d2fSBarry Smith PetscFunctionReturn(0); 1385f1af5d2fSBarry Smith } 1386f1af5d2fSBarry Smith 1387e0877f53SBarry Smith static PetscErrorCode MatView_SeqDense_Draw(Mat A,PetscViewer viewer) 1388f1af5d2fSBarry Smith { 1389b0a32e0cSBarry Smith PetscDraw draw; 1390ace3abfcSBarry Smith PetscBool isnull; 1391329f5518SBarry Smith PetscReal xr,yr,xl,yl,h,w; 1392dfbe8321SBarry Smith PetscErrorCode ierr; 1393f1af5d2fSBarry Smith 1394f1af5d2fSBarry Smith PetscFunctionBegin; 1395b0a32e0cSBarry Smith ierr = PetscViewerDrawGetDraw(viewer,0,&draw);CHKERRQ(ierr); 1396b0a32e0cSBarry Smith ierr = PetscDrawIsNull(draw,&isnull);CHKERRQ(ierr); 1397abc0a331SBarry Smith if (isnull) PetscFunctionReturn(0); 1398f1af5d2fSBarry Smith 1399d0f46423SBarry Smith xr = A->cmap->n; yr = A->rmap->n; h = yr/10.0; w = xr/10.0; 1400f1af5d2fSBarry Smith xr += w; yr += h; xl = -w; yl = -h; 1401b0a32e0cSBarry Smith ierr = PetscDrawSetCoordinates(draw,xl,yl,xr,yr);CHKERRQ(ierr); 1402832b7cebSLisandro Dalcin ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",(PetscObject)viewer);CHKERRQ(ierr); 1403b0a32e0cSBarry Smith ierr = PetscDrawZoom(draw,MatView_SeqDense_Draw_Zoom,A);CHKERRQ(ierr); 14040298fd71SBarry Smith ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",NULL);CHKERRQ(ierr); 1405832b7cebSLisandro Dalcin ierr = PetscDrawSave(draw);CHKERRQ(ierr); 1406f1af5d2fSBarry Smith PetscFunctionReturn(0); 1407f1af5d2fSBarry Smith } 1408f1af5d2fSBarry Smith 1409dfbe8321SBarry Smith PetscErrorCode MatView_SeqDense(Mat A,PetscViewer viewer) 1410932b0c3eSLois Curfman McInnes { 1411dfbe8321SBarry Smith PetscErrorCode ierr; 1412ace3abfcSBarry Smith PetscBool iascii,isbinary,isdraw; 1413932b0c3eSLois Curfman McInnes 14143a40ed3dSBarry Smith PetscFunctionBegin; 1415251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 1416251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 1417251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERDRAW,&isdraw);CHKERRQ(ierr); 14180f5bd95cSBarry Smith 1419c45a1595SBarry Smith if (iascii) { 1420c45a1595SBarry Smith ierr = MatView_SeqDense_ASCII(A,viewer);CHKERRQ(ierr); 14210f5bd95cSBarry Smith } else if (isbinary) { 14223a40ed3dSBarry Smith ierr = MatView_SeqDense_Binary(A,viewer);CHKERRQ(ierr); 1423f1af5d2fSBarry Smith } else if (isdraw) { 1424f1af5d2fSBarry Smith ierr = MatView_SeqDense_Draw(A,viewer);CHKERRQ(ierr); 1425932b0c3eSLois Curfman McInnes } 14263a40ed3dSBarry Smith PetscFunctionReturn(0); 1427932b0c3eSLois Curfman McInnes } 1428289bc588SBarry Smith 1429d3042a70SBarry Smith static PetscErrorCode MatDensePlaceArray_SeqDense(Mat A,const PetscScalar array[]) 1430d3042a70SBarry Smith { 1431d3042a70SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1432d3042a70SBarry Smith 1433d3042a70SBarry Smith PetscFunctionBegin; 1434d3042a70SBarry Smith a->unplacedarray = a->v; 1435d3042a70SBarry Smith a->unplaced_user_alloc = a->user_alloc; 1436d3042a70SBarry Smith a->v = (PetscScalar*) array; 1437ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 1438c70f7ee4SJunchao Zhang A->offloadmask = PETSC_OFFLOAD_CPU; 1439ca15aa20SStefano Zampini #endif 1440d3042a70SBarry Smith PetscFunctionReturn(0); 1441d3042a70SBarry Smith } 1442d3042a70SBarry Smith 1443d3042a70SBarry Smith static PetscErrorCode MatDenseResetArray_SeqDense(Mat A) 1444d3042a70SBarry Smith { 1445d3042a70SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1446d3042a70SBarry Smith 1447d3042a70SBarry Smith PetscFunctionBegin; 1448d3042a70SBarry Smith a->v = a->unplacedarray; 1449d3042a70SBarry Smith a->user_alloc = a->unplaced_user_alloc; 1450d3042a70SBarry Smith a->unplacedarray = NULL; 1451ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 1452c70f7ee4SJunchao Zhang A->offloadmask = PETSC_OFFLOAD_CPU; 1453ca15aa20SStefano Zampini #endif 1454d3042a70SBarry Smith PetscFunctionReturn(0); 1455d3042a70SBarry Smith } 1456d3042a70SBarry Smith 1457ca15aa20SStefano Zampini PetscErrorCode MatDestroy_SeqDense(Mat mat) 1458289bc588SBarry Smith { 1459ec8511deSBarry Smith Mat_SeqDense *l = (Mat_SeqDense*)mat->data; 1460dfbe8321SBarry Smith PetscErrorCode ierr; 146190f02eecSBarry Smith 14623a40ed3dSBarry Smith PetscFunctionBegin; 1463aa482453SBarry Smith #if defined(PETSC_USE_LOG) 1464d0f46423SBarry Smith PetscLogObjectState((PetscObject)mat,"Rows %D Cols %D",mat->rmap->n,mat->cmap->n); 1465a5a9c739SBarry Smith #endif 146605b42c5fSBarry Smith ierr = PetscFree(l->pivots);CHKERRQ(ierr); 1467a49dc2a2SStefano Zampini ierr = PetscFree(l->fwork);CHKERRQ(ierr); 1468abc3b08eSStefano Zampini ierr = MatDestroy(&l->ptapwork);CHKERRQ(ierr); 14696857c123SSatish Balay if (!l->user_alloc) {ierr = PetscFree(l->v);CHKERRQ(ierr);} 1470bf0cc555SLisandro Dalcin ierr = PetscFree(mat->data);CHKERRQ(ierr); 1471dbd8c25aSHong Zhang 1472dbd8c25aSHong Zhang ierr = PetscObjectChangeTypeName((PetscObject)mat,0);CHKERRQ(ierr); 147349a6ff4bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetLDA_C",NULL);CHKERRQ(ierr); 1474bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetArray_C",NULL);CHKERRQ(ierr); 147552c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreArray_C",NULL);CHKERRQ(ierr); 1476d3042a70SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDensePlaceArray_C",NULL);CHKERRQ(ierr); 1477d3042a70SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseResetArray_C",NULL);CHKERRQ(ierr); 147852c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetArrayRead_C",NULL);CHKERRQ(ierr); 147952c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreArrayRead_C",NULL);CHKERRQ(ierr); 14808baccfbdSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatConvert_seqdense_seqaij_C",NULL);CHKERRQ(ierr); 14818baccfbdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 14828baccfbdSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatConvert_seqdense_elemental_C",NULL);CHKERRQ(ierr); 14838baccfbdSHong Zhang #endif 14842bf066beSStefano Zampini #if defined(PETSC_HAVE_CUDA) 14852bf066beSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatConvert_seqdense_seqdensecuda_C",NULL);CHKERRQ(ierr); 1486a4af7ca8SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMult_seqaijcusparse_seqdense_C",NULL);CHKERRQ(ierr); 1487a4af7ca8SStefano Zampini #endif 1488a4af7ca8SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) 1489a4af7ca8SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMult_seqaijviennacl_seqdense_C",NULL);CHKERRQ(ierr); 14902bf066beSStefano Zampini #endif 1491bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatSeqDenseSetPreallocation_C",NULL);CHKERRQ(ierr); 1492bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMult_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 1493bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultSymbolic_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 1494bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultNumeric_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 1495a001520aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMult_seqbaij_seqdense_C",NULL);CHKERRQ(ierr); 1496a001520aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultSymbolic_seqbaij_seqdense_C",NULL);CHKERRQ(ierr); 1497a001520aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultNumeric_seqbaij_seqdense_C",NULL);CHKERRQ(ierr); 1498*c2916339SPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMult_seqsbaij_seqdense_C",NULL);CHKERRQ(ierr); 1499*c2916339SPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultSymbolic_seqsbaij_seqdense_C",NULL);CHKERRQ(ierr); 1500*c2916339SPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultNumeric_seqsbaij_seqdense_C",NULL);CHKERRQ(ierr); 1501abc3b08eSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatPtAP_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 150252c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMult_seqaijperm_seqdense_C",NULL);CHKERRQ(ierr); 150352c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultSymbolic_seqaijperm_seqdense_C",NULL);CHKERRQ(ierr); 150452c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultNumeric_seqaijperm_seqdense_C",NULL);CHKERRQ(ierr); 150552c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatPtAP_seqaijperm_seqdense_C",NULL);CHKERRQ(ierr); 150652c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMult_seqaijsell_seqdense_C",NULL);CHKERRQ(ierr); 150752c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultSymbolic_seqaijsell_seqdense_C",NULL);CHKERRQ(ierr); 150852c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultNumeric_seqaijsell_seqdense_C",NULL);CHKERRQ(ierr); 150952c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatPtAP_seqaijsell_seqdense_C",NULL);CHKERRQ(ierr); 151052c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMult_seqaijmkl_seqdense_C",NULL);CHKERRQ(ierr); 151152c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultSymbolic_seqaijmkl_seqdense_C",NULL);CHKERRQ(ierr); 151252c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultNumeric_seqaijmkl_seqdense_C",NULL);CHKERRQ(ierr); 151352c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMult_nest_seqdense_C",NULL);CHKERRQ(ierr); 151452c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultSymbolic_nest_seqdense_C",NULL);CHKERRQ(ierr); 151552c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultNumeric_nest_seqdense_C",NULL);CHKERRQ(ierr); 151652c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatPtAP_seqaijmkl_seqdense_C",NULL);CHKERRQ(ierr); 151752c5f739Sprj- 15183bf78175SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMult_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 15193bf78175SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultSymbolic_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 15203bf78175SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultNumeric_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 152152c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMult_seqaijperm_seqdense_C",NULL);CHKERRQ(ierr); 152252c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultSymbolic_seqaijperm_seqdense_C",NULL);CHKERRQ(ierr); 152352c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultNumeric_seqaijperm_seqdense_C",NULL);CHKERRQ(ierr); 152452c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMult_seqaijsell_seqdense_C",NULL);CHKERRQ(ierr); 152552c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultSymbolic_seqaijsell_seqdense_C",NULL);CHKERRQ(ierr); 152652c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultNumeric_seqaijsell_seqdense_C",NULL);CHKERRQ(ierr); 152752c5f739Sprj- 152852c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMult_seqaijmkl_seqdense_C",NULL);CHKERRQ(ierr); 152952c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultSymbolic_seqaijmkl_seqdense_C",NULL);CHKERRQ(ierr); 153052c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultNumeric_seqaijmkl_seqdense_C",NULL);CHKERRQ(ierr); 153186aefd0dSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetColumn_C",NULL);CHKERRQ(ierr); 153286aefd0dSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreColumn_C",NULL);CHKERRQ(ierr); 15333a40ed3dSBarry Smith PetscFunctionReturn(0); 1534289bc588SBarry Smith } 1535289bc588SBarry Smith 1536e0877f53SBarry Smith static PetscErrorCode MatTranspose_SeqDense(Mat A,MatReuse reuse,Mat *matout) 1537289bc588SBarry Smith { 1538c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 15396849ba73SBarry Smith PetscErrorCode ierr; 154013f74950SBarry Smith PetscInt k,j,m,n,M; 154187828ca2SBarry Smith PetscScalar *v,tmp; 154248b35521SBarry Smith 15433a40ed3dSBarry Smith PetscFunctionBegin; 1544ca15aa20SStefano Zampini m = A->rmap->n; M = mat->lda; n = A->cmap->n; 15452847e3fdSStefano Zampini if (reuse == MAT_INPLACE_MATRIX && m == n) { /* in place transpose */ 1546ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 1547d3e5ee88SLois Curfman McInnes for (j=0; j<m; j++) { 1548289bc588SBarry Smith for (k=0; k<j; k++) { 15491b807ce4Svictorle tmp = v[j + k*M]; 15501b807ce4Svictorle v[j + k*M] = v[k + j*M]; 15511b807ce4Svictorle v[k + j*M] = tmp; 1552289bc588SBarry Smith } 1553289bc588SBarry Smith } 1554ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 15553a40ed3dSBarry Smith } else { /* out-of-place transpose */ 1556d3e5ee88SLois Curfman McInnes Mat tmat; 1557ec8511deSBarry Smith Mat_SeqDense *tmatd; 155887828ca2SBarry Smith PetscScalar *v2; 1559af36a384SStefano Zampini PetscInt M2; 1560ea709b57SSatish Balay 15612847e3fdSStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 1562ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&tmat);CHKERRQ(ierr); 1563d0f46423SBarry Smith ierr = MatSetSizes(tmat,A->cmap->n,A->rmap->n,A->cmap->n,A->rmap->n);CHKERRQ(ierr); 15647adad957SLisandro Dalcin ierr = MatSetType(tmat,((PetscObject)A)->type_name);CHKERRQ(ierr); 15650298fd71SBarry Smith ierr = MatSeqDenseSetPreallocation(tmat,NULL);CHKERRQ(ierr); 1566ca15aa20SStefano Zampini } else tmat = *matout; 1567ca15aa20SStefano Zampini 1568ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,(const PetscScalar**)&v);CHKERRQ(ierr); 1569ca15aa20SStefano Zampini ierr = MatDenseGetArray(tmat,&v2);CHKERRQ(ierr); 1570ec8511deSBarry Smith tmatd = (Mat_SeqDense*)tmat->data; 1571ca15aa20SStefano Zampini M2 = tmatd->lda; 1572d3e5ee88SLois Curfman McInnes for (j=0; j<n; j++) { 1573af36a384SStefano Zampini for (k=0; k<m; k++) v2[j + k*M2] = v[k + j*M]; 1574d3e5ee88SLois Curfman McInnes } 1575ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(tmat,&v2);CHKERRQ(ierr); 1576ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,(const PetscScalar**)&v);CHKERRQ(ierr); 15776d4a8577SBarry Smith ierr = MatAssemblyBegin(tmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 15786d4a8577SBarry Smith ierr = MatAssemblyEnd(tmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 15792847e3fdSStefano Zampini if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX) *matout = tmat; 15802847e3fdSStefano Zampini else { 15812847e3fdSStefano Zampini ierr = MatHeaderMerge(A,&tmat);CHKERRQ(ierr); 15822847e3fdSStefano Zampini } 158348b35521SBarry Smith } 15843a40ed3dSBarry Smith PetscFunctionReturn(0); 1585289bc588SBarry Smith } 1586289bc588SBarry Smith 1587e0877f53SBarry Smith static PetscErrorCode MatEqual_SeqDense(Mat A1,Mat A2,PetscBool *flg) 1588289bc588SBarry Smith { 1589c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat1 = (Mat_SeqDense*)A1->data; 1590c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat2 = (Mat_SeqDense*)A2->data; 1591ca15aa20SStefano Zampini PetscInt i; 1592ca15aa20SStefano Zampini const PetscScalar *v1,*v2; 1593ca15aa20SStefano Zampini PetscErrorCode ierr; 15949ea5d5aeSSatish Balay 15953a40ed3dSBarry Smith PetscFunctionBegin; 1596d0f46423SBarry Smith if (A1->rmap->n != A2->rmap->n) {*flg = PETSC_FALSE; PetscFunctionReturn(0);} 1597d0f46423SBarry Smith if (A1->cmap->n != A2->cmap->n) {*flg = PETSC_FALSE; PetscFunctionReturn(0);} 1598ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A1,&v1);CHKERRQ(ierr); 1599ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A2,&v2);CHKERRQ(ierr); 1600ca15aa20SStefano Zampini for (i=0; i<A1->cmap->n; i++) { 1601ca15aa20SStefano Zampini ierr = PetscArraycmp(v1,v2,A1->rmap->n,flg);CHKERRQ(ierr); 1602ca15aa20SStefano Zampini if (*flg == PETSC_FALSE) PetscFunctionReturn(0); 1603ca15aa20SStefano Zampini v1 += mat1->lda; 1604ca15aa20SStefano Zampini v2 += mat2->lda; 16051b807ce4Svictorle } 1606ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A1,&v1);CHKERRQ(ierr); 1607ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A2,&v2);CHKERRQ(ierr); 160877c4ece6SBarry Smith *flg = PETSC_TRUE; 16093a40ed3dSBarry Smith PetscFunctionReturn(0); 1610289bc588SBarry Smith } 1611289bc588SBarry Smith 1612e0877f53SBarry Smith static PetscErrorCode MatGetDiagonal_SeqDense(Mat A,Vec v) 1613289bc588SBarry Smith { 1614c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 161513f74950SBarry Smith PetscInt i,n,len; 1616ca15aa20SStefano Zampini PetscScalar *x; 1617ca15aa20SStefano Zampini const PetscScalar *vv; 1618ca15aa20SStefano Zampini PetscErrorCode ierr; 161944cd7ae7SLois Curfman McInnes 16203a40ed3dSBarry Smith PetscFunctionBegin; 16217a97a34bSBarry Smith ierr = VecGetSize(v,&n);CHKERRQ(ierr); 16221ebc52fbSHong Zhang ierr = VecGetArray(v,&x);CHKERRQ(ierr); 1623d0f46423SBarry Smith len = PetscMin(A->rmap->n,A->cmap->n); 1624ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&vv);CHKERRQ(ierr); 1625e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming mat and vec"); 162644cd7ae7SLois Curfman McInnes for (i=0; i<len; i++) { 1627ca15aa20SStefano Zampini x[i] = vv[i*mat->lda + i]; 1628289bc588SBarry Smith } 1629ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&vv);CHKERRQ(ierr); 16301ebc52fbSHong Zhang ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 16313a40ed3dSBarry Smith PetscFunctionReturn(0); 1632289bc588SBarry Smith } 1633289bc588SBarry Smith 1634e0877f53SBarry Smith static PetscErrorCode MatDiagonalScale_SeqDense(Mat A,Vec ll,Vec rr) 1635289bc588SBarry Smith { 1636c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 1637f1ceaac6SMatthew G. Knepley const PetscScalar *l,*r; 1638ca15aa20SStefano Zampini PetscScalar x,*v,*vv; 1639dfbe8321SBarry Smith PetscErrorCode ierr; 1640d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n; 164155659b69SBarry Smith 16423a40ed3dSBarry Smith PetscFunctionBegin; 1643ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&vv);CHKERRQ(ierr); 164428988994SBarry Smith if (ll) { 16457a97a34bSBarry Smith ierr = VecGetSize(ll,&m);CHKERRQ(ierr); 1646f1ceaac6SMatthew G. Knepley ierr = VecGetArrayRead(ll,&l);CHKERRQ(ierr); 1647e32f2f54SBarry Smith if (m != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Left scaling vec wrong size"); 1648da3a660dSBarry Smith for (i=0; i<m; i++) { 1649da3a660dSBarry Smith x = l[i]; 1650ca15aa20SStefano Zampini v = vv + i; 1651b43bac26SStefano Zampini for (j=0; j<n; j++) { (*v) *= x; v+= mat->lda;} 1652da3a660dSBarry Smith } 1653f1ceaac6SMatthew G. Knepley ierr = VecRestoreArrayRead(ll,&l);CHKERRQ(ierr); 1654eb3f19e4SBarry Smith ierr = PetscLogFlops(1.0*n*m);CHKERRQ(ierr); 1655da3a660dSBarry Smith } 165628988994SBarry Smith if (rr) { 16577a97a34bSBarry Smith ierr = VecGetSize(rr,&n);CHKERRQ(ierr); 1658f1ceaac6SMatthew G. Knepley ierr = VecGetArrayRead(rr,&r);CHKERRQ(ierr); 1659e32f2f54SBarry Smith if (n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Right scaling vec wrong size"); 1660da3a660dSBarry Smith for (i=0; i<n; i++) { 1661da3a660dSBarry Smith x = r[i]; 1662ca15aa20SStefano Zampini v = vv + i*mat->lda; 16632205254eSKarl Rupp for (j=0; j<m; j++) (*v++) *= x; 1664da3a660dSBarry Smith } 1665f1ceaac6SMatthew G. Knepley ierr = VecRestoreArrayRead(rr,&r);CHKERRQ(ierr); 1666eb3f19e4SBarry Smith ierr = PetscLogFlops(1.0*n*m);CHKERRQ(ierr); 1667da3a660dSBarry Smith } 1668ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&vv);CHKERRQ(ierr); 16693a40ed3dSBarry Smith PetscFunctionReturn(0); 1670289bc588SBarry Smith } 1671289bc588SBarry Smith 1672ca15aa20SStefano Zampini PetscErrorCode MatNorm_SeqDense(Mat A,NormType type,PetscReal *nrm) 1673289bc588SBarry Smith { 1674c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 1675ca15aa20SStefano Zampini PetscScalar *v,*vv; 1676329f5518SBarry Smith PetscReal sum = 0.0; 1677d0f46423SBarry Smith PetscInt lda =mat->lda,m=A->rmap->n,i,j; 1678efee365bSSatish Balay PetscErrorCode ierr; 167955659b69SBarry Smith 16803a40ed3dSBarry Smith PetscFunctionBegin; 1681ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,(const PetscScalar**)&vv);CHKERRQ(ierr); 1682ca15aa20SStefano Zampini v = vv; 1683289bc588SBarry Smith if (type == NORM_FROBENIUS) { 1684a5ce6ee0Svictorle if (lda>m) { 1685d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1686ca15aa20SStefano Zampini v = vv+j*lda; 1687a5ce6ee0Svictorle for (i=0; i<m; i++) { 1688a5ce6ee0Svictorle sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 1689a5ce6ee0Svictorle } 1690a5ce6ee0Svictorle } 1691a5ce6ee0Svictorle } else { 1692570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 1693570b7f6dSBarry Smith PetscBLASInt one = 1,cnt = A->cmap->n*A->rmap->n; 1694570b7f6dSBarry Smith *nrm = BLASnrm2_(&cnt,v,&one); 1695570b7f6dSBarry Smith } 1696570b7f6dSBarry Smith #else 1697d0f46423SBarry Smith for (i=0; i<A->cmap->n*A->rmap->n; i++) { 1698329f5518SBarry Smith sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 1699289bc588SBarry Smith } 1700a5ce6ee0Svictorle } 17018f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 1702570b7f6dSBarry Smith #endif 1703dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->rmap->n);CHKERRQ(ierr); 17043a40ed3dSBarry Smith } else if (type == NORM_1) { 1705064f8208SBarry Smith *nrm = 0.0; 1706d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1707ca15aa20SStefano Zampini v = vv + j*mat->lda; 1708289bc588SBarry Smith sum = 0.0; 1709d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 171033a8263dSBarry Smith sum += PetscAbsScalar(*v); v++; 1711289bc588SBarry Smith } 1712064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 1713289bc588SBarry Smith } 1714eb3f19e4SBarry Smith ierr = PetscLogFlops(1.0*A->cmap->n*A->rmap->n);CHKERRQ(ierr); 17153a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 1716064f8208SBarry Smith *nrm = 0.0; 1717d0f46423SBarry Smith for (j=0; j<A->rmap->n; j++) { 1718ca15aa20SStefano Zampini v = vv + j; 1719289bc588SBarry Smith sum = 0.0; 1720d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) { 17211b807ce4Svictorle sum += PetscAbsScalar(*v); v += mat->lda; 1722289bc588SBarry Smith } 1723064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 1724289bc588SBarry Smith } 1725eb3f19e4SBarry Smith ierr = PetscLogFlops(1.0*A->cmap->n*A->rmap->n);CHKERRQ(ierr); 1726e7e72b3dSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"No two norm"); 1727ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,(const PetscScalar**)&vv);CHKERRQ(ierr); 17283a40ed3dSBarry Smith PetscFunctionReturn(0); 1729289bc588SBarry Smith } 1730289bc588SBarry Smith 1731e0877f53SBarry Smith static PetscErrorCode MatSetOption_SeqDense(Mat A,MatOption op,PetscBool flg) 1732289bc588SBarry Smith { 1733c0bbcb79SLois Curfman McInnes Mat_SeqDense *aij = (Mat_SeqDense*)A->data; 173463ba0a88SBarry Smith PetscErrorCode ierr; 173567e560aaSBarry Smith 17363a40ed3dSBarry Smith PetscFunctionBegin; 1737b5a2b587SKris Buschelman switch (op) { 1738b5a2b587SKris Buschelman case MAT_ROW_ORIENTED: 17394e0d8c25SBarry Smith aij->roworiented = flg; 1740b5a2b587SKris Buschelman break; 1741512a5fc5SBarry Smith case MAT_NEW_NONZERO_LOCATIONS: 1742b5a2b587SKris Buschelman case MAT_NEW_NONZERO_LOCATION_ERR: 17433971808eSMatthew Knepley case MAT_NEW_NONZERO_ALLOCATION_ERR: 17444e0d8c25SBarry Smith case MAT_NEW_DIAGONALS: 174513fa8e87SLisandro Dalcin case MAT_KEEP_NONZERO_PATTERN: 1746b5a2b587SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1747b5a2b587SKris Buschelman case MAT_USE_HASH_TABLE: 17480f8fb01aSBarry Smith case MAT_IGNORE_ZERO_ENTRIES: 17495021d80fSJed Brown case MAT_IGNORE_LOWER_TRIANGULAR: 1750071fcb05SBarry Smith case MAT_SORTED_FULL: 17515021d80fSJed Brown ierr = PetscInfo1(A,"Option %s ignored\n",MatOptions[op]);CHKERRQ(ierr); 17525021d80fSJed Brown break; 17535021d80fSJed Brown case MAT_SPD: 175477e54ba9SKris Buschelman case MAT_SYMMETRIC: 175577e54ba9SKris Buschelman case MAT_STRUCTURALLY_SYMMETRIC: 17569a4540c5SBarry Smith case MAT_HERMITIAN: 17579a4540c5SBarry Smith case MAT_SYMMETRY_ETERNAL: 17585021d80fSJed Brown /* These options are handled directly by MatSetOption() */ 175977e54ba9SKris Buschelman break; 1760b5a2b587SKris Buschelman default: 1761e32f2f54SBarry Smith SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"unknown option %s",MatOptions[op]); 17623a40ed3dSBarry Smith } 17633a40ed3dSBarry Smith PetscFunctionReturn(0); 1764289bc588SBarry Smith } 1765289bc588SBarry Smith 1766e0877f53SBarry Smith static PetscErrorCode MatZeroEntries_SeqDense(Mat A) 17676f0a148fSBarry Smith { 1768ec8511deSBarry Smith Mat_SeqDense *l = (Mat_SeqDense*)A->data; 17696849ba73SBarry Smith PetscErrorCode ierr; 1770d0f46423SBarry Smith PetscInt lda=l->lda,m=A->rmap->n,j; 1771ca15aa20SStefano Zampini PetscScalar *v; 17723a40ed3dSBarry Smith 17733a40ed3dSBarry Smith PetscFunctionBegin; 1774ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 1775a5ce6ee0Svictorle if (lda>m) { 1776d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1777ca15aa20SStefano Zampini ierr = PetscArrayzero(v+j*lda,m);CHKERRQ(ierr); 1778a5ce6ee0Svictorle } 1779a5ce6ee0Svictorle } else { 1780ca15aa20SStefano Zampini ierr = PetscArrayzero(v,A->rmap->n*A->cmap->n);CHKERRQ(ierr); 1781a5ce6ee0Svictorle } 1782ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 17833a40ed3dSBarry Smith PetscFunctionReturn(0); 17846f0a148fSBarry Smith } 17856f0a148fSBarry Smith 1786e0877f53SBarry Smith static PetscErrorCode MatZeroRows_SeqDense(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 17876f0a148fSBarry Smith { 178897b48c8fSBarry Smith PetscErrorCode ierr; 1789ec8511deSBarry Smith Mat_SeqDense *l = (Mat_SeqDense*)A->data; 1790b9679d65SBarry Smith PetscInt m = l->lda, n = A->cmap->n, i,j; 1791ca15aa20SStefano Zampini PetscScalar *slot,*bb,*v; 179297b48c8fSBarry Smith const PetscScalar *xx; 179355659b69SBarry Smith 17943a40ed3dSBarry Smith PetscFunctionBegin; 1795b9679d65SBarry Smith #if defined(PETSC_USE_DEBUG) 1796b9679d65SBarry Smith for (i=0; i<N; i++) { 1797b9679d65SBarry Smith if (rows[i] < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row requested to be zeroed"); 1798b9679d65SBarry Smith if (rows[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D requested to be zeroed greater than or equal number of rows %D",rows[i],A->rmap->n); 1799b9679d65SBarry Smith } 1800b9679d65SBarry Smith #endif 1801ca15aa20SStefano Zampini if (!N) PetscFunctionReturn(0); 1802b9679d65SBarry Smith 180397b48c8fSBarry Smith /* fix right hand side if needed */ 180497b48c8fSBarry Smith if (x && b) { 180597b48c8fSBarry Smith ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 180697b48c8fSBarry Smith ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 18072205254eSKarl Rupp for (i=0; i<N; i++) bb[rows[i]] = diag*xx[rows[i]]; 180897b48c8fSBarry Smith ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 180997b48c8fSBarry Smith ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 181097b48c8fSBarry Smith } 181197b48c8fSBarry Smith 1812ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 18136f0a148fSBarry Smith for (i=0; i<N; i++) { 1814ca15aa20SStefano Zampini slot = v + rows[i]; 1815b9679d65SBarry Smith for (j=0; j<n; j++) { *slot = 0.0; slot += m;} 18166f0a148fSBarry Smith } 1817f4df32b1SMatthew Knepley if (diag != 0.0) { 1818b9679d65SBarry Smith if (A->rmap->n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Only coded for square matrices"); 18196f0a148fSBarry Smith for (i=0; i<N; i++) { 1820ca15aa20SStefano Zampini slot = v + (m+1)*rows[i]; 1821f4df32b1SMatthew Knepley *slot = diag; 18226f0a148fSBarry Smith } 18236f0a148fSBarry Smith } 1824ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 18253a40ed3dSBarry Smith PetscFunctionReturn(0); 18266f0a148fSBarry Smith } 1827557bce09SLois Curfman McInnes 182849a6ff4bSBarry Smith static PetscErrorCode MatDenseGetLDA_SeqDense(Mat A,PetscInt *lda) 182949a6ff4bSBarry Smith { 183049a6ff4bSBarry Smith Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 183149a6ff4bSBarry Smith 183249a6ff4bSBarry Smith PetscFunctionBegin; 183349a6ff4bSBarry Smith *lda = mat->lda; 183449a6ff4bSBarry Smith PetscFunctionReturn(0); 183549a6ff4bSBarry Smith } 183649a6ff4bSBarry Smith 1837ca15aa20SStefano Zampini PetscErrorCode MatDenseGetArray_SeqDense(Mat A,PetscScalar *array[]) 183864e87e97SBarry Smith { 1839c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 18403a40ed3dSBarry Smith 18413a40ed3dSBarry Smith PetscFunctionBegin; 184264e87e97SBarry Smith *array = mat->v; 18433a40ed3dSBarry Smith PetscFunctionReturn(0); 184464e87e97SBarry Smith } 18450754003eSLois Curfman McInnes 1846ca15aa20SStefano Zampini PetscErrorCode MatDenseRestoreArray_SeqDense(Mat A,PetscScalar *array[]) 1847ff14e315SSatish Balay { 18483a40ed3dSBarry Smith PetscFunctionBegin; 18493a40ed3dSBarry Smith PetscFunctionReturn(0); 1850ff14e315SSatish Balay } 18510754003eSLois Curfman McInnes 1852dec5eb66SMatthew G Knepley /*@C 185349a6ff4bSBarry Smith MatDenseGetLDA - gets the leading dimension of the array returned from MatDenseGetArray() 185449a6ff4bSBarry Smith 185549a6ff4bSBarry Smith Logically Collective on Mat 185649a6ff4bSBarry Smith 185749a6ff4bSBarry Smith Input Parameter: 185849a6ff4bSBarry Smith . mat - a MATSEQDENSE or MATMPIDENSE matrix 185949a6ff4bSBarry Smith 186049a6ff4bSBarry Smith Output Parameter: 186149a6ff4bSBarry Smith . lda - the leading dimension 186249a6ff4bSBarry Smith 186349a6ff4bSBarry Smith Level: intermediate 186449a6ff4bSBarry Smith 186549a6ff4bSBarry Smith .seealso: MatDenseGetArray(), MatDenseRestoreArray(), MatDenseGetArrayRead(), MatDenseRestoreArrayRead(), MatSeqDenseSetLDA() 186649a6ff4bSBarry Smith @*/ 186749a6ff4bSBarry Smith PetscErrorCode MatDenseGetLDA(Mat A,PetscInt *lda) 186849a6ff4bSBarry Smith { 186949a6ff4bSBarry Smith PetscErrorCode ierr; 187049a6ff4bSBarry Smith 187149a6ff4bSBarry Smith PetscFunctionBegin; 187249a6ff4bSBarry Smith ierr = PetscUseMethod(A,"MatDenseGetLDA_C",(Mat,PetscInt*),(A,lda));CHKERRQ(ierr); 187349a6ff4bSBarry Smith PetscFunctionReturn(0); 187449a6ff4bSBarry Smith } 187549a6ff4bSBarry Smith 187649a6ff4bSBarry Smith /*@C 18778c778c55SBarry Smith MatDenseGetArray - gives access to the array where the data for a SeqDense matrix is stored 187873a71a0fSBarry Smith 18798572280aSBarry Smith Logically Collective on Mat 188073a71a0fSBarry Smith 188173a71a0fSBarry Smith Input Parameter: 1882579dbff0SBarry Smith . mat - a MATSEQDENSE or MATMPIDENSE matrix 188373a71a0fSBarry Smith 188473a71a0fSBarry Smith Output Parameter: 188573a71a0fSBarry Smith . array - pointer to the data 188673a71a0fSBarry Smith 188773a71a0fSBarry Smith Level: intermediate 188873a71a0fSBarry Smith 18898572280aSBarry Smith .seealso: MatDenseRestoreArray(), MatDenseGetArrayRead(), MatDenseRestoreArrayRead() 189073a71a0fSBarry Smith @*/ 18918c778c55SBarry Smith PetscErrorCode MatDenseGetArray(Mat A,PetscScalar **array) 189273a71a0fSBarry Smith { 189373a71a0fSBarry Smith PetscErrorCode ierr; 189473a71a0fSBarry Smith 189573a71a0fSBarry Smith PetscFunctionBegin; 18968c778c55SBarry Smith ierr = PetscUseMethod(A,"MatDenseGetArray_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 189773a71a0fSBarry Smith PetscFunctionReturn(0); 189873a71a0fSBarry Smith } 189973a71a0fSBarry Smith 1900dec5eb66SMatthew G Knepley /*@C 1901579dbff0SBarry Smith MatDenseRestoreArray - returns access to the array where the data for a dense matrix is stored obtained by MatDenseGetArray() 190273a71a0fSBarry Smith 19038572280aSBarry Smith Logically Collective on Mat 19048572280aSBarry Smith 19058572280aSBarry Smith Input Parameters: 1906a2b725a8SWilliam Gropp + mat - a MATSEQDENSE or MATMPIDENSE matrix 1907a2b725a8SWilliam Gropp - array - pointer to the data 19088572280aSBarry Smith 19098572280aSBarry Smith Level: intermediate 19108572280aSBarry Smith 19118572280aSBarry Smith .seealso: MatDenseGetArray(), MatDenseGetArrayRead(), MatDenseRestoreArrayRead() 19128572280aSBarry Smith @*/ 19138572280aSBarry Smith PetscErrorCode MatDenseRestoreArray(Mat A,PetscScalar **array) 19148572280aSBarry Smith { 19158572280aSBarry Smith PetscErrorCode ierr; 19168572280aSBarry Smith 19178572280aSBarry Smith PetscFunctionBegin; 19188572280aSBarry Smith ierr = PetscUseMethod(A,"MatDenseRestoreArray_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 19198572280aSBarry Smith if (array) *array = NULL; 19208572280aSBarry Smith ierr = PetscObjectStateIncrease((PetscObject)A);CHKERRQ(ierr); 19218572280aSBarry Smith PetscFunctionReturn(0); 19228572280aSBarry Smith } 19238572280aSBarry Smith 19248572280aSBarry Smith /*@C 19258572280aSBarry Smith MatDenseGetArrayRead - gives access to the array where the data for a SeqDense matrix is stored 19268572280aSBarry Smith 19278572280aSBarry Smith Not Collective 19288572280aSBarry Smith 19298572280aSBarry Smith Input Parameter: 19308572280aSBarry Smith . mat - a MATSEQDENSE or MATMPIDENSE matrix 19318572280aSBarry Smith 19328572280aSBarry Smith Output Parameter: 19338572280aSBarry Smith . array - pointer to the data 19348572280aSBarry Smith 19358572280aSBarry Smith Level: intermediate 19368572280aSBarry Smith 19378572280aSBarry Smith .seealso: MatDenseRestoreArray(), MatDenseGetArray(), MatDenseRestoreArrayRead() 19388572280aSBarry Smith @*/ 19398572280aSBarry Smith PetscErrorCode MatDenseGetArrayRead(Mat A,const PetscScalar **array) 19408572280aSBarry Smith { 19418572280aSBarry Smith PetscErrorCode ierr; 19428572280aSBarry Smith 19438572280aSBarry Smith PetscFunctionBegin; 19448572280aSBarry Smith ierr = PetscUseMethod(A,"MatDenseGetArrayRead_C",(Mat,const PetscScalar**),(A,array));CHKERRQ(ierr); 19458572280aSBarry Smith PetscFunctionReturn(0); 19468572280aSBarry Smith } 19478572280aSBarry Smith 19488572280aSBarry Smith /*@C 19498572280aSBarry Smith MatDenseRestoreArrayRead - returns access to the array where the data for a dense matrix is stored obtained by MatDenseGetArray() 19508572280aSBarry Smith 195173a71a0fSBarry Smith Not Collective 195273a71a0fSBarry Smith 195373a71a0fSBarry Smith Input Parameters: 1954a2b725a8SWilliam Gropp + mat - a MATSEQDENSE or MATMPIDENSE matrix 1955a2b725a8SWilliam Gropp - array - pointer to the data 195673a71a0fSBarry Smith 195773a71a0fSBarry Smith Level: intermediate 195873a71a0fSBarry Smith 19598572280aSBarry Smith .seealso: MatDenseGetArray(), MatDenseGetArrayRead(), MatDenseRestoreArray() 196073a71a0fSBarry Smith @*/ 19618572280aSBarry Smith PetscErrorCode MatDenseRestoreArrayRead(Mat A,const PetscScalar **array) 196273a71a0fSBarry Smith { 196373a71a0fSBarry Smith PetscErrorCode ierr; 196473a71a0fSBarry Smith 196573a71a0fSBarry Smith PetscFunctionBegin; 19668572280aSBarry Smith ierr = PetscUseMethod(A,"MatDenseRestoreArrayRead_C",(Mat,const PetscScalar**),(A,array));CHKERRQ(ierr); 19678572280aSBarry Smith if (array) *array = NULL; 196873a71a0fSBarry Smith PetscFunctionReturn(0); 196973a71a0fSBarry Smith } 197073a71a0fSBarry Smith 19717dae84e0SHong Zhang static PetscErrorCode MatCreateSubMatrix_SeqDense(Mat A,IS isrow,IS iscol,PetscInt cs,MatReuse scall,Mat *B) 19720754003eSLois Curfman McInnes { 1973c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 19746849ba73SBarry Smith PetscErrorCode ierr; 1975ca15aa20SStefano Zampini PetscInt i,j,nrows,ncols,blda; 19765d0c19d7SBarry Smith const PetscInt *irow,*icol; 197787828ca2SBarry Smith PetscScalar *av,*bv,*v = mat->v; 19780754003eSLois Curfman McInnes Mat newmat; 19790754003eSLois Curfman McInnes 19803a40ed3dSBarry Smith PetscFunctionBegin; 198178b31e54SBarry Smith ierr = ISGetIndices(isrow,&irow);CHKERRQ(ierr); 198278b31e54SBarry Smith ierr = ISGetIndices(iscol,&icol);CHKERRQ(ierr); 1983e03a110bSBarry Smith ierr = ISGetLocalSize(isrow,&nrows);CHKERRQ(ierr); 1984e03a110bSBarry Smith ierr = ISGetLocalSize(iscol,&ncols);CHKERRQ(ierr); 19850754003eSLois Curfman McInnes 1986182d2002SSatish Balay /* Check submatrixcall */ 1987182d2002SSatish Balay if (scall == MAT_REUSE_MATRIX) { 198813f74950SBarry Smith PetscInt n_cols,n_rows; 1989182d2002SSatish Balay ierr = MatGetSize(*B,&n_rows,&n_cols);CHKERRQ(ierr); 199021a2c019SBarry Smith if (n_rows != nrows || n_cols != ncols) { 1991f746d493SDmitry Karpeev /* resize the result matrix to match number of requested rows/columns */ 1992c61587bbSBarry Smith ierr = MatSetSizes(*B,nrows,ncols,nrows,ncols);CHKERRQ(ierr); 199321a2c019SBarry Smith } 1994182d2002SSatish Balay newmat = *B; 1995182d2002SSatish Balay } else { 19960754003eSLois Curfman McInnes /* Create and fill new matrix */ 1997ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&newmat);CHKERRQ(ierr); 1998f69a0ea3SMatthew Knepley ierr = MatSetSizes(newmat,nrows,ncols,nrows,ncols);CHKERRQ(ierr); 19997adad957SLisandro Dalcin ierr = MatSetType(newmat,((PetscObject)A)->type_name);CHKERRQ(ierr); 20000298fd71SBarry Smith ierr = MatSeqDenseSetPreallocation(newmat,NULL);CHKERRQ(ierr); 2001182d2002SSatish Balay } 2002182d2002SSatish Balay 2003182d2002SSatish Balay /* Now extract the data pointers and do the copy,column at a time */ 2004ca15aa20SStefano Zampini ierr = MatDenseGetArray(newmat,&bv);CHKERRQ(ierr); 2005ca15aa20SStefano Zampini ierr = MatDenseGetLDA(newmat,&blda);CHKERRQ(ierr); 2006182d2002SSatish Balay for (i=0; i<ncols; i++) { 20076de62eeeSBarry Smith av = v + mat->lda*icol[i]; 2008ca15aa20SStefano Zampini for (j=0; j<nrows; j++) bv[j] = av[irow[j]]; 2009ca15aa20SStefano Zampini bv += blda; 20100754003eSLois Curfman McInnes } 2011ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(newmat,&bv);CHKERRQ(ierr); 2012182d2002SSatish Balay 2013182d2002SSatish Balay /* Assemble the matrices so that the correct flags are set */ 20146d4a8577SBarry Smith ierr = MatAssemblyBegin(newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 20156d4a8577SBarry Smith ierr = MatAssemblyEnd(newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 20160754003eSLois Curfman McInnes 20170754003eSLois Curfman McInnes /* Free work space */ 201878b31e54SBarry Smith ierr = ISRestoreIndices(isrow,&irow);CHKERRQ(ierr); 201978b31e54SBarry Smith ierr = ISRestoreIndices(iscol,&icol);CHKERRQ(ierr); 2020182d2002SSatish Balay *B = newmat; 20213a40ed3dSBarry Smith PetscFunctionReturn(0); 20220754003eSLois Curfman McInnes } 20230754003eSLois Curfman McInnes 20247dae84e0SHong Zhang static PetscErrorCode MatCreateSubMatrices_SeqDense(Mat A,PetscInt n,const IS irow[],const IS icol[],MatReuse scall,Mat *B[]) 2025905e6a2fSBarry Smith { 20266849ba73SBarry Smith PetscErrorCode ierr; 202713f74950SBarry Smith PetscInt i; 2028905e6a2fSBarry Smith 20293a40ed3dSBarry Smith PetscFunctionBegin; 2030905e6a2fSBarry Smith if (scall == MAT_INITIAL_MATRIX) { 2031df750dc8SHong Zhang ierr = PetscCalloc1(n+1,B);CHKERRQ(ierr); 2032905e6a2fSBarry Smith } 2033905e6a2fSBarry Smith 2034905e6a2fSBarry Smith for (i=0; i<n; i++) { 20357dae84e0SHong Zhang ierr = MatCreateSubMatrix_SeqDense(A,irow[i],icol[i],PETSC_DECIDE,scall,&(*B)[i]);CHKERRQ(ierr); 2036905e6a2fSBarry Smith } 20373a40ed3dSBarry Smith PetscFunctionReturn(0); 2038905e6a2fSBarry Smith } 2039905e6a2fSBarry Smith 2040e0877f53SBarry Smith static PetscErrorCode MatAssemblyBegin_SeqDense(Mat mat,MatAssemblyType mode) 2041c0aa2d19SHong Zhang { 2042c0aa2d19SHong Zhang PetscFunctionBegin; 2043c0aa2d19SHong Zhang PetscFunctionReturn(0); 2044c0aa2d19SHong Zhang } 2045c0aa2d19SHong Zhang 2046e0877f53SBarry Smith static PetscErrorCode MatAssemblyEnd_SeqDense(Mat mat,MatAssemblyType mode) 2047c0aa2d19SHong Zhang { 2048c0aa2d19SHong Zhang PetscFunctionBegin; 2049c0aa2d19SHong Zhang PetscFunctionReturn(0); 2050c0aa2d19SHong Zhang } 2051c0aa2d19SHong Zhang 2052e0877f53SBarry Smith static PetscErrorCode MatCopy_SeqDense(Mat A,Mat B,MatStructure str) 20534b0e389bSBarry Smith { 20544b0e389bSBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data,*b = (Mat_SeqDense*)B->data; 20556849ba73SBarry Smith PetscErrorCode ierr; 2056ca15aa20SStefano Zampini const PetscScalar *va; 2057ca15aa20SStefano Zampini PetscScalar *vb; 2058d0f46423SBarry Smith PetscInt lda1=a->lda,lda2=b->lda, m=A->rmap->n,n=A->cmap->n, j; 20593a40ed3dSBarry Smith 20603a40ed3dSBarry Smith PetscFunctionBegin; 206133f4a19fSKris Buschelman /* If the two matrices don't have the same copy implementation, they aren't compatible for fast copy. */ 206233f4a19fSKris Buschelman if (A->ops->copy != B->ops->copy) { 2063cb5b572fSBarry Smith ierr = MatCopy_Basic(A,B,str);CHKERRQ(ierr); 20643a40ed3dSBarry Smith PetscFunctionReturn(0); 20653a40ed3dSBarry Smith } 2066e32f2f54SBarry Smith if (m != B->rmap->n || n != B->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"size(B) != size(A)"); 2067ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&va);CHKERRQ(ierr); 2068ca15aa20SStefano Zampini ierr = MatDenseGetArray(B,&vb);CHKERRQ(ierr); 2069a5ce6ee0Svictorle if (lda1>m || lda2>m) { 20700dbb7854Svictorle for (j=0; j<n; j++) { 2071ca15aa20SStefano Zampini ierr = PetscArraycpy(vb+j*lda2,va+j*lda1,m);CHKERRQ(ierr); 2072a5ce6ee0Svictorle } 2073a5ce6ee0Svictorle } else { 2074ca15aa20SStefano Zampini ierr = PetscArraycpy(vb,va,A->rmap->n*A->cmap->n);CHKERRQ(ierr); 2075a5ce6ee0Svictorle } 2076ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(B,&vb);CHKERRQ(ierr); 2077ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&va);CHKERRQ(ierr); 2078ca15aa20SStefano Zampini ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2079ca15aa20SStefano Zampini ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2080273d9f13SBarry Smith PetscFunctionReturn(0); 2081273d9f13SBarry Smith } 2082273d9f13SBarry Smith 2083e0877f53SBarry Smith static PetscErrorCode MatSetUp_SeqDense(Mat A) 2084273d9f13SBarry Smith { 2085dfbe8321SBarry Smith PetscErrorCode ierr; 2086273d9f13SBarry Smith 2087273d9f13SBarry Smith PetscFunctionBegin; 2088273d9f13SBarry Smith ierr = MatSeqDenseSetPreallocation(A,0);CHKERRQ(ierr); 20893a40ed3dSBarry Smith PetscFunctionReturn(0); 20904b0e389bSBarry Smith } 20914b0e389bSBarry Smith 2092ba337c44SJed Brown static PetscErrorCode MatConjugate_SeqDense(Mat A) 2093ba337c44SJed Brown { 2094ba337c44SJed Brown PetscInt i,nz = A->rmap->n*A->cmap->n; 2095ca15aa20SStefano Zampini PetscScalar *aa; 2096ca15aa20SStefano Zampini PetscErrorCode ierr; 2097ba337c44SJed Brown 2098ba337c44SJed Brown PetscFunctionBegin; 2099ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&aa);CHKERRQ(ierr); 2100ba337c44SJed Brown for (i=0; i<nz; i++) aa[i] = PetscConj(aa[i]); 2101ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&aa);CHKERRQ(ierr); 2102ba337c44SJed Brown PetscFunctionReturn(0); 2103ba337c44SJed Brown } 2104ba337c44SJed Brown 2105ba337c44SJed Brown static PetscErrorCode MatRealPart_SeqDense(Mat A) 2106ba337c44SJed Brown { 2107ba337c44SJed Brown PetscInt i,nz = A->rmap->n*A->cmap->n; 2108ca15aa20SStefano Zampini PetscScalar *aa; 2109ca15aa20SStefano Zampini PetscErrorCode ierr; 2110ba337c44SJed Brown 2111ba337c44SJed Brown PetscFunctionBegin; 2112ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&aa);CHKERRQ(ierr); 2113ba337c44SJed Brown for (i=0; i<nz; i++) aa[i] = PetscRealPart(aa[i]); 2114ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&aa);CHKERRQ(ierr); 2115ba337c44SJed Brown PetscFunctionReturn(0); 2116ba337c44SJed Brown } 2117ba337c44SJed Brown 2118ba337c44SJed Brown static PetscErrorCode MatImaginaryPart_SeqDense(Mat A) 2119ba337c44SJed Brown { 2120ba337c44SJed Brown PetscInt i,nz = A->rmap->n*A->cmap->n; 2121ca15aa20SStefano Zampini PetscScalar *aa; 2122ca15aa20SStefano Zampini PetscErrorCode ierr; 2123ba337c44SJed Brown 2124ba337c44SJed Brown PetscFunctionBegin; 2125ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&aa);CHKERRQ(ierr); 2126ba337c44SJed Brown for (i=0; i<nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 2127ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&aa);CHKERRQ(ierr); 2128ba337c44SJed Brown PetscFunctionReturn(0); 2129ba337c44SJed Brown } 2130284134d9SBarry Smith 2131a9fe9ddaSSatish Balay /* ----------------------------------------------------------------*/ 2132150d2497SBarry Smith PETSC_INTERN PetscErrorCode MatMatMult_SeqDense_SeqDense(Mat A,Mat B,MatReuse scall,PetscReal fill,Mat *C) 2133a9fe9ddaSSatish Balay { 2134a9fe9ddaSSatish Balay PetscErrorCode ierr; 2135a9fe9ddaSSatish Balay 2136a9fe9ddaSSatish Balay PetscFunctionBegin; 2137a9fe9ddaSSatish Balay if (scall == MAT_INITIAL_MATRIX) { 21383ff4c91cSHong Zhang ierr = PetscLogEventBegin(MAT_MatMultSymbolic,A,B,0,0);CHKERRQ(ierr); 2139a9fe9ddaSSatish Balay ierr = MatMatMultSymbolic_SeqDense_SeqDense(A,B,fill,C);CHKERRQ(ierr); 21403ff4c91cSHong Zhang ierr = PetscLogEventEnd(MAT_MatMultSymbolic,A,B,0,0);CHKERRQ(ierr); 2141a9fe9ddaSSatish Balay } 21423ff4c91cSHong Zhang ierr = PetscLogEventBegin(MAT_MatMultNumeric,A,B,0,0);CHKERRQ(ierr); 2143ca15aa20SStefano Zampini if ((*C)->ops->matmultnumeric) { 2144ca15aa20SStefano Zampini ierr = (*(*C)->ops->matmultnumeric)(A,B,*C);CHKERRQ(ierr); 2145ca15aa20SStefano Zampini } else { 2146a9fe9ddaSSatish Balay ierr = MatMatMultNumeric_SeqDense_SeqDense(A,B,*C);CHKERRQ(ierr); 2147ca15aa20SStefano Zampini } 21483ff4c91cSHong Zhang ierr = PetscLogEventEnd(MAT_MatMultNumeric,A,B,0,0);CHKERRQ(ierr); 2149a9fe9ddaSSatish Balay PetscFunctionReturn(0); 2150a9fe9ddaSSatish Balay } 2151a9fe9ddaSSatish Balay 2152a9fe9ddaSSatish Balay PetscErrorCode MatMatMultSymbolic_SeqDense_SeqDense(Mat A,Mat B,PetscReal fill,Mat *C) 2153a9fe9ddaSSatish Balay { 2154ee16a9a1SHong Zhang PetscErrorCode ierr; 2155d0f46423SBarry Smith PetscInt m=A->rmap->n,n=B->cmap->n; 2156ee16a9a1SHong Zhang Mat Cmat; 2157ca15aa20SStefano Zampini PetscBool flg; 2158a9fe9ddaSSatish Balay 2159ee16a9a1SHong Zhang PetscFunctionBegin; 2160ee16a9a1SHong Zhang ierr = MatCreate(PETSC_COMM_SELF,&Cmat);CHKERRQ(ierr); 2161ee16a9a1SHong Zhang ierr = MatSetSizes(Cmat,m,n,m,n);CHKERRQ(ierr); 2162ca15aa20SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)B,((PetscObject)A)->type_name,&flg);CHKERRQ(ierr); 2163ca15aa20SStefano Zampini ierr = MatSetType(Cmat,flg ? ((PetscObject)A)->type_name : MATDENSE);CHKERRQ(ierr); 21640298fd71SBarry Smith ierr = MatSeqDenseSetPreallocation(Cmat,NULL);CHKERRQ(ierr); 2165ee16a9a1SHong Zhang *C = Cmat; 2166ee16a9a1SHong Zhang PetscFunctionReturn(0); 2167ee16a9a1SHong Zhang } 2168a9fe9ddaSSatish Balay 2169a9fe9ddaSSatish Balay PetscErrorCode MatMatMultNumeric_SeqDense_SeqDense(Mat A,Mat B,Mat C) 2170a9fe9ddaSSatish Balay { 217152c5f739Sprj- Mat_SeqDense *a,*b=(Mat_SeqDense*)B->data,*c=(Mat_SeqDense*)C->data; 21720805154bSBarry Smith PetscBLASInt m,n,k; 2173ca15aa20SStefano Zampini const PetscScalar *av,*bv; 2174ca15aa20SStefano Zampini PetscScalar *cv; 2175a9fe9ddaSSatish Balay PetscScalar _DOne=1.0,_DZero=0.0; 2176fd4e9aacSBarry Smith PetscBool flg; 2177*c2916339SPierre Jolivet PetscErrorCode (*numeric)(Mat,Mat,Mat)=NULL; 2178*c2916339SPierre Jolivet PetscErrorCode ierr; 2179a9fe9ddaSSatish Balay 2180a9fe9ddaSSatish Balay PetscFunctionBegin; 2181fd4e9aacSBarry Smith /* Handle case where where user provided the final C matrix rather than calling MatMatMult() with MAT_INITIAL_MATRIX*/ 2182fd4e9aacSBarry Smith ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQAIJ,&flg);CHKERRQ(ierr); 2183*c2916339SPierre Jolivet if (flg) numeric = MatMatMultNumeric_SeqAIJ_SeqDense; 2184a001520aSPierre Jolivet ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQBAIJ,&flg);CHKERRQ(ierr); 2185*c2916339SPierre Jolivet if (flg) numeric = MatMatMultNumeric_SeqBAIJ_SeqDense; 2186*c2916339SPierre Jolivet ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQSBAIJ,&flg);CHKERRQ(ierr); 2187*c2916339SPierre Jolivet if (flg) numeric = MatMatMultNumeric_SeqSBAIJ_SeqDense; 218852c5f739Sprj- ierr = PetscObjectTypeCompare((PetscObject)A,MATNEST,&flg);CHKERRQ(ierr); 2189*c2916339SPierre Jolivet if (flg) numeric = MatMatMultNumeric_Nest_Dense; 2190*c2916339SPierre Jolivet if (numeric) { 2191*c2916339SPierre Jolivet C->ops->matmultnumeric = numeric; 2192*c2916339SPierre Jolivet ierr = (*numeric)(A,B,C);CHKERRQ(ierr); 219352c5f739Sprj- PetscFunctionReturn(0); 219452c5f739Sprj- } 219552c5f739Sprj- a = (Mat_SeqDense*)A->data; 21968208b9aeSStefano Zampini ierr = PetscBLASIntCast(C->rmap->n,&m);CHKERRQ(ierr); 21978208b9aeSStefano Zampini ierr = PetscBLASIntCast(C->cmap->n,&n);CHKERRQ(ierr); 2198c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&k);CHKERRQ(ierr); 219949d0e964SStefano Zampini if (!m || !n || !k) PetscFunctionReturn(0); 2200ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&av);CHKERRQ(ierr); 2201ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(B,&bv);CHKERRQ(ierr); 2202ca15aa20SStefano Zampini ierr = MatDenseGetArray(C,&cv);CHKERRQ(ierr); 2203ca15aa20SStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_("N","N",&m,&n,&k,&_DOne,av,&a->lda,bv,&b->lda,&_DZero,cv,&c->lda)); 2204ca15aa20SStefano Zampini ierr = PetscLogFlops(1.0*m*n*k + 1.0*m*n*(k-1));CHKERRQ(ierr); 2205ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&av);CHKERRQ(ierr); 2206ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(B,&bv);CHKERRQ(ierr); 2207ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(C,&cv);CHKERRQ(ierr); 2208a9fe9ddaSSatish Balay PetscFunctionReturn(0); 2209a9fe9ddaSSatish Balay } 2210a9fe9ddaSSatish Balay 221169f65d41SStefano Zampini PetscErrorCode MatMatTransposeMult_SeqDense_SeqDense(Mat A,Mat B,MatReuse scall,PetscReal fill,Mat *C) 221269f65d41SStefano Zampini { 221369f65d41SStefano Zampini PetscErrorCode ierr; 221469f65d41SStefano Zampini 221569f65d41SStefano Zampini PetscFunctionBegin; 221669f65d41SStefano Zampini if (scall == MAT_INITIAL_MATRIX) { 221769f65d41SStefano Zampini ierr = PetscLogEventBegin(MAT_MatTransposeMultSymbolic,A,B,0,0);CHKERRQ(ierr); 221869f65d41SStefano Zampini ierr = MatMatTransposeMultSymbolic_SeqDense_SeqDense(A,B,fill,C);CHKERRQ(ierr); 221969f65d41SStefano Zampini ierr = PetscLogEventEnd(MAT_MatTransposeMultSymbolic,A,B,0,0);CHKERRQ(ierr); 222069f65d41SStefano Zampini } 222169f65d41SStefano Zampini ierr = PetscLogEventBegin(MAT_MatTransposeMultNumeric,A,B,0,0);CHKERRQ(ierr); 222269f65d41SStefano Zampini ierr = MatMatTransposeMultNumeric_SeqDense_SeqDense(A,B,*C);CHKERRQ(ierr); 222369f65d41SStefano Zampini ierr = PetscLogEventEnd(MAT_MatTransposeMultNumeric,A,B,0,0);CHKERRQ(ierr); 222469f65d41SStefano Zampini PetscFunctionReturn(0); 222569f65d41SStefano Zampini } 222669f65d41SStefano Zampini 222769f65d41SStefano Zampini PetscErrorCode MatMatTransposeMultSymbolic_SeqDense_SeqDense(Mat A,Mat B,PetscReal fill,Mat *C) 222869f65d41SStefano Zampini { 222969f65d41SStefano Zampini PetscErrorCode ierr; 223069f65d41SStefano Zampini PetscInt m=A->rmap->n,n=B->rmap->n; 223169f65d41SStefano Zampini Mat Cmat; 2232ca15aa20SStefano Zampini PetscBool flg; 223369f65d41SStefano Zampini 223469f65d41SStefano Zampini PetscFunctionBegin; 223569f65d41SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&Cmat);CHKERRQ(ierr); 223669f65d41SStefano Zampini ierr = MatSetSizes(Cmat,m,n,m,n);CHKERRQ(ierr); 2237ca15aa20SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)B,((PetscObject)A)->type_name,&flg);CHKERRQ(ierr); 2238ca15aa20SStefano Zampini ierr = MatSetType(Cmat,flg ? ((PetscObject)A)->type_name : MATDENSE);CHKERRQ(ierr); 223969f65d41SStefano Zampini ierr = MatSeqDenseSetPreallocation(Cmat,NULL);CHKERRQ(ierr); 224069f65d41SStefano Zampini *C = Cmat; 224169f65d41SStefano Zampini PetscFunctionReturn(0); 224269f65d41SStefano Zampini } 224369f65d41SStefano Zampini 224469f65d41SStefano Zampini PetscErrorCode MatMatTransposeMultNumeric_SeqDense_SeqDense(Mat A,Mat B,Mat C) 224569f65d41SStefano Zampini { 224669f65d41SStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 224769f65d41SStefano Zampini Mat_SeqDense *b = (Mat_SeqDense*)B->data; 224869f65d41SStefano Zampini Mat_SeqDense *c = (Mat_SeqDense*)C->data; 224969f65d41SStefano Zampini PetscBLASInt m,n,k; 225069f65d41SStefano Zampini PetscScalar _DOne=1.0,_DZero=0.0; 225169f65d41SStefano Zampini PetscErrorCode ierr; 225269f65d41SStefano Zampini 225369f65d41SStefano Zampini PetscFunctionBegin; 225449d0e964SStefano Zampini ierr = PetscBLASIntCast(C->rmap->n,&m);CHKERRQ(ierr); 225549d0e964SStefano Zampini ierr = PetscBLASIntCast(C->cmap->n,&n);CHKERRQ(ierr); 225669f65d41SStefano Zampini ierr = PetscBLASIntCast(A->cmap->n,&k);CHKERRQ(ierr); 225749d0e964SStefano Zampini if (!m || !n || !k) PetscFunctionReturn(0); 225869f65d41SStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_("N","T",&m,&n,&k,&_DOne,a->v,&a->lda,b->v,&b->lda,&_DZero,c->v,&c->lda)); 2259ca15aa20SStefano Zampini ierr = PetscLogFlops(1.0*m*n*k + 1.0*m*n*(k-1));CHKERRQ(ierr); 226069f65d41SStefano Zampini PetscFunctionReturn(0); 226169f65d41SStefano Zampini } 226269f65d41SStefano Zampini 226375648e8dSHong Zhang PetscErrorCode MatTransposeMatMult_SeqDense_SeqDense(Mat A,Mat B,MatReuse scall,PetscReal fill,Mat *C) 2264a9fe9ddaSSatish Balay { 2265a9fe9ddaSSatish Balay PetscErrorCode ierr; 2266a9fe9ddaSSatish Balay 2267a9fe9ddaSSatish Balay PetscFunctionBegin; 2268a9fe9ddaSSatish Balay if (scall == MAT_INITIAL_MATRIX) { 22693ff4c91cSHong Zhang ierr = PetscLogEventBegin(MAT_TransposeMatMultSymbolic,A,B,0,0);CHKERRQ(ierr); 227075648e8dSHong Zhang ierr = MatTransposeMatMultSymbolic_SeqDense_SeqDense(A,B,fill,C);CHKERRQ(ierr); 22713ff4c91cSHong Zhang ierr = PetscLogEventEnd(MAT_TransposeMatMultSymbolic,A,B,0,0);CHKERRQ(ierr); 2272a9fe9ddaSSatish Balay } 22733ff4c91cSHong Zhang ierr = PetscLogEventBegin(MAT_TransposeMatMultNumeric,A,B,0,0);CHKERRQ(ierr); 227475648e8dSHong Zhang ierr = MatTransposeMatMultNumeric_SeqDense_SeqDense(A,B,*C);CHKERRQ(ierr); 22753ff4c91cSHong Zhang ierr = PetscLogEventEnd(MAT_TransposeMatMultNumeric,A,B,0,0);CHKERRQ(ierr); 2276a9fe9ddaSSatish Balay PetscFunctionReturn(0); 2277a9fe9ddaSSatish Balay } 2278a9fe9ddaSSatish Balay 227975648e8dSHong Zhang PetscErrorCode MatTransposeMatMultSymbolic_SeqDense_SeqDense(Mat A,Mat B,PetscReal fill,Mat *C) 2280a9fe9ddaSSatish Balay { 2281ee16a9a1SHong Zhang PetscErrorCode ierr; 2282d0f46423SBarry Smith PetscInt m=A->cmap->n,n=B->cmap->n; 2283ee16a9a1SHong Zhang Mat Cmat; 2284ca15aa20SStefano Zampini PetscBool flg; 2285a9fe9ddaSSatish Balay 2286ee16a9a1SHong Zhang PetscFunctionBegin; 2287ee16a9a1SHong Zhang ierr = MatCreate(PETSC_COMM_SELF,&Cmat);CHKERRQ(ierr); 2288ee16a9a1SHong Zhang ierr = MatSetSizes(Cmat,m,n,m,n);CHKERRQ(ierr); 2289ca15aa20SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)B,((PetscObject)A)->type_name,&flg);CHKERRQ(ierr); 2290ca15aa20SStefano Zampini ierr = MatSetType(Cmat,flg ? ((PetscObject)A)->type_name : MATDENSE);CHKERRQ(ierr); 22910298fd71SBarry Smith ierr = MatSeqDenseSetPreallocation(Cmat,NULL);CHKERRQ(ierr); 2292ee16a9a1SHong Zhang *C = Cmat; 2293ee16a9a1SHong Zhang PetscFunctionReturn(0); 2294ee16a9a1SHong Zhang } 2295a9fe9ddaSSatish Balay 229675648e8dSHong Zhang PetscErrorCode MatTransposeMatMultNumeric_SeqDense_SeqDense(Mat A,Mat B,Mat C) 2297a9fe9ddaSSatish Balay { 2298a9fe9ddaSSatish Balay Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2299a9fe9ddaSSatish Balay Mat_SeqDense *b = (Mat_SeqDense*)B->data; 2300a9fe9ddaSSatish Balay Mat_SeqDense *c = (Mat_SeqDense*)C->data; 23010805154bSBarry Smith PetscBLASInt m,n,k; 2302a9fe9ddaSSatish Balay PetscScalar _DOne=1.0,_DZero=0.0; 2303c5df96a5SBarry Smith PetscErrorCode ierr; 2304a9fe9ddaSSatish Balay 2305a9fe9ddaSSatish Balay PetscFunctionBegin; 23068208b9aeSStefano Zampini ierr = PetscBLASIntCast(C->rmap->n,&m);CHKERRQ(ierr); 23078208b9aeSStefano Zampini ierr = PetscBLASIntCast(C->cmap->n,&n);CHKERRQ(ierr); 2308c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&k);CHKERRQ(ierr); 230949d0e964SStefano Zampini if (!m || !n || !k) PetscFunctionReturn(0); 23105ca1cc5dSStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_("T","N",&m,&n,&k,&_DOne,a->v,&a->lda,b->v,&b->lda,&_DZero,c->v,&c->lda)); 2311ca15aa20SStefano Zampini ierr = PetscLogFlops(1.0*m*n*k + 1.0*m*n*(k-1));CHKERRQ(ierr); 2312a9fe9ddaSSatish Balay PetscFunctionReturn(0); 2313a9fe9ddaSSatish Balay } 2314985db425SBarry Smith 2315e0877f53SBarry Smith static PetscErrorCode MatGetRowMax_SeqDense(Mat A,Vec v,PetscInt idx[]) 2316985db425SBarry Smith { 2317985db425SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2318985db425SBarry Smith PetscErrorCode ierr; 2319d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,p; 2320985db425SBarry Smith PetscScalar *x; 2321ca15aa20SStefano Zampini const PetscScalar *aa; 2322985db425SBarry Smith 2323985db425SBarry Smith PetscFunctionBegin; 2324e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2325985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2326985db425SBarry Smith ierr = VecGetLocalSize(v,&p);CHKERRQ(ierr); 2327ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&aa);CHKERRQ(ierr); 2328e32f2f54SBarry Smith if (p != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2329985db425SBarry Smith for (i=0; i<m; i++) { 2330985db425SBarry Smith x[i] = aa[i]; if (idx) idx[i] = 0; 2331985db425SBarry Smith for (j=1; j<n; j++) { 2332ca15aa20SStefano Zampini if (PetscRealPart(x[i]) < PetscRealPart(aa[i+a->lda*j])) {x[i] = aa[i + a->lda*j]; if (idx) idx[i] = j;} 2333985db425SBarry Smith } 2334985db425SBarry Smith } 2335ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&aa);CHKERRQ(ierr); 2336985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2337985db425SBarry Smith PetscFunctionReturn(0); 2338985db425SBarry Smith } 2339985db425SBarry Smith 2340e0877f53SBarry Smith static PetscErrorCode MatGetRowMaxAbs_SeqDense(Mat A,Vec v,PetscInt idx[]) 2341985db425SBarry Smith { 2342985db425SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2343985db425SBarry Smith PetscErrorCode ierr; 2344d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,p; 2345985db425SBarry Smith PetscScalar *x; 2346985db425SBarry Smith PetscReal atmp; 2347ca15aa20SStefano Zampini const PetscScalar *aa; 2348985db425SBarry Smith 2349985db425SBarry Smith PetscFunctionBegin; 2350e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2351985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2352985db425SBarry Smith ierr = VecGetLocalSize(v,&p);CHKERRQ(ierr); 2353ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&aa);CHKERRQ(ierr); 2354e32f2f54SBarry Smith if (p != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2355985db425SBarry Smith for (i=0; i<m; i++) { 23569189402eSHong Zhang x[i] = PetscAbsScalar(aa[i]); 2357985db425SBarry Smith for (j=1; j<n; j++) { 2358ca15aa20SStefano Zampini atmp = PetscAbsScalar(aa[i+a->lda*j]); 2359985db425SBarry Smith if (PetscAbsScalar(x[i]) < atmp) {x[i] = atmp; if (idx) idx[i] = j;} 2360985db425SBarry Smith } 2361985db425SBarry Smith } 2362ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&aa);CHKERRQ(ierr); 2363985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2364985db425SBarry Smith PetscFunctionReturn(0); 2365985db425SBarry Smith } 2366985db425SBarry Smith 2367e0877f53SBarry Smith static PetscErrorCode MatGetRowMin_SeqDense(Mat A,Vec v,PetscInt idx[]) 2368985db425SBarry Smith { 2369985db425SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2370985db425SBarry Smith PetscErrorCode ierr; 2371d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,p; 2372985db425SBarry Smith PetscScalar *x; 2373ca15aa20SStefano Zampini const PetscScalar *aa; 2374985db425SBarry Smith 2375985db425SBarry Smith PetscFunctionBegin; 2376e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2377ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&aa);CHKERRQ(ierr); 2378985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2379985db425SBarry Smith ierr = VecGetLocalSize(v,&p);CHKERRQ(ierr); 2380e32f2f54SBarry Smith if (p != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2381985db425SBarry Smith for (i=0; i<m; i++) { 2382985db425SBarry Smith x[i] = aa[i]; if (idx) idx[i] = 0; 2383985db425SBarry Smith for (j=1; j<n; j++) { 2384ca15aa20SStefano Zampini if (PetscRealPart(x[i]) > PetscRealPart(aa[i+a->lda*j])) {x[i] = aa[i + a->lda*j]; if (idx) idx[i] = j;} 2385985db425SBarry Smith } 2386985db425SBarry Smith } 2387985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2388ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&aa);CHKERRQ(ierr); 2389985db425SBarry Smith PetscFunctionReturn(0); 2390985db425SBarry Smith } 2391985db425SBarry Smith 2392e0877f53SBarry Smith static PetscErrorCode MatGetColumnVector_SeqDense(Mat A,Vec v,PetscInt col) 23938d0534beSBarry Smith { 23948d0534beSBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 23958d0534beSBarry Smith PetscErrorCode ierr; 23968d0534beSBarry Smith PetscScalar *x; 2397ca15aa20SStefano Zampini const PetscScalar *aa; 23988d0534beSBarry Smith 23998d0534beSBarry Smith PetscFunctionBegin; 2400e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2401ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&aa);CHKERRQ(ierr); 24028d0534beSBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2403ca15aa20SStefano Zampini ierr = PetscArraycpy(x,aa+col*a->lda,A->rmap->n);CHKERRQ(ierr); 24048d0534beSBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2405ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&aa);CHKERRQ(ierr); 24068d0534beSBarry Smith PetscFunctionReturn(0); 24078d0534beSBarry Smith } 24088d0534beSBarry Smith 240952c5f739Sprj- PETSC_INTERN PetscErrorCode MatGetColumnNorms_SeqDense(Mat A,NormType type,PetscReal *norms) 24100716a85fSBarry Smith { 24110716a85fSBarry Smith PetscErrorCode ierr; 24120716a85fSBarry Smith PetscInt i,j,m,n; 24131683a169SBarry Smith const PetscScalar *a; 24140716a85fSBarry Smith 24150716a85fSBarry Smith PetscFunctionBegin; 24160716a85fSBarry Smith ierr = MatGetSize(A,&m,&n);CHKERRQ(ierr); 2417580bdb30SBarry Smith ierr = PetscArrayzero(norms,n);CHKERRQ(ierr); 24181683a169SBarry Smith ierr = MatDenseGetArrayRead(A,&a);CHKERRQ(ierr); 24190716a85fSBarry Smith if (type == NORM_2) { 24200716a85fSBarry Smith for (i=0; i<n; i++) { 24210716a85fSBarry Smith for (j=0; j<m; j++) { 24220716a85fSBarry Smith norms[i] += PetscAbsScalar(a[j]*a[j]); 24230716a85fSBarry Smith } 24240716a85fSBarry Smith a += m; 24250716a85fSBarry Smith } 24260716a85fSBarry Smith } else if (type == NORM_1) { 24270716a85fSBarry Smith for (i=0; i<n; i++) { 24280716a85fSBarry Smith for (j=0; j<m; j++) { 24290716a85fSBarry Smith norms[i] += PetscAbsScalar(a[j]); 24300716a85fSBarry Smith } 24310716a85fSBarry Smith a += m; 24320716a85fSBarry Smith } 24330716a85fSBarry Smith } else if (type == NORM_INFINITY) { 24340716a85fSBarry Smith for (i=0; i<n; i++) { 24350716a85fSBarry Smith for (j=0; j<m; j++) { 24360716a85fSBarry Smith norms[i] = PetscMax(PetscAbsScalar(a[j]),norms[i]); 24370716a85fSBarry Smith } 24380716a85fSBarry Smith a += m; 24390716a85fSBarry Smith } 2440ce94432eSBarry Smith } else SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Unknown NormType"); 24411683a169SBarry Smith ierr = MatDenseRestoreArrayRead(A,&a);CHKERRQ(ierr); 24420716a85fSBarry Smith if (type == NORM_2) { 24438f1a2a5eSBarry Smith for (i=0; i<n; i++) norms[i] = PetscSqrtReal(norms[i]); 24440716a85fSBarry Smith } 24450716a85fSBarry Smith PetscFunctionReturn(0); 24460716a85fSBarry Smith } 24470716a85fSBarry Smith 244873a71a0fSBarry Smith static PetscErrorCode MatSetRandom_SeqDense(Mat x,PetscRandom rctx) 244973a71a0fSBarry Smith { 245073a71a0fSBarry Smith PetscErrorCode ierr; 245173a71a0fSBarry Smith PetscScalar *a; 245273a71a0fSBarry Smith PetscInt m,n,i; 245373a71a0fSBarry Smith 245473a71a0fSBarry Smith PetscFunctionBegin; 245573a71a0fSBarry Smith ierr = MatGetSize(x,&m,&n);CHKERRQ(ierr); 24568c778c55SBarry Smith ierr = MatDenseGetArray(x,&a);CHKERRQ(ierr); 245773a71a0fSBarry Smith for (i=0; i<m*n; i++) { 245873a71a0fSBarry Smith ierr = PetscRandomGetValue(rctx,a+i);CHKERRQ(ierr); 245973a71a0fSBarry Smith } 24608c778c55SBarry Smith ierr = MatDenseRestoreArray(x,&a);CHKERRQ(ierr); 246173a71a0fSBarry Smith PetscFunctionReturn(0); 246273a71a0fSBarry Smith } 246373a71a0fSBarry Smith 24643b49f96aSBarry Smith static PetscErrorCode MatMissingDiagonal_SeqDense(Mat A,PetscBool *missing,PetscInt *d) 24653b49f96aSBarry Smith { 24663b49f96aSBarry Smith PetscFunctionBegin; 24673b49f96aSBarry Smith *missing = PETSC_FALSE; 24683b49f96aSBarry Smith PetscFunctionReturn(0); 24693b49f96aSBarry Smith } 247073a71a0fSBarry Smith 2471ca15aa20SStefano Zampini /* vals is not const */ 2472af53bab2SHong Zhang static PetscErrorCode MatDenseGetColumn_SeqDense(Mat A,PetscInt col,PetscScalar **vals) 247386aefd0dSHong Zhang { 2474ca15aa20SStefano Zampini PetscErrorCode ierr; 247586aefd0dSHong Zhang Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2476ca15aa20SStefano Zampini PetscScalar *v; 247786aefd0dSHong Zhang 247886aefd0dSHong Zhang PetscFunctionBegin; 247986aefd0dSHong Zhang if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2480ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 2481ca15aa20SStefano Zampini *vals = v+col*a->lda; 2482ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 248386aefd0dSHong Zhang PetscFunctionReturn(0); 248486aefd0dSHong Zhang } 248586aefd0dSHong Zhang 2486af53bab2SHong Zhang static PetscErrorCode MatDenseRestoreColumn_SeqDense(Mat A,PetscScalar **vals) 248786aefd0dSHong Zhang { 248886aefd0dSHong Zhang PetscFunctionBegin; 248986aefd0dSHong Zhang *vals = 0; /* user cannot accidently use the array later */ 249086aefd0dSHong Zhang PetscFunctionReturn(0); 249186aefd0dSHong Zhang } 2492abc3b08eSStefano Zampini 2493289bc588SBarry Smith /* -------------------------------------------------------------------*/ 2494a5ae1ecdSBarry Smith static struct _MatOps MatOps_Values = { MatSetValues_SeqDense, 2495905e6a2fSBarry Smith MatGetRow_SeqDense, 2496905e6a2fSBarry Smith MatRestoreRow_SeqDense, 2497905e6a2fSBarry Smith MatMult_SeqDense, 249897304618SKris Buschelman /* 4*/ MatMultAdd_SeqDense, 24997c922b88SBarry Smith MatMultTranspose_SeqDense, 25007c922b88SBarry Smith MatMultTransposeAdd_SeqDense, 2501db4efbfdSBarry Smith 0, 2502db4efbfdSBarry Smith 0, 2503db4efbfdSBarry Smith 0, 2504db4efbfdSBarry Smith /* 10*/ 0, 2505905e6a2fSBarry Smith MatLUFactor_SeqDense, 2506905e6a2fSBarry Smith MatCholeskyFactor_SeqDense, 250741f059aeSBarry Smith MatSOR_SeqDense, 2508ec8511deSBarry Smith MatTranspose_SeqDense, 250997304618SKris Buschelman /* 15*/ MatGetInfo_SeqDense, 2510905e6a2fSBarry Smith MatEqual_SeqDense, 2511905e6a2fSBarry Smith MatGetDiagonal_SeqDense, 2512905e6a2fSBarry Smith MatDiagonalScale_SeqDense, 2513905e6a2fSBarry Smith MatNorm_SeqDense, 2514c0aa2d19SHong Zhang /* 20*/ MatAssemblyBegin_SeqDense, 2515c0aa2d19SHong Zhang MatAssemblyEnd_SeqDense, 2516905e6a2fSBarry Smith MatSetOption_SeqDense, 2517905e6a2fSBarry Smith MatZeroEntries_SeqDense, 2518d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqDense, 2519db4efbfdSBarry Smith 0, 2520db4efbfdSBarry Smith 0, 2521db4efbfdSBarry Smith 0, 2522db4efbfdSBarry Smith 0, 25234994cf47SJed Brown /* 29*/ MatSetUp_SeqDense, 2524273d9f13SBarry Smith 0, 2525905e6a2fSBarry Smith 0, 252673a71a0fSBarry Smith 0, 252773a71a0fSBarry Smith 0, 2528d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqDense, 2529a5ae1ecdSBarry Smith 0, 2530a5ae1ecdSBarry Smith 0, 2531a5ae1ecdSBarry Smith 0, 2532a5ae1ecdSBarry Smith 0, 2533d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqDense, 25347dae84e0SHong Zhang MatCreateSubMatrices_SeqDense, 2535a5ae1ecdSBarry Smith 0, 25364b0e389bSBarry Smith MatGetValues_SeqDense, 2537a5ae1ecdSBarry Smith MatCopy_SeqDense, 2538d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqDense, 2539a5ae1ecdSBarry Smith MatScale_SeqDense, 25407d68702bSBarry Smith MatShift_Basic, 2541a5ae1ecdSBarry Smith 0, 25423f49a652SStefano Zampini MatZeroRowsColumns_SeqDense, 254373a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqDense, 2544a5ae1ecdSBarry Smith 0, 2545a5ae1ecdSBarry Smith 0, 2546a5ae1ecdSBarry Smith 0, 2547a5ae1ecdSBarry Smith 0, 2548d519adbfSMatthew Knepley /* 54*/ 0, 2549a5ae1ecdSBarry Smith 0, 2550a5ae1ecdSBarry Smith 0, 2551a5ae1ecdSBarry Smith 0, 2552a5ae1ecdSBarry Smith 0, 2553d519adbfSMatthew Knepley /* 59*/ 0, 2554e03a110bSBarry Smith MatDestroy_SeqDense, 2555e03a110bSBarry Smith MatView_SeqDense, 2556357abbc8SBarry Smith 0, 255797304618SKris Buschelman 0, 2558d519adbfSMatthew Knepley /* 64*/ 0, 255997304618SKris Buschelman 0, 256097304618SKris Buschelman 0, 256197304618SKris Buschelman 0, 256297304618SKris Buschelman 0, 2563d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqDense, 256497304618SKris Buschelman 0, 256597304618SKris Buschelman 0, 256697304618SKris Buschelman 0, 256797304618SKris Buschelman 0, 2568d519adbfSMatthew Knepley /* 74*/ 0, 256997304618SKris Buschelman 0, 257097304618SKris Buschelman 0, 257197304618SKris Buschelman 0, 257297304618SKris Buschelman 0, 2573d519adbfSMatthew Knepley /* 79*/ 0, 257497304618SKris Buschelman 0, 257597304618SKris Buschelman 0, 257697304618SKris Buschelman 0, 25775bba2384SShri Abhyankar /* 83*/ MatLoad_SeqDense, 2578865e5f61SKris Buschelman 0, 25791cbb95d3SBarry Smith MatIsHermitian_SeqDense, 2580865e5f61SKris Buschelman 0, 2581865e5f61SKris Buschelman 0, 2582865e5f61SKris Buschelman 0, 2583d519adbfSMatthew Knepley /* 89*/ MatMatMult_SeqDense_SeqDense, 2584a9fe9ddaSSatish Balay MatMatMultSymbolic_SeqDense_SeqDense, 2585a9fe9ddaSSatish Balay MatMatMultNumeric_SeqDense_SeqDense, 2586abc3b08eSStefano Zampini MatPtAP_SeqDense_SeqDense, 2587abc3b08eSStefano Zampini MatPtAPSymbolic_SeqDense_SeqDense, 2588abc3b08eSStefano Zampini /* 94*/ MatPtAPNumeric_SeqDense_SeqDense, 258969f65d41SStefano Zampini MatMatTransposeMult_SeqDense_SeqDense, 259069f65d41SStefano Zampini MatMatTransposeMultSymbolic_SeqDense_SeqDense, 259169f65d41SStefano Zampini MatMatTransposeMultNumeric_SeqDense_SeqDense, 2592284134d9SBarry Smith 0, 2593d519adbfSMatthew Knepley /* 99*/ 0, 2594284134d9SBarry Smith 0, 2595284134d9SBarry Smith 0, 2596ba337c44SJed Brown MatConjugate_SeqDense, 2597f73d5cc4SBarry Smith 0, 2598ba337c44SJed Brown /*104*/ 0, 2599ba337c44SJed Brown MatRealPart_SeqDense, 2600ba337c44SJed Brown MatImaginaryPart_SeqDense, 2601985db425SBarry Smith 0, 2602985db425SBarry Smith 0, 26038208b9aeSStefano Zampini /*109*/ 0, 2604985db425SBarry Smith 0, 26058d0534beSBarry Smith MatGetRowMin_SeqDense, 2606aabbc4fbSShri Abhyankar MatGetColumnVector_SeqDense, 26073b49f96aSBarry Smith MatMissingDiagonal_SeqDense, 2608aabbc4fbSShri Abhyankar /*114*/ 0, 2609aabbc4fbSShri Abhyankar 0, 2610aabbc4fbSShri Abhyankar 0, 2611aabbc4fbSShri Abhyankar 0, 2612aabbc4fbSShri Abhyankar 0, 2613aabbc4fbSShri Abhyankar /*119*/ 0, 2614aabbc4fbSShri Abhyankar 0, 2615aabbc4fbSShri Abhyankar 0, 26160716a85fSBarry Smith 0, 26170716a85fSBarry Smith 0, 26180716a85fSBarry Smith /*124*/ 0, 26195df89d91SHong Zhang MatGetColumnNorms_SeqDense, 26205df89d91SHong Zhang 0, 26215df89d91SHong Zhang 0, 26225df89d91SHong Zhang 0, 26235df89d91SHong Zhang /*129*/ 0, 262475648e8dSHong Zhang MatTransposeMatMult_SeqDense_SeqDense, 262575648e8dSHong Zhang MatTransposeMatMultSymbolic_SeqDense_SeqDense, 262675648e8dSHong Zhang MatTransposeMatMultNumeric_SeqDense_SeqDense, 26273964eb88SJed Brown 0, 26283964eb88SJed Brown /*134*/ 0, 26293964eb88SJed Brown 0, 26303964eb88SJed Brown 0, 26313964eb88SJed Brown 0, 26323964eb88SJed Brown 0, 26333964eb88SJed Brown /*139*/ 0, 2634f9426fe0SMark Adams 0, 2635d528f656SJakub Kruzik 0, 2636d528f656SJakub Kruzik 0, 2637d528f656SJakub Kruzik 0, 2638d528f656SJakub Kruzik /*144*/ MatCreateMPIMatConcatenateSeqMat_SeqDense 2639985db425SBarry Smith }; 264090ace30eSBarry Smith 26414b828684SBarry Smith /*@C 2642fafbff53SBarry Smith MatCreateSeqDense - Creates a sequential dense matrix that 2643d65003e9SLois Curfman McInnes is stored in column major order (the usual Fortran 77 manner). Many 2644d65003e9SLois Curfman McInnes of the matrix operations use the BLAS and LAPACK routines. 2645289bc588SBarry Smith 2646d083f849SBarry Smith Collective 2647db81eaa0SLois Curfman McInnes 264820563c6bSBarry Smith Input Parameters: 2649db81eaa0SLois Curfman McInnes + comm - MPI communicator, set to PETSC_COMM_SELF 26500c775827SLois Curfman McInnes . m - number of rows 265118f449edSLois Curfman McInnes . n - number of columns 26520298fd71SBarry Smith - data - optional location of matrix data in column major order. Set data=NULL for PETSc 2653dfc5480cSLois Curfman McInnes to control all matrix memory allocation. 265420563c6bSBarry Smith 265520563c6bSBarry Smith Output Parameter: 265644cd7ae7SLois Curfman McInnes . A - the matrix 265720563c6bSBarry Smith 2658b259b22eSLois Curfman McInnes Notes: 265918f449edSLois Curfman McInnes The data input variable is intended primarily for Fortran programmers 266018f449edSLois Curfman McInnes who wish to allocate their own matrix memory space. Most users should 26610298fd71SBarry Smith set data=NULL. 266218f449edSLois Curfman McInnes 2663027ccd11SLois Curfman McInnes Level: intermediate 2664027ccd11SLois Curfman McInnes 266569b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateDense(), MatSetValues() 266620563c6bSBarry Smith @*/ 26677087cfbeSBarry Smith PetscErrorCode MatCreateSeqDense(MPI_Comm comm,PetscInt m,PetscInt n,PetscScalar *data,Mat *A) 2668289bc588SBarry Smith { 2669dfbe8321SBarry Smith PetscErrorCode ierr; 26703b2fbd54SBarry Smith 26713a40ed3dSBarry Smith PetscFunctionBegin; 2672f69a0ea3SMatthew Knepley ierr = MatCreate(comm,A);CHKERRQ(ierr); 2673f69a0ea3SMatthew Knepley ierr = MatSetSizes(*A,m,n,m,n);CHKERRQ(ierr); 2674273d9f13SBarry Smith ierr = MatSetType(*A,MATSEQDENSE);CHKERRQ(ierr); 2675273d9f13SBarry Smith ierr = MatSeqDenseSetPreallocation(*A,data);CHKERRQ(ierr); 2676273d9f13SBarry Smith PetscFunctionReturn(0); 2677273d9f13SBarry Smith } 2678273d9f13SBarry Smith 2679273d9f13SBarry Smith /*@C 2680273d9f13SBarry Smith MatSeqDenseSetPreallocation - Sets the array used for storing the matrix elements 2681273d9f13SBarry Smith 2682d083f849SBarry Smith Collective 2683273d9f13SBarry Smith 2684273d9f13SBarry Smith Input Parameters: 26851c4f3114SJed Brown + B - the matrix 26860298fd71SBarry Smith - data - the array (or NULL) 2687273d9f13SBarry Smith 2688273d9f13SBarry Smith Notes: 2689273d9f13SBarry Smith The data input variable is intended primarily for Fortran programmers 2690273d9f13SBarry Smith who wish to allocate their own matrix memory space. Most users should 2691284134d9SBarry Smith need not call this routine. 2692273d9f13SBarry Smith 2693273d9f13SBarry Smith Level: intermediate 2694273d9f13SBarry Smith 269569b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateDense(), MatSetValues(), MatSeqDenseSetLDA() 2696867c911aSBarry Smith 2697273d9f13SBarry Smith @*/ 26987087cfbeSBarry Smith PetscErrorCode MatSeqDenseSetPreallocation(Mat B,PetscScalar data[]) 2699273d9f13SBarry Smith { 27004ac538c5SBarry Smith PetscErrorCode ierr; 2701a23d5eceSKris Buschelman 2702a23d5eceSKris Buschelman PetscFunctionBegin; 27034ac538c5SBarry Smith ierr = PetscTryMethod(B,"MatSeqDenseSetPreallocation_C",(Mat,PetscScalar[]),(B,data));CHKERRQ(ierr); 2704a23d5eceSKris Buschelman PetscFunctionReturn(0); 2705a23d5eceSKris Buschelman } 2706a23d5eceSKris Buschelman 27077087cfbeSBarry Smith PetscErrorCode MatSeqDenseSetPreallocation_SeqDense(Mat B,PetscScalar *data) 2708a23d5eceSKris Buschelman { 2709273d9f13SBarry Smith Mat_SeqDense *b; 2710dfbe8321SBarry Smith PetscErrorCode ierr; 2711273d9f13SBarry Smith 2712273d9f13SBarry Smith PetscFunctionBegin; 2713273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 2714a868139aSShri Abhyankar 271534ef9618SShri Abhyankar ierr = PetscLayoutSetUp(B->rmap);CHKERRQ(ierr); 271634ef9618SShri Abhyankar ierr = PetscLayoutSetUp(B->cmap);CHKERRQ(ierr); 271734ef9618SShri Abhyankar 2718273d9f13SBarry Smith b = (Mat_SeqDense*)B->data; 271986d161a7SShri Abhyankar b->Mmax = B->rmap->n; 272086d161a7SShri Abhyankar b->Nmax = B->cmap->n; 272186d161a7SShri Abhyankar if (b->lda <= 0 || b->changelda) b->lda = B->rmap->n; 272286d161a7SShri Abhyankar 2723220afb94SBarry Smith ierr = PetscIntMultError(b->lda,b->Nmax,NULL);CHKERRQ(ierr); 27249e8f95c4SLisandro Dalcin if (!data) { /* petsc-allocated storage */ 27259e8f95c4SLisandro Dalcin if (!b->user_alloc) { ierr = PetscFree(b->v);CHKERRQ(ierr); } 2726e92229d0SSatish Balay ierr = PetscCalloc1((size_t)b->lda*b->Nmax,&b->v);CHKERRQ(ierr); 27273bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)B,b->lda*b->Nmax*sizeof(PetscScalar));CHKERRQ(ierr); 27282205254eSKarl Rupp 27299e8f95c4SLisandro Dalcin b->user_alloc = PETSC_FALSE; 2730273d9f13SBarry Smith } else { /* user-allocated storage */ 27319e8f95c4SLisandro Dalcin if (!b->user_alloc) { ierr = PetscFree(b->v);CHKERRQ(ierr); } 2732273d9f13SBarry Smith b->v = data; 2733273d9f13SBarry Smith b->user_alloc = PETSC_TRUE; 2734273d9f13SBarry Smith } 27350450473dSBarry Smith B->assembled = PETSC_TRUE; 2736273d9f13SBarry Smith PetscFunctionReturn(0); 2737273d9f13SBarry Smith } 2738273d9f13SBarry Smith 273965b80a83SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 2740cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqDense_Elemental(Mat A, MatType newtype,MatReuse reuse,Mat *newmat) 27418baccfbdSHong Zhang { 2742d77f618aSHong Zhang Mat mat_elemental; 2743d77f618aSHong Zhang PetscErrorCode ierr; 27441683a169SBarry Smith const PetscScalar *array; 27451683a169SBarry Smith PetscScalar *v_colwise; 2746d77f618aSHong Zhang PetscInt M=A->rmap->N,N=A->cmap->N,i,j,k,*rows,*cols; 2747d77f618aSHong Zhang 27488baccfbdSHong Zhang PetscFunctionBegin; 2749d77f618aSHong Zhang ierr = PetscMalloc3(M*N,&v_colwise,M,&rows,N,&cols);CHKERRQ(ierr); 27501683a169SBarry Smith ierr = MatDenseGetArrayRead(A,&array);CHKERRQ(ierr); 2751d77f618aSHong Zhang /* convert column-wise array into row-wise v_colwise, see MatSetValues_Elemental() */ 2752d77f618aSHong Zhang k = 0; 2753d77f618aSHong Zhang for (j=0; j<N; j++) { 2754d77f618aSHong Zhang cols[j] = j; 2755d77f618aSHong Zhang for (i=0; i<M; i++) { 2756d77f618aSHong Zhang v_colwise[j*M+i] = array[k++]; 2757d77f618aSHong Zhang } 2758d77f618aSHong Zhang } 2759d77f618aSHong Zhang for (i=0; i<M; i++) { 2760d77f618aSHong Zhang rows[i] = i; 2761d77f618aSHong Zhang } 27621683a169SBarry Smith ierr = MatDenseRestoreArrayRead(A,&array);CHKERRQ(ierr); 2763d77f618aSHong Zhang 2764d77f618aSHong Zhang ierr = MatCreate(PetscObjectComm((PetscObject)A), &mat_elemental);CHKERRQ(ierr); 2765d77f618aSHong Zhang ierr = MatSetSizes(mat_elemental,PETSC_DECIDE,PETSC_DECIDE,M,N);CHKERRQ(ierr); 2766d77f618aSHong Zhang ierr = MatSetType(mat_elemental,MATELEMENTAL);CHKERRQ(ierr); 2767d77f618aSHong Zhang ierr = MatSetUp(mat_elemental);CHKERRQ(ierr); 2768d77f618aSHong Zhang 2769d77f618aSHong Zhang /* PETSc-Elemental interaface uses axpy for setting off-processor entries, only ADD_VALUES is allowed */ 2770d77f618aSHong Zhang ierr = MatSetValues(mat_elemental,M,rows,N,cols,v_colwise,ADD_VALUES);CHKERRQ(ierr); 2771d77f618aSHong Zhang ierr = MatAssemblyBegin(mat_elemental, MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2772d77f618aSHong Zhang ierr = MatAssemblyEnd(mat_elemental, MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2773d77f618aSHong Zhang ierr = PetscFree3(v_colwise,rows,cols);CHKERRQ(ierr); 2774d77f618aSHong Zhang 2775511c6705SHong Zhang if (reuse == MAT_INPLACE_MATRIX) { 277628be2f97SBarry Smith ierr = MatHeaderReplace(A,&mat_elemental);CHKERRQ(ierr); 2777d77f618aSHong Zhang } else { 2778d77f618aSHong Zhang *newmat = mat_elemental; 2779d77f618aSHong Zhang } 27808baccfbdSHong Zhang PetscFunctionReturn(0); 27818baccfbdSHong Zhang } 278265b80a83SHong Zhang #endif 27838baccfbdSHong Zhang 27841b807ce4Svictorle /*@C 27851b807ce4Svictorle MatSeqDenseSetLDA - Declare the leading dimension of the user-provided array 27861b807ce4Svictorle 27871b807ce4Svictorle Input parameter: 27881b807ce4Svictorle + A - the matrix 27891b807ce4Svictorle - lda - the leading dimension 27901b807ce4Svictorle 27911b807ce4Svictorle Notes: 2792867c911aSBarry Smith This routine is to be used in conjunction with MatSeqDenseSetPreallocation(); 27931b807ce4Svictorle it asserts that the preallocation has a leading dimension (the LDA parameter 27941b807ce4Svictorle of Blas and Lapack fame) larger than M, the first dimension of the matrix. 27951b807ce4Svictorle 27961b807ce4Svictorle Level: intermediate 27971b807ce4Svictorle 2798284134d9SBarry Smith .seealso: MatCreate(), MatCreateSeqDense(), MatSeqDenseSetPreallocation(), MatSetMaximumSize() 2799867c911aSBarry Smith 28001b807ce4Svictorle @*/ 28017087cfbeSBarry Smith PetscErrorCode MatSeqDenseSetLDA(Mat B,PetscInt lda) 28021b807ce4Svictorle { 28031b807ce4Svictorle Mat_SeqDense *b = (Mat_SeqDense*)B->data; 280421a2c019SBarry Smith 28051b807ce4Svictorle PetscFunctionBegin; 2806e32f2f54SBarry Smith if (lda < B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"LDA %D must be at least matrix dimension %D",lda,B->rmap->n); 28071b807ce4Svictorle b->lda = lda; 280821a2c019SBarry Smith b->changelda = PETSC_FALSE; 280921a2c019SBarry Smith b->Mmax = PetscMax(b->Mmax,lda); 28101b807ce4Svictorle PetscFunctionReturn(0); 28111b807ce4Svictorle } 28121b807ce4Svictorle 2813d528f656SJakub Kruzik PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqDense(MPI_Comm comm,Mat inmat,PetscInt n,MatReuse scall,Mat *outmat) 2814d528f656SJakub Kruzik { 2815d528f656SJakub Kruzik PetscErrorCode ierr; 2816d528f656SJakub Kruzik PetscMPIInt size; 2817d528f656SJakub Kruzik 2818d528f656SJakub Kruzik PetscFunctionBegin; 2819d528f656SJakub Kruzik ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 2820d528f656SJakub Kruzik if (size == 1) { 2821d528f656SJakub Kruzik if (scall == MAT_INITIAL_MATRIX) { 2822d528f656SJakub Kruzik ierr = MatDuplicate(inmat,MAT_COPY_VALUES,outmat);CHKERRQ(ierr); 2823d528f656SJakub Kruzik } else { 2824d528f656SJakub Kruzik ierr = MatCopy(inmat,*outmat,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 2825d528f656SJakub Kruzik } 2826d528f656SJakub Kruzik } else { 2827d528f656SJakub Kruzik ierr = MatCreateMPIMatConcatenateSeqMat_MPIDense(comm,inmat,n,scall,outmat);CHKERRQ(ierr); 2828d528f656SJakub Kruzik } 2829d528f656SJakub Kruzik PetscFunctionReturn(0); 2830d528f656SJakub Kruzik } 2831d528f656SJakub Kruzik 28320bad9183SKris Buschelman /*MC 2833fafad747SKris Buschelman MATSEQDENSE - MATSEQDENSE = "seqdense" - A matrix type to be used for sequential dense matrices. 28340bad9183SKris Buschelman 28350bad9183SKris Buschelman Options Database Keys: 28360bad9183SKris Buschelman . -mat_type seqdense - sets the matrix type to "seqdense" during a call to MatSetFromOptions() 28370bad9183SKris Buschelman 28380bad9183SKris Buschelman Level: beginner 28390bad9183SKris Buschelman 284089665df3SBarry Smith .seealso: MatCreateSeqDense() 284189665df3SBarry Smith 28420bad9183SKris Buschelman M*/ 2843ca15aa20SStefano Zampini PetscErrorCode MatCreate_SeqDense(Mat B) 2844273d9f13SBarry Smith { 2845273d9f13SBarry Smith Mat_SeqDense *b; 2846dfbe8321SBarry Smith PetscErrorCode ierr; 28477c334f02SBarry Smith PetscMPIInt size; 2848273d9f13SBarry Smith 2849273d9f13SBarry Smith PetscFunctionBegin; 2850ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)B),&size);CHKERRQ(ierr); 2851e32f2f54SBarry Smith if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Comm must be of size 1"); 285255659b69SBarry Smith 2853b00a9115SJed Brown ierr = PetscNewLog(B,&b);CHKERRQ(ierr); 2854549d3d68SSatish Balay ierr = PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps));CHKERRQ(ierr); 285544cd7ae7SLois Curfman McInnes B->data = (void*)b; 285618f449edSLois Curfman McInnes 2857273d9f13SBarry Smith b->roworiented = PETSC_TRUE; 28584e220ebcSLois Curfman McInnes 285949a6ff4bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetLDA_C",MatDenseGetLDA_SeqDense);CHKERRQ(ierr); 2860bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetArray_C",MatDenseGetArray_SeqDense);CHKERRQ(ierr); 28618572280aSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreArray_C",MatDenseRestoreArray_SeqDense);CHKERRQ(ierr); 2862d3042a70SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDensePlaceArray_C",MatDensePlaceArray_SeqDense);CHKERRQ(ierr); 2863d3042a70SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseResetArray_C",MatDenseResetArray_SeqDense);CHKERRQ(ierr); 28648572280aSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetArrayRead_C",MatDenseGetArray_SeqDense);CHKERRQ(ierr); 2865715b7558SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreArrayRead_C",MatDenseRestoreArray_SeqDense);CHKERRQ(ierr); 2866bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqdense_seqaij_C",MatConvert_SeqDense_SeqAIJ);CHKERRQ(ierr); 28678baccfbdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 28688baccfbdSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqdense_elemental_C",MatConvert_SeqDense_Elemental);CHKERRQ(ierr); 28698baccfbdSHong Zhang #endif 28702bf066beSStefano Zampini #if defined(PETSC_HAVE_CUDA) 28712bf066beSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqdense_seqdensecuda_C",MatConvert_SeqDense_SeqDenseCUDA);CHKERRQ(ierr); 2872a4af7ca8SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMult_seqaijcusparse_seqdense_C",MatMatMult_SeqAIJ_SeqDense);CHKERRQ(ierr); 28732bf066beSStefano Zampini #endif 2874bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqDenseSetPreallocation_C",MatSeqDenseSetPreallocation_SeqDense);CHKERRQ(ierr); 2875bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMult_seqaij_seqdense_C",MatMatMult_SeqAIJ_SeqDense);CHKERRQ(ierr); 2876a4af7ca8SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) 2877a4af7ca8SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMult_seqaijviennacl_seqdense_C",MatMatMult_SeqAIJ_SeqDense);CHKERRQ(ierr); 2878a4af7ca8SStefano Zampini #endif 2879bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_seqaij_seqdense_C",MatMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 2880bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_seqaij_seqdense_C",MatMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 2881a001520aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMult_seqbaij_seqdense_C",MatMatMult_SeqBAIJ_SeqDense);CHKERRQ(ierr); 2882a001520aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_seqbaij_seqdense_C",MatMatMultSymbolic_SeqBAIJ_SeqDense);CHKERRQ(ierr); 2883a001520aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_seqbaij_seqdense_C",MatMatMultNumeric_SeqBAIJ_SeqDense);CHKERRQ(ierr); 2884*c2916339SPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMult_seqsbaij_seqdense_C",MatMatMult_SeqSBAIJ_SeqDense);CHKERRQ(ierr); 2885*c2916339SPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_seqsbaij_seqdense_C",MatMatMultSymbolic_SeqSBAIJ_SeqDense);CHKERRQ(ierr); 2886*c2916339SPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_seqsbaij_seqdense_C",MatMatMultNumeric_SeqSBAIJ_SeqDense);CHKERRQ(ierr); 2887abc3b08eSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatPtAP_seqaij_seqdense_C",MatPtAP_SeqDense_SeqDense);CHKERRQ(ierr); 28884099cc6bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMult_seqaijperm_seqdense_C",MatMatMult_SeqAIJ_SeqDense);CHKERRQ(ierr); 28894099cc6bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_seqaijperm_seqdense_C",MatMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 28904099cc6bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_seqaijperm_seqdense_C",MatMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 28914099cc6bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatPtAP_seqaijperm_seqdense_C",MatPtAP_SeqDense_SeqDense);CHKERRQ(ierr); 2892e9e4f4a6SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMult_seqaijsell_seqdense_C",MatMatMult_SeqAIJ_SeqDense);CHKERRQ(ierr); 2893e9e4f4a6SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_seqaijsell_seqdense_C",MatMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 2894e9e4f4a6SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_seqaijsell_seqdense_C",MatMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 2895e9e4f4a6SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatPtAP_seqaijsell_seqdense_C",MatPtAP_SeqDense_SeqDense);CHKERRQ(ierr); 289696e6d5c4SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMult_seqaijmkl_seqdense_C",MatMatMult_SeqAIJ_SeqDense);CHKERRQ(ierr); 289796e6d5c4SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_seqaijmkl_seqdense_C",MatMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 289896e6d5c4SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_seqaijmkl_seqdense_C",MatMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 289952c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMult_nest_seqdense_C",MatMatMult_Nest_Dense);CHKERRQ(ierr); 290052c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_nest_seqdense_C",MatMatMultSymbolic_Nest_Dense);CHKERRQ(ierr); 290152c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_nest_seqdense_C",MatMatMultNumeric_Nest_Dense);CHKERRQ(ierr); 290296e6d5c4SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatPtAP_seqaijmkl_seqdense_C",MatPtAP_SeqDense_SeqDense);CHKERRQ(ierr); 290396e6d5c4SRichard Tran Mills 29043bf78175SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMult_seqaij_seqdense_C",MatTransposeMatMult_SeqAIJ_SeqDense);CHKERRQ(ierr); 29053bf78175SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultSymbolic_seqaij_seqdense_C",MatTransposeMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 29063bf78175SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultNumeric_seqaij_seqdense_C",MatTransposeMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 29074099cc6bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMult_seqaijperm_seqdense_C",MatTransposeMatMult_SeqAIJ_SeqDense);CHKERRQ(ierr); 29084099cc6bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultSymbolic_seqaijperm_seqdense_C",MatTransposeMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 29094099cc6bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultNumeric_seqaijperm_seqdense_C",MatTransposeMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 2910e9e4f4a6SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMult_seqaijsell_seqdense_C",MatTransposeMatMult_SeqAIJ_SeqDense);CHKERRQ(ierr); 2911e9e4f4a6SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultSymbolic_seqaijsell_seqdense_C",MatTransposeMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 2912e9e4f4a6SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultNumeric_seqaijsell_seqdense_C",MatTransposeMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 291396e6d5c4SRichard Tran Mills 291496e6d5c4SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMult_seqaijmkl_seqdense_C",MatTransposeMatMult_SeqAIJ_SeqDense);CHKERRQ(ierr); 291596e6d5c4SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultSymbolic_seqaijmkl_seqdense_C",MatTransposeMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 291696e6d5c4SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultNumeric_seqaijmkl_seqdense_C",MatTransposeMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 2917af53bab2SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetColumn_C",MatDenseGetColumn_SeqDense);CHKERRQ(ierr); 2918af53bab2SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreColumn_C",MatDenseRestoreColumn_SeqDense);CHKERRQ(ierr); 291917667f90SBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQDENSE);CHKERRQ(ierr); 29203a40ed3dSBarry Smith PetscFunctionReturn(0); 2921289bc588SBarry Smith } 292286aefd0dSHong Zhang 292386aefd0dSHong Zhang /*@C 2924af53bab2SHong Zhang MatDenseGetColumn - gives access to a column of a dense matrix. This is only the local part of the column. You MUST call MatDenseRestoreColumn() to avoid memory bleeding. 292586aefd0dSHong Zhang 292686aefd0dSHong Zhang Not Collective 292786aefd0dSHong Zhang 292886aefd0dSHong Zhang Input Parameter: 292986aefd0dSHong Zhang + mat - a MATSEQDENSE or MATMPIDENSE matrix 293086aefd0dSHong Zhang - col - column index 293186aefd0dSHong Zhang 293286aefd0dSHong Zhang Output Parameter: 293386aefd0dSHong Zhang . vals - pointer to the data 293486aefd0dSHong Zhang 293586aefd0dSHong Zhang Level: intermediate 293686aefd0dSHong Zhang 293786aefd0dSHong Zhang .seealso: MatDenseRestoreColumn() 293886aefd0dSHong Zhang @*/ 293986aefd0dSHong Zhang PetscErrorCode MatDenseGetColumn(Mat A,PetscInt col,PetscScalar **vals) 294086aefd0dSHong Zhang { 294186aefd0dSHong Zhang PetscErrorCode ierr; 294286aefd0dSHong Zhang 294386aefd0dSHong Zhang PetscFunctionBegin; 294486aefd0dSHong Zhang ierr = PetscUseMethod(A,"MatDenseGetColumn_C",(Mat,PetscInt,PetscScalar**),(A,col,vals));CHKERRQ(ierr); 294586aefd0dSHong Zhang PetscFunctionReturn(0); 294686aefd0dSHong Zhang } 294786aefd0dSHong Zhang 294886aefd0dSHong Zhang /*@C 294986aefd0dSHong Zhang MatDenseRestoreColumn - returns access to a column of a dense matrix which is returned by MatDenseGetColumn(). 295086aefd0dSHong Zhang 295186aefd0dSHong Zhang Not Collective 295286aefd0dSHong Zhang 295386aefd0dSHong Zhang Input Parameter: 295486aefd0dSHong Zhang . mat - a MATSEQDENSE or MATMPIDENSE matrix 295586aefd0dSHong Zhang 295686aefd0dSHong Zhang Output Parameter: 295786aefd0dSHong Zhang . vals - pointer to the data 295886aefd0dSHong Zhang 295986aefd0dSHong Zhang Level: intermediate 296086aefd0dSHong Zhang 296186aefd0dSHong Zhang .seealso: MatDenseGetColumn() 296286aefd0dSHong Zhang @*/ 296386aefd0dSHong Zhang PetscErrorCode MatDenseRestoreColumn(Mat A,PetscScalar **vals) 296486aefd0dSHong Zhang { 296586aefd0dSHong Zhang PetscErrorCode ierr; 296686aefd0dSHong Zhang 296786aefd0dSHong Zhang PetscFunctionBegin; 296886aefd0dSHong Zhang ierr = PetscUseMethod(A,"MatDenseRestoreColumn_C",(Mat,PetscScalar**),(A,vals));CHKERRQ(ierr); 296986aefd0dSHong Zhang PetscFunctionReturn(0); 297086aefd0dSHong Zhang } 2971