1 2 #include <petsc-private/matimpl.h> /*I "petscmat.h" I*/ 3 4 #undef __FUNCT__ 5 #define __FUNCT__ "MatAXPY" 6 /*@ 7 MatAXPY - Computes Y = a*X + Y. 8 9 Logically Collective on Mat 10 11 Input Parameters: 12 + a - the scalar multiplier 13 . X - the first matrix 14 . Y - the second matrix 15 - str - either SAME_NONZERO_PATTERN, DIFFERENT_NONZERO_PATTERN 16 or SUBSET_NONZERO_PATTERN (nonzeros of X is a subset of Y's) 17 18 Level: intermediate 19 20 .keywords: matrix, add 21 22 .seealso: MatAYPX() 23 @*/ 24 PetscErrorCode MatAXPY(Mat Y,PetscScalar a,Mat X,MatStructure str) 25 { 26 PetscErrorCode ierr; 27 PetscInt m1,m2,n1,n2; 28 29 PetscFunctionBegin; 30 PetscValidHeaderSpecific(X,MAT_CLASSID,3); 31 PetscValidHeaderSpecific(Y,MAT_CLASSID,1); 32 PetscValidLogicalCollectiveScalar(Y,a,2); 33 ierr = MatGetSize(X,&m1,&n1);CHKERRQ(ierr); 34 ierr = MatGetSize(Y,&m2,&n2);CHKERRQ(ierr); 35 if (m1 != m2 || n1 != n2) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Non conforming matrix add: %D %D %D %D",m1,m2,n1,n2); 36 37 ierr = PetscLogEventBegin(MAT_AXPY,Y,0,0,0);CHKERRQ(ierr); 38 if (Y->ops->axpy) { 39 ierr = (*Y->ops->axpy)(Y,a,X,str);CHKERRQ(ierr); 40 } else { 41 ierr = MatAXPY_Basic(Y,a,X,str);CHKERRQ(ierr); 42 } 43 ierr = PetscLogEventEnd(MAT_AXPY,Y,0,0,0);CHKERRQ(ierr); 44 #if defined(PETSC_HAVE_CUSP) 45 if (Y->valid_GPU_matrix != PETSC_CUSP_UNALLOCATED) { 46 Y->valid_GPU_matrix = PETSC_CUSP_CPU; 47 } 48 #endif 49 #if defined(PETSC_HAVE_VIENNACL) 50 if (Y->valid_GPU_matrix != PETSC_VIENNACL_UNALLOCATED) { 51 Y->valid_GPU_matrix = PETSC_VIENNACL_CPU; 52 } 53 #endif 54 PetscFunctionReturn(0); 55 } 56 57 #undef __FUNCT__ 58 #define __FUNCT__ "MatAXPY_Basic" 59 PetscErrorCode MatAXPY_Basic(Mat Y,PetscScalar a,Mat X,MatStructure str) 60 { 61 PetscInt i,start,end,j,ncols,m,n; 62 PetscErrorCode ierr; 63 const PetscInt *row; 64 PetscScalar *val; 65 const PetscScalar *vals; 66 67 PetscFunctionBegin; 68 ierr = MatGetSize(X,&m,&n);CHKERRQ(ierr); 69 ierr = MatGetOwnershipRange(X,&start,&end);CHKERRQ(ierr); 70 if (a == 1.0) { 71 for (i = start; i < end; i++) { 72 ierr = MatGetRow(X,i,&ncols,&row,&vals);CHKERRQ(ierr); 73 ierr = MatSetValues(Y,1,&i,ncols,row,vals,ADD_VALUES);CHKERRQ(ierr); 74 ierr = MatRestoreRow(X,i,&ncols,&row,&vals);CHKERRQ(ierr); 75 } 76 } else { 77 ierr = PetscMalloc((n+1)*sizeof(PetscScalar),&val);CHKERRQ(ierr); 78 for (i=start; i<end; i++) { 79 ierr = MatGetRow(X,i,&ncols,&row,&vals);CHKERRQ(ierr); 80 for (j=0; j<ncols; j++) { 81 val[j] = a*vals[j]; 82 } 83 ierr = MatSetValues(Y,1,&i,ncols,row,val,ADD_VALUES);CHKERRQ(ierr); 84 ierr = MatRestoreRow(X,i,&ncols,&row,&vals);CHKERRQ(ierr); 85 } 86 ierr = PetscFree(val);CHKERRQ(ierr); 87 } 88 ierr = MatAssemblyBegin(Y,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 89 ierr = MatAssemblyEnd(Y,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 90 PetscFunctionReturn(0); 91 } 92 93 #undef __FUNCT__ 94 #define __FUNCT__ "MatAXPY_BasicWithPreallocation" 95 PetscErrorCode MatAXPY_BasicWithPreallocation(Mat B,Mat Y,PetscScalar a,Mat X,MatStructure str) 96 { 97 PetscInt i,start,end,j,ncols,m,n; 98 PetscErrorCode ierr; 99 const PetscInt *row; 100 PetscScalar *val; 101 const PetscScalar *vals; 102 103 PetscFunctionBegin; 104 ierr = MatGetSize(X,&m,&n);CHKERRQ(ierr); 105 ierr = MatGetOwnershipRange(X,&start,&end);CHKERRQ(ierr); 106 if (a == 1.0) { 107 for (i = start; i < end; i++) { 108 ierr = MatGetRow(Y,i,&ncols,&row,&vals);CHKERRQ(ierr); 109 ierr = MatSetValues(B,1,&i,ncols,row,vals,ADD_VALUES);CHKERRQ(ierr); 110 ierr = MatRestoreRow(Y,i,&ncols,&row,&vals);CHKERRQ(ierr); 111 112 ierr = MatGetRow(X,i,&ncols,&row,&vals);CHKERRQ(ierr); 113 ierr = MatSetValues(B,1,&i,ncols,row,vals,ADD_VALUES);CHKERRQ(ierr); 114 ierr = MatRestoreRow(X,i,&ncols,&row,&vals);CHKERRQ(ierr); 115 } 116 } else { 117 ierr = PetscMalloc((n+1)*sizeof(PetscScalar),&val);CHKERRQ(ierr); 118 for (i=start; i<end; i++) { 119 ierr = MatGetRow(Y,i,&ncols,&row,&vals);CHKERRQ(ierr); 120 ierr = MatSetValues(B,1,&i,ncols,row,vals,ADD_VALUES);CHKERRQ(ierr); 121 ierr = MatRestoreRow(Y,i,&ncols,&row,&vals);CHKERRQ(ierr); 122 123 ierr = MatGetRow(X,i,&ncols,&row,&vals);CHKERRQ(ierr); 124 for (j=0; j<ncols; j++) { 125 val[j] = a*vals[j]; 126 } 127 ierr = MatSetValues(B,1,&i,ncols,row,val,ADD_VALUES);CHKERRQ(ierr); 128 ierr = MatRestoreRow(X,i,&ncols,&row,&vals);CHKERRQ(ierr); 129 } 130 ierr = PetscFree(val);CHKERRQ(ierr); 131 } 132 ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 133 ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 134 PetscFunctionReturn(0); 135 } 136 137 #undef __FUNCT__ 138 #define __FUNCT__ "MatShift" 139 /*@ 140 MatShift - Computes Y = Y + a I, where a is a PetscScalar and I is the identity matrix. 141 142 Neighbor-wise Collective on Mat 143 144 Input Parameters: 145 + Y - the matrices 146 - a - the PetscScalar 147 148 Level: intermediate 149 150 .keywords: matrix, add, shift 151 152 .seealso: MatDiagonalSet() 153 @*/ 154 PetscErrorCode MatShift(Mat Y,PetscScalar a) 155 { 156 PetscErrorCode ierr; 157 PetscInt i,start,end; 158 159 PetscFunctionBegin; 160 PetscValidHeaderSpecific(Y,MAT_CLASSID,1); 161 if (!Y->assembled) SETERRQ(PetscObjectComm((PetscObject)Y),PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 162 if (Y->factortype) SETERRQ(PetscObjectComm((PetscObject)Y),PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 163 MatCheckPreallocated(Y,1); 164 165 if (Y->ops->shift) { 166 ierr = (*Y->ops->shift)(Y,a);CHKERRQ(ierr); 167 } else { 168 PetscScalar alpha = a; 169 ierr = MatGetOwnershipRange(Y,&start,&end);CHKERRQ(ierr); 170 for (i=start; i<end; i++) { 171 ierr = MatSetValues(Y,1,&i,1,&i,&alpha,ADD_VALUES);CHKERRQ(ierr); 172 } 173 ierr = MatAssemblyBegin(Y,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 174 ierr = MatAssemblyEnd(Y,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 175 } 176 #if defined(PETSC_HAVE_CUSP) 177 if (Y->valid_GPU_matrix != PETSC_CUSP_UNALLOCATED) { 178 Y->valid_GPU_matrix = PETSC_CUSP_CPU; 179 } 180 #endif 181 #if defined(PETSC_HAVE_VIENNACL) 182 if (Y->valid_GPU_matrix != PETSC_VIENNACL_UNALLOCATED) { 183 Y->valid_GPU_matrix = PETSC_VIENNACL_CPU; 184 } 185 #endif 186 PetscFunctionReturn(0); 187 } 188 189 #undef __FUNCT__ 190 #define __FUNCT__ "MatDiagonalSet_Default" 191 PetscErrorCode MatDiagonalSet_Default(Mat Y,Vec D,InsertMode is) 192 { 193 PetscErrorCode ierr; 194 PetscInt i,start,end,vstart,vend; 195 PetscScalar *v; 196 197 PetscFunctionBegin; 198 ierr = VecGetOwnershipRange(D,&vstart,&vend);CHKERRQ(ierr); 199 ierr = MatGetOwnershipRange(Y,&start,&end);CHKERRQ(ierr); 200 if (vstart != start || vend != end) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Vector ownership range not compatible with matrix: %D %D vec %D %D mat",vstart,vend,start,end); 201 ierr = VecGetArray(D,&v);CHKERRQ(ierr); 202 for (i=start; i<end; i++) { 203 ierr = MatSetValues(Y,1,&i,1,&i,v+i-start,is);CHKERRQ(ierr); 204 } 205 ierr = VecRestoreArray(D,&v);CHKERRQ(ierr); 206 ierr = MatAssemblyBegin(Y,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 207 ierr = MatAssemblyEnd(Y,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 208 PetscFunctionReturn(0); 209 } 210 211 #undef __FUNCT__ 212 #define __FUNCT__ "MatDiagonalSet" 213 /*@ 214 MatDiagonalSet - Computes Y = Y + D, where D is a diagonal matrix 215 that is represented as a vector. Or Y[i,i] = D[i] if InsertMode is 216 INSERT_VALUES. 217 218 Input Parameters: 219 + Y - the input matrix 220 . D - the diagonal matrix, represented as a vector 221 - i - INSERT_VALUES or ADD_VALUES 222 223 Neighbor-wise Collective on Mat and Vec 224 225 Level: intermediate 226 227 .keywords: matrix, add, shift, diagonal 228 229 .seealso: MatShift() 230 @*/ 231 PetscErrorCode MatDiagonalSet(Mat Y,Vec D,InsertMode is) 232 { 233 PetscErrorCode ierr; 234 235 PetscFunctionBegin; 236 PetscValidHeaderSpecific(Y,MAT_CLASSID,1); 237 PetscValidHeaderSpecific(D,VEC_CLASSID,2); 238 if (Y->ops->diagonalset) { 239 ierr = (*Y->ops->diagonalset)(Y,D,is);CHKERRQ(ierr); 240 } else { 241 ierr = MatDiagonalSet_Default(Y,D,is);CHKERRQ(ierr); 242 } 243 PetscFunctionReturn(0); 244 } 245 246 #undef __FUNCT__ 247 #define __FUNCT__ "MatAYPX" 248 /*@ 249 MatAYPX - Computes Y = a*Y + X. 250 251 Logically on Mat 252 253 Input Parameters: 254 + a - the PetscScalar multiplier 255 . Y - the first matrix 256 . X - the second matrix 257 - str - either SAME_NONZERO_PATTERN, DIFFERENT_NONZERO_PATTERN or SUBSET_NONZERO_PATTERN 258 259 Level: intermediate 260 261 .keywords: matrix, add 262 263 .seealso: MatAXPY() 264 @*/ 265 PetscErrorCode MatAYPX(Mat Y,PetscScalar a,Mat X,MatStructure str) 266 { 267 PetscScalar one = 1.0; 268 PetscErrorCode ierr; 269 PetscInt mX,mY,nX,nY; 270 271 PetscFunctionBegin; 272 PetscValidHeaderSpecific(X,MAT_CLASSID,3); 273 PetscValidHeaderSpecific(Y,MAT_CLASSID,1); 274 PetscValidLogicalCollectiveScalar(Y,a,2); 275 ierr = MatGetSize(X,&mX,&nX);CHKERRQ(ierr); 276 ierr = MatGetSize(X,&mY,&nY);CHKERRQ(ierr); 277 if (mX != mY || nX != nY) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Non conforming matrices: %D %D first %D %D second",mX,mY,nX,nY); 278 279 ierr = MatScale(Y,a);CHKERRQ(ierr); 280 ierr = MatAXPY(Y,one,X,str);CHKERRQ(ierr); 281 PetscFunctionReturn(0); 282 } 283 284 #undef __FUNCT__ 285 #define __FUNCT__ "MatComputeExplicitOperator" 286 /*@ 287 MatComputeExplicitOperator - Computes the explicit matrix 288 289 Collective on Mat 290 291 Input Parameter: 292 . inmat - the matrix 293 294 Output Parameter: 295 . mat - the explict preconditioned operator 296 297 Notes: 298 This computation is done by applying the operators to columns of the 299 identity matrix. 300 301 Currently, this routine uses a dense matrix format when 1 processor 302 is used and a sparse format otherwise. This routine is costly in general, 303 and is recommended for use only with relatively small systems. 304 305 Level: advanced 306 307 .keywords: Mat, compute, explicit, operator 308 @*/ 309 PetscErrorCode MatComputeExplicitOperator(Mat inmat,Mat *mat) 310 { 311 Vec in,out; 312 PetscErrorCode ierr; 313 PetscInt i,m,n,M,N,*rows,start,end; 314 MPI_Comm comm; 315 PetscScalar *array,zero = 0.0,one = 1.0; 316 PetscMPIInt size; 317 318 PetscFunctionBegin; 319 PetscValidHeaderSpecific(inmat,MAT_CLASSID,1); 320 PetscValidPointer(mat,2); 321 322 ierr = PetscObjectGetComm((PetscObject)inmat,&comm);CHKERRQ(ierr); 323 ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 324 325 ierr = MatGetLocalSize(inmat,&m,&n);CHKERRQ(ierr); 326 ierr = MatGetSize(inmat,&M,&N);CHKERRQ(ierr); 327 ierr = MatGetVecs(inmat,&in,&out);CHKERRQ(ierr); 328 ierr = VecSetOption(in,VEC_IGNORE_OFF_PROC_ENTRIES,PETSC_TRUE);CHKERRQ(ierr); 329 ierr = VecGetOwnershipRange(out,&start,&end);CHKERRQ(ierr); 330 ierr = PetscMalloc(m*sizeof(PetscInt),&rows);CHKERRQ(ierr); 331 for (i=0; i<m; i++) rows[i] = start + i; 332 333 ierr = MatCreate(comm,mat);CHKERRQ(ierr); 334 ierr = MatSetSizes(*mat,m,n,M,N);CHKERRQ(ierr); 335 if (size == 1) { 336 ierr = MatSetType(*mat,MATSEQDENSE);CHKERRQ(ierr); 337 ierr = MatSeqDenseSetPreallocation(*mat,NULL);CHKERRQ(ierr); 338 } else { 339 ierr = MatSetType(*mat,MATMPIAIJ);CHKERRQ(ierr); 340 ierr = MatMPIAIJSetPreallocation(*mat,n,NULL,N-n,NULL);CHKERRQ(ierr); 341 } 342 343 for (i=0; i<N; i++) { 344 345 ierr = VecSet(in,zero);CHKERRQ(ierr); 346 ierr = VecSetValues(in,1,&i,&one,INSERT_VALUES);CHKERRQ(ierr); 347 ierr = VecAssemblyBegin(in);CHKERRQ(ierr); 348 ierr = VecAssemblyEnd(in);CHKERRQ(ierr); 349 350 ierr = MatMult(inmat,in,out);CHKERRQ(ierr); 351 352 ierr = VecGetArray(out,&array);CHKERRQ(ierr); 353 ierr = MatSetValues(*mat,m,rows,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 354 ierr = VecRestoreArray(out,&array);CHKERRQ(ierr); 355 356 } 357 ierr = PetscFree(rows);CHKERRQ(ierr); 358 ierr = VecDestroy(&out);CHKERRQ(ierr); 359 ierr = VecDestroy(&in);CHKERRQ(ierr); 360 ierr = MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 361 ierr = MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 362 PetscFunctionReturn(0); 363 } 364 365 /* Get the map xtoy which is used by MatAXPY() in the case of SUBSET_NONZERO_PATTERN */ 366 #undef __FUNCT__ 367 #define __FUNCT__ "MatAXPYGetxtoy_Private" 368 PetscErrorCode MatAXPYGetxtoy_Private(PetscInt m,PetscInt *xi,PetscInt *xj,PetscInt *xgarray, PetscInt *yi,PetscInt *yj,PetscInt *ygarray, PetscInt **xtoy) 369 { 370 PetscErrorCode ierr; 371 PetscInt row,i,nz,xcol,ycol,jx,jy,*x2y; 372 373 PetscFunctionBegin; 374 ierr = PetscMalloc(xi[m]*sizeof(PetscInt),&x2y);CHKERRQ(ierr); 375 i = 0; 376 for (row=0; row<m; row++) { 377 nz = xi[1] - xi[0]; 378 jy = 0; 379 for (jx=0; jx<nz; jx++,jy++) { 380 if (xgarray && ygarray) { 381 xcol = xgarray[xj[*xi + jx]]; 382 ycol = ygarray[yj[*yi + jy]]; 383 } else { 384 xcol = xj[*xi + jx]; 385 ycol = yj[*yi + jy]; /* col index for y */ 386 } 387 while (ycol < xcol) { 388 jy++; 389 if (ygarray) { 390 ycol = ygarray[yj[*yi + jy]]; 391 } else { 392 ycol = yj[*yi + jy]; 393 } 394 } 395 if (xcol != ycol) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"X matrix entry (%D,%D) is not in Y matrix",row,ycol); 396 x2y[i++] = *yi + jy; 397 } 398 xi++; yi++; 399 } 400 *xtoy = x2y; 401 PetscFunctionReturn(0); 402 } 403 404 #undef __FUNCT__ 405 #define __FUNCT__ "MatChop" 406 /*@ 407 MatChop - Set all values in the matrix less than the tolerance to zero 408 409 Input Parameters: 410 + A - The matrix 411 - tol - The zero tolerance 412 413 Output Parameters: 414 . A - The chopped matrix 415 416 Level: intermediate 417 418 .seealso: MatCreate(), MatZeroEntries() 419 @*/ 420 PetscErrorCode MatChop(Mat A, PetscReal tol) 421 { 422 PetscScalar *newVals; 423 PetscInt *newCols; 424 PetscInt rStart, rEnd, numRows, maxRows, r, colMax = 0; 425 PetscErrorCode ierr; 426 427 PetscFunctionBegin; 428 ierr = MatGetOwnershipRange(A, &rStart, &rEnd);CHKERRQ(ierr); 429 for (r = rStart; r < rEnd; ++r) { 430 PetscInt ncols; 431 432 ierr = MatGetRow(A, r, &ncols, NULL, NULL);CHKERRQ(ierr); 433 colMax = PetscMax(colMax, ncols);CHKERRQ(ierr); 434 ierr = MatRestoreRow(A, r, &ncols, NULL, NULL);CHKERRQ(ierr); 435 } 436 numRows = rEnd - rStart; 437 ierr = MPI_Allreduce(&numRows, &maxRows, 1, MPIU_INT, MPI_MAX, PetscObjectComm((PetscObject)A));CHKERRQ(ierr); 438 ierr = PetscMalloc2(colMax,PetscInt,&newCols,colMax,PetscScalar,&newVals);CHKERRQ(ierr); 439 for (r = rStart; r < rStart+maxRows; ++r) { 440 const PetscScalar *vals; 441 const PetscInt *cols; 442 PetscInt ncols, newcols, c; 443 444 if (r < rEnd) { 445 ierr = MatGetRow(A, r, &ncols, &cols, &vals);CHKERRQ(ierr); 446 for (c = 0; c < ncols; ++c) { 447 newCols[c] = cols[c]; 448 newVals[c] = PetscAbsScalar(vals[c]) < tol ? 0.0 : vals[c]; 449 } 450 newcols = ncols; 451 ierr = MatRestoreRow(A, r, &ncols, &cols, &vals);CHKERRQ(ierr); 452 ierr = MatSetValues(A, 1, &r, newcols, newCols, newVals, INSERT_VALUES);CHKERRQ(ierr); 453 } 454 ierr = MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 455 ierr = MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 456 } 457 ierr = PetscFree2(newCols,newVals);CHKERRQ(ierr); 458 PetscFunctionReturn(0); 459 } 460