xref: /petsc/src/mat/impls/aij/seq/aij.c (revision 4e8208cbcbc709572b8abe32f33c78b69c819375)
1d5d45c9bSBarry Smith /*
23369ce9aSBarry Smith     Defines the basic matrix operations for the AIJ (compressed row)
3d5d45c9bSBarry Smith   matrix storage format.
4d5d45c9bSBarry Smith */
53369ce9aSBarry Smith 
6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/
7c6db04a5SJed Brown #include <petscblaslapack.h>
8c6db04a5SJed Brown #include <petscbt.h>
9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h>
100716a85fSBarry Smith 
1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */
1226cec326SBarry Smith #define TYPE AIJ
1326cec326SBarry Smith #define TYPE_BS
1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h"
1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h"
1626cec326SBarry Smith #undef TYPE
1726cec326SBarry Smith #undef TYPE_BS
1826cec326SBarry Smith 
19421480d9SBarry Smith MatGetDiagonalMarkers(SeqAIJ, 1)
20421480d9SBarry Smith 
MatSeqAIJSetTypeFromOptions(Mat A)21ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A)
22d71ae5a4SJacob Faibussowitsch {
234099cc6bSBarry Smith   PetscBool flg;
244099cc6bSBarry Smith   char      type[256];
254099cc6bSBarry Smith 
264099cc6bSBarry Smith   PetscFunctionBegin;
27d0609cedSBarry Smith   PetscObjectOptionsBegin((PetscObject)A);
289566063dSJacob Faibussowitsch   PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg));
299566063dSJacob Faibussowitsch   if (flg) PetscCall(MatSeqAIJSetType(A, type));
30d0609cedSBarry Smith   PetscOptionsEnd();
313ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
324099cc6bSBarry Smith }
334099cc6bSBarry Smith 
MatGetColumnReductions_SeqAIJ(Mat A,PetscInt type,PetscReal * reductions)34ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions)
35d71ae5a4SJacob Faibussowitsch {
360716a85fSBarry Smith   PetscInt    i, m, n;
370716a85fSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
380716a85fSBarry Smith 
390716a85fSBarry Smith   PetscFunctionBegin;
409566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &m, &n));
419566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(reductions, n));
420716a85fSBarry Smith   if (type == NORM_2) {
43ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]);
440716a85fSBarry Smith   } else if (type == NORM_1) {
45ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]);
460716a85fSBarry Smith   } else if (type == NORM_INFINITY) {
47ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]);
48857cbf51SRichard Tran Mills   } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) {
49ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]);
50857cbf51SRichard Tran Mills   } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) {
51ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]);
526adde796SStefano Zampini   } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Unknown reduction type");
530716a85fSBarry Smith 
540716a85fSBarry Smith   if (type == NORM_2) {
55a873a8cdSSam Reynolds     for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]);
56857cbf51SRichard Tran Mills   } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) {
57a873a8cdSSam Reynolds     for (i = 0; i < n; i++) reductions[i] /= m;
580716a85fSBarry Smith   }
593ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
600716a85fSBarry Smith }
610716a85fSBarry Smith 
MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A,IS * is)62ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is)
63d71ae5a4SJacob Faibussowitsch {
643a062f41SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
653a062f41SBarry Smith   PetscInt        i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs;
663a062f41SBarry Smith   const PetscInt *jj = a->j, *ii = a->i;
673a062f41SBarry Smith   PetscInt       *rows;
683a062f41SBarry Smith 
693a062f41SBarry Smith   PetscFunctionBegin;
703a062f41SBarry Smith   for (i = 0; i < m; i++) {
71ad540459SPierre Jolivet     if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++;
723a062f41SBarry Smith   }
739566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(cnt, &rows));
743a062f41SBarry Smith   cnt = 0;
753a062f41SBarry Smith   for (i = 0; i < m; i++) {
763a062f41SBarry Smith     if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) {
773a062f41SBarry Smith       rows[cnt] = i;
783a062f41SBarry Smith       cnt++;
793a062f41SBarry Smith     }
803a062f41SBarry Smith   }
819566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is));
823ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
833a062f41SBarry Smith }
843a062f41SBarry Smith 
MatFindZeroDiagonals_SeqAIJ_Private(Mat A,PetscInt * nrows,PetscInt ** zrows)85d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows)
86d71ae5a4SJacob Faibussowitsch {
876ce1633cSBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
88fff043a9SJunchao Zhang   const MatScalar *aa;
896ce1633cSBarry Smith   PetscInt         i, m = A->rmap->n, cnt = 0;
90b2db7409Sstefano_zampini   const PetscInt  *ii = a->i, *jj = a->j, *diag;
916ce1633cSBarry Smith   PetscInt        *rows;
926ce1633cSBarry Smith 
936ce1633cSBarry Smith   PetscFunctionBegin;
949566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
95421480d9SBarry Smith   PetscCall(MatGetDiagonalMarkers_SeqAIJ(A, &diag, NULL));
966ce1633cSBarry Smith   for (i = 0; i < m; i++) {
97ad540459SPierre Jolivet     if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++;
986ce1633cSBarry Smith   }
999566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(cnt, &rows));
1006ce1633cSBarry Smith   cnt = 0;
1016ce1633cSBarry Smith   for (i = 0; i < m; i++) {
102ad540459SPierre Jolivet     if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i;
1036ce1633cSBarry Smith   }
104f1f41ecbSJed Brown   *nrows = cnt;
105f1f41ecbSJed Brown   *zrows = rows;
1069566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1073ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
108f1f41ecbSJed Brown }
109f1f41ecbSJed Brown 
MatFindZeroDiagonals_SeqAIJ(Mat A,IS * zrows)110ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows)
111d71ae5a4SJacob Faibussowitsch {
112f1f41ecbSJed Brown   PetscInt nrows, *rows;
113f1f41ecbSJed Brown 
114f1f41ecbSJed Brown   PetscFunctionBegin;
1150298fd71SBarry Smith   *zrows = NULL;
1169566063dSJacob Faibussowitsch   PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows));
1179566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows));
1183ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1196ce1633cSBarry Smith }
1206ce1633cSBarry Smith 
MatFindNonzeroRows_SeqAIJ(Mat A,IS * keptrows)121ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows)
122d71ae5a4SJacob Faibussowitsch {
123b3a44c85SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
124b3a44c85SBarry Smith   const MatScalar *aa;
125b3a44c85SBarry Smith   PetscInt         m = A->rmap->n, cnt = 0;
126b3a44c85SBarry Smith   const PetscInt  *ii;
127b3a44c85SBarry Smith   PetscInt         n, i, j, *rows;
128b3a44c85SBarry Smith 
129b3a44c85SBarry Smith   PetscFunctionBegin;
1309566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
131f4259b30SLisandro Dalcin   *keptrows = NULL;
132b3a44c85SBarry Smith   ii        = a->i;
133b3a44c85SBarry Smith   for (i = 0; i < m; i++) {
134b3a44c85SBarry Smith     n = ii[i + 1] - ii[i];
135b3a44c85SBarry Smith     if (!n) {
136b3a44c85SBarry Smith       cnt++;
137b3a44c85SBarry Smith       goto ok1;
138b3a44c85SBarry Smith     }
1392e5835c6SStefano Zampini     for (j = ii[i]; j < ii[i + 1]; j++) {
140b3a44c85SBarry Smith       if (aa[j] != 0.0) goto ok1;
141b3a44c85SBarry Smith     }
142b3a44c85SBarry Smith     cnt++;
143b3a44c85SBarry Smith   ok1:;
144b3a44c85SBarry Smith   }
1452e5835c6SStefano Zampini   if (!cnt) {
1469566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1473ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1482e5835c6SStefano Zampini   }
1499566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows));
150b3a44c85SBarry Smith   cnt = 0;
151b3a44c85SBarry Smith   for (i = 0; i < m; i++) {
152b3a44c85SBarry Smith     n = ii[i + 1] - ii[i];
153b3a44c85SBarry Smith     if (!n) continue;
1542e5835c6SStefano Zampini     for (j = ii[i]; j < ii[i + 1]; j++) {
155b3a44c85SBarry Smith       if (aa[j] != 0.0) {
156b3a44c85SBarry Smith         rows[cnt++] = i;
157b3a44c85SBarry Smith         break;
158b3a44c85SBarry Smith       }
159b3a44c85SBarry Smith     }
160b3a44c85SBarry Smith   }
1619566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1629566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows));
1633ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
164b3a44c85SBarry Smith }
165b3a44c85SBarry Smith 
MatDiagonalSet_SeqAIJ(Mat Y,Vec D,InsertMode is)166d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is)
167d71ae5a4SJacob Faibussowitsch {
16899e65526SBarry Smith   PetscInt           i, m = Y->rmap->n;
16999e65526SBarry Smith   const PetscInt    *diag;
1702e5835c6SStefano Zampini   MatScalar         *aa;
17199e65526SBarry Smith   const PetscScalar *v;
172421480d9SBarry Smith   PetscBool          diagDense;
17379299369SBarry Smith 
17479299369SBarry Smith   PetscFunctionBegin;
17509f38230SBarry Smith   if (Y->assembled) {
176421480d9SBarry Smith     PetscCall(MatGetDiagonalMarkers_SeqAIJ(Y, &diag, &diagDense));
177421480d9SBarry Smith     if (diagDense) {
1789566063dSJacob Faibussowitsch       PetscCall(VecGetArrayRead(D, &v));
1799566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJGetArray(Y, &aa));
18079299369SBarry Smith       if (is == INSERT_VALUES) {
181ad540459SPierre Jolivet         for (i = 0; i < m; i++) aa[diag[i]] = v[i];
18279299369SBarry Smith       } else {
183ad540459SPierre Jolivet         for (i = 0; i < m; i++) aa[diag[i]] += v[i];
18479299369SBarry Smith       }
1859566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJRestoreArray(Y, &aa));
1869566063dSJacob Faibussowitsch       PetscCall(VecRestoreArrayRead(D, &v));
1873ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
18879299369SBarry Smith     }
18909f38230SBarry Smith   }
1909566063dSJacob Faibussowitsch   PetscCall(MatDiagonalSet_Default(Y, D, is));
1913ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
19209f38230SBarry Smith }
19379299369SBarry Smith 
MatGetRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt * m,const PetscInt * ia[],const PetscInt * ja[],PetscBool * done)194d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
195d71ae5a4SJacob Faibussowitsch {
196416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
19797f1f81fSBarry Smith   PetscInt    i, ishift;
19817ab2063SBarry Smith 
1993a40ed3dSBarry Smith   PetscFunctionBegin;
200f1f2ae84SBarry Smith   if (m) *m = A->rmap->n;
2013ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
202bfeeae90SHong Zhang   ishift = 0;
203b94d7dedSBarry Smith   if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) {
2049566063dSJacob Faibussowitsch     PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja));
205bfeeae90SHong Zhang   } else if (oshift == 1) {
2061a83f524SJed Brown     PetscInt *tia;
207d0f46423SBarry Smith     PetscInt  nz = a->i[A->rmap->n];
2089234b629SBarry Smith 
2093b2fbd54SBarry Smith     /* malloc space and  add 1 to i and j indices */
2109566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n + 1, &tia));
2111a83f524SJed Brown     for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1;
2121a83f524SJed Brown     *ia = tia;
213ecc77c7aSBarry Smith     if (ja) {
2141a83f524SJed Brown       PetscInt *tja;
2159234b629SBarry Smith 
2169566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(nz + 1, &tja));
2171a83f524SJed Brown       for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1;
2181a83f524SJed Brown       *ja = tja;
219ecc77c7aSBarry Smith     }
2206945ee14SBarry Smith   } else {
221ecc77c7aSBarry Smith     *ia = a->i;
222ecc77c7aSBarry Smith     if (ja) *ja = a->j;
223a2ce50c7SBarry Smith   }
2243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
225a2744918SBarry Smith }
226a2744918SBarry Smith 
MatRestoreRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt * n,const PetscInt * ia[],const PetscInt * ja[],PetscBool * done)227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
228d71ae5a4SJacob Faibussowitsch {
2293a40ed3dSBarry Smith   PetscFunctionBegin;
2303ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
231b94d7dedSBarry Smith   if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) {
2329566063dSJacob Faibussowitsch     PetscCall(PetscFree(*ia));
2339566063dSJacob Faibussowitsch     if (ja) PetscCall(PetscFree(*ja));
234bcd2baecSBarry Smith   }
2353ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
23617ab2063SBarry Smith }
23717ab2063SBarry Smith 
MatGetColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt * nn,const PetscInt * ia[],const PetscInt * ja[],PetscBool * done)238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
239d71ae5a4SJacob Faibussowitsch {
2403b2fbd54SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
241d0f46423SBarry Smith   PetscInt    i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n;
24297f1f81fSBarry Smith   PetscInt    nz = a->i[m], row, *jj, mr, col;
2433b2fbd54SBarry Smith 
2443a40ed3dSBarry Smith   PetscFunctionBegin;
245899cda47SBarry Smith   *nn = n;
2463ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
2473b2fbd54SBarry Smith   if (symmetric) {
2489566063dSJacob Faibussowitsch     PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja));
2493b2fbd54SBarry Smith   } else {
2509566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(n, &collengths));
2519566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(n + 1, &cia));
2529566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nz, &cja));
2533b2fbd54SBarry Smith     jj = a->j;
254ad540459SPierre Jolivet     for (i = 0; i < nz; i++) collengths[jj[i]]++;
2553b2fbd54SBarry Smith     cia[0] = oshift;
256ad540459SPierre Jolivet     for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i];
2579566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(collengths, n));
2583b2fbd54SBarry Smith     jj = a->j;
259a93ec695SBarry Smith     for (row = 0; row < m; row++) {
260a93ec695SBarry Smith       mr = a->i[row + 1] - a->i[row];
261a93ec695SBarry Smith       for (i = 0; i < mr; i++) {
262bfeeae90SHong Zhang         col = *jj++;
2632205254eSKarl Rupp 
2643b2fbd54SBarry Smith         cja[cia[col] + collengths[col]++ - oshift] = row + oshift;
2653b2fbd54SBarry Smith       }
2663b2fbd54SBarry Smith     }
2679566063dSJacob Faibussowitsch     PetscCall(PetscFree(collengths));
2689371c9d4SSatish Balay     *ia = cia;
2699371c9d4SSatish Balay     *ja = cja;
2703b2fbd54SBarry Smith   }
2713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2723b2fbd54SBarry Smith }
2733b2fbd54SBarry Smith 
MatRestoreColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt * n,const PetscInt * ia[],const PetscInt * ja[],PetscBool * done)274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
275d71ae5a4SJacob Faibussowitsch {
2763a40ed3dSBarry Smith   PetscFunctionBegin;
2773ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
2783b2fbd54SBarry Smith 
2799566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ia));
2809566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ja));
2813ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2823b2fbd54SBarry Smith }
2833b2fbd54SBarry Smith 
2847cee066cSHong Zhang /*
2857cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from
2867cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output
287040ebd07SHong Zhang  spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ()
2887cee066cSHong Zhang */
MatGetColumnIJ_SeqAIJ_Color(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt * nn,const PetscInt * ia[],const PetscInt * ja[],PetscInt * spidx[],PetscBool * done)289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done)
290d71ae5a4SJacob Faibussowitsch {
2917cee066cSHong Zhang   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
2927cee066cSHong Zhang   PetscInt        i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n;
293071fcb05SBarry Smith   PetscInt        nz = a->i[m], row, mr, col, tmp;
2947cee066cSHong Zhang   PetscInt       *cspidx;
295071fcb05SBarry Smith   const PetscInt *jj;
2967cee066cSHong Zhang 
2977cee066cSHong Zhang   PetscFunctionBegin;
2987cee066cSHong Zhang   *nn = n;
2993ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
300625f6d37SHong Zhang 
3019566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(n, &collengths));
3029566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n + 1, &cia));
3039566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nz, &cja));
3049566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nz, &cspidx));
3057cee066cSHong Zhang   jj = a->j;
306ad540459SPierre Jolivet   for (i = 0; i < nz; i++) collengths[jj[i]]++;
3077cee066cSHong Zhang   cia[0] = oshift;
308ad540459SPierre Jolivet   for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i];
3099566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(collengths, n));
3107cee066cSHong Zhang   jj = a->j;
3117cee066cSHong Zhang   for (row = 0; row < m; row++) {
3127cee066cSHong Zhang     mr = a->i[row + 1] - a->i[row];
3137cee066cSHong Zhang     for (i = 0; i < mr; i++) {
3147cee066cSHong Zhang       col         = *jj++;
315071fcb05SBarry Smith       tmp         = cia[col] + collengths[col]++ - oshift;
316071fcb05SBarry Smith       cspidx[tmp] = a->i[row] + i; /* index of a->j */
317071fcb05SBarry Smith       cja[tmp]    = row + oshift;
3187cee066cSHong Zhang     }
3197cee066cSHong Zhang   }
3209566063dSJacob Faibussowitsch   PetscCall(PetscFree(collengths));
321071fcb05SBarry Smith   *ia    = cia;
322071fcb05SBarry Smith   *ja    = cja;
3237cee066cSHong Zhang   *spidx = cspidx;
3243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3257cee066cSHong Zhang }
3267cee066cSHong Zhang 
MatRestoreColumnIJ_SeqAIJ_Color(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt * n,const PetscInt * ia[],const PetscInt * ja[],PetscInt * spidx[],PetscBool * done)327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done)
328d71ae5a4SJacob Faibussowitsch {
3297cee066cSHong Zhang   PetscFunctionBegin;
3309566063dSJacob Faibussowitsch   PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done));
3319566063dSJacob Faibussowitsch   PetscCall(PetscFree(*spidx));
3323ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3337cee066cSHong Zhang }
3347cee066cSHong Zhang 
MatSetValuesRow_SeqAIJ(Mat A,PetscInt row,const PetscScalar v[])335ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[])
336d71ae5a4SJacob Faibussowitsch {
33787d4246cSBarry Smith   Mat_SeqAIJ  *a  = (Mat_SeqAIJ *)A->data;
33887d4246cSBarry Smith   PetscInt    *ai = a->i;
339fff043a9SJunchao Zhang   PetscScalar *aa;
34087d4246cSBarry Smith 
34187d4246cSBarry Smith   PetscFunctionBegin;
3429566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
3439566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row]));
3449566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
3453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
34687d4246cSBarry Smith }
34787d4246cSBarry Smith 
348bd04181cSBarry Smith /*
349bd04181cSBarry Smith     MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions
350bd04181cSBarry Smith 
351bd04181cSBarry Smith       -   a single row of values is set with each call
352bd04181cSBarry Smith       -   no row or column indices are negative or (in error) larger than the number of rows or columns
353bd04181cSBarry Smith       -   the values are always added to the matrix, not set
354bd04181cSBarry Smith       -   no new locations are introduced in the nonzero structure of the matrix
355bd04181cSBarry Smith 
3561f763a69SBarry Smith      This does NOT assume the global column indices are sorted
357bd04181cSBarry Smith 
3581f763a69SBarry Smith */
359bd04181cSBarry Smith 
360af0996ceSBarry Smith #include <petsc/private/isimpl.h>
MatSeqAIJSetValuesLocalFast(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is)361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
362d71ae5a4SJacob Faibussowitsch {
363189e4007SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
3641f763a69SBarry Smith   PetscInt        low, high, t, row, nrow, i, col, l;
3651f763a69SBarry Smith   const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j;
3661f763a69SBarry Smith   PetscInt        lastcol = -1;
367fff043a9SJunchao Zhang   MatScalar      *ap, value, *aa;
368189e4007SBarry Smith   const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices;
369189e4007SBarry Smith 
370fff043a9SJunchao Zhang   PetscFunctionBegin;
3719566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
372f38dd0b8SBarry Smith   row  = ridx[im[0]];
3731f763a69SBarry Smith   rp   = aj + ai[row];
3741f763a69SBarry Smith   ap   = aa + ai[row];
3751f763a69SBarry Smith   nrow = ailen[row];
376189e4007SBarry Smith   low  = 0;
377189e4007SBarry Smith   high = nrow;
378189e4007SBarry Smith   for (l = 0; l < n; l++) { /* loop over added columns */
379189e4007SBarry Smith     col   = cidx[in[l]];
380f38dd0b8SBarry Smith     value = v[l];
381189e4007SBarry Smith 
382189e4007SBarry Smith     if (col <= lastcol) low = 0;
383189e4007SBarry Smith     else high = nrow;
384189e4007SBarry Smith     lastcol = col;
385189e4007SBarry Smith     while (high - low > 5) {
386189e4007SBarry Smith       t = (low + high) / 2;
387189e4007SBarry Smith       if (rp[t] > col) high = t;
388189e4007SBarry Smith       else low = t;
389189e4007SBarry Smith     }
390189e4007SBarry Smith     for (i = low; i < high; i++) {
391189e4007SBarry Smith       if (rp[i] == col) {
3921f763a69SBarry Smith         ap[i] += value;
393189e4007SBarry Smith         low = i + 1;
3941f763a69SBarry Smith         break;
395189e4007SBarry Smith       }
396189e4007SBarry Smith     }
397189e4007SBarry Smith   }
3989566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
3993ba16761SJacob Faibussowitsch   return PETSC_SUCCESS;
400189e4007SBarry Smith }
401189e4007SBarry Smith 
MatSetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is)402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
403d71ae5a4SJacob Faibussowitsch {
404416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
405e2ee6c50SBarry Smith   PetscInt   *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N;
40697f1f81fSBarry Smith   PetscInt   *imax = a->imax, *ai = a->i, *ailen = a->ilen;
407e2ee6c50SBarry Smith   PetscInt   *aj = a->j, nonew = a->nonew, lastcol = -1;
408ce496241SStefano Zampini   MatScalar  *ap = NULL, value = 0.0, *aa;
409ace3abfcSBarry Smith   PetscBool   ignorezeroentries = a->ignorezeroentries;
410ace3abfcSBarry Smith   PetscBool   roworiented       = a->roworiented;
41117ab2063SBarry Smith 
4123a40ed3dSBarry Smith   PetscFunctionBegin;
4139566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
41417ab2063SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
415416022c9SBarry Smith     row = im[k];
4165ef9f2a5SBarry Smith     if (row < 0) continue;
4176bdcaf15SBarry Smith     PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1);
4188e3a54c0SPierre Jolivet     rp = PetscSafePointerPlusOffset(aj, ai[row]);
4198e3a54c0SPierre Jolivet     if (!A->structure_only) ap = PetscSafePointerPlusOffset(aa, ai[row]);
4209371c9d4SSatish Balay     rmax = imax[row];
4219371c9d4SSatish Balay     nrow = ailen[row];
422416022c9SBarry Smith     low  = 0;
423c71e6ed7SBarry Smith     high = nrow;
42417ab2063SBarry Smith     for (l = 0; l < n; l++) { /* loop over added columns */
4255ef9f2a5SBarry Smith       if (in[l] < 0) continue;
4266bdcaf15SBarry Smith       PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1);
427bfeeae90SHong Zhang       col = in[l];
428071fcb05SBarry Smith       if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m];
429071fcb05SBarry Smith       if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue;
43036db0b34SBarry Smith 
4312205254eSKarl Rupp       if (col <= lastcol) low = 0;
4322205254eSKarl Rupp       else high = nrow;
433e2ee6c50SBarry Smith       lastcol = col;
434416022c9SBarry Smith       while (high - low > 5) {
435416022c9SBarry Smith         t = (low + high) / 2;
436416022c9SBarry Smith         if (rp[t] > col) high = t;
437416022c9SBarry Smith         else low = t;
43817ab2063SBarry Smith       }
439416022c9SBarry Smith       for (i = low; i < high; i++) {
44017ab2063SBarry Smith         if (rp[i] > col) break;
44117ab2063SBarry Smith         if (rp[i] == col) {
442876c6284SHong Zhang           if (!A->structure_only) {
4430c0d7e18SFande Kong             if (is == ADD_VALUES) {
4440c0d7e18SFande Kong               ap[i] += value;
4450c0d7e18SFande Kong               (void)PetscLogFlops(1.0);
4469371c9d4SSatish Balay             } else ap[i] = value;
447720833daSHong Zhang           }
448e44c0bd4SBarry Smith           low = i + 1;
44917ab2063SBarry Smith           goto noinsert;
45017ab2063SBarry Smith         }
45117ab2063SBarry Smith       }
452dcd36c23SBarry Smith       if (value == 0.0 && ignorezeroentries && row != col) goto noinsert;
453c2653b3dSLois Curfman McInnes       if (nonew == 1) goto noinsert;
45408401ef6SPierre Jolivet       PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col);
455720833daSHong Zhang       if (A->structure_only) {
456876c6284SHong Zhang         MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar);
457720833daSHong Zhang       } else {
458fef13f97SBarry Smith         MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
459720833daSHong Zhang       }
4609371c9d4SSatish Balay       N = nrow++ - 1;
4619371c9d4SSatish Balay       a->nz++;
4629371c9d4SSatish Balay       high++;
463416022c9SBarry Smith       /* shift up all the later entries in this row */
4649566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1));
46517ab2063SBarry Smith       rp[i] = col;
466580bdb30SBarry Smith       if (!A->structure_only) {
4679566063dSJacob Faibussowitsch         PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1));
468580bdb30SBarry Smith         ap[i] = value;
469580bdb30SBarry Smith       }
470416022c9SBarry Smith       low = i + 1;
471e44c0bd4SBarry Smith     noinsert:;
47217ab2063SBarry Smith     }
47317ab2063SBarry Smith     ailen[row] = nrow;
47417ab2063SBarry Smith   }
4759566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
4763ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
47717ab2063SBarry Smith }
47817ab2063SBarry Smith 
MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is)479ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
480d71ae5a4SJacob Faibussowitsch {
48119b08ed1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
48219b08ed1SBarry Smith   PetscInt   *rp, k, row;
48319b08ed1SBarry Smith   PetscInt   *ai = a->i;
48419b08ed1SBarry Smith   PetscInt   *aj = a->j;
485fff043a9SJunchao Zhang   MatScalar  *aa, *ap;
48619b08ed1SBarry Smith 
48719b08ed1SBarry Smith   PetscFunctionBegin;
48828b400f6SJacob Faibussowitsch   PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix.");
48908401ef6SPierre Jolivet   PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz);
490fff043a9SJunchao Zhang 
4919566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
49219b08ed1SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
49319b08ed1SBarry Smith     row = im[k];
49419b08ed1SBarry Smith     rp  = aj + ai[row];
4958e3a54c0SPierre Jolivet     ap  = PetscSafePointerPlusOffset(aa, ai[row]);
49619b08ed1SBarry Smith 
497418fb43bSPierre Jolivet     PetscCall(PetscArraycpy(rp, in, n));
49819b08ed1SBarry Smith     if (!A->structure_only) {
49919b08ed1SBarry Smith       if (v) {
500418fb43bSPierre Jolivet         PetscCall(PetscArraycpy(ap, v, n));
50119b08ed1SBarry Smith         v += n;
50219b08ed1SBarry Smith       } else {
5039566063dSJacob Faibussowitsch         PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar)));
50419b08ed1SBarry Smith       }
50519b08ed1SBarry Smith     }
50619b08ed1SBarry Smith     a->ilen[row]  = n;
50719b08ed1SBarry Smith     a->imax[row]  = n;
50819b08ed1SBarry Smith     a->i[row + 1] = a->i[row] + n;
50919b08ed1SBarry Smith     a->nz += n;
51019b08ed1SBarry Smith   }
5119566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
5123ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
51319b08ed1SBarry Smith }
51419b08ed1SBarry Smith 
51519b08ed1SBarry Smith /*@
51619b08ed1SBarry Smith   MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix.
51719b08ed1SBarry Smith 
51819b08ed1SBarry Smith   Input Parameters:
51911a5261eSBarry Smith + A       - the `MATSEQAIJ` matrix
52019b08ed1SBarry Smith - nztotal - bound on the number of nonzeros
52119b08ed1SBarry Smith 
52219b08ed1SBarry Smith   Level: advanced
52319b08ed1SBarry Smith 
52419b08ed1SBarry Smith   Notes:
52519b08ed1SBarry Smith   This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row.
52611a5261eSBarry Smith   Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used
52719b08ed1SBarry Smith   as always with multiple matrix assemblies.
52819b08ed1SBarry Smith 
5291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`
53019b08ed1SBarry Smith @*/
MatSeqAIJSetTotalPreallocation(Mat A,PetscInt nztotal)531d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal)
532d71ae5a4SJacob Faibussowitsch {
53319b08ed1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
53419b08ed1SBarry Smith 
53519b08ed1SBarry Smith   PetscFunctionBegin;
5369566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->rmap));
5379566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->cmap));
53819b08ed1SBarry Smith   a->maxnz = nztotal;
5393a7d0413SPierre Jolivet   if (!a->imax) PetscCall(PetscMalloc1(A->rmap->n, &a->imax));
54019b08ed1SBarry Smith   if (!a->ilen) {
5419566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n, &a->ilen));
54219b08ed1SBarry Smith   } else {
5439566063dSJacob Faibussowitsch     PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt)));
54419b08ed1SBarry Smith   }
54519b08ed1SBarry Smith 
54619b08ed1SBarry Smith   /* allocate the matrix space */
5479f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(A->rmap->n + 1, sizeof(PetscInt), (void **)&a->i));
5489f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscInt), (void **)&a->j));
5499f0612e4SBarry Smith   a->free_ij = PETSC_TRUE;
55019b08ed1SBarry Smith   if (A->structure_only) {
55119b08ed1SBarry Smith     a->free_a = PETSC_FALSE;
55219b08ed1SBarry Smith   } else {
5539f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscScalar), (void **)&a->a));
55419b08ed1SBarry Smith     a->free_a = PETSC_TRUE;
55519b08ed1SBarry Smith   }
5569f0612e4SBarry Smith   a->i[0]           = 0;
55719b08ed1SBarry Smith   A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation;
55819b08ed1SBarry Smith   A->preallocated   = PETSC_TRUE;
5593ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
56019b08ed1SBarry Smith }
56119b08ed1SBarry Smith 
MatSetValues_SeqAIJ_SortedFull(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is)562ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
563d71ae5a4SJacob Faibussowitsch {
564071fcb05SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
565071fcb05SBarry Smith   PetscInt   *rp, k, row;
566071fcb05SBarry Smith   PetscInt   *ai = a->i, *ailen = a->ilen;
567071fcb05SBarry Smith   PetscInt   *aj = a->j;
568fff043a9SJunchao Zhang   MatScalar  *aa, *ap;
569071fcb05SBarry Smith 
570071fcb05SBarry Smith   PetscFunctionBegin;
5719566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
572071fcb05SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
573071fcb05SBarry Smith     row = im[k];
5746bdcaf15SBarry Smith     PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n);
575071fcb05SBarry Smith     rp = aj + ai[row];
576071fcb05SBarry Smith     ap = aa + ai[row];
577418fb43bSPierre Jolivet     if (!A->was_assembled) PetscCall(PetscArraycpy(rp, in, n));
578071fcb05SBarry Smith     if (!A->structure_only) {
579071fcb05SBarry Smith       if (v) {
580418fb43bSPierre Jolivet         PetscCall(PetscArraycpy(ap, v, n));
581071fcb05SBarry Smith         v += n;
582071fcb05SBarry Smith       } else {
5839566063dSJacob Faibussowitsch         PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar)));
584071fcb05SBarry Smith       }
585071fcb05SBarry Smith     }
586071fcb05SBarry Smith     ailen[row] = n;
587071fcb05SBarry Smith     a->nz += n;
588071fcb05SBarry Smith   }
5899566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
5903ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
591071fcb05SBarry Smith }
592071fcb05SBarry Smith 
MatGetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],PetscScalar v[])593ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[])
594d71ae5a4SJacob Faibussowitsch {
5957eb43aa7SLois Curfman McInnes   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
59697f1f81fSBarry Smith   PetscInt        *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j;
59797f1f81fSBarry Smith   PetscInt        *ai = a->i, *ailen = a->ilen;
5984e208921SJed Brown   const MatScalar *ap, *aa;
5997eb43aa7SLois Curfman McInnes 
6003a40ed3dSBarry Smith   PetscFunctionBegin;
6014e208921SJed Brown   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
6027eb43aa7SLois Curfman McInnes   for (k = 0; k < m; k++) { /* loop over rows */
6037eb43aa7SLois Curfman McInnes     row = im[k];
6049371c9d4SSatish Balay     if (row < 0) {
6059371c9d4SSatish Balay       v += n;
6069371c9d4SSatish Balay       continue;
6079371c9d4SSatish Balay     } /* negative row */
60854c59aa7SJacob Faibussowitsch     PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1);
6098e3a54c0SPierre Jolivet     rp   = PetscSafePointerPlusOffset(aj, ai[row]);
6108e3a54c0SPierre Jolivet     ap   = PetscSafePointerPlusOffset(aa, ai[row]);
6117eb43aa7SLois Curfman McInnes     nrow = ailen[row];
6127eb43aa7SLois Curfman McInnes     for (l = 0; l < n; l++) { /* loop over columns */
6139371c9d4SSatish Balay       if (in[l] < 0) {
6149371c9d4SSatish Balay         v++;
6159371c9d4SSatish Balay         continue;
6169371c9d4SSatish Balay       } /* negative column */
61754c59aa7SJacob Faibussowitsch       PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1);
618bfeeae90SHong Zhang       col  = in[l];
6199371c9d4SSatish Balay       high = nrow;
6209371c9d4SSatish Balay       low  = 0; /* assume unsorted */
6217eb43aa7SLois Curfman McInnes       while (high - low > 5) {
6227eb43aa7SLois Curfman McInnes         t = (low + high) / 2;
6237eb43aa7SLois Curfman McInnes         if (rp[t] > col) high = t;
6247eb43aa7SLois Curfman McInnes         else low = t;
6257eb43aa7SLois Curfman McInnes       }
6267eb43aa7SLois Curfman McInnes       for (i = low; i < high; i++) {
6277eb43aa7SLois Curfman McInnes         if (rp[i] > col) break;
6287eb43aa7SLois Curfman McInnes         if (rp[i] == col) {
629b49de8d1SLois Curfman McInnes           *v++ = ap[i];
6307eb43aa7SLois Curfman McInnes           goto finished;
6317eb43aa7SLois Curfman McInnes         }
6327eb43aa7SLois Curfman McInnes       }
63397e567efSBarry Smith       *v++ = 0.0;
6347eb43aa7SLois Curfman McInnes     finished:;
6357eb43aa7SLois Curfman McInnes     }
6367eb43aa7SLois Curfman McInnes   }
6374e208921SJed Brown   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
6383ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
6397eb43aa7SLois Curfman McInnes }
6407eb43aa7SLois Curfman McInnes 
MatView_SeqAIJ_Binary(Mat mat,PetscViewer viewer)641ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer)
642d71ae5a4SJacob Faibussowitsch {
6433ea6fe3dSLisandro Dalcin   Mat_SeqAIJ        *A = (Mat_SeqAIJ *)mat->data;
644c898d852SStefano Zampini   const PetscScalar *av;
6453ea6fe3dSLisandro Dalcin   PetscInt           header[4], M, N, m, nz, i;
6463ea6fe3dSLisandro Dalcin   PetscInt          *rowlens;
64717ab2063SBarry Smith 
6483a40ed3dSBarry Smith   PetscFunctionBegin;
6499566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
6502205254eSKarl Rupp 
6513ea6fe3dSLisandro Dalcin   M  = mat->rmap->N;
6523ea6fe3dSLisandro Dalcin   N  = mat->cmap->N;
6533ea6fe3dSLisandro Dalcin   m  = mat->rmap->n;
6543ea6fe3dSLisandro Dalcin   nz = A->nz;
655416022c9SBarry Smith 
6563ea6fe3dSLisandro Dalcin   /* write matrix header */
6573ea6fe3dSLisandro Dalcin   header[0] = MAT_FILE_CLASSID;
6589371c9d4SSatish Balay   header[1] = M;
6599371c9d4SSatish Balay   header[2] = N;
6609371c9d4SSatish Balay   header[3] = nz;
6619566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT));
662416022c9SBarry Smith 
6633ea6fe3dSLisandro Dalcin   /* fill in and store row lengths */
6649566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &rowlens));
6653ea6fe3dSLisandro Dalcin   for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i];
666e457bb90SBarry Smith   if (PetscDefined(USE_DEBUG)) {
667e457bb90SBarry Smith     PetscInt mnz = 0;
668e457bb90SBarry Smith 
669e457bb90SBarry Smith     for (i = 0; i < m; i++) mnz += rowlens[i];
670e457bb90SBarry Smith     PetscCheck(nz == mnz, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row lens %" PetscInt_FMT " do not sum to nz %" PetscInt_FMT, mnz, nz);
671e457bb90SBarry Smith   }
6729566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT));
6739566063dSJacob Faibussowitsch   PetscCall(PetscFree(rowlens));
6743ea6fe3dSLisandro Dalcin   /* store column indices */
6759566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT));
676416022c9SBarry Smith   /* store nonzero values */
6779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(mat, &av));
6789566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR));
6799566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(mat, &av));
680b37d52dbSMark F. Adams 
6813ea6fe3dSLisandro Dalcin   /* write block size option to the viewer's .info file */
6829566063dSJacob Faibussowitsch   PetscCall(MatView_Binary_BlockSizes(mat, viewer));
6833ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
68417ab2063SBarry Smith }
685416022c9SBarry Smith 
MatView_SeqAIJ_ASCII_structonly(Mat A,PetscViewer viewer)686d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer)
687d71ae5a4SJacob Faibussowitsch {
6887dc0baabSHong Zhang   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
6897dc0baabSHong Zhang   PetscInt    i, k, m = A->rmap->N;
6907dc0baabSHong Zhang 
6917dc0baabSHong Zhang   PetscFunctionBegin;
6929566063dSJacob Faibussowitsch   PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
6937dc0baabSHong Zhang   for (i = 0; i < m; i++) {
6949566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
69548a46eb9SPierre Jolivet     for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k]));
6969566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
6977dc0baabSHong Zhang   }
6989566063dSJacob Faibussowitsch   PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
6993ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
7007dc0baabSHong Zhang }
7017dc0baabSHong Zhang 
MatView_SeqAIJ_ASCII(Mat A,PetscViewer viewer)702ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer)
703d71ae5a4SJacob Faibussowitsch {
704416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
705c898d852SStefano Zampini   const PetscScalar *av;
70660e0710aSBarry Smith   PetscInt           i, j, m = A->rmap->n;
707e060cb09SBarry Smith   const char        *name;
708f3ef73ceSBarry Smith   PetscViewerFormat  format;
70917ab2063SBarry Smith 
7103a40ed3dSBarry Smith   PetscFunctionBegin;
7117dc0baabSHong Zhang   if (A->structure_only) {
7129566063dSJacob Faibussowitsch     PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer));
7133ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
7147dc0baabSHong Zhang   }
71543e49210SHong Zhang 
7169566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(viewer, &format));
717bd6a2ce3SJunchao Zhang   // By petsc's rule, even PETSC_VIEWER_ASCII_INFO_DETAIL doesn't print matrix entries
7183ba16761SJacob Faibussowitsch   if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS);
7192e5835c6SStefano Zampini 
720c898d852SStefano Zampini   /* trigger copy to CPU if needed */
7219566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
7229566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
72371c2f376SKris Buschelman   if (format == PETSC_VIEWER_ASCII_MATLAB) {
72497f1f81fSBarry Smith     PetscInt nofinalvalue = 0;
72560e0710aSBarry Smith     if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) {
726c337ccceSJed Brown       /* Need a dummy value to ensure the dimension of the matrix. */
727d00d2cf4SBarry Smith       nofinalvalue = 1;
728d00d2cf4SBarry Smith     }
7299566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
7309566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n));
7319566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz));
732fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX)
7339566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue));
734fbfe6fa7SJed Brown #else
7359566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue));
736fbfe6fa7SJed Brown #endif
7379566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n"));
73817ab2063SBarry Smith 
73917ab2063SBarry Smith     for (i = 0; i < m; i++) {
74060e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
741aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
7429566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
74317ab2063SBarry Smith #else
7449566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j]));
74517ab2063SBarry Smith #endif
74617ab2063SBarry Smith       }
74717ab2063SBarry Smith     }
748d00d2cf4SBarry Smith     if (nofinalvalue) {
749c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX)
7509566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e %18.16e\n", m, A->cmap->n, 0., 0.));
751c337ccceSJed Brown #else
7529566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n", m, A->cmap->n, 0.0));
753c337ccceSJed Brown #endif
754d00d2cf4SBarry Smith     }
7559566063dSJacob Faibussowitsch     PetscCall(PetscObjectGetName((PetscObject)A, &name));
7569566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name));
7579566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
758fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_COMMON) {
7599566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
76044cd7ae7SLois Curfman McInnes     for (i = 0; i < m; i++) {
7619566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
76260e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
763aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
76436db0b34SBarry Smith         if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) {
7659566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
76636db0b34SBarry Smith         } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) {
7679566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j])));
76836db0b34SBarry Smith         } else if (PetscRealPart(a->a[j]) != 0.0) {
7699566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
7706831982aSBarry Smith         }
77144cd7ae7SLois Curfman McInnes #else
7729566063dSJacob Faibussowitsch         if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
77344cd7ae7SLois Curfman McInnes #endif
77444cd7ae7SLois Curfman McInnes       }
7759566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
77644cd7ae7SLois Curfman McInnes     }
7779566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
778fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_SYMMODU) {
77997f1f81fSBarry Smith     PetscInt nzd = 0, fshift = 1, *sptr;
7809566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
7819566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m + 1, &sptr));
782496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
783496be53dSLois Curfman McInnes       sptr[i] = nzd + 1;
78460e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
785496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
786aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
78736db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++;
788496be53dSLois Curfman McInnes #else
789496be53dSLois Curfman McInnes           if (a->a[j] != 0.0) nzd++;
790496be53dSLois Curfman McInnes #endif
791496be53dSLois Curfman McInnes         }
792496be53dSLois Curfman McInnes       }
793496be53dSLois Curfman McInnes     }
7942e44a96cSLois Curfman McInnes     sptr[m] = nzd + 1;
7959566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd));
7962e44a96cSLois Curfman McInnes     for (i = 0; i < m + 1; i += 6) {
7972205254eSKarl Rupp       if (i + 4 < m) {
7989566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5]));
7992205254eSKarl Rupp       } else if (i + 3 < m) {
8009566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4]));
8012205254eSKarl Rupp       } else if (i + 2 < m) {
8029566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3]));
8032205254eSKarl Rupp       } else if (i + 1 < m) {
8049566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2]));
8052205254eSKarl Rupp       } else if (i < m) {
8069566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1]));
8072205254eSKarl Rupp       } else {
8089566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i]));
8092205254eSKarl Rupp       }
810496be53dSLois Curfman McInnes     }
8119566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
8129566063dSJacob Faibussowitsch     PetscCall(PetscFree(sptr));
813496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
81460e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
8159566063dSJacob Faibussowitsch         if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift));
816496be53dSLois Curfman McInnes       }
8179566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
818496be53dSLois Curfman McInnes     }
8199566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
820496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
82160e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
822496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
823aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
82448a46eb9SPierre Jolivet           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
825496be53dSLois Curfman McInnes #else
8269566063dSJacob Faibussowitsch           if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j]));
827496be53dSLois Curfman McInnes #endif
828496be53dSLois Curfman McInnes         }
829496be53dSLois Curfman McInnes       }
8309566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
831496be53dSLois Curfman McInnes     }
8329566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
833fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_DENSE) {
83497f1f81fSBarry Smith     PetscInt    cnt = 0, jcnt;
83587828ca2SBarry Smith     PetscScalar value;
83668f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX)
83768f1ed48SBarry Smith     PetscBool realonly = PETSC_TRUE;
83868f1ed48SBarry Smith 
83968f1ed48SBarry Smith     for (i = 0; i < a->i[m]; i++) {
84068f1ed48SBarry Smith       if (PetscImaginaryPart(a->a[i]) != 0.0) {
84168f1ed48SBarry Smith         realonly = PETSC_FALSE;
84268f1ed48SBarry Smith         break;
84368f1ed48SBarry Smith       }
84468f1ed48SBarry Smith     }
84568f1ed48SBarry Smith #endif
84602594712SBarry Smith 
8479566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
84802594712SBarry Smith     for (i = 0; i < m; i++) {
84902594712SBarry Smith       jcnt = 0;
850d0f46423SBarry Smith       for (j = 0; j < A->cmap->n; j++) {
851e24b481bSBarry Smith         if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) {
85202594712SBarry Smith           value = a->a[cnt++];
853e24b481bSBarry Smith           jcnt++;
85402594712SBarry Smith         } else {
85502594712SBarry Smith           value = 0.0;
85602594712SBarry Smith         }
857aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
85868f1ed48SBarry Smith         if (realonly) {
8599566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value)));
86068f1ed48SBarry Smith         } else {
8619566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value)));
86268f1ed48SBarry Smith         }
86302594712SBarry Smith #else
8649566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value));
86502594712SBarry Smith #endif
86602594712SBarry Smith       }
8679566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
86802594712SBarry Smith     }
8699566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
8703c215bfdSMatthew Knepley   } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) {
871150b93efSMatthew G. Knepley     PetscInt fshift = 1;
8729566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
8733c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
8749566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n"));
8753c215bfdSMatthew Knepley #else
8769566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n"));
8773c215bfdSMatthew Knepley #endif
8789566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz));
8793c215bfdSMatthew Knepley     for (i = 0; i < m; i++) {
88060e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
8813c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
8829566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
8833c215bfdSMatthew Knepley #else
8849566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j]));
8853c215bfdSMatthew Knepley #endif
8863c215bfdSMatthew Knepley       }
8873c215bfdSMatthew Knepley     }
8889566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
8893a40ed3dSBarry Smith   } else {
8909566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
891d5f3da31SBarry Smith     if (A->factortype) {
892421480d9SBarry Smith       const PetscInt *adiag;
893421480d9SBarry Smith 
894421480d9SBarry Smith       PetscCall(MatGetDiagonalMarkers_SeqAIJ(A, &adiag, NULL));
89516cd7e1dSShri Abhyankar       for (i = 0; i < m; i++) {
8969566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
89716cd7e1dSShri Abhyankar         /* L part */
89860e0710aSBarry Smith         for (j = a->i[i]; j < a->i[i + 1]; j++) {
89916cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
90016cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9019566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
90216cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9039566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j]))));
90416cd7e1dSShri Abhyankar           } else {
9059566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
90616cd7e1dSShri Abhyankar           }
90716cd7e1dSShri Abhyankar #else
9089566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
90916cd7e1dSShri Abhyankar #endif
91016cd7e1dSShri Abhyankar         }
91116cd7e1dSShri Abhyankar         /* diagonal */
912421480d9SBarry Smith         j = adiag[i];
91316cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
91416cd7e1dSShri Abhyankar         if (PetscImaginaryPart(a->a[j]) > 0.0) {
915835f2295SStefano Zampini           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1 / a->a[j]), (double)PetscImaginaryPart(1 / a->a[j])));
91616cd7e1dSShri Abhyankar         } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
917835f2295SStefano Zampini           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1 / a->a[j]), (double)(-PetscImaginaryPart(1 / a->a[j]))));
91816cd7e1dSShri Abhyankar         } else {
919835f2295SStefano Zampini           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1 / a->a[j])));
92016cd7e1dSShri Abhyankar         }
92116cd7e1dSShri Abhyankar #else
922835f2295SStefano Zampini         PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1 / a->a[j])));
92316cd7e1dSShri Abhyankar #endif
92416cd7e1dSShri Abhyankar 
92516cd7e1dSShri Abhyankar         /* U part */
926421480d9SBarry Smith         for (j = adiag[i + 1] + 1; j < adiag[i]; j++) {
92716cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
92816cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9299566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
93016cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9319566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j]))));
93216cd7e1dSShri Abhyankar           } else {
9339566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
93416cd7e1dSShri Abhyankar           }
93516cd7e1dSShri Abhyankar #else
9369566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
93716cd7e1dSShri Abhyankar #endif
93816cd7e1dSShri Abhyankar         }
9399566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
94016cd7e1dSShri Abhyankar       }
94116cd7e1dSShri Abhyankar     } else {
94217ab2063SBarry Smith       for (i = 0; i < m; i++) {
9439566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
94460e0710aSBarry Smith         for (j = a->i[i]; j < a->i[i + 1]; j++) {
945aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
94636db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9479566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
94836db0b34SBarry Smith           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9499566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j])));
9503a40ed3dSBarry Smith           } else {
9519566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
95217ab2063SBarry Smith           }
95317ab2063SBarry Smith #else
9549566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
95517ab2063SBarry Smith #endif
95617ab2063SBarry Smith         }
9579566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
95817ab2063SBarry Smith       }
95916cd7e1dSShri Abhyankar     }
9609566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
96117ab2063SBarry Smith   }
9629566063dSJacob Faibussowitsch   PetscCall(PetscViewerFlush(viewer));
9633ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
964416022c9SBarry Smith }
965416022c9SBarry Smith 
9669804daf3SBarry Smith #include <petscdraw.h>
MatView_SeqAIJ_Draw_Zoom(PetscDraw draw,void * Aa)967ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa)
968d71ae5a4SJacob Faibussowitsch {
969480ef9eaSBarry Smith   Mat                A = (Mat)Aa;
970416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
971383922c3SLisandro Dalcin   PetscInt           i, j, m = A->rmap->n;
972383922c3SLisandro Dalcin   int                color;
973b05fc000SLisandro Dalcin   PetscReal          xl, yl, xr, yr, x_l, x_r, y_l, y_r;
974b0a32e0cSBarry Smith   PetscViewer        viewer;
975f3ef73ceSBarry Smith   PetscViewerFormat  format;
976fff043a9SJunchao Zhang   const PetscScalar *aa;
977cddf8d76SBarry Smith 
9783a40ed3dSBarry Smith   PetscFunctionBegin;
9799566063dSJacob Faibussowitsch   PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer));
9809566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(viewer, &format));
9819566063dSJacob Faibussowitsch   PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr));
982383922c3SLisandro Dalcin 
983416022c9SBarry Smith   /* loop over matrix elements drawing boxes */
9849566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
985fb9695e5SSatish Balay   if (format != PETSC_VIEWER_DRAW_CONTOUR) {
986d0609cedSBarry Smith     PetscDrawCollectiveBegin(draw);
9870513a670SBarry Smith     /* Blue for negative, Cyan for zero and  Red for positive */
988b0a32e0cSBarry Smith     color = PETSC_DRAW_BLUE;
989416022c9SBarry Smith     for (i = 0; i < m; i++) {
9909371c9d4SSatish Balay       y_l = m - i - 1.0;
9919371c9d4SSatish Balay       y_r = y_l + 1.0;
992bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
9939371c9d4SSatish Balay         x_l = a->j[j];
9949371c9d4SSatish Balay         x_r = x_l + 1.0;
995fff043a9SJunchao Zhang         if (PetscRealPart(aa[j]) >= 0.) continue;
9969566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
997cddf8d76SBarry Smith       }
998cddf8d76SBarry Smith     }
999b0a32e0cSBarry Smith     color = PETSC_DRAW_CYAN;
1000cddf8d76SBarry Smith     for (i = 0; i < m; i++) {
10019371c9d4SSatish Balay       y_l = m - i - 1.0;
10029371c9d4SSatish Balay       y_r = y_l + 1.0;
1003bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
10049371c9d4SSatish Balay         x_l = a->j[j];
10059371c9d4SSatish Balay         x_r = x_l + 1.0;
1006fff043a9SJunchao Zhang         if (aa[j] != 0.) continue;
10079566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
1008cddf8d76SBarry Smith       }
1009cddf8d76SBarry Smith     }
1010b0a32e0cSBarry Smith     color = PETSC_DRAW_RED;
1011cddf8d76SBarry Smith     for (i = 0; i < m; i++) {
10129371c9d4SSatish Balay       y_l = m - i - 1.0;
10139371c9d4SSatish Balay       y_r = y_l + 1.0;
1014bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
10159371c9d4SSatish Balay         x_l = a->j[j];
10169371c9d4SSatish Balay         x_r = x_l + 1.0;
1017fff043a9SJunchao Zhang         if (PetscRealPart(aa[j]) <= 0.) continue;
10189566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
1019416022c9SBarry Smith       }
1020416022c9SBarry Smith     }
1021d0609cedSBarry Smith     PetscDrawCollectiveEnd(draw);
10220513a670SBarry Smith   } else {
10230513a670SBarry Smith     /* use contour shading to indicate magnitude of values */
10240513a670SBarry Smith     /* first determine max of all nonzero values */
1025b05fc000SLisandro Dalcin     PetscReal minv = 0.0, maxv = 0.0;
1026383922c3SLisandro Dalcin     PetscInt  nz = a->nz, count = 0;
1027b0a32e0cSBarry Smith     PetscDraw popup;
10280513a670SBarry Smith 
10290513a670SBarry Smith     for (i = 0; i < nz; i++) {
1030fff043a9SJunchao Zhang       if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]);
10310513a670SBarry Smith     }
1032383922c3SLisandro Dalcin     if (minv >= maxv) maxv = minv + PETSC_SMALL;
10339566063dSJacob Faibussowitsch     PetscCall(PetscDrawGetPopup(draw, &popup));
10349566063dSJacob Faibussowitsch     PetscCall(PetscDrawScalePopup(popup, minv, maxv));
1035383922c3SLisandro Dalcin 
1036d0609cedSBarry Smith     PetscDrawCollectiveBegin(draw);
10370513a670SBarry Smith     for (i = 0; i < m; i++) {
1038383922c3SLisandro Dalcin       y_l = m - i - 1.0;
1039383922c3SLisandro Dalcin       y_r = y_l + 1.0;
1040bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
1041383922c3SLisandro Dalcin         x_l   = a->j[j];
1042383922c3SLisandro Dalcin         x_r   = x_l + 1.0;
1043fff043a9SJunchao Zhang         color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv);
10449566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
10450513a670SBarry Smith         count++;
10460513a670SBarry Smith       }
10470513a670SBarry Smith     }
1048d0609cedSBarry Smith     PetscDrawCollectiveEnd(draw);
10490513a670SBarry Smith   }
10509566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
10513ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1052480ef9eaSBarry Smith }
1053cddf8d76SBarry Smith 
10549804daf3SBarry Smith #include <petscdraw.h>
MatView_SeqAIJ_Draw(Mat A,PetscViewer viewer)1055ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer)
1056d71ae5a4SJacob Faibussowitsch {
1057b0a32e0cSBarry Smith   PetscDraw draw;
105836db0b34SBarry Smith   PetscReal xr, yr, xl, yl, h, w;
1059ace3abfcSBarry Smith   PetscBool isnull;
1060480ef9eaSBarry Smith 
1061480ef9eaSBarry Smith   PetscFunctionBegin;
10629566063dSJacob Faibussowitsch   PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw));
10639566063dSJacob Faibussowitsch   PetscCall(PetscDrawIsNull(draw, &isnull));
10643ba16761SJacob Faibussowitsch   if (isnull) PetscFunctionReturn(PETSC_SUCCESS);
1065480ef9eaSBarry Smith 
10669371c9d4SSatish Balay   xr = A->cmap->n;
10679371c9d4SSatish Balay   yr = A->rmap->n;
10689371c9d4SSatish Balay   h  = yr / 10.0;
10699371c9d4SSatish Balay   w  = xr / 10.0;
10709371c9d4SSatish Balay   xr += w;
10719371c9d4SSatish Balay   yr += h;
10729371c9d4SSatish Balay   xl = -w;
10739371c9d4SSatish Balay   yl = -h;
10749566063dSJacob Faibussowitsch   PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr));
10759566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer));
10769566063dSJacob Faibussowitsch   PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A));
10779566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL));
10789566063dSJacob Faibussowitsch   PetscCall(PetscDrawSave(draw));
10793ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1080416022c9SBarry Smith }
1081416022c9SBarry Smith 
MatView_SeqAIJ(Mat A,PetscViewer viewer)1082d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer)
1083d71ae5a4SJacob Faibussowitsch {
10849f196a02SMartin Diehl   PetscBool isascii, isbinary, isdraw;
1085416022c9SBarry Smith 
10863a40ed3dSBarry Smith   PetscFunctionBegin;
10879f196a02SMartin Diehl   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &isascii));
10889566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
10899566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw));
10909f196a02SMartin Diehl   if (isascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer));
10911baa6e33SBarry Smith   else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer));
10921baa6e33SBarry Smith   else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer));
10939566063dSJacob Faibussowitsch   PetscCall(MatView_SeqAIJ_Inode(A, viewer));
10943ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
109517ab2063SBarry Smith }
109619bcc07fSBarry Smith 
MatAssemblyEnd_SeqAIJ(Mat A,MatAssemblyType mode)1097d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode)
1098d71ae5a4SJacob Faibussowitsch {
1099416022c9SBarry Smith   Mat_SeqAIJ *a      = (Mat_SeqAIJ *)A->data;
1100580bdb30SBarry Smith   PetscInt    fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax;
110107425a8dSBarry Smith   PetscInt    m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0;
110254f21887SBarry Smith   MatScalar  *aa    = a->a, *ap;
11033447b6efSHong Zhang   PetscReal   ratio = 0.6;
110417ab2063SBarry Smith 
11053a40ed3dSBarry Smith   PetscFunctionBegin;
11063ba16761SJacob Faibussowitsch   if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS);
1107b215bc84SStefano Zampini   if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) {
110855a7f34eSJunchao Zhang     /* we need to respect users asking to use or not the inodes routine in between matrix assemblies, e.g., via MatSetOption(A, MAT_USE_INODES, val) */
110955a7f34eSJunchao Zhang     PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); /* read the sparsity pattern */
11103ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1111b215bc84SStefano Zampini   }
111217ab2063SBarry Smith 
111343ee02c3SBarry Smith   if (m) rmax = ailen[0]; /* determine row with most nonzeros */
111417ab2063SBarry Smith   for (i = 1; i < m; i++) {
1115416022c9SBarry Smith     /* move each row back by the amount of empty slots (fshift) before it*/
111617ab2063SBarry Smith     fshift += imax[i - 1] - ailen[i - 1];
111794a9d846SBarry Smith     rmax = PetscMax(rmax, ailen[i]);
111817ab2063SBarry Smith     if (fshift) {
1119bfeeae90SHong Zhang       ip = aj + ai[i];
1120bfeeae90SHong Zhang       ap = aa + ai[i];
112117ab2063SBarry Smith       N  = ailen[i];
11229566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(ip - fshift, ip, N));
112348a46eb9SPierre Jolivet       if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N));
112417ab2063SBarry Smith     }
112517ab2063SBarry Smith     ai[i] = ai[i - 1] + ailen[i - 1];
112617ab2063SBarry Smith   }
112717ab2063SBarry Smith   if (m) {
112817ab2063SBarry Smith     fshift += imax[m - 1] - ailen[m - 1];
112917ab2063SBarry Smith     ai[m] = ai[m - 1] + ailen[m - 1];
113017ab2063SBarry Smith   }
113117ab2063SBarry Smith   /* reset ilen and imax for each row */
11327b083b7cSBarry Smith   a->nonzerorowcnt = 0;
1133396832f4SHong Zhang   if (A->structure_only) {
11349566063dSJacob Faibussowitsch     PetscCall(PetscFree(a->imax));
11359566063dSJacob Faibussowitsch     PetscCall(PetscFree(a->ilen));
1136396832f4SHong Zhang   } else { /* !A->structure_only */
113717ab2063SBarry Smith     for (i = 0; i < m; i++) {
113817ab2063SBarry Smith       ailen[i] = imax[i] = ai[i + 1] - ai[i];
11397b083b7cSBarry Smith       a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0);
114017ab2063SBarry Smith     }
1141396832f4SHong Zhang   }
1142bfeeae90SHong Zhang   a->nz = ai[m];
1143aed4548fSBarry Smith   PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift);
11449566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded, %" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz));
11459566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs));
11469566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax));
11472205254eSKarl Rupp 
11488e58a170SBarry Smith   A->info.mallocs += a->reallocs;
1149dd5f02e7SSatish Balay   a->reallocs         = 0;
11506712e2f1SBarry Smith   A->info.nz_unneeded = (PetscReal)fshift;
115136db0b34SBarry Smith   a->rmax             = rmax;
11524e220ebcSLois Curfman McInnes 
115348a46eb9SPierre Jolivet   if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio));
11549566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode));
11553ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
115617ab2063SBarry Smith }
115717ab2063SBarry Smith 
MatRealPart_SeqAIJ(Mat A)1158ba38deedSJacob Faibussowitsch static PetscErrorCode MatRealPart_SeqAIJ(Mat A)
1159d71ae5a4SJacob Faibussowitsch {
116099cafbc1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
116199cafbc1SBarry Smith   PetscInt    i, nz = a->nz;
11622e5835c6SStefano Zampini   MatScalar  *aa;
116399cafbc1SBarry Smith 
116499cafbc1SBarry Smith   PetscFunctionBegin;
11659566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
116699cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]);
11679566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
11683ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
116999cafbc1SBarry Smith }
117099cafbc1SBarry Smith 
MatImaginaryPart_SeqAIJ(Mat A)1171ba38deedSJacob Faibussowitsch static PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A)
1172d71ae5a4SJacob Faibussowitsch {
117399cafbc1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
117499cafbc1SBarry Smith   PetscInt    i, nz = a->nz;
11752e5835c6SStefano Zampini   MatScalar  *aa;
117699cafbc1SBarry Smith 
117799cafbc1SBarry Smith   PetscFunctionBegin;
11789566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
117999cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]);
11809566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
11813ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
118299cafbc1SBarry Smith }
118399cafbc1SBarry Smith 
MatZeroEntries_SeqAIJ(Mat A)1184d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A)
1185d71ae5a4SJacob Faibussowitsch {
1186fff043a9SJunchao Zhang   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1187fff043a9SJunchao Zhang   MatScalar  *aa;
11883a40ed3dSBarry Smith 
11893a40ed3dSBarry Smith   PetscFunctionBegin;
11909566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayWrite(A, &aa));
11919566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(aa, a->i[A->rmap->n]));
11929566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa));
11933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
119417ab2063SBarry Smith }
1195416022c9SBarry Smith 
MatReset_SeqAIJ(Mat A)1196674b392bSAlexander static PetscErrorCode MatReset_SeqAIJ(Mat A)
1197d71ae5a4SJacob Faibussowitsch {
1198416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1199d5d45c9bSBarry Smith 
12003a40ed3dSBarry Smith   PetscFunctionBegin;
1201b4e2f619SBarry Smith   if (A->hash_active) {
1202e3c72094SPierre Jolivet     A->ops[0] = a->cops;
1203b4e2f619SBarry Smith     PetscCall(PetscHMapIJVDestroy(&a->ht));
1204b4e2f619SBarry Smith     PetscCall(PetscFree(a->dnz));
1205b4e2f619SBarry Smith     A->hash_active = PETSC_FALSE;
1206b4e2f619SBarry Smith   }
1207b4e2f619SBarry Smith 
12083ba16761SJacob Faibussowitsch   PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz));
12099566063dSJacob Faibussowitsch   PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i));
12109566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
12119566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
12129566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->diag));
12139566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ibdiag));
12149566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->imax));
12159566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ilen));
12169566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ipre));
12179566063dSJacob Faibussowitsch   PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work));
12189566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->solve_work));
12199566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->icol));
12209566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->saved_values));
1221820d003aSStefano Zampini   a->compressedrow.use = PETSC_FALSE;
12229566063dSJacob Faibussowitsch   PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex));
12239566063dSJacob Faibussowitsch   PetscCall(MatDestroy_SeqAIJ_Inode(A));
1224674b392bSAlexander   PetscFunctionReturn(PETSC_SUCCESS);
1225674b392bSAlexander }
1226674b392bSAlexander 
MatResetHash_SeqAIJ(Mat A)1227674b392bSAlexander static PetscErrorCode MatResetHash_SeqAIJ(Mat A)
1228674b392bSAlexander {
1229674b392bSAlexander   PetscFunctionBegin;
1230674b392bSAlexander   PetscCall(MatReset_SeqAIJ(A));
1231674b392bSAlexander   PetscCall(MatCreate_SeqAIJ_Inode(A));
1232674b392bSAlexander   PetscCall(MatSetUp_Seq_Hash(A));
1233674b392bSAlexander   A->nonzerostate++;
1234674b392bSAlexander   PetscFunctionReturn(PETSC_SUCCESS);
1235674b392bSAlexander }
1236674b392bSAlexander 
MatDestroy_SeqAIJ(Mat A)1237674b392bSAlexander PetscErrorCode MatDestroy_SeqAIJ(Mat A)
1238674b392bSAlexander {
1239674b392bSAlexander   PetscFunctionBegin;
1240674b392bSAlexander   PetscCall(MatReset_SeqAIJ(A));
12419566063dSJacob Faibussowitsch   PetscCall(PetscFree(A->data));
1242901853e0SKris Buschelman 
12436718818eSStefano Zampini   /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this.
12446718818eSStefano Zampini      That function is so heavily used (sometimes in an hidden way through multnumeric function pointers)
12456718818eSStefano Zampini      that is hard to properly add this data to the MatProduct data. We free it here to avoid
12466718818eSStefano Zampini      users reusing the matrix object with different data to incur in obscure segmentation faults
12476718818eSStefano Zampini      due to different matrix sizes */
12489566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL));
12496718818eSStefano Zampini 
12509566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL));
12512e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL));
12522e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL));
12539566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL));
12549566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL));
12559566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL));
12569566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL));
12579566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL));
12589566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL));
12592e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL));
12602e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE)
12612e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL));
12622e956fe4SStefano Zampini #endif
12634222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA)
12649566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL));
12659566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL));
12669566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL));
12674222ddf1SHong Zhang #endif
1268d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
1269d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL));
1270d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL));
1271d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL));
1272d5e393b6SSuyash Tandon #endif
12733d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
12749566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL));
12753d0639e7SStefano Zampini #endif
12769566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL));
1277af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
12789566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL));
1279af8000cdSHong Zhang #endif
1280d1a032dbSPierre Jolivet #if defined(PETSC_HAVE_SCALAPACK) && (defined(PETSC_USE_REAL_SINGLE) || defined(PETSC_USE_REAL_DOUBLE))
12819566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL));
1282d24d4204SJose E. Roman #endif
128363c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
12849566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL));
12859566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL));
128663c07aadSStefano Zampini #endif
12879566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL));
12889566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL));
12899566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL));
12909566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL));
12912e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL));
12929566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL));
12939566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL));
1294674b392bSAlexander   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetHash_C", NULL));
12959566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL));
12969566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL));
12979566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL));
12989566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL));
12999566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL));
13009566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL));
13019566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL));
13029566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL));
13032e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL));
13042e956fe4SStefano Zampini   /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */
13052e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL));
13062e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL));
13072e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL));
13082e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL));
13092e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL));
13103ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
131117ab2063SBarry Smith }
131217ab2063SBarry Smith 
MatSetOption_SeqAIJ(Mat A,MatOption op,PetscBool flg)1313d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg)
1314d71ae5a4SJacob Faibussowitsch {
1315416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
13163a40ed3dSBarry Smith 
13173a40ed3dSBarry Smith   PetscFunctionBegin;
1318a65d3064SKris Buschelman   switch (op) {
1319d71ae5a4SJacob Faibussowitsch   case MAT_ROW_ORIENTED:
1320d71ae5a4SJacob Faibussowitsch     a->roworiented = flg;
1321d71ae5a4SJacob Faibussowitsch     break;
1322d71ae5a4SJacob Faibussowitsch   case MAT_KEEP_NONZERO_PATTERN:
1323d71ae5a4SJacob Faibussowitsch     a->keepnonzeropattern = flg;
1324d71ae5a4SJacob Faibussowitsch     break;
1325d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATIONS:
1326d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? 0 : 1);
1327d71ae5a4SJacob Faibussowitsch     break;
1328d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATION_ERR:
1329d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -1 : 0);
1330d71ae5a4SJacob Faibussowitsch     break;
1331d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_ALLOCATION_ERR:
1332d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -2 : 0);
1333d71ae5a4SJacob Faibussowitsch     break;
1334d71ae5a4SJacob Faibussowitsch   case MAT_UNUSED_NONZERO_LOCATION_ERR:
1335d71ae5a4SJacob Faibussowitsch     a->nounused = (flg ? -1 : 0);
1336d71ae5a4SJacob Faibussowitsch     break;
1337d71ae5a4SJacob Faibussowitsch   case MAT_IGNORE_ZERO_ENTRIES:
1338d71ae5a4SJacob Faibussowitsch     a->ignorezeroentries = flg;
1339d71ae5a4SJacob Faibussowitsch     break;
1340d71ae5a4SJacob Faibussowitsch   case MAT_USE_INODES:
1341d71ae5a4SJacob Faibussowitsch     PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg));
1342d71ae5a4SJacob Faibussowitsch     break;
1343d71ae5a4SJacob Faibussowitsch   case MAT_SUBMAT_SINGLEIS:
1344d71ae5a4SJacob Faibussowitsch     A->submat_singleis = flg;
1345d71ae5a4SJacob Faibussowitsch     break;
1346071fcb05SBarry Smith   case MAT_SORTED_FULL:
1347071fcb05SBarry Smith     if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
1348071fcb05SBarry Smith     else A->ops->setvalues = MatSetValues_SeqAIJ;
1349071fcb05SBarry Smith     break;
1350d71ae5a4SJacob Faibussowitsch   case MAT_FORM_EXPLICIT_TRANSPOSE:
1351d71ae5a4SJacob Faibussowitsch     A->form_explicit_transpose = flg;
1352d71ae5a4SJacob Faibussowitsch     break;
1353d71ae5a4SJacob Faibussowitsch   default:
1354888c827cSStefano Zampini     break;
1355a65d3064SKris Buschelman   }
13563ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
135717ab2063SBarry Smith }
135817ab2063SBarry Smith 
MatGetDiagonal_SeqAIJ(Mat A,Vec v)13599ee18893SBarry Smith PETSC_INTERN PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v)
1360d71ae5a4SJacob Faibussowitsch {
1361416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1362421480d9SBarry Smith   PetscInt           n, *ai = a->i;
1363c898d852SStefano Zampini   PetscScalar       *x;
1364c898d852SStefano Zampini   const PetscScalar *aa;
1365421480d9SBarry Smith   const PetscInt    *diag;
1366421480d9SBarry Smith   PetscBool          diagDense;
136717ab2063SBarry Smith 
13683a40ed3dSBarry Smith   PetscFunctionBegin;
13699566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
137008401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
13719566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
1372d5f3da31SBarry Smith   if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) {
1373421480d9SBarry Smith     PetscCall(MatGetDiagonalMarkers_SeqAIJ(A, &diag, NULL));
13749566063dSJacob Faibussowitsch     PetscCall(VecGetArrayWrite(v, &x));
1375421480d9SBarry Smith     for (PetscInt i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]];
13769566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayWrite(v, &x));
13779566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
13783ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
137935e7444dSHong Zhang   }
138035e7444dSHong Zhang 
1381421480d9SBarry Smith   PetscCheck(A->factortype == MAT_FACTOR_NONE, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Not for factor matrices that are not ILU or LU");
1382421480d9SBarry Smith   PetscCall(MatGetDiagonalMarkers_SeqAIJ(A, &diag, &diagDense));
13839566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
1384421480d9SBarry Smith   if (diagDense) {
1385421480d9SBarry Smith     for (PetscInt i = 0; i < n; i++) x[i] = aa[diag[i]];
1386421480d9SBarry Smith   } else {
1387421480d9SBarry Smith     for (PetscInt i = 0; i < n; i++) x[i] = (diag[i] == ai[i + 1]) ? 0.0 : aa[diag[i]];
138817ab2063SBarry Smith   }
13899566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
13909566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
13913ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
139217ab2063SBarry Smith }
139317ab2063SBarry Smith 
1394c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
MatMultTransposeAdd_SeqAIJ(Mat A,Vec xx,Vec zz,Vec yy)1395d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy)
1396d71ae5a4SJacob Faibussowitsch {
1397416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
13985f22a7b3SSebastian Grimberg   const MatScalar   *aa;
1399d9ca1df4SBarry Smith   PetscScalar       *y;
1400d9ca1df4SBarry Smith   const PetscScalar *x;
1401d0f46423SBarry Smith   PetscInt           m = A->rmap->n;
14025c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
14035f22a7b3SSebastian Grimberg   const MatScalar  *v;
1404a77337e4SBarry Smith   PetscScalar       alpha;
1405d9ca1df4SBarry Smith   PetscInt          n, i, j;
1406d9ca1df4SBarry Smith   const PetscInt   *idx, *ii, *ridx = NULL;
14073447b6efSHong Zhang   Mat_CompressedRow cprow    = a->compressedrow;
1408ace3abfcSBarry Smith   PetscBool         usecprow = cprow.use;
14095c897100SBarry Smith #endif
141017ab2063SBarry Smith 
14113a40ed3dSBarry Smith   PetscFunctionBegin;
14129566063dSJacob Faibussowitsch   if (zz != yy) PetscCall(VecCopy(zz, yy));
14139566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
14149566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
14159566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
14165c897100SBarry Smith 
14175c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
1418fff043a9SJunchao Zhang   fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y);
14195c897100SBarry Smith #else
14203447b6efSHong Zhang   if (usecprow) {
14213447b6efSHong Zhang     m    = cprow.nrows;
14223447b6efSHong Zhang     ii   = cprow.i;
14237b2bb3b9SHong Zhang     ridx = cprow.rindex;
14243447b6efSHong Zhang   } else {
14253447b6efSHong Zhang     ii = a->i;
14263447b6efSHong Zhang   }
142717ab2063SBarry Smith   for (i = 0; i < m; i++) {
14283447b6efSHong Zhang     idx = a->j + ii[i];
1429fff043a9SJunchao Zhang     v   = aa + ii[i];
14303447b6efSHong Zhang     n   = ii[i + 1] - ii[i];
14313447b6efSHong Zhang     if (usecprow) {
14327b2bb3b9SHong Zhang       alpha = x[ridx[i]];
14333447b6efSHong Zhang     } else {
143417ab2063SBarry Smith       alpha = x[i];
14353447b6efSHong Zhang     }
143604fbf559SBarry Smith     for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j];
143717ab2063SBarry Smith   }
14385c897100SBarry Smith #endif
14399566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
14409566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
14419566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
14429566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
14433ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
144417ab2063SBarry Smith }
144517ab2063SBarry Smith 
MatMultTranspose_SeqAIJ(Mat A,Vec xx,Vec yy)1446d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy)
1447d71ae5a4SJacob Faibussowitsch {
14485c897100SBarry Smith   PetscFunctionBegin;
14499566063dSJacob Faibussowitsch   PetscCall(VecSet(yy, 0.0));
14509566063dSJacob Faibussowitsch   PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy));
14513ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
14525c897100SBarry Smith }
14535c897100SBarry Smith 
1454c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
145578b84d54SShri Abhyankar 
MatMult_SeqAIJ(Mat A,Vec xx,Vec yy)1456d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy)
1457d71ae5a4SJacob Faibussowitsch {
1458416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1459d9fead3dSBarry Smith   PetscScalar       *y;
146054f21887SBarry Smith   const PetscScalar *x;
14615914357eSBarry Smith   const MatScalar   *a_a;
1462003131ecSBarry Smith   PetscInt           m = A->rmap->n;
14635914357eSBarry Smith   const PetscInt    *ii, *ridx = NULL;
1464ace3abfcSBarry Smith   PetscBool          usecprow = a->compressedrow.use;
146517ab2063SBarry Smith 
1466b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
146797952fefSHong Zhang   #pragma disjoint(*x, *y, *aa)
1468fee21e36SBarry Smith #endif
1469fee21e36SBarry Smith 
14703a40ed3dSBarry Smith   PetscFunctionBegin;
1471b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked) {
14729566063dSJacob Faibussowitsch     PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy));
14733ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1474b215bc84SStefano Zampini   }
14759566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
14769566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
14779566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
1478416022c9SBarry Smith   ii = a->i;
14794eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
14809566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(y, m));
148197952fefSHong Zhang     m    = a->compressedrow.nrows;
148297952fefSHong Zhang     ii   = a->compressedrow.i;
148397952fefSHong Zhang     ridx = a->compressedrow.rindex;
14845914357eSBarry Smith     PetscPragmaUseOMPKernels(parallel for)
14855914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
14865914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
14875914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
14885914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
14895914357eSBarry Smith       PetscScalar        sum = 0.0;
1490003131ecSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
1491003131ecSBarry Smith       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
1492c9a1b032SJunchao Zhang       y[ridx[i]] = sum;
149397952fefSHong Zhang     }
149497952fefSHong Zhang   } else { /* do not use compressed row format */
1495b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ)
14965914357eSBarry Smith     fortranmultaij_(&m, x, ii, a->j, a_a, y);
1497b05257ddSBarry Smith #else
14985914357eSBarry Smith     PetscPragmaUseOMPKernels(parallel for)
14995914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
15005914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
15015914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
15025914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
15035914357eSBarry Smith       PetscScalar        sum = 0.0;
1504003131ecSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
150517ab2063SBarry Smith       y[i] = sum;
150617ab2063SBarry Smith     }
15078d195f9aSBarry Smith #endif
1508b05257ddSBarry Smith   }
15099566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt));
15109566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
15119566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
15129566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
15133ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
151417ab2063SBarry Smith }
151517ab2063SBarry Smith 
1516ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c
MatMultMax_SeqAIJ(Mat A,Vec xx,Vec yy)1517ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy)
1518d71ae5a4SJacob Faibussowitsch {
1519b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1520b434eb95SMatthew G. Knepley   PetscScalar       *y;
1521b434eb95SMatthew G. Knepley   const PetscScalar *x;
1522fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1523b434eb95SMatthew G. Knepley   PetscInt           m = A->rmap->n;
1524b434eb95SMatthew G. Knepley   const PetscInt    *aj, *ii, *ridx   = NULL;
1525b434eb95SMatthew G. Knepley   PetscInt           n, i, nonzerorow = 0;
1526b434eb95SMatthew G. Knepley   PetscScalar        sum;
1527b434eb95SMatthew G. Knepley   PetscBool          usecprow = a->compressedrow.use;
1528b434eb95SMatthew G. Knepley 
1529b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
1530b434eb95SMatthew G. Knepley   #pragma disjoint(*x, *y, *aa)
1531b434eb95SMatthew G. Knepley #endif
1532b434eb95SMatthew G. Knepley 
1533b434eb95SMatthew G. Knepley   PetscFunctionBegin;
15349566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
15359566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
15369566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
1537b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
1538b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1539b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1540b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1541b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1542b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1543b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1544fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1545b434eb95SMatthew G. Knepley       sum = 0.0;
1546b434eb95SMatthew G. Knepley       nonzerorow += (n > 0);
1547b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1548b434eb95SMatthew G. Knepley       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
1549b434eb95SMatthew G. Knepley       y[*ridx++] = sum;
1550b434eb95SMatthew G. Knepley     }
1551b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
15523d3eaba7SBarry Smith     ii = a->i;
1553b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1554b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1555b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1556fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1557b434eb95SMatthew G. Knepley       sum = 0.0;
1558b434eb95SMatthew G. Knepley       nonzerorow += (n > 0);
1559b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1560b434eb95SMatthew G. Knepley       y[i] = sum;
1561b434eb95SMatthew G. Knepley     }
1562b434eb95SMatthew G. Knepley   }
15639566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow));
15649566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
15659566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
15669566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
15673ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1568b434eb95SMatthew G. Knepley }
1569b434eb95SMatthew G. Knepley 
1570ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c
MatMultAddMax_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz)1571ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz)
1572d71ae5a4SJacob Faibussowitsch {
1573b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1574b434eb95SMatthew G. Knepley   PetscScalar       *y, *z;
1575b434eb95SMatthew G. Knepley   const PetscScalar *x;
1576fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1577b434eb95SMatthew G. Knepley   PetscInt           m = A->rmap->n, *aj, *ii;
1578b434eb95SMatthew G. Knepley   PetscInt           n, i, *ridx = NULL;
1579b434eb95SMatthew G. Knepley   PetscScalar        sum;
1580b434eb95SMatthew G. Knepley   PetscBool          usecprow = a->compressedrow.use;
1581b434eb95SMatthew G. Knepley 
1582b434eb95SMatthew G. Knepley   PetscFunctionBegin;
15839566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
15849566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
15859566063dSJacob Faibussowitsch   PetscCall(VecGetArrayPair(yy, zz, &y, &z));
1586b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
158748a46eb9SPierre Jolivet     if (zz != yy) PetscCall(PetscArraycpy(z, y, m));
1588b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1589b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1590b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1591b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1592b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1593b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1594fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1595b434eb95SMatthew G. Knepley       sum = y[*ridx];
1596b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1597b434eb95SMatthew G. Knepley       z[*ridx++] = sum;
1598b434eb95SMatthew G. Knepley     }
1599b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
16003d3eaba7SBarry Smith     ii = a->i;
1601b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1602b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1603b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1604fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1605b434eb95SMatthew G. Knepley       sum = y[i];
1606b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1607b434eb95SMatthew G. Knepley       z[i] = sum;
1608b434eb95SMatthew G. Knepley     }
1609b434eb95SMatthew G. Knepley   }
16109566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
16119566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
16129566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayPair(yy, zz, &y, &z));
16139566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
16143ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1615b434eb95SMatthew G. Knepley }
1616b434eb95SMatthew G. Knepley 
1617c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h>
MatMultAdd_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz)1618d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz)
1619d71ae5a4SJacob Faibussowitsch {
1620416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1621f15663dcSBarry Smith   PetscScalar       *y, *z;
1622f15663dcSBarry Smith   const PetscScalar *x;
16235914357eSBarry Smith   const MatScalar   *a_a;
16245914357eSBarry Smith   const PetscInt    *ii, *ridx = NULL;
16255914357eSBarry Smith   PetscInt           m        = A->rmap->n;
1626ace3abfcSBarry Smith   PetscBool          usecprow = a->compressedrow.use;
16279ea0dfa2SSatish Balay 
16283a40ed3dSBarry Smith   PetscFunctionBegin;
1629b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked) {
16309566063dSJacob Faibussowitsch     PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz));
16313ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1632b215bc84SStefano Zampini   }
16339566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
16349566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
16359566063dSJacob Faibussowitsch   PetscCall(VecGetArrayPair(yy, zz, &y, &z));
16364eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
163748a46eb9SPierre Jolivet     if (zz != yy) PetscCall(PetscArraycpy(z, y, m));
163897952fefSHong Zhang     m    = a->compressedrow.nrows;
163997952fefSHong Zhang     ii   = a->compressedrow.i;
164097952fefSHong Zhang     ridx = a->compressedrow.rindex;
16415914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
16425914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
16435914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
16445914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
16455914357eSBarry Smith       PetscScalar        sum = y[*ridx];
1646f15663dcSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
164797952fefSHong Zhang       z[*ridx++] = sum;
164897952fefSHong Zhang     }
164997952fefSHong Zhang   } else { /* do not use compressed row format */
16503d3eaba7SBarry Smith     ii = a->i;
1651f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ)
16525914357eSBarry Smith     fortranmultaddaij_(&m, x, ii, a->j, a_a, y, z);
1653f15663dcSBarry Smith #else
16545914357eSBarry Smith     PetscPragmaUseOMPKernels(parallel for)
16555914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
16565914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
16575914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
16585914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
16595914357eSBarry Smith       PetscScalar        sum = y[i];
1660f15663dcSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
166117ab2063SBarry Smith       z[i] = sum;
166217ab2063SBarry Smith     }
166302ab625aSSatish Balay #endif
1664f15663dcSBarry Smith   }
16659566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
16669566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
16679566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayPair(yy, zz, &y, &z));
16689566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
16693ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
167017ab2063SBarry Smith }
167117ab2063SBarry Smith 
MatShift_SeqAIJ(Mat A,PetscScalar v)1672ba38deedSJacob Faibussowitsch static PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v)
1673d71ae5a4SJacob Faibussowitsch {
167461ecd0c6SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
1675421480d9SBarry Smith   const PetscInt *diag;
167661ecd0c6SBarry Smith   const PetscInt *ii = (const PetscInt *)a->i;
1677421480d9SBarry Smith   PetscBool       diagDense;
167861ecd0c6SBarry Smith 
167961ecd0c6SBarry Smith   PetscFunctionBegin;
168061ecd0c6SBarry Smith   if (!A->preallocated || !a->nz) {
16819566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL));
16829566063dSJacob Faibussowitsch     PetscCall(MatShift_Basic(A, v));
16833ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
168461ecd0c6SBarry Smith   }
168561ecd0c6SBarry Smith 
1686421480d9SBarry Smith   PetscCall(MatGetDiagonalMarkers_SeqAIJ(A, &diag, &diagDense));
1687421480d9SBarry Smith   if (diagDense) {
16889234b629SBarry Smith     PetscScalar *Aa;
16899234b629SBarry Smith 
16909234b629SBarry Smith     PetscCall(MatSeqAIJGetArray(A, &Aa));
16919234b629SBarry Smith     for (PetscInt i = 0; i < A->rmap->n; i++) Aa[diag[i]] += v;
16929234b629SBarry Smith     PetscCall(MatSeqAIJRestoreArray(A, &Aa));
169361ecd0c6SBarry Smith   } else {
1694b6f2aa54SBarry Smith     PetscScalar       *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */
1695b6f2aa54SBarry Smith     PetscInt          *oldj = a->j, *oldi = a->i;
16969f0612e4SBarry Smith     PetscBool          free_a = a->free_a, free_ij = a->free_ij;
16976ea2a7edSJunchao Zhang     const PetscScalar *Aa;
169807425a8dSBarry Smith     PetscInt          *mdiag = NULL;
16996ea2a7edSJunchao Zhang 
170007425a8dSBarry Smith     PetscCall(PetscCalloc1(A->rmap->n, &mdiag));
170107425a8dSBarry Smith     for (PetscInt i = 0; i < A->rmap->n; i++) {
170207425a8dSBarry Smith       if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */
170307425a8dSBarry Smith         mdiag[i] = 1;
170407425a8dSBarry Smith       }
170507425a8dSBarry Smith     }
17066ea2a7edSJunchao Zhang     PetscCall(MatSeqAIJGetArrayRead(A, &Aa)); // sync the host
17076ea2a7edSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayRead(A, &Aa));
170861ecd0c6SBarry Smith 
170961ecd0c6SBarry Smith     a->a = NULL;
171061ecd0c6SBarry Smith     a->j = NULL;
171161ecd0c6SBarry Smith     a->i = NULL;
171261ecd0c6SBarry Smith     /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */
171307425a8dSBarry Smith     for (PetscInt i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i];
17149566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax));
171561ecd0c6SBarry Smith 
171661ecd0c6SBarry Smith     /* copy old values into new matrix data structure */
171707425a8dSBarry Smith     for (PetscInt i = 0; i < A->rmap->n; i++) {
17189566063dSJacob Faibussowitsch       PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES));
171948a46eb9SPierre Jolivet       if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES));
1720447d62f5SStefano Zampini     }
17219566063dSJacob Faibussowitsch     PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY));
17229566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY));
17239f0612e4SBarry Smith     if (free_a) PetscCall(PetscShmgetDeallocateArray((void **)&olda));
17249f0612e4SBarry Smith     if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldj));
17259f0612e4SBarry Smith     if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldi));
17269566063dSJacob Faibussowitsch     PetscCall(PetscFree(mdiag));
1727be5855fcSBarry Smith   }
17283ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1729be5855fcSBarry Smith }
1730be5855fcSBarry Smith 
17310da83c2eSBarry Smith #include <petscblaslapack.h>
17320da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h>
17330da83c2eSBarry Smith 
17340da83c2eSBarry Smith /*
17350da83c2eSBarry Smith     Note that values is allocated externally by the PC and then passed into this routine
17360da83c2eSBarry Smith */
MatInvertVariableBlockDiagonal_SeqAIJ(Mat A,PetscInt nblocks,const PetscInt * bsizes,PetscScalar * diag)1737ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag)
1738d71ae5a4SJacob Faibussowitsch {
17390da83c2eSBarry Smith   PetscInt        n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots;
17400da83c2eSBarry Smith   PetscBool       allowzeropivot, zeropivotdetected = PETSC_FALSE;
17410da83c2eSBarry Smith   const PetscReal shift = 0.0;
17420da83c2eSBarry Smith   PetscInt        ipvt[5];
17434e208921SJed Brown   PetscCount      flops = 0;
17440da83c2eSBarry Smith   PetscScalar     work[25], *v_work;
17450da83c2eSBarry Smith 
17460da83c2eSBarry Smith   PetscFunctionBegin;
17470da83c2eSBarry Smith   allowzeropivot = PetscNot(A->erroriffailure);
17480da83c2eSBarry Smith   for (i = 0; i < nblocks; i++) ncnt += bsizes[i];
174908401ef6SPierre Jolivet   PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n);
1750ad540459SPierre Jolivet   for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]);
17519566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(bsizemax, &indx));
175248a46eb9SPierre Jolivet   if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots));
17530da83c2eSBarry Smith   ncnt = 0;
17540da83c2eSBarry Smith   for (i = 0; i < nblocks; i++) {
17550da83c2eSBarry Smith     for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j;
17569566063dSJacob Faibussowitsch     PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag));
17570da83c2eSBarry Smith     switch (bsizes[i]) {
1758d71ae5a4SJacob Faibussowitsch     case 1:
1759d71ae5a4SJacob Faibussowitsch       *diag = 1.0 / (*diag);
1760d71ae5a4SJacob Faibussowitsch       break;
17610da83c2eSBarry Smith     case 2:
17629566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected));
17630da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
17649566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_2(diag));
17650da83c2eSBarry Smith       break;
17660da83c2eSBarry Smith     case 3:
17679566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected));
17680da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
17699566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_3(diag));
17700da83c2eSBarry Smith       break;
17710da83c2eSBarry Smith     case 4:
17729566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected));
17730da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
17749566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_4(diag));
17750da83c2eSBarry Smith       break;
17760da83c2eSBarry Smith     case 5:
17779566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected));
17780da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
17799566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_5(diag));
17800da83c2eSBarry Smith       break;
17810da83c2eSBarry Smith     case 6:
17829566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected));
17830da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
17849566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_6(diag));
17850da83c2eSBarry Smith       break;
17860da83c2eSBarry Smith     case 7:
17879566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected));
17880da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
17899566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_7(diag));
17900da83c2eSBarry Smith       break;
17910da83c2eSBarry Smith     default:
17929566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected));
17930da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
17949566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i]));
17950da83c2eSBarry Smith     }
17960da83c2eSBarry Smith     ncnt += bsizes[i];
17970da83c2eSBarry Smith     diag += bsizes[i] * bsizes[i];
1798baa50dc0SBrad Aagaard     flops += 2 * PetscPowInt64(bsizes[i], 3) / 3;
17990da83c2eSBarry Smith   }
18003ba16761SJacob Faibussowitsch   PetscCall(PetscLogFlops(flops));
180148a46eb9SPierre Jolivet   if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots));
18029566063dSJacob Faibussowitsch   PetscCall(PetscFree(indx));
18033ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
18040da83c2eSBarry Smith }
18050da83c2eSBarry Smith 
1806422a814eSBarry Smith /*
1807422a814eSBarry Smith    Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways
1808422a814eSBarry Smith */
MatInvertDiagonalForSOR_SeqAIJ(Mat A,PetscScalar omega,PetscScalar fshift)180907425a8dSBarry Smith static PetscErrorCode MatInvertDiagonalForSOR_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift)
1810d71ae5a4SJacob Faibussowitsch {
181171f1c65dSBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
1812421480d9SBarry Smith   PetscInt         i, m = A->rmap->n;
18132e5835c6SStefano Zampini   const MatScalar *v;
181454f21887SBarry Smith   PetscScalar     *idiag, *mdiag;
1815421480d9SBarry Smith   PetscBool        diagDense;
1816421480d9SBarry Smith   const PetscInt  *diag;
181771f1c65dSBarry Smith 
181871f1c65dSBarry Smith   PetscFunctionBegin;
181907425a8dSBarry Smith   if (a->idiagState == ((PetscObject)A)->state && a->omega == omega && a->fshift == fshift) PetscFunctionReturn(PETSC_SUCCESS);
1820421480d9SBarry Smith   PetscCall(MatGetDiagonalMarkers_SeqAIJ(A, &diag, &diagDense));
1821421480d9SBarry Smith   PetscCheck(diagDense, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix must have all diagonal locations to invert them");
18223a7d0413SPierre Jolivet   if (!a->idiag) PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work));
18232e5835c6SStefano Zampini 
182471f1c65dSBarry Smith   mdiag = a->mdiag;
182571f1c65dSBarry Smith   idiag = a->idiag;
18269566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &v));
1827422a814eSBarry Smith   if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) {
182871f1c65dSBarry Smith     for (i = 0; i < m; i++) {
182971f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
1830899639b0SHong Zhang       if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */
1831966bd95aSPierre Jolivet         PetscCheck(PetscRealPart(fshift), PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i);
18329566063dSJacob Faibussowitsch         PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i));
18337b6c816cSBarry Smith         A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18347b6c816cSBarry Smith         A->factorerror_zeropivot_value = 0.0;
18357b6c816cSBarry Smith         A->factorerror_zeropivot_row   = i;
1836899639b0SHong Zhang       }
183771f1c65dSBarry Smith       idiag[i] = 1.0 / v[diag[i]];
183871f1c65dSBarry Smith     }
18399566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(m));
184071f1c65dSBarry Smith   } else {
184171f1c65dSBarry Smith     for (i = 0; i < m; i++) {
184271f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
184371f1c65dSBarry Smith       idiag[i] = omega / (fshift + v[diag[i]]);
184471f1c65dSBarry Smith     }
18459566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * m));
184671f1c65dSBarry Smith   }
18479566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &v));
184807425a8dSBarry Smith   a->idiagState = ((PetscObject)A)->state;
184907425a8dSBarry Smith   a->omega      = omega;
185007425a8dSBarry Smith   a->fshift     = fshift;
18513ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
185271f1c65dSBarry Smith }
185371f1c65dSBarry Smith 
MatSOR_SeqAIJ(Mat A,Vec bb,PetscReal omega,MatSORType flag,PetscReal fshift,PetscInt its,PetscInt lits,Vec xx)1854d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx)
1855d71ae5a4SJacob Faibussowitsch {
1856416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1857e6d1f457SBarry Smith   PetscScalar       *x, d, sum, *t, scale;
18582e5835c6SStefano Zampini   const MatScalar   *v, *idiag = NULL, *mdiag, *aa;
185954f21887SBarry Smith   const PetscScalar *b, *bs, *xb, *ts;
18603d3eaba7SBarry Smith   PetscInt           n, m = A->rmap->n, i;
186197f1f81fSBarry Smith   const PetscInt    *idx, *diag;
186217ab2063SBarry Smith 
18633a40ed3dSBarry Smith   PetscFunctionBegin;
1864b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) {
18659566063dSJacob Faibussowitsch     PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx));
18663ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1867b215bc84SStefano Zampini   }
1868b965ef7fSBarry Smith   its = its * lits;
186907425a8dSBarry Smith   PetscCall(MatInvertDiagonalForSOR_SeqAIJ(A, omega, fshift));
1870421480d9SBarry Smith   PetscCall(MatGetDiagonalMarkers_SeqAIJ(A, &diag, NULL));
187171f1c65dSBarry Smith   t     = a->ssor_work;
1872ed480e8bSBarry Smith   idiag = a->idiag;
187371f1c65dSBarry Smith   mdiag = a->mdiag;
1874ed480e8bSBarry Smith 
18759566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
18769566063dSJacob Faibussowitsch   PetscCall(VecGetArray(xx, &x));
18779566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(bb, &b));
1878ed480e8bSBarry Smith   /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */
187917ab2063SBarry Smith   if (flag == SOR_APPLY_UPPER) {
188017ab2063SBarry Smith     /* apply (U + D/omega) to the vector */
1881ed480e8bSBarry Smith     bs = b;
188217ab2063SBarry Smith     for (i = 0; i < m; i++) {
188371f1c65dSBarry Smith       d   = fshift + mdiag[i];
1884416022c9SBarry Smith       n   = a->i[i + 1] - diag[i] - 1;
1885ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
18862e5835c6SStefano Zampini       v   = aa + diag[i] + 1;
188717ab2063SBarry Smith       sum = b[i] * d / omega;
1888003131ecSBarry Smith       PetscSparseDensePlusDot(sum, bs, v, idx, n);
188917ab2063SBarry Smith       x[i] = sum;
189017ab2063SBarry Smith     }
18919566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(xx, &x));
18929566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(bb, &b));
18939566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
18949566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(a->nz));
18953ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
189617ab2063SBarry Smith   }
1897c783ea89SBarry Smith 
189808401ef6SPierre Jolivet   PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented");
1899f7d195e4SLawrence Mitchell   if (flag & SOR_EISENSTAT) {
19004c500f23SPierre Jolivet     /* Let  A = L + U + D; where L is lower triangular,
1901887ee2caSBarry Smith     U is upper triangular, E = D/omega; This routine applies
190217ab2063SBarry Smith 
190317ab2063SBarry Smith             (L + E)^{-1} A (U + E)^{-1}
190417ab2063SBarry Smith 
1905887ee2caSBarry Smith     to a vector efficiently using Eisenstat's trick.
190617ab2063SBarry Smith     */
190717ab2063SBarry Smith     scale = (2.0 / omega) - 1.0;
190817ab2063SBarry Smith 
190917ab2063SBarry Smith     /*  x = (E + U)^{-1} b */
191017ab2063SBarry Smith     for (i = m - 1; i >= 0; i--) {
1911416022c9SBarry Smith       n   = a->i[i + 1] - diag[i] - 1;
1912ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
19132e5835c6SStefano Zampini       v   = aa + diag[i] + 1;
191417ab2063SBarry Smith       sum = b[i];
1915e6d1f457SBarry Smith       PetscSparseDenseMinusDot(sum, x, v, idx, n);
1916ed480e8bSBarry Smith       x[i] = sum * idiag[i];
191717ab2063SBarry Smith     }
191817ab2063SBarry Smith 
191917ab2063SBarry Smith     /*  t = b - (2*E - D)x */
19202e5835c6SStefano Zampini     v = aa;
19212205254eSKarl Rupp     for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i];
192217ab2063SBarry Smith 
192317ab2063SBarry Smith     /*  t = (E + L)^{-1}t */
1924ed480e8bSBarry Smith     ts   = t;
1925416022c9SBarry Smith     diag = a->diag;
192617ab2063SBarry Smith     for (i = 0; i < m; i++) {
1927416022c9SBarry Smith       n   = diag[i] - a->i[i];
1928ed480e8bSBarry Smith       idx = a->j + a->i[i];
19292e5835c6SStefano Zampini       v   = aa + a->i[i];
193017ab2063SBarry Smith       sum = t[i];
1931003131ecSBarry Smith       PetscSparseDenseMinusDot(sum, ts, v, idx, n);
1932ed480e8bSBarry Smith       t[i] = sum * idiag[i];
1933733d66baSBarry Smith       /*  x = x + t */
1934733d66baSBarry Smith       x[i] += t[i];
193517ab2063SBarry Smith     }
193617ab2063SBarry Smith 
19379566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz));
19389566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(xx, &x));
19399566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(bb, &b));
19403ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
194117ab2063SBarry Smith   }
194217ab2063SBarry Smith   if (flag & SOR_ZERO_INITIAL_GUESS) {
194317ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
194417ab2063SBarry Smith       for (i = 0; i < m; i++) {
1945416022c9SBarry Smith         n   = diag[i] - a->i[i];
1946ed480e8bSBarry Smith         idx = a->j + a->i[i];
19472e5835c6SStefano Zampini         v   = aa + a->i[i];
194817ab2063SBarry Smith         sum = b[i];
1949e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
19505c99c7daSBarry Smith         t[i] = sum;
1951ed480e8bSBarry Smith         x[i] = sum * idiag[i];
195217ab2063SBarry Smith       }
19535c99c7daSBarry Smith       xb = t;
19549566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(a->nz));
19553a40ed3dSBarry Smith     } else xb = b;
195617ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
195717ab2063SBarry Smith       for (i = m - 1; i >= 0; i--) {
1958416022c9SBarry Smith         n   = a->i[i + 1] - diag[i] - 1;
1959ed480e8bSBarry Smith         idx = a->j + diag[i] + 1;
19602e5835c6SStefano Zampini         v   = aa + diag[i] + 1;
196117ab2063SBarry Smith         sum = xb[i];
1962e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
19635c99c7daSBarry Smith         if (xb == b) {
1964ed480e8bSBarry Smith           x[i] = sum * idiag[i];
19655c99c7daSBarry Smith         } else {
1966b19a5dc2SMark Adams           x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
196717ab2063SBarry Smith         }
19685c99c7daSBarry Smith       }
19699566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */
197017ab2063SBarry Smith     }
197117ab2063SBarry Smith     its--;
197217ab2063SBarry Smith   }
197317ab2063SBarry Smith   while (its--) {
197417ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
197517ab2063SBarry Smith       for (i = 0; i < m; i++) {
1976b19a5dc2SMark Adams         /* lower */
1977b19a5dc2SMark Adams         n   = diag[i] - a->i[i];
1978ed480e8bSBarry Smith         idx = a->j + a->i[i];
19792e5835c6SStefano Zampini         v   = aa + a->i[i];
198017ab2063SBarry Smith         sum = b[i];
1981e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
1982b19a5dc2SMark Adams         t[i] = sum; /* save application of the lower-triangular part */
1983b19a5dc2SMark Adams         /* upper */
1984b19a5dc2SMark Adams         n   = a->i[i + 1] - diag[i] - 1;
1985b19a5dc2SMark Adams         idx = a->j + diag[i] + 1;
19862e5835c6SStefano Zampini         v   = aa + diag[i] + 1;
1987b19a5dc2SMark Adams         PetscSparseDenseMinusDot(sum, x, v, idx, n);
1988b19a5dc2SMark Adams         x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
198917ab2063SBarry Smith       }
1990b19a5dc2SMark Adams       xb = t;
19919566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(2.0 * a->nz));
1992b19a5dc2SMark Adams     } else xb = b;
199317ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
199417ab2063SBarry Smith       for (i = m - 1; i >= 0; i--) {
1995b19a5dc2SMark Adams         sum = xb[i];
1996b19a5dc2SMark Adams         if (xb == b) {
1997b19a5dc2SMark Adams           /* whole matrix (no checkpointing available) */
1998416022c9SBarry Smith           n   = a->i[i + 1] - a->i[i];
1999ed480e8bSBarry Smith           idx = a->j + a->i[i];
20002e5835c6SStefano Zampini           v   = aa + a->i[i];
2001e6d1f457SBarry Smith           PetscSparseDenseMinusDot(sum, x, v, idx, n);
2002ed480e8bSBarry Smith           x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i];
2003b19a5dc2SMark Adams         } else { /* lower-triangular part has been saved, so only apply upper-triangular */
2004b19a5dc2SMark Adams           n   = a->i[i + 1] - diag[i] - 1;
2005b19a5dc2SMark Adams           idx = a->j + diag[i] + 1;
20062e5835c6SStefano Zampini           v   = aa + diag[i] + 1;
2007b19a5dc2SMark Adams           PetscSparseDenseMinusDot(sum, x, v, idx, n);
2008b19a5dc2SMark Adams           x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
200917ab2063SBarry Smith         }
2010b19a5dc2SMark Adams       }
2011b19a5dc2SMark Adams       if (xb == b) {
20129566063dSJacob Faibussowitsch         PetscCall(PetscLogFlops(2.0 * a->nz));
2013b19a5dc2SMark Adams       } else {
20149566063dSJacob Faibussowitsch         PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */
2015b19a5dc2SMark Adams       }
201617ab2063SBarry Smith     }
201717ab2063SBarry Smith   }
20189566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
20199566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(xx, &x));
20209566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(bb, &b));
20213ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
202217ab2063SBarry Smith }
202317ab2063SBarry Smith 
MatGetInfo_SeqAIJ(Mat A,MatInfoType flag,MatInfo * info)2024ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info)
2025d71ae5a4SJacob Faibussowitsch {
2026416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
20274e220ebcSLois Curfman McInnes 
20283a40ed3dSBarry Smith   PetscFunctionBegin;
20294e220ebcSLois Curfman McInnes   info->block_size   = 1.0;
20303966268fSBarry Smith   info->nz_allocated = a->maxnz;
20313966268fSBarry Smith   info->nz_used      = a->nz;
20323966268fSBarry Smith   info->nz_unneeded  = (a->maxnz - a->nz);
20333966268fSBarry Smith   info->assemblies   = A->num_ass;
20343966268fSBarry Smith   info->mallocs      = A->info.mallocs;
20354dfa11a4SJacob Faibussowitsch   info->memory       = 0; /* REVIEW ME */
2036d5f3da31SBarry Smith   if (A->factortype) {
20374e220ebcSLois Curfman McInnes     info->fill_ratio_given  = A->info.fill_ratio_given;
20384e220ebcSLois Curfman McInnes     info->fill_ratio_needed = A->info.fill_ratio_needed;
20394e220ebcSLois Curfman McInnes     info->factor_mallocs    = A->info.factor_mallocs;
20404e220ebcSLois Curfman McInnes   } else {
20414e220ebcSLois Curfman McInnes     info->fill_ratio_given  = 0;
20424e220ebcSLois Curfman McInnes     info->fill_ratio_needed = 0;
20434e220ebcSLois Curfman McInnes     info->factor_mallocs    = 0;
20444e220ebcSLois Curfman McInnes   }
20453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
204617ab2063SBarry Smith }
204717ab2063SBarry Smith 
MatZeroRows_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diagv,Vec x,Vec b)2048421480d9SBarry Smith static PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diagv, Vec x, Vec b)
2049d71ae5a4SJacob Faibussowitsch {
2050416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2051c7da8527SEric Chamberland   PetscInt           i, m = A->rmap->n - 1;
205297b48c8fSBarry Smith   const PetscScalar *xx;
20532e5835c6SStefano Zampini   PetscScalar       *bb, *aa;
2054c7da8527SEric Chamberland   PetscInt           d = 0;
2055421480d9SBarry Smith   const PetscInt    *diag;
205617ab2063SBarry Smith 
20573a40ed3dSBarry Smith   PetscFunctionBegin;
205897b48c8fSBarry Smith   if (x && b) {
20599566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(x, &xx));
20609566063dSJacob Faibussowitsch     PetscCall(VecGetArray(b, &bb));
206197b48c8fSBarry Smith     for (i = 0; i < N; i++) {
2062aed4548fSBarry Smith       PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
2063447d62f5SStefano Zampini       if (rows[i] >= A->cmap->n) continue;
2064421480d9SBarry Smith       bb[rows[i]] = diagv * xx[rows[i]];
206597b48c8fSBarry Smith     }
20669566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(x, &xx));
20679566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(b, &bb));
206897b48c8fSBarry Smith   }
206997b48c8fSBarry Smith 
2070421480d9SBarry Smith   PetscCall(MatGetDiagonalMarkers_SeqAIJ(A, &diag, NULL));
20719566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
2072a9817697SBarry Smith   if (a->keepnonzeropattern) {
2073f1e2ffcdSBarry Smith     for (i = 0; i < N; i++) {
2074aed4548fSBarry Smith       PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
20759566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]]));
2076f1e2ffcdSBarry Smith     }
2077421480d9SBarry Smith     if (diagv != 0.0) {
2078c7da8527SEric Chamberland       for (i = 0; i < N; i++) {
2079c7da8527SEric Chamberland         d = rows[i];
2080421480d9SBarry Smith         if (d >= A->cmap->n) continue;
2081421480d9SBarry Smith         PetscCheck(diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d);
20829234b629SBarry Smith         aa[diag[d]] = diagv;
2083f1e2ffcdSBarry Smith       }
2084f1e2ffcdSBarry Smith     }
2085f1e2ffcdSBarry Smith   } else {
2086421480d9SBarry Smith     if (diagv != 0.0) {
208717ab2063SBarry Smith       for (i = 0; i < N; i++) {
2088aed4548fSBarry Smith         PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
20897ae801bdSBarry Smith         if (a->ilen[rows[i]] > 0) {
2090447d62f5SStefano Zampini           if (rows[i] >= A->cmap->n) {
2091447d62f5SStefano Zampini             a->ilen[rows[i]] = 0;
2092447d62f5SStefano Zampini           } else {
2093416022c9SBarry Smith             a->ilen[rows[i]]    = 1;
2094421480d9SBarry Smith             aa[a->i[rows[i]]]   = diagv;
2095bfeeae90SHong Zhang             a->j[a->i[rows[i]]] = rows[i];
2096447d62f5SStefano Zampini           }
2097447d62f5SStefano Zampini         } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */
2098421480d9SBarry Smith           PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diagv, INSERT_VALUES));
209917ab2063SBarry Smith         }
210017ab2063SBarry Smith       }
21013a40ed3dSBarry Smith     } else {
210217ab2063SBarry Smith       for (i = 0; i < N; i++) {
2103aed4548fSBarry Smith         PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
2104416022c9SBarry Smith         a->ilen[rows[i]] = 0;
210517ab2063SBarry Smith       }
210617ab2063SBarry Smith     }
2107e56f5c9eSBarry Smith     A->nonzerostate++;
2108f1e2ffcdSBarry Smith   }
21099566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
2110dbbe0bcdSBarry Smith   PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY);
21113ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
211217ab2063SBarry Smith }
211317ab2063SBarry Smith 
MatZeroRowsColumns_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diagv,Vec x,Vec b)2114421480d9SBarry Smith static PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diagv, Vec x, Vec b)
2115d71ae5a4SJacob Faibussowitsch {
21166e169961SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
21176e169961SBarry Smith   PetscInt           i, j, m = A->rmap->n - 1, d = 0;
2118421480d9SBarry Smith   PetscBool         *zeroed, vecs = PETSC_FALSE;
21196e169961SBarry Smith   const PetscScalar *xx;
21202e5835c6SStefano Zampini   PetscScalar       *bb, *aa;
2121421480d9SBarry Smith   const PetscInt    *diag;
2122421480d9SBarry Smith   PetscBool          diagDense;
21236e169961SBarry Smith 
21246e169961SBarry Smith   PetscFunctionBegin;
21253ba16761SJacob Faibussowitsch   if (!N) PetscFunctionReturn(PETSC_SUCCESS);
2126421480d9SBarry Smith   PetscCall(MatGetDiagonalMarkers_SeqAIJ(A, &diag, &diagDense));
21279566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
21286e169961SBarry Smith   if (x && b) {
21299566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(x, &xx));
21309566063dSJacob Faibussowitsch     PetscCall(VecGetArray(b, &bb));
21312b40b63fSBarry Smith     vecs = PETSC_TRUE;
21326e169961SBarry Smith   }
21339566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(A->rmap->n, &zeroed));
21346e169961SBarry Smith   for (i = 0; i < N; i++) {
2135aed4548fSBarry Smith     PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
21368e3a54c0SPierre Jolivet     PetscCall(PetscArrayzero(PetscSafePointerPlusOffset(aa, a->i[rows[i]]), a->ilen[rows[i]]));
21372205254eSKarl Rupp 
21386e169961SBarry Smith     zeroed[rows[i]] = PETSC_TRUE;
21396e169961SBarry Smith   }
21406e169961SBarry Smith   for (i = 0; i < A->rmap->n; i++) {
21416e169961SBarry Smith     if (!zeroed[i]) {
21426e169961SBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
21434cf107fdSStefano Zampini         if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) {
21442e5835c6SStefano Zampini           if (vecs) bb[i] -= aa[j] * xx[a->j[j]];
21452e5835c6SStefano Zampini           aa[j] = 0.0;
21466e169961SBarry Smith         }
21476e169961SBarry Smith       }
2148421480d9SBarry Smith     } else if (vecs && i < A->cmap->N) bb[i] = diagv * xx[i];
21496e169961SBarry Smith   }
21506e169961SBarry Smith   if (x && b) {
21519566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(x, &xx));
21529566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(b, &bb));
21536e169961SBarry Smith   }
21549566063dSJacob Faibussowitsch   PetscCall(PetscFree(zeroed));
2155421480d9SBarry Smith   if (diagv != 0.0) {
2156421480d9SBarry Smith     if (!diagDense) {
21571d5a398dSstefano_zampini       for (i = 0; i < N; i++) {
21584cf107fdSStefano Zampini         if (rows[i] >= A->cmap->N) continue;
2159aed4548fSBarry Smith         PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]);
2160421480d9SBarry Smith         PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diagv, INSERT_VALUES));
21611d5a398dSstefano_zampini       }
21621d5a398dSstefano_zampini     } else {
2163421480d9SBarry Smith       for (i = 0; i < N; i++) aa[diag[rows[i]]] = diagv;
21646e169961SBarry Smith     }
21651d5a398dSstefano_zampini   }
21669566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
21679234b629SBarry Smith   if (!diagDense) PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY);
21683ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
21696e169961SBarry Smith }
21706e169961SBarry Smith 
MatGetRow_SeqAIJ(Mat A,PetscInt row,PetscInt * nz,PetscInt ** idx,PetscScalar ** v)2171d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2172d71ae5a4SJacob Faibussowitsch {
2173fff043a9SJunchao Zhang   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2174fff043a9SJunchao Zhang   const PetscScalar *aa;
217517ab2063SBarry Smith 
21763a40ed3dSBarry Smith   PetscFunctionBegin;
21779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
2178416022c9SBarry Smith   *nz = a->i[row + 1] - a->i[row];
21798e3a54c0SPierre Jolivet   if (v) *v = PetscSafePointerPlusOffset((PetscScalar *)aa, a->i[row]);
218017ab2063SBarry Smith   if (idx) {
21815c0db29aSPierre Jolivet     if (*nz && a->j) *idx = a->j + a->i[row];
2182f4259b30SLisandro Dalcin     else *idx = NULL;
218317ab2063SBarry Smith   }
21849566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
21853ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
218617ab2063SBarry Smith }
218717ab2063SBarry Smith 
MatRestoreRow_SeqAIJ(Mat A,PetscInt row,PetscInt * nz,PetscInt ** idx,PetscScalar ** v)2188d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2189d71ae5a4SJacob Faibussowitsch {
21903a40ed3dSBarry Smith   PetscFunctionBegin;
21913ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
219217ab2063SBarry Smith }
219317ab2063SBarry Smith 
MatNorm_SeqAIJ(Mat A,NormType type,PetscReal * nrm)2194ba38deedSJacob Faibussowitsch static PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm)
2195d71ae5a4SJacob Faibussowitsch {
2196416022c9SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
21972e5835c6SStefano Zampini   const MatScalar *v;
219836db0b34SBarry Smith   PetscReal        sum = 0.0;
219997f1f81fSBarry Smith   PetscInt         i, j;
220017ab2063SBarry Smith 
22013a40ed3dSBarry Smith   PetscFunctionBegin;
22029566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &v));
220317ab2063SBarry Smith   if (type == NORM_FROBENIUS) {
2204570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16)
2205570b7f6dSBarry Smith     PetscBLASInt one = 1, nz = a->nz;
2206792fecdfSBarry Smith     PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one));
2207570b7f6dSBarry Smith #else
2208416022c9SBarry Smith     for (i = 0; i < a->nz; i++) {
22099371c9d4SSatish Balay       sum += PetscRealPart(PetscConj(*v) * (*v));
22109371c9d4SSatish Balay       v++;
221117ab2063SBarry Smith     }
22128f1a2a5eSBarry Smith     *nrm = PetscSqrtReal(sum);
2213570b7f6dSBarry Smith #endif
22149566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * a->nz));
22153a40ed3dSBarry Smith   } else if (type == NORM_1) {
221636db0b34SBarry Smith     PetscReal *tmp;
221797f1f81fSBarry Smith     PetscInt  *jj = a->j;
2218f1957bc3SPierre Jolivet     PetscCall(PetscCalloc1(A->cmap->n, &tmp));
2219064f8208SBarry Smith     *nrm = 0.0;
2220416022c9SBarry Smith     for (j = 0; j < a->nz; j++) {
22219371c9d4SSatish Balay       tmp[*jj++] += PetscAbsScalar(*v);
22229371c9d4SSatish Balay       v++;
222317ab2063SBarry Smith     }
2224d0f46423SBarry Smith     for (j = 0; j < A->cmap->n; j++) {
2225064f8208SBarry Smith       if (tmp[j] > *nrm) *nrm = tmp[j];
222617ab2063SBarry Smith     }
22279566063dSJacob Faibussowitsch     PetscCall(PetscFree(tmp));
2228f1957bc3SPierre Jolivet     PetscCall(PetscLogFlops(a->nz));
22293a40ed3dSBarry Smith   } else if (type == NORM_INFINITY) {
2230064f8208SBarry Smith     *nrm = 0.0;
2231d0f46423SBarry Smith     for (j = 0; j < A->rmap->n; j++) {
22328e3a54c0SPierre Jolivet       const PetscScalar *v2 = PetscSafePointerPlusOffset(v, a->i[j]);
223317ab2063SBarry Smith       sum                   = 0.0;
2234416022c9SBarry Smith       for (i = 0; i < a->i[j + 1] - a->i[j]; i++) {
22359371c9d4SSatish Balay         sum += PetscAbsScalar(*v2);
22369371c9d4SSatish Balay         v2++;
223717ab2063SBarry Smith       }
2238064f8208SBarry Smith       if (sum > *nrm) *nrm = sum;
223917ab2063SBarry Smith     }
2240f1957bc3SPierre Jolivet     PetscCall(PetscLogFlops(a->nz));
2241f23aa3ddSBarry Smith   } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm");
22429566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &v));
22433ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
224417ab2063SBarry Smith }
224517ab2063SBarry Smith 
MatIsTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool * f)2246ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f)
2247d71ae5a4SJacob Faibussowitsch {
22483d3eaba7SBarry Smith   Mat_SeqAIJ      *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data;
224954f21887SBarry Smith   PetscInt        *adx, *bdx, *aii, *bii, *aptr, *bptr;
22502e5835c6SStefano Zampini   const MatScalar *va, *vb;
225197f1f81fSBarry Smith   PetscInt         ma, na, mb, nb, i;
2252cd0d46ebSvictorle 
2253cd0d46ebSvictorle   PetscFunctionBegin;
22549566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &ma, &na));
22559566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &mb, &nb));
22565485867bSBarry Smith   if (ma != nb || na != mb) {
22575485867bSBarry Smith     *f = PETSC_FALSE;
22583ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
22595485867bSBarry Smith   }
22609566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &va));
22619566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &vb));
22629371c9d4SSatish Balay   aii = aij->i;
22639371c9d4SSatish Balay   bii = bij->i;
22649371c9d4SSatish Balay   adx = aij->j;
22659371c9d4SSatish Balay   bdx = bij->j;
22669566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ma, &aptr));
22679566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(mb, &bptr));
2268cd0d46ebSvictorle   for (i = 0; i < ma; i++) aptr[i] = aii[i];
2269cd0d46ebSvictorle   for (i = 0; i < mb; i++) bptr[i] = bii[i];
2270cd0d46ebSvictorle 
2271cd0d46ebSvictorle   *f = PETSC_TRUE;
2272cd0d46ebSvictorle   for (i = 0; i < ma; i++) {
2273cd0d46ebSvictorle     while (aptr[i] < aii[i + 1]) {
227497f1f81fSBarry Smith       PetscInt    idc, idr;
22755485867bSBarry Smith       PetscScalar vc, vr;
2276cd0d46ebSvictorle       /* column/row index/value */
22775485867bSBarry Smith       idc = adx[aptr[i]];
22785485867bSBarry Smith       idr = bdx[bptr[idc]];
22795485867bSBarry Smith       vc  = va[aptr[i]];
22805485867bSBarry Smith       vr  = vb[bptr[idc]];
22815485867bSBarry Smith       if (i != idr || PetscAbsScalar(vc - vr) > tol) {
22825485867bSBarry Smith         *f = PETSC_FALSE;
22835485867bSBarry Smith         goto done;
2284cd0d46ebSvictorle       } else {
22855485867bSBarry Smith         aptr[i]++;
22865485867bSBarry Smith         if (B || i != idc) bptr[idc]++;
2287cd0d46ebSvictorle       }
2288cd0d46ebSvictorle     }
2289cd0d46ebSvictorle   }
2290cd0d46ebSvictorle done:
22919566063dSJacob Faibussowitsch   PetscCall(PetscFree(aptr));
22929566063dSJacob Faibussowitsch   PetscCall(PetscFree(bptr));
22939566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &va));
22949566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &vb));
22953ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2296cd0d46ebSvictorle }
2297cd0d46ebSvictorle 
MatIsHermitianTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool * f)2298ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f)
2299d71ae5a4SJacob Faibussowitsch {
23003d3eaba7SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data;
230154f21887SBarry Smith   PetscInt   *adx, *bdx, *aii, *bii, *aptr, *bptr;
230254f21887SBarry Smith   MatScalar  *va, *vb;
23031cbb95d3SBarry Smith   PetscInt    ma, na, mb, nb, i;
23041cbb95d3SBarry Smith 
23051cbb95d3SBarry Smith   PetscFunctionBegin;
23069566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &ma, &na));
23079566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &mb, &nb));
23081cbb95d3SBarry Smith   if (ma != nb || na != mb) {
23091cbb95d3SBarry Smith     *f = PETSC_FALSE;
23103ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
23111cbb95d3SBarry Smith   }
23129371c9d4SSatish Balay   aii = aij->i;
23139371c9d4SSatish Balay   bii = bij->i;
23149371c9d4SSatish Balay   adx = aij->j;
23159371c9d4SSatish Balay   bdx = bij->j;
23169371c9d4SSatish Balay   va  = aij->a;
23179371c9d4SSatish Balay   vb  = bij->a;
23189566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ma, &aptr));
23199566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(mb, &bptr));
23201cbb95d3SBarry Smith   for (i = 0; i < ma; i++) aptr[i] = aii[i];
23211cbb95d3SBarry Smith   for (i = 0; i < mb; i++) bptr[i] = bii[i];
23221cbb95d3SBarry Smith 
23231cbb95d3SBarry Smith   *f = PETSC_TRUE;
23241cbb95d3SBarry Smith   for (i = 0; i < ma; i++) {
23251cbb95d3SBarry Smith     while (aptr[i] < aii[i + 1]) {
23261cbb95d3SBarry Smith       PetscInt    idc, idr;
23271cbb95d3SBarry Smith       PetscScalar vc, vr;
23281cbb95d3SBarry Smith       /* column/row index/value */
23291cbb95d3SBarry Smith       idc = adx[aptr[i]];
23301cbb95d3SBarry Smith       idr = bdx[bptr[idc]];
23311cbb95d3SBarry Smith       vc  = va[aptr[i]];
23321cbb95d3SBarry Smith       vr  = vb[bptr[idc]];
23331cbb95d3SBarry Smith       if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) {
23341cbb95d3SBarry Smith         *f = PETSC_FALSE;
23351cbb95d3SBarry Smith         goto done;
23361cbb95d3SBarry Smith       } else {
23371cbb95d3SBarry Smith         aptr[i]++;
23381cbb95d3SBarry Smith         if (B || i != idc) bptr[idc]++;
23391cbb95d3SBarry Smith       }
23401cbb95d3SBarry Smith     }
23411cbb95d3SBarry Smith   }
23421cbb95d3SBarry Smith done:
23439566063dSJacob Faibussowitsch   PetscCall(PetscFree(aptr));
23449566063dSJacob Faibussowitsch   PetscCall(PetscFree(bptr));
23453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
23461cbb95d3SBarry Smith }
23471cbb95d3SBarry Smith 
MatDiagonalScale_SeqAIJ(Mat A,Vec ll,Vec rr)2348d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr)
2349d71ae5a4SJacob Faibussowitsch {
2350416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2351fff8e43fSBarry Smith   const PetscScalar *l, *r;
2352fff8e43fSBarry Smith   PetscScalar        x;
235354f21887SBarry Smith   MatScalar         *v;
2354fff8e43fSBarry Smith   PetscInt           i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz;
2355fff8e43fSBarry Smith   const PetscInt    *jj;
235617ab2063SBarry Smith 
23573a40ed3dSBarry Smith   PetscFunctionBegin;
235817ab2063SBarry Smith   if (ll) {
23593ea7c6a1SSatish Balay     /* The local size is used so that VecMPI can be passed to this routine
23603ea7c6a1SSatish Balay        by MatDiagonalScale_MPIAIJ */
23619566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(ll, &m));
236208401ef6SPierre Jolivet     PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length");
23639566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(ll, &l));
23649566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(A, &v));
236517ab2063SBarry Smith     for (i = 0; i < m; i++) {
236617ab2063SBarry Smith       x = l[i];
2367416022c9SBarry Smith       M = a->i[i + 1] - a->i[i];
23682205254eSKarl Rupp       for (j = 0; j < M; j++) (*v++) *= x;
236917ab2063SBarry Smith     }
23709566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(ll, &l));
23719566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(nz));
23729566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(A, &v));
237317ab2063SBarry Smith   }
237417ab2063SBarry Smith   if (rr) {
23759566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(rr, &n));
237608401ef6SPierre Jolivet     PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length");
23779566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(rr, &r));
23789566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(A, &v));
23792e5835c6SStefano Zampini     jj = a->j;
23802205254eSKarl Rupp     for (i = 0; i < nz; i++) (*v++) *= r[*jj++];
23819566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(A, &v));
23829566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(rr, &r));
23839566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(nz));
238417ab2063SBarry Smith   }
23853ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
238617ab2063SBarry Smith }
238717ab2063SBarry Smith 
MatCreateSubMatrix_SeqAIJ(Mat A,IS isrow,IS iscol,PetscInt csize,MatReuse scall,Mat * B)2388d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B)
2389d71ae5a4SJacob Faibussowitsch {
2390db02288aSLois Curfman McInnes   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data, *c;
2391d0f46423SBarry Smith   PetscInt          *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens;
239297f1f81fSBarry Smith   PetscInt           row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi;
23935d0c19d7SBarry Smith   const PetscInt    *irow, *icol;
23942e5835c6SStefano Zampini   const PetscScalar *aa;
23955d0c19d7SBarry Smith   PetscInt           nrows, ncols;
239697f1f81fSBarry Smith   PetscInt          *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen;
2397fb3c7e2dSJunchao Zhang   MatScalar         *a_new, *mat_a, *c_a;
2398416022c9SBarry Smith   Mat                C;
2399cdc6f3adSToby Isaac   PetscBool          stride;
240017ab2063SBarry Smith 
24013a40ed3dSBarry Smith   PetscFunctionBegin;
24029566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(isrow, &irow));
24039566063dSJacob Faibussowitsch   PetscCall(ISGetLocalSize(isrow, &nrows));
24049566063dSJacob Faibussowitsch   PetscCall(ISGetLocalSize(iscol, &ncols));
240517ab2063SBarry Smith 
24069566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride));
2407ff718158SBarry Smith   if (stride) {
24089566063dSJacob Faibussowitsch     PetscCall(ISStrideGetInfo(iscol, &first, &step));
2409ff718158SBarry Smith   } else {
2410ff718158SBarry Smith     first = 0;
2411ff718158SBarry Smith     step  = 0;
2412ff718158SBarry Smith   }
2413fee21e36SBarry Smith   if (stride && step == 1) {
241402834360SBarry Smith     /* special case of contiguous rows */
24159566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts));
241602834360SBarry Smith     /* loop over new rows determining lens and starting points */
241702834360SBarry Smith     for (i = 0; i < nrows; i++) {
2418bfeeae90SHong Zhang       kstart    = ai[irow[i]];
2419a2744918SBarry Smith       kend      = kstart + ailen[irow[i]];
2420a91a9bebSLisandro Dalcin       starts[i] = kstart;
242102834360SBarry Smith       for (k = kstart; k < kend; k++) {
2422bfeeae90SHong Zhang         if (aj[k] >= first) {
242302834360SBarry Smith           starts[i] = k;
242402834360SBarry Smith           break;
242502834360SBarry Smith         }
242602834360SBarry Smith       }
2427a2744918SBarry Smith       sum = 0;
242802834360SBarry Smith       while (k < kend) {
2429bfeeae90SHong Zhang         if (aj[k++] >= first + ncols) break;
2430a2744918SBarry Smith         sum++;
243102834360SBarry Smith       }
2432a2744918SBarry Smith       lens[i] = sum;
243302834360SBarry Smith     }
243402834360SBarry Smith     /* create submatrix */
2435cddf8d76SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
243697f1f81fSBarry Smith       PetscInt n_cols, n_rows;
24379566063dSJacob Faibussowitsch       PetscCall(MatGetSize(*B, &n_rows, &n_cols));
2438aed4548fSBarry Smith       PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size");
24399566063dSJacob Faibussowitsch       PetscCall(MatZeroEntries(*B));
244008480c60SBarry Smith       C = *B;
24413a40ed3dSBarry Smith     } else {
24423bef6203SJed Brown       PetscInt rbs, cbs;
24439566063dSJacob Faibussowitsch       PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C));
24449566063dSJacob Faibussowitsch       PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE));
24459566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(isrow, &rbs));
24469566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(iscol, &cbs));
24479566063dSJacob Faibussowitsch       PetscCall(MatSetBlockSizes(C, rbs, cbs));
24489566063dSJacob Faibussowitsch       PetscCall(MatSetType(C, ((PetscObject)A)->type_name));
24499566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens));
245008480c60SBarry Smith     }
2451db02288aSLois Curfman McInnes     c = (Mat_SeqAIJ *)C->data;
2452db02288aSLois Curfman McInnes 
245302834360SBarry Smith     /* loop over rows inserting into submatrix */
2454fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C
2455db02288aSLois Curfman McInnes     j_new = c->j;
2456db02288aSLois Curfman McInnes     i_new = c->i;
24579566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
245802834360SBarry Smith     for (i = 0; i < nrows; i++) {
2459a2744918SBarry Smith       ii    = starts[i];
2460a2744918SBarry Smith       lensi = lens[i];
2461810441c8SPierre Jolivet       if (lensi) {
2462ad540459SPierre Jolivet         for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first;
24639566063dSJacob Faibussowitsch         PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi));
2464a2744918SBarry Smith         a_new += lensi;
2465810441c8SPierre Jolivet       }
2466a2744918SBarry Smith       i_new[i + 1] = i_new[i] + lensi;
2467a2744918SBarry Smith       c->ilen[i]   = lensi;
246802834360SBarry Smith     }
2469fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly
24709566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
24719566063dSJacob Faibussowitsch     PetscCall(PetscFree2(lens, starts));
24723a40ed3dSBarry Smith   } else {
24739566063dSJacob Faibussowitsch     PetscCall(ISGetIndices(iscol, &icol));
24749566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(oldcols, &smap));
24759566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(1 + nrows, &lens));
24764dcab191SBarry Smith     for (i = 0; i < ncols; i++) {
24776bdcaf15SBarry Smith       PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols);
24784dcab191SBarry Smith       smap[icol[i]] = i + 1;
24794dcab191SBarry Smith     }
24804dcab191SBarry Smith 
248102834360SBarry Smith     /* determine lens of each row */
248202834360SBarry Smith     for (i = 0; i < nrows; i++) {
2483bfeeae90SHong Zhang       kstart  = ai[irow[i]];
248402834360SBarry Smith       kend    = kstart + a->ilen[irow[i]];
248502834360SBarry Smith       lens[i] = 0;
248602834360SBarry Smith       for (k = kstart; k < kend; k++) {
2487ad540459SPierre Jolivet         if (smap[aj[k]]) lens[i]++;
248802834360SBarry Smith       }
248902834360SBarry Smith     }
249017ab2063SBarry Smith     /* Create and fill new matrix */
2491a2744918SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
2492ace3abfcSBarry Smith       PetscBool equal;
24930f5bd95cSBarry Smith 
249499141d43SSatish Balay       c = (Mat_SeqAIJ *)((*B)->data);
2495aed4548fSBarry Smith       PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size");
24969566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal));
2497fdfbdca6SPierre Jolivet       PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong number of nonzeros");
24989566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n));
249908480c60SBarry Smith       C = *B;
25003a40ed3dSBarry Smith     } else {
25013bef6203SJed Brown       PetscInt rbs, cbs;
25029566063dSJacob Faibussowitsch       PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C));
25039566063dSJacob Faibussowitsch       PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE));
25049566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(isrow, &rbs));
25059566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(iscol, &cbs));
250637a5e0faSPierre Jolivet       if (rbs > 1 || cbs > 1) PetscCall(MatSetBlockSizes(C, rbs, cbs));
25079566063dSJacob Faibussowitsch       PetscCall(MatSetType(C, ((PetscObject)A)->type_name));
25089566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens));
250908480c60SBarry Smith     }
25109566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
2511fb3c7e2dSJunchao Zhang 
2512f4f49eeaSPierre Jolivet     c = (Mat_SeqAIJ *)C->data;
2513fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C
251417ab2063SBarry Smith     for (i = 0; i < nrows; i++) {
251599141d43SSatish Balay       row      = irow[i];
2516bfeeae90SHong Zhang       kstart   = ai[row];
251799141d43SSatish Balay       kend     = kstart + a->ilen[row];
2518bfeeae90SHong Zhang       mat_i    = c->i[i];
25198e3a54c0SPierre Jolivet       mat_j    = PetscSafePointerPlusOffset(c->j, mat_i);
25208e3a54c0SPierre Jolivet       mat_a    = PetscSafePointerPlusOffset(c_a, mat_i);
252199141d43SSatish Balay       mat_ilen = c->ilen + i;
252217ab2063SBarry Smith       for (k = kstart; k < kend; k++) {
2523bfeeae90SHong Zhang         if ((tcol = smap[a->j[k]])) {
2524ed480e8bSBarry Smith           *mat_j++ = tcol - 1;
25252e5835c6SStefano Zampini           *mat_a++ = aa[k];
252699141d43SSatish Balay           (*mat_ilen)++;
252717ab2063SBarry Smith         }
252817ab2063SBarry Smith       }
252917ab2063SBarry Smith     }
25309566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
253102834360SBarry Smith     /* Free work space */
25329566063dSJacob Faibussowitsch     PetscCall(ISRestoreIndices(iscol, &icol));
25339566063dSJacob Faibussowitsch     PetscCall(PetscFree(smap));
25349566063dSJacob Faibussowitsch     PetscCall(PetscFree(lens));
2535cdc6f3adSToby Isaac     /* sort */
2536cdc6f3adSToby Isaac     for (i = 0; i < nrows; i++) {
2537cdc6f3adSToby Isaac       PetscInt ilen;
2538cdc6f3adSToby Isaac 
2539cdc6f3adSToby Isaac       mat_i = c->i[i];
25408e3a54c0SPierre Jolivet       mat_j = PetscSafePointerPlusOffset(c->j, mat_i);
25418e3a54c0SPierre Jolivet       mat_a = PetscSafePointerPlusOffset(c_a, mat_i);
2542cdc6f3adSToby Isaac       ilen  = c->ilen[i];
25439566063dSJacob Faibussowitsch       PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a));
2544cdc6f3adSToby Isaac     }
2545fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a));
254602834360SBarry Smith   }
25478c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE)
25489566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU(C, A->boundtocpu));
2549305c6ccfSStefano Zampini #endif
25509566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY));
25519566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY));
255217ab2063SBarry Smith 
25539566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(isrow, &irow));
2554416022c9SBarry Smith   *B = C;
25553ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
255617ab2063SBarry Smith }
255717ab2063SBarry Smith 
MatGetMultiProcBlock_SeqAIJ(Mat mat,MPI_Comm subComm,MatReuse scall,Mat * subMat)2558ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat)
2559d71ae5a4SJacob Faibussowitsch {
256082d44351SHong Zhang   Mat B;
256182d44351SHong Zhang 
256282d44351SHong Zhang   PetscFunctionBegin;
2563c2d650bdSHong Zhang   if (scall == MAT_INITIAL_MATRIX) {
25649566063dSJacob Faibussowitsch     PetscCall(MatCreate(subComm, &B));
25659566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n));
25669566063dSJacob Faibussowitsch     PetscCall(MatSetBlockSizesFromMats(B, mat, mat));
25679566063dSJacob Faibussowitsch     PetscCall(MatSetType(B, MATSEQAIJ));
25689566063dSJacob Faibussowitsch     PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE));
256982d44351SHong Zhang     *subMat = B;
2570c2d650bdSHong Zhang   } else {
25719566063dSJacob Faibussowitsch     PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN));
2572c2d650bdSHong Zhang   }
25733ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
257482d44351SHong Zhang }
257582d44351SHong Zhang 
MatILUFactor_SeqAIJ(Mat inA,IS row,IS col,const MatFactorInfo * info)2576ba38deedSJacob Faibussowitsch static PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info)
2577d71ae5a4SJacob Faibussowitsch {
257863b91edcSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data;
257963b91edcSBarry Smith   Mat         outA;
2580ace3abfcSBarry Smith   PetscBool   row_identity, col_identity;
258163b91edcSBarry Smith 
25823a40ed3dSBarry Smith   PetscFunctionBegin;
258308401ef6SPierre Jolivet   PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu");
25841df811f5SHong Zhang 
25859566063dSJacob Faibussowitsch   PetscCall(ISIdentity(row, &row_identity));
25869566063dSJacob Faibussowitsch   PetscCall(ISIdentity(col, &col_identity));
2587a871dcd8SBarry Smith 
258863b91edcSBarry Smith   outA = inA;
25899566063dSJacob Faibussowitsch   PetscCall(PetscFree(inA->solvertype));
25909566063dSJacob Faibussowitsch   PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype));
25912205254eSKarl Rupp 
25929566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)row));
25939566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
25942205254eSKarl Rupp 
2595c3122656SLisandro Dalcin   a->row = row;
25962205254eSKarl Rupp 
25979566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)col));
25989566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
25992205254eSKarl Rupp 
2600c3122656SLisandro Dalcin   a->col = col;
260163b91edcSBarry Smith 
260236db0b34SBarry Smith   /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */
26039566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->icol));
26049566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol));
2605f0ec6fceSSatish Balay 
260694a9d846SBarry Smith   if (!a->solve_work) { /* this matrix may have been factored before */
260784648c2dSPierre Jolivet     PetscCall(PetscMalloc1(inA->rmap->n, &a->solve_work));
260894a9d846SBarry Smith   }
260963b91edcSBarry Smith 
2610137fb511SHong Zhang   if (row_identity && col_identity) {
26119566063dSJacob Faibussowitsch     PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info));
2612137fb511SHong Zhang   } else {
26139566063dSJacob Faibussowitsch     PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info));
2614137fb511SHong Zhang   }
2615421480d9SBarry Smith   outA->factortype = MAT_FACTOR_LU;
26163ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2617a871dcd8SBarry Smith }
2618a871dcd8SBarry Smith 
MatScale_SeqAIJ(Mat inA,PetscScalar alpha)2619d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha)
2620d71ae5a4SJacob Faibussowitsch {
2621f0b747eeSBarry Smith   Mat_SeqAIJ  *a = (Mat_SeqAIJ *)inA->data;
2622dfa0f9e5SStefano Zampini   PetscScalar *v;
2623c5df96a5SBarry Smith   PetscBLASInt one = 1, bnz;
26243a40ed3dSBarry Smith 
26253a40ed3dSBarry Smith   PetscFunctionBegin;
26269566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(inA, &v));
26279566063dSJacob Faibussowitsch   PetscCall(PetscBLASIntCast(a->nz, &bnz));
2628792fecdfSBarry Smith   PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one));
26299566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(a->nz));
26309566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(inA, &v));
26313ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2632f0b747eeSBarry Smith }
2633f0b747eeSBarry Smith 
MatDestroySubMatrix_Private(Mat_SubSppt * submatj)2634d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj)
2635d71ae5a4SJacob Faibussowitsch {
263616b64355SHong Zhang   PetscInt i;
263716b64355SHong Zhang 
263816b64355SHong Zhang   PetscFunctionBegin;
263916b64355SHong Zhang   if (!submatj->id) { /* delete data that are linked only to submats[id=0] */
26409566063dSJacob Faibussowitsch     PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr));
264116b64355SHong Zhang 
264248a46eb9SPierre Jolivet     for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i]));
26439566063dSJacob Faibussowitsch     PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1));
264416b64355SHong Zhang 
264516b64355SHong Zhang     if (submatj->rbuf1) {
26469566063dSJacob Faibussowitsch       PetscCall(PetscFree(submatj->rbuf1[0]));
26479566063dSJacob Faibussowitsch       PetscCall(PetscFree(submatj->rbuf1));
264816b64355SHong Zhang     }
264916b64355SHong Zhang 
265048a46eb9SPierre Jolivet     for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i]));
26519566063dSJacob Faibussowitsch     PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3));
26529566063dSJacob Faibussowitsch     PetscCall(PetscFree(submatj->pa));
265316b64355SHong Zhang   }
265416b64355SHong Zhang 
265516b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
2656eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIDestroy(&submatj->rmap));
26579566063dSJacob Faibussowitsch   if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc));
26589566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->rmap_loc));
265916b64355SHong Zhang #else
26609566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->rmap));
266116b64355SHong Zhang #endif
266216b64355SHong Zhang 
266316b64355SHong Zhang   if (!submatj->allcolumns) {
266416b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
2665835f2295SStefano Zampini     PetscCall(PetscHMapIDestroy(&submatj->cmap));
266616b64355SHong Zhang #else
26679566063dSJacob Faibussowitsch     PetscCall(PetscFree(submatj->cmap));
266816b64355SHong Zhang #endif
266916b64355SHong Zhang   }
26709566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->row2proc));
267116b64355SHong Zhang 
26729566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj));
26733ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
267416b64355SHong Zhang }
267516b64355SHong Zhang 
MatDestroySubMatrix_SeqAIJ(Mat C)2676d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C)
2677d71ae5a4SJacob Faibussowitsch {
267816b64355SHong Zhang   Mat_SeqAIJ  *c       = (Mat_SeqAIJ *)C->data;
26795c39f6d9SHong Zhang   Mat_SubSppt *submatj = c->submatis1;
268016b64355SHong Zhang 
268116b64355SHong Zhang   PetscFunctionBegin;
26829566063dSJacob Faibussowitsch   PetscCall((*submatj->destroy)(C));
26839566063dSJacob Faibussowitsch   PetscCall(MatDestroySubMatrix_Private(submatj));
26843ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
268516b64355SHong Zhang }
268616b64355SHong Zhang 
268789a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */
MatDestroySubMatrices_SeqAIJ(PetscInt n,Mat * mat[])2688ba38deedSJacob Faibussowitsch static PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[])
2689d71ae5a4SJacob Faibussowitsch {
26902d033e1fSHong Zhang   PetscInt     i;
26910fb991dcSHong Zhang   Mat          C;
26920fb991dcSHong Zhang   Mat_SeqAIJ  *c;
26930fb991dcSHong Zhang   Mat_SubSppt *submatj;
26942d033e1fSHong Zhang 
26952d033e1fSHong Zhang   PetscFunctionBegin;
26962d033e1fSHong Zhang   for (i = 0; i < n; i++) {
26970fb991dcSHong Zhang     C       = (*mat)[i];
26980fb991dcSHong Zhang     c       = (Mat_SeqAIJ *)C->data;
26990fb991dcSHong Zhang     submatj = c->submatis1;
27002d033e1fSHong Zhang     if (submatj) {
2701682e4c99SStefano Zampini       if (--((PetscObject)C)->refct <= 0) {
270226cc229bSBarry Smith         PetscCall(PetscFree(C->factorprefix));
27039566063dSJacob Faibussowitsch         PetscCall((*submatj->destroy)(C));
27049566063dSJacob Faibussowitsch         PetscCall(MatDestroySubMatrix_Private(submatj));
27059566063dSJacob Faibussowitsch         PetscCall(PetscFree(C->defaultvectype));
27063faff063SStefano Zampini         PetscCall(PetscFree(C->defaultrandtype));
27079566063dSJacob Faibussowitsch         PetscCall(PetscLayoutDestroy(&C->rmap));
27089566063dSJacob Faibussowitsch         PetscCall(PetscLayoutDestroy(&C->cmap));
27099566063dSJacob Faibussowitsch         PetscCall(PetscHeaderDestroy(&C));
2710682e4c99SStefano Zampini       }
27112d033e1fSHong Zhang     } else {
27129566063dSJacob Faibussowitsch       PetscCall(MatDestroy(&C));
27132d033e1fSHong Zhang     }
27142d033e1fSHong Zhang   }
271586e85357SHong Zhang 
271663a75b2aSHong Zhang   /* Destroy Dummy submatrices created for reuse */
27179566063dSJacob Faibussowitsch   PetscCall(MatDestroySubMatrices_Dummy(n, mat));
271863a75b2aSHong Zhang 
27199566063dSJacob Faibussowitsch   PetscCall(PetscFree(*mat));
27203ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
27212d033e1fSHong Zhang }
27222d033e1fSHong Zhang 
MatCreateSubMatrices_SeqAIJ(Mat A,PetscInt n,const IS irow[],const IS icol[],MatReuse scall,Mat * B[])2723ba38deedSJacob Faibussowitsch static PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[])
2724d71ae5a4SJacob Faibussowitsch {
272597f1f81fSBarry Smith   PetscInt i;
2726cddf8d76SBarry Smith 
27273a40ed3dSBarry Smith   PetscFunctionBegin;
272848a46eb9SPierre Jolivet   if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B));
2729cddf8d76SBarry Smith 
273048a46eb9SPierre Jolivet   for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i]));
27313ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2732cddf8d76SBarry Smith }
2733cddf8d76SBarry Smith 
MatIncreaseOverlap_SeqAIJ(Mat A,PetscInt is_max,IS is[],PetscInt ov)2734ba38deedSJacob Faibussowitsch static PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov)
2735d71ae5a4SJacob Faibussowitsch {
2736e4d965acSSatish Balay   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
27379a88ca10SBarry Smith   PetscInt        row, i, j, k, l, ll, m, n, *nidx, isz, val;
27385d0c19d7SBarry Smith   const PetscInt *idx;
273958b7e2c1SStefano Zampini   PetscInt        start, end, *ai, *aj, bs = A->rmap->bs == A->cmap->bs ? A->rmap->bs : 1;
2740f1af5d2fSBarry Smith   PetscBT         table;
2741bbd702dbSSatish Balay 
27423a40ed3dSBarry Smith   PetscFunctionBegin;
27439a88ca10SBarry Smith   m  = A->rmap->n / bs;
2744e4d965acSSatish Balay   ai = a->i;
2745bfeeae90SHong Zhang   aj = a->j;
27468a047759SSatish Balay 
274708401ef6SPierre Jolivet   PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used");
274806763907SSatish Balay 
27499566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nidx));
27509566063dSJacob Faibussowitsch   PetscCall(PetscBTCreate(m, &table));
275106763907SSatish Balay 
2752e4d965acSSatish Balay   for (i = 0; i < is_max; i++) {
2753b97fc60eSLois Curfman McInnes     /* Initialize the two local arrays */
2754e4d965acSSatish Balay     isz = 0;
27559566063dSJacob Faibussowitsch     PetscCall(PetscBTMemzero(m, table));
2756e4d965acSSatish Balay 
2757e4d965acSSatish Balay     /* Extract the indices, assume there can be duplicate entries */
27589566063dSJacob Faibussowitsch     PetscCall(ISGetIndices(is[i], &idx));
27599566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(is[i], &n));
2760e4d965acSSatish Balay 
27619a88ca10SBarry Smith     if (bs > 1) {
27629a88ca10SBarry Smith       /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */
27639a88ca10SBarry Smith       for (j = 0; j < n; ++j) {
27649a88ca10SBarry Smith         if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs;
27659a88ca10SBarry Smith       }
27669a88ca10SBarry Smith       PetscCall(ISRestoreIndices(is[i], &idx));
27679a88ca10SBarry Smith       PetscCall(ISDestroy(&is[i]));
27689a88ca10SBarry Smith 
27699a88ca10SBarry Smith       k = 0;
27709a88ca10SBarry Smith       for (j = 0; j < ov; j++) { /* for each overlap */
27719a88ca10SBarry Smith         n = isz;
27729a88ca10SBarry Smith         for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */
27739a88ca10SBarry Smith           for (ll = 0; ll < bs; ll++) {
27749a88ca10SBarry Smith             row   = bs * nidx[k] + ll;
27759a88ca10SBarry Smith             start = ai[row];
27769a88ca10SBarry Smith             end   = ai[row + 1];
27779a88ca10SBarry Smith             for (l = start; l < end; l++) {
27789a88ca10SBarry Smith               val = aj[l] / bs;
27799a88ca10SBarry Smith               if (!PetscBTLookupSet(table, val)) nidx[isz++] = val;
27809a88ca10SBarry Smith             }
27819a88ca10SBarry Smith           }
27829a88ca10SBarry Smith         }
27839a88ca10SBarry Smith       }
278457508eceSPierre Jolivet       PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, is + i));
27859a88ca10SBarry Smith     } else {
2786dd097bc3SLois Curfman McInnes       /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */
2787e4d965acSSatish Balay       for (j = 0; j < n; ++j) {
27882205254eSKarl Rupp         if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j];
27894dcbc457SBarry Smith       }
27909566063dSJacob Faibussowitsch       PetscCall(ISRestoreIndices(is[i], &idx));
27919566063dSJacob Faibussowitsch       PetscCall(ISDestroy(&is[i]));
2792e4d965acSSatish Balay 
279304a348a9SBarry Smith       k = 0;
279404a348a9SBarry Smith       for (j = 0; j < ov; j++) { /* for each overlap */
279504a348a9SBarry Smith         n = isz;
279606763907SSatish Balay         for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */
2797e4d965acSSatish Balay           row   = nidx[k];
2798e4d965acSSatish Balay           start = ai[row];
2799e4d965acSSatish Balay           end   = ai[row + 1];
280004a348a9SBarry Smith           for (l = start; l < end; l++) {
2801efb16452SHong Zhang             val = aj[l];
28022205254eSKarl Rupp             if (!PetscBTLookupSet(table, val)) nidx[isz++] = val;
2803e4d965acSSatish Balay           }
2804e4d965acSSatish Balay         }
2805e4d965acSSatish Balay       }
280657508eceSPierre Jolivet       PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, is + i));
2807e4d965acSSatish Balay     }
28089a88ca10SBarry Smith   }
28099566063dSJacob Faibussowitsch   PetscCall(PetscBTDestroy(&table));
28109566063dSJacob Faibussowitsch   PetscCall(PetscFree(nidx));
28113ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
28124dcbc457SBarry Smith }
281317ab2063SBarry Smith 
MatPermute_SeqAIJ(Mat A,IS rowp,IS colp,Mat * B)2814ba38deedSJacob Faibussowitsch static PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B)
2815d71ae5a4SJacob Faibussowitsch {
28160513a670SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
28173b98c0a2SBarry Smith   PetscInt        i, nz = 0, m = A->rmap->n, n = A->cmap->n;
28185d0c19d7SBarry Smith   const PetscInt *row, *col;
28195d0c19d7SBarry Smith   PetscInt       *cnew, j, *lens;
282056cd22aeSBarry Smith   IS              icolp, irowp;
28210298fd71SBarry Smith   PetscInt       *cwork = NULL;
28220298fd71SBarry Smith   PetscScalar    *vwork = NULL;
28230513a670SBarry Smith 
28243a40ed3dSBarry Smith   PetscFunctionBegin;
28259566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp));
28269566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(irowp, &row));
28279566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp));
28289566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(icolp, &col));
28290513a670SBarry Smith 
28300513a670SBarry Smith   /* determine lengths of permuted rows */
28319566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &lens));
28322205254eSKarl Rupp   for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i];
28339566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B));
28349566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*B, m, n, m, n));
28359566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(*B, A, A));
28369566063dSJacob Faibussowitsch   PetscCall(MatSetType(*B, ((PetscObject)A)->type_name));
28379566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens));
28389566063dSJacob Faibussowitsch   PetscCall(PetscFree(lens));
28390513a670SBarry Smith 
28409566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &cnew));
28410513a670SBarry Smith   for (i = 0; i < m; i++) {
28429566063dSJacob Faibussowitsch     PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork));
28432205254eSKarl Rupp     for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]];
28449566063dSJacob Faibussowitsch     PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES));
28459566063dSJacob Faibussowitsch     PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork));
28460513a670SBarry Smith   }
28479566063dSJacob Faibussowitsch   PetscCall(PetscFree(cnew));
28482205254eSKarl Rupp 
28493c7d62e4SBarry Smith   (*B)->assembled = PETSC_FALSE;
28502205254eSKarl Rupp 
28518c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE)
28529566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU(*B, A->boundtocpu));
28539fe5e383SStefano Zampini #endif
28549566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY));
28559566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY));
28569566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(irowp, &row));
28579566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(icolp, &col));
28589566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&irowp));
28599566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&icolp));
286048a46eb9SPierre Jolivet   if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B));
28613ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
28620513a670SBarry Smith }
28630513a670SBarry Smith 
MatCopy_SeqAIJ(Mat A,Mat B,MatStructure str)2864d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str)
2865d71ae5a4SJacob Faibussowitsch {
2866cb5b572fSBarry Smith   PetscFunctionBegin;
286733f4a19fSKris Buschelman   /* If the two matrices have the same copy implementation, use fast copy. */
286833f4a19fSKris Buschelman   if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) {
2869be6bf707SBarry Smith     Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2870be6bf707SBarry Smith     Mat_SeqAIJ        *b = (Mat_SeqAIJ *)B->data;
28712e5835c6SStefano Zampini     const PetscScalar *aa;
28723ac85a22SJunchao Zhang     PetscScalar       *bb;
2873be6bf707SBarry Smith 
28749566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
28753ac85a22SJunchao Zhang     PetscCall(MatSeqAIJGetArrayWrite(B, &bb));
28763ac85a22SJunchao Zhang 
287708401ef6SPierre Jolivet     PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]);
28783ac85a22SJunchao Zhang     PetscCall(PetscArraycpy(bb, aa, a->i[A->rmap->n]));
28799566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)B));
28809566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
28813ac85a22SJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayWrite(B, &bb));
2882cb5b572fSBarry Smith   } else {
28839566063dSJacob Faibussowitsch     PetscCall(MatCopy_Basic(A, B, str));
2884cb5b572fSBarry Smith   }
28853ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2886cb5b572fSBarry Smith }
2887cb5b572fSBarry Smith 
MatSeqAIJGetArray_SeqAIJ(Mat A,PetscScalar * array[])2888d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[])
2889d71ae5a4SJacob Faibussowitsch {
28906c0721eeSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
28916e111a19SKarl Rupp 
28926c0721eeSBarry Smith   PetscFunctionBegin;
28936c0721eeSBarry Smith   *array = a->a;
28943ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
28956c0721eeSBarry Smith }
28966c0721eeSBarry Smith 
MatSeqAIJRestoreArray_SeqAIJ(Mat A,PetscScalar * array[])2897d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[])
2898d71ae5a4SJacob Faibussowitsch {
28996c0721eeSBarry Smith   PetscFunctionBegin;
2900f38c1e66SStefano Zampini   *array = NULL;
29013ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29026c0721eeSBarry Smith }
2903273d9f13SBarry Smith 
29048229c054SShri Abhyankar /*
29058229c054SShri Abhyankar    Computes the number of nonzeros per row needed for preallocation when X and Y
29068229c054SShri Abhyankar    have different nonzero structure.
29078229c054SShri Abhyankar */
MatAXPYGetPreallocation_SeqX_private(PetscInt m,const PetscInt * xi,const PetscInt * xj,const PetscInt * yi,const PetscInt * yj,PetscInt * nnz)2908d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz)
2909d71ae5a4SJacob Faibussowitsch {
2910b264fe52SHong Zhang   PetscInt i, j, k, nzx, nzy;
2911ec7775f6SShri Abhyankar 
2912ec7775f6SShri Abhyankar   PetscFunctionBegin;
2913ec7775f6SShri Abhyankar   /* Set the number of nonzeros in the new matrix */
2914ec7775f6SShri Abhyankar   for (i = 0; i < m; i++) {
29158e3a54c0SPierre Jolivet     const PetscInt *xjj = PetscSafePointerPlusOffset(xj, xi[i]), *yjj = PetscSafePointerPlusOffset(yj, yi[i]);
2916b264fe52SHong Zhang     nzx    = xi[i + 1] - xi[i];
2917b264fe52SHong Zhang     nzy    = yi[i + 1] - yi[i];
29188af7cee1SJed Brown     nnz[i] = 0;
29198af7cee1SJed Brown     for (j = 0, k = 0; j < nzx; j++) {                  /* Point in X */
2920b264fe52SHong Zhang       for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */
2921b264fe52SHong Zhang       if (k < nzy && yjj[k] == xjj[j]) k++;             /* Skip duplicate */
29228af7cee1SJed Brown       nnz[i]++;
29238af7cee1SJed Brown     }
29248af7cee1SJed Brown     for (; k < nzy; k++) nnz[i]++;
2925ec7775f6SShri Abhyankar   }
29263ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2927ec7775f6SShri Abhyankar }
2928ec7775f6SShri Abhyankar 
MatAXPYGetPreallocation_SeqAIJ(Mat Y,Mat X,PetscInt * nnz)2929d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz)
2930d71ae5a4SJacob Faibussowitsch {
2931b264fe52SHong Zhang   PetscInt    m = Y->rmap->N;
2932b264fe52SHong Zhang   Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data;
2933b264fe52SHong Zhang   Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data;
2934b264fe52SHong Zhang 
2935b264fe52SHong Zhang   PetscFunctionBegin;
2936b264fe52SHong Zhang   /* Set the number of nonzeros in the new matrix */
29379566063dSJacob Faibussowitsch   PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz));
29383ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2939b264fe52SHong Zhang }
2940b264fe52SHong Zhang 
MatAXPY_SeqAIJ(Mat Y,PetscScalar a,Mat X,MatStructure str)2941d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str)
2942d71ae5a4SJacob Faibussowitsch {
2943ac90fabeSBarry Smith   Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data;
2944ac90fabeSBarry Smith 
2945ac90fabeSBarry Smith   PetscFunctionBegin;
2946134adf20SPierre Jolivet   if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) {
2947134adf20SPierre Jolivet     PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE;
2948134adf20SPierre Jolivet     if (e) {
29499566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e));
295081fa06acSBarry Smith       if (e) {
29519566063dSJacob Faibussowitsch         PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e));
2952134adf20SPierre Jolivet         if (e) str = SAME_NONZERO_PATTERN;
295381fa06acSBarry Smith       }
295481fa06acSBarry Smith     }
295554c59aa7SJacob Faibussowitsch     if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN");
295681fa06acSBarry Smith   }
2957ac90fabeSBarry Smith   if (str == SAME_NONZERO_PATTERN) {
29582e5835c6SStefano Zampini     const PetscScalar *xa;
29592e5835c6SStefano Zampini     PetscScalar       *ya, alpha = a;
296081fa06acSBarry Smith     PetscBLASInt       one = 1, bnz;
296181fa06acSBarry Smith 
29629566063dSJacob Faibussowitsch     PetscCall(PetscBLASIntCast(x->nz, &bnz));
29639566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(Y, &ya));
29649566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(X, &xa));
2965792fecdfSBarry Smith     PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one));
29669566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(X, &xa));
29679566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(Y, &ya));
29689566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * bnz));
29699566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)Y));
2970ab784542SHong Zhang   } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */
29719566063dSJacob Faibussowitsch     PetscCall(MatAXPY_Basic(Y, a, X, str));
2972ac90fabeSBarry Smith   } else {
29738229c054SShri Abhyankar     Mat       B;
29748229c054SShri Abhyankar     PetscInt *nnz;
29759566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(Y->rmap->N, &nnz));
29769566063dSJacob Faibussowitsch     PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B));
29779566063dSJacob Faibussowitsch     PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name));
29789566063dSJacob Faibussowitsch     PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap));
29799566063dSJacob Faibussowitsch     PetscCall(MatSetType(B, ((PetscObject)Y)->type_name));
29809566063dSJacob Faibussowitsch     PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz));
29819566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz));
29829566063dSJacob Faibussowitsch     PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str));
29839566063dSJacob Faibussowitsch     PetscCall(MatHeaderMerge(Y, &B));
29849bb234a9SBarry Smith     PetscCall(MatSeqAIJCheckInode(Y));
29859566063dSJacob Faibussowitsch     PetscCall(PetscFree(nnz));
2986ac90fabeSBarry Smith   }
29873ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2988ac90fabeSBarry Smith }
2989ac90fabeSBarry Smith 
MatConjugate_SeqAIJ(Mat mat)2990d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat)
2991d71ae5a4SJacob Faibussowitsch {
2992354c94deSBarry Smith   Mat_SeqAIJ  *aij = (Mat_SeqAIJ *)mat->data;
299365d0d443SPierre Jolivet   PetscInt     i, nz = aij->nz;
2994354c94deSBarry Smith   PetscScalar *a;
2995354c94deSBarry Smith 
2996354c94deSBarry Smith   PetscFunctionBegin;
29979566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(mat, &a));
29982205254eSKarl Rupp   for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]);
29999566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(mat, &a));
30003ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3001354c94deSBarry Smith }
3002354c94deSBarry Smith 
MatGetRowMaxAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[])3003ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3004d71ae5a4SJacob Faibussowitsch {
3005e34fafa9SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3006d0f46423SBarry Smith   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3007e34fafa9SBarry Smith   PetscReal        atmp;
3008985db425SBarry Smith   PetscScalar     *x;
3009ce496241SStefano Zampini   const MatScalar *aa, *av;
3010e34fafa9SBarry Smith 
3011e34fafa9SBarry Smith   PetscFunctionBegin;
301228b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
30139566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3014ce496241SStefano Zampini   aa = av;
3015e34fafa9SBarry Smith   ai = a->i;
3016e34fafa9SBarry Smith   aj = a->j;
3017e34fafa9SBarry Smith 
30189566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
30199566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
302008401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3021e34fafa9SBarry Smith   for (i = 0; i < m; i++) {
30229371c9d4SSatish Balay     ncols = ai[1] - ai[0];
30239371c9d4SSatish Balay     ai++;
302462e5df07SMark Adams     x[i] = 0;
3025e34fafa9SBarry Smith     for (j = 0; j < ncols; j++) {
3026985db425SBarry Smith       atmp = PetscAbsScalar(*aa);
30279371c9d4SSatish Balay       if (PetscAbsScalar(x[i]) < atmp) {
30289371c9d4SSatish Balay         x[i] = atmp;
30299371c9d4SSatish Balay         if (idx) idx[i] = *aj;
30309371c9d4SSatish Balay       }
30319371c9d4SSatish Balay       aa++;
30329371c9d4SSatish Balay       aj++;
3033985db425SBarry Smith     }
3034985db425SBarry Smith   }
30359566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
30369566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
30373ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3038985db425SBarry Smith }
3039985db425SBarry Smith 
MatGetRowSumAbs_SeqAIJ(Mat A,Vec v)3040eede4a3fSMark Adams static PetscErrorCode MatGetRowSumAbs_SeqAIJ(Mat A, Vec v)
3041eede4a3fSMark Adams {
3042eede4a3fSMark Adams   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3043eede4a3fSMark Adams   PetscInt         i, j, m = A->rmap->n, *ai, ncols, n;
3044eede4a3fSMark Adams   PetscScalar     *x;
3045eede4a3fSMark Adams   const MatScalar *aa, *av;
3046eede4a3fSMark Adams 
3047eede4a3fSMark Adams   PetscFunctionBegin;
3048eede4a3fSMark Adams   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3049eede4a3fSMark Adams   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3050eede4a3fSMark Adams   aa = av;
3051eede4a3fSMark Adams   ai = a->i;
3052eede4a3fSMark Adams 
3053eede4a3fSMark Adams   PetscCall(VecGetArrayWrite(v, &x));
3054eede4a3fSMark Adams   PetscCall(VecGetLocalSize(v, &n));
3055eede4a3fSMark Adams   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3056eede4a3fSMark Adams   for (i = 0; i < m; i++) {
3057eede4a3fSMark Adams     ncols = ai[1] - ai[0];
3058eede4a3fSMark Adams     ai++;
305962e5df07SMark Adams     x[i] = 0;
3060eede4a3fSMark Adams     for (j = 0; j < ncols; j++) {
3061eede4a3fSMark Adams       x[i] += PetscAbsScalar(*aa);
3062eede4a3fSMark Adams       aa++;
3063eede4a3fSMark Adams     }
3064eede4a3fSMark Adams   }
3065eede4a3fSMark Adams   PetscCall(VecRestoreArrayWrite(v, &x));
3066eede4a3fSMark Adams   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
3067eede4a3fSMark Adams   PetscFunctionReturn(PETSC_SUCCESS);
3068eede4a3fSMark Adams }
3069eede4a3fSMark Adams 
MatGetRowMax_SeqAIJ(Mat A,Vec v,PetscInt idx[])3070ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3071d71ae5a4SJacob Faibussowitsch {
3072985db425SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3073d0f46423SBarry Smith   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3074985db425SBarry Smith   PetscScalar     *x;
3075ce496241SStefano Zampini   const MatScalar *aa, *av;
3076985db425SBarry Smith 
3077985db425SBarry Smith   PetscFunctionBegin;
307828b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
30799566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3080ce496241SStefano Zampini   aa = av;
3081985db425SBarry Smith   ai = a->i;
3082985db425SBarry Smith   aj = a->j;
3083985db425SBarry Smith 
30849566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
30859566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
308608401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3087985db425SBarry Smith   for (i = 0; i < m; i++) {
30889371c9d4SSatish Balay     ncols = ai[1] - ai[0];
30899371c9d4SSatish Balay     ai++;
3090d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
30919371c9d4SSatish Balay       x[i] = *aa;
30929371c9d4SSatish Balay       if (idx) idx[i] = 0;
3093985db425SBarry Smith     } else { /* row is sparse so already KNOW maximum is 0.0 or higher */
3094985db425SBarry Smith       x[i] = 0.0;
3095985db425SBarry Smith       if (idx) {
3096985db425SBarry Smith         for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */
3097985db425SBarry Smith           if (aj[j] > j) {
3098985db425SBarry Smith             idx[i] = j;
3099985db425SBarry Smith             break;
3100985db425SBarry Smith           }
3101985db425SBarry Smith         }
31021a254869SHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
31031a254869SHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3104985db425SBarry Smith       }
3105985db425SBarry Smith     }
3106985db425SBarry Smith     for (j = 0; j < ncols; j++) {
31079371c9d4SSatish Balay       if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {
31089371c9d4SSatish Balay         x[i] = *aa;
31099371c9d4SSatish Balay         if (idx) idx[i] = *aj;
31109371c9d4SSatish Balay       }
31119371c9d4SSatish Balay       aa++;
31129371c9d4SSatish Balay       aj++;
3113985db425SBarry Smith     }
3114985db425SBarry Smith   }
31159566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
31169566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
31173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3118985db425SBarry Smith }
3119985db425SBarry Smith 
MatGetRowMinAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[])3120ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3121d71ae5a4SJacob Faibussowitsch {
3122c87e5d42SMatthew Knepley   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3123c87e5d42SMatthew Knepley   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3124ce496241SStefano Zampini   PetscScalar     *x;
3125ce496241SStefano Zampini   const MatScalar *aa, *av;
3126c87e5d42SMatthew Knepley 
3127c87e5d42SMatthew Knepley   PetscFunctionBegin;
31289566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3129ce496241SStefano Zampini   aa = av;
3130c87e5d42SMatthew Knepley   ai = a->i;
3131c87e5d42SMatthew Knepley   aj = a->j;
3132c87e5d42SMatthew Knepley 
31339566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
31349566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
313508401ef6SPierre Jolivet   PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n);
3136c87e5d42SMatthew Knepley   for (i = 0; i < m; i++) {
31379371c9d4SSatish Balay     ncols = ai[1] - ai[0];
31389371c9d4SSatish Balay     ai++;
3139f07e67edSHong Zhang     if (ncols == A->cmap->n) { /* row is dense */
31409371c9d4SSatish Balay       x[i] = *aa;
31419371c9d4SSatish Balay       if (idx) idx[i] = 0;
3142f07e67edSHong Zhang     } else { /* row is sparse so already KNOW minimum is 0.0 or higher */
3143f07e67edSHong Zhang       x[i] = 0.0;
3144f07e67edSHong Zhang       if (idx) { /* find first implicit 0.0 in the row */
3145289a08f5SMatthew Knepley         for (j = 0; j < ncols; j++) {
3146f07e67edSHong Zhang           if (aj[j] > j) {
3147f07e67edSHong Zhang             idx[i] = j;
31482205254eSKarl Rupp             break;
31492205254eSKarl Rupp           }
3150289a08f5SMatthew Knepley         }
3151f07e67edSHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
3152f07e67edSHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3153f07e67edSHong Zhang       }
3154289a08f5SMatthew Knepley     }
3155c87e5d42SMatthew Knepley     for (j = 0; j < ncols; j++) {
31569371c9d4SSatish Balay       if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) {
31579371c9d4SSatish Balay         x[i] = *aa;
31589371c9d4SSatish Balay         if (idx) idx[i] = *aj;
31599371c9d4SSatish Balay       }
31609371c9d4SSatish Balay       aa++;
31619371c9d4SSatish Balay       aj++;
3162c87e5d42SMatthew Knepley     }
3163c87e5d42SMatthew Knepley   }
31649566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
31659566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
31663ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3167c87e5d42SMatthew Knepley }
3168c87e5d42SMatthew Knepley 
MatGetRowMin_SeqAIJ(Mat A,Vec v,PetscInt idx[])3169ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3170d71ae5a4SJacob Faibussowitsch {
3171985db425SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3172d9ca1df4SBarry Smith   PetscInt         i, j, m = A->rmap->n, ncols, n;
3173d9ca1df4SBarry Smith   const PetscInt  *ai, *aj;
3174985db425SBarry Smith   PetscScalar     *x;
3175ce496241SStefano Zampini   const MatScalar *aa, *av;
3176985db425SBarry Smith 
3177985db425SBarry Smith   PetscFunctionBegin;
317828b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
31799566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3180ce496241SStefano Zampini   aa = av;
3181985db425SBarry Smith   ai = a->i;
3182985db425SBarry Smith   aj = a->j;
3183985db425SBarry Smith 
31849566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
31859566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
318608401ef6SPierre Jolivet   PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3187985db425SBarry Smith   for (i = 0; i < m; i++) {
31889371c9d4SSatish Balay     ncols = ai[1] - ai[0];
31899371c9d4SSatish Balay     ai++;
3190d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
31919371c9d4SSatish Balay       x[i] = *aa;
31929371c9d4SSatish Balay       if (idx) idx[i] = 0;
3193985db425SBarry Smith     } else { /* row is sparse so already KNOW minimum is 0.0 or lower */
3194985db425SBarry Smith       x[i] = 0.0;
3195985db425SBarry Smith       if (idx) { /* find first implicit 0.0 in the row */
3196985db425SBarry Smith         for (j = 0; j < ncols; j++) {
3197985db425SBarry Smith           if (aj[j] > j) {
3198985db425SBarry Smith             idx[i] = j;
3199985db425SBarry Smith             break;
3200985db425SBarry Smith           }
3201985db425SBarry Smith         }
3202fa213d2fSHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
3203fa213d2fSHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3204985db425SBarry Smith       }
3205985db425SBarry Smith     }
3206985db425SBarry Smith     for (j = 0; j < ncols; j++) {
32079371c9d4SSatish Balay       if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {
32089371c9d4SSatish Balay         x[i] = *aa;
32099371c9d4SSatish Balay         if (idx) idx[i] = *aj;
32109371c9d4SSatish Balay       }
32119371c9d4SSatish Balay       aa++;
32129371c9d4SSatish Balay       aj++;
3213e34fafa9SBarry Smith     }
3214e34fafa9SBarry Smith   }
32159566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
32169566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
32173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3218e34fafa9SBarry Smith }
3219bbead8a2SBarry Smith 
MatInvertBlockDiagonal_SeqAIJ(Mat A,const PetscScalar ** values)3220ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values)
3221d71ae5a4SJacob Faibussowitsch {
3222bbead8a2SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
322358b7e2c1SStefano Zampini   PetscInt        i, bs = A->rmap->bs, mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j;
3224bbead8a2SBarry Smith   MatScalar      *diag, work[25], *v_work;
32250da83c2eSBarry Smith   const PetscReal shift = 0.0;
32261a9391e3SHong Zhang   PetscBool       allowzeropivot, zeropivotdetected = PETSC_FALSE;
3227bbead8a2SBarry Smith 
3228bbead8a2SBarry Smith   PetscFunctionBegin;
3229a455e926SHong Zhang   allowzeropivot = PetscNot(A->erroriffailure);
32304a0d0026SBarry Smith   if (a->ibdiagvalid) {
32314a0d0026SBarry Smith     if (values) *values = a->ibdiag;
32323ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
32334a0d0026SBarry Smith   }
32343a7d0413SPierre Jolivet   if (!a->ibdiag) PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag));
3235bbead8a2SBarry Smith   diag = a->ibdiag;
3236bbead8a2SBarry Smith   if (values) *values = a->ibdiag;
3237bbead8a2SBarry Smith   /* factor and invert each block */
3238bbead8a2SBarry Smith   switch (bs) {
3239bbead8a2SBarry Smith   case 1:
3240bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
32419566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i));
3242ec1892c8SHong Zhang       if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) {
3243966bd95aSPierre Jolivet         PetscCheck(allowzeropivot, PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON);
32447b6c816cSBarry Smith         A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
32457b6c816cSBarry Smith         A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]);
32467b6c816cSBarry Smith         A->factorerror_zeropivot_row   = i;
32479566063dSJacob Faibussowitsch         PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON));
3248ec1892c8SHong Zhang       }
3249bbead8a2SBarry Smith       diag[i] = (PetscScalar)1.0 / (diag[i] + shift);
3250bbead8a2SBarry Smith     }
3251bbead8a2SBarry Smith     break;
3252bbead8a2SBarry Smith   case 2:
3253bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
32549371c9d4SSatish Balay       ij[0] = 2 * i;
32559371c9d4SSatish Balay       ij[1] = 2 * i + 1;
32569566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 2, ij, 2, ij, diag));
32579566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected));
32587b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
32599566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_2(diag));
3260bbead8a2SBarry Smith       diag += 4;
3261bbead8a2SBarry Smith     }
3262bbead8a2SBarry Smith     break;
3263bbead8a2SBarry Smith   case 3:
3264bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
32659371c9d4SSatish Balay       ij[0] = 3 * i;
32669371c9d4SSatish Balay       ij[1] = 3 * i + 1;
32679371c9d4SSatish Balay       ij[2] = 3 * i + 2;
32689566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 3, ij, 3, ij, diag));
32699566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected));
32707b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
32719566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_3(diag));
3272bbead8a2SBarry Smith       diag += 9;
3273bbead8a2SBarry Smith     }
3274bbead8a2SBarry Smith     break;
3275bbead8a2SBarry Smith   case 4:
3276bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
32779371c9d4SSatish Balay       ij[0] = 4 * i;
32789371c9d4SSatish Balay       ij[1] = 4 * i + 1;
32799371c9d4SSatish Balay       ij[2] = 4 * i + 2;
32809371c9d4SSatish Balay       ij[3] = 4 * i + 3;
32819566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 4, ij, 4, ij, diag));
32829566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected));
32837b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
32849566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_4(diag));
3285bbead8a2SBarry Smith       diag += 16;
3286bbead8a2SBarry Smith     }
3287bbead8a2SBarry Smith     break;
3288bbead8a2SBarry Smith   case 5:
3289bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
32909371c9d4SSatish Balay       ij[0] = 5 * i;
32919371c9d4SSatish Balay       ij[1] = 5 * i + 1;
32929371c9d4SSatish Balay       ij[2] = 5 * i + 2;
32939371c9d4SSatish Balay       ij[3] = 5 * i + 3;
32949371c9d4SSatish Balay       ij[4] = 5 * i + 4;
32959566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 5, ij, 5, ij, diag));
32969566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected));
32977b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
32989566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_5(diag));
3299bbead8a2SBarry Smith       diag += 25;
3300bbead8a2SBarry Smith     }
3301bbead8a2SBarry Smith     break;
3302bbead8a2SBarry Smith   case 6:
3303bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33049371c9d4SSatish Balay       ij[0] = 6 * i;
33059371c9d4SSatish Balay       ij[1] = 6 * i + 1;
33069371c9d4SSatish Balay       ij[2] = 6 * i + 2;
33079371c9d4SSatish Balay       ij[3] = 6 * i + 3;
33089371c9d4SSatish Balay       ij[4] = 6 * i + 4;
33099371c9d4SSatish Balay       ij[5] = 6 * i + 5;
33109566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 6, ij, 6, ij, diag));
33119566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected));
33127b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33139566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_6(diag));
3314bbead8a2SBarry Smith       diag += 36;
3315bbead8a2SBarry Smith     }
3316bbead8a2SBarry Smith     break;
3317bbead8a2SBarry Smith   case 7:
3318bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33199371c9d4SSatish Balay       ij[0] = 7 * i;
33209371c9d4SSatish Balay       ij[1] = 7 * i + 1;
33219371c9d4SSatish Balay       ij[2] = 7 * i + 2;
33229371c9d4SSatish Balay       ij[3] = 7 * i + 3;
33239371c9d4SSatish Balay       ij[4] = 7 * i + 4;
33249371c9d4SSatish Balay       ij[5] = 7 * i + 5;
3325cdd8bf47SJunchao Zhang       ij[6] = 7 * i + 6;
33269566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 7, ij, 7, ij, diag));
33279566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected));
33287b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33299566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_7(diag));
3330bbead8a2SBarry Smith       diag += 49;
3331bbead8a2SBarry Smith     }
3332bbead8a2SBarry Smith     break;
3333bbead8a2SBarry Smith   default:
33349566063dSJacob Faibussowitsch     PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ));
3335bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
3336ad540459SPierre Jolivet       for (j = 0; j < bs; j++) IJ[j] = bs * i + j;
33379566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag));
33389566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected));
33397b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33409566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs));
3341bbead8a2SBarry Smith       diag += bs2;
3342bbead8a2SBarry Smith     }
33439566063dSJacob Faibussowitsch     PetscCall(PetscFree3(v_work, v_pivots, IJ));
3344bbead8a2SBarry Smith   }
3345bbead8a2SBarry Smith   a->ibdiagvalid = PETSC_TRUE;
33463ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3347bbead8a2SBarry Smith }
3348bbead8a2SBarry Smith 
MatSetRandom_SeqAIJ(Mat x,PetscRandom rctx)3349d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx)
3350d71ae5a4SJacob Faibussowitsch {
335173a71a0fSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data;
3352fff043a9SJunchao Zhang   PetscScalar a, *aa;
335373a71a0fSBarry Smith   PetscInt    m, n, i, j, col;
335473a71a0fSBarry Smith 
335573a71a0fSBarry Smith   PetscFunctionBegin;
335673a71a0fSBarry Smith   if (!x->assembled) {
33579566063dSJacob Faibussowitsch     PetscCall(MatGetSize(x, &m, &n));
335873a71a0fSBarry Smith     for (i = 0; i < m; i++) {
335973a71a0fSBarry Smith       for (j = 0; j < aij->imax[i]; j++) {
33609566063dSJacob Faibussowitsch         PetscCall(PetscRandomGetValue(rctx, &a));
336173a71a0fSBarry Smith         col = (PetscInt)(n * PetscRealPart(a));
33629566063dSJacob Faibussowitsch         PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES));
336373a71a0fSBarry Smith       }
336473a71a0fSBarry Smith     }
3365e2ce353bSJunchao Zhang   } else {
33669566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayWrite(x, &aa));
33679566063dSJacob Faibussowitsch     for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i));
33689566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa));
3369e2ce353bSJunchao Zhang   }
33709566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY));
33719566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY));
33723ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
337373a71a0fSBarry Smith }
337473a71a0fSBarry Smith 
3375679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */
MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x,PetscInt low,PetscInt high,PetscRandom rctx)3376d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx)
3377d71ae5a4SJacob Faibussowitsch {
3378679944adSJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data;
3379679944adSJunchao Zhang   PetscScalar a;
3380679944adSJunchao Zhang   PetscInt    m, n, i, j, col, nskip;
3381679944adSJunchao Zhang 
3382679944adSJunchao Zhang   PetscFunctionBegin;
3383679944adSJunchao Zhang   nskip = high - low;
33849566063dSJacob Faibussowitsch   PetscCall(MatGetSize(x, &m, &n));
3385679944adSJunchao Zhang   n -= nskip; /* shrink number of columns where nonzeros can be set */
3386679944adSJunchao Zhang   for (i = 0; i < m; i++) {
3387679944adSJunchao Zhang     for (j = 0; j < aij->imax[i]; j++) {
33889566063dSJacob Faibussowitsch       PetscCall(PetscRandomGetValue(rctx, &a));
3389679944adSJunchao Zhang       col = (PetscInt)(n * PetscRealPart(a));
3390679944adSJunchao Zhang       if (col >= low) col += nskip; /* shift col rightward to skip the hole */
33919566063dSJacob Faibussowitsch       PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES));
3392679944adSJunchao Zhang     }
3393e2ce353bSJunchao Zhang   }
33949566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY));
33959566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY));
33963ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3397679944adSJunchao Zhang }
3398679944adSJunchao Zhang 
33990a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ,
3400cb5b572fSBarry Smith                                        MatGetRow_SeqAIJ,
3401cb5b572fSBarry Smith                                        MatRestoreRow_SeqAIJ,
3402cb5b572fSBarry Smith                                        MatMult_SeqAIJ,
340397304618SKris Buschelman                                        /*  4*/ MatMultAdd_SeqAIJ,
34047c922b88SBarry Smith                                        MatMultTranspose_SeqAIJ,
34057c922b88SBarry Smith                                        MatMultTransposeAdd_SeqAIJ,
3406f4259b30SLisandro Dalcin                                        NULL,
3407f4259b30SLisandro Dalcin                                        NULL,
3408f4259b30SLisandro Dalcin                                        NULL,
3409f4259b30SLisandro Dalcin                                        /* 10*/ NULL,
3410cb5b572fSBarry Smith                                        MatLUFactor_SeqAIJ,
3411f4259b30SLisandro Dalcin                                        NULL,
341241f059aeSBarry Smith                                        MatSOR_SeqAIJ,
341391e9d3e2SHong Zhang                                        MatTranspose_SeqAIJ,
341497304618SKris Buschelman                                        /* 15*/ MatGetInfo_SeqAIJ,
3415cb5b572fSBarry Smith                                        MatEqual_SeqAIJ,
3416cb5b572fSBarry Smith                                        MatGetDiagonal_SeqAIJ,
3417cb5b572fSBarry Smith                                        MatDiagonalScale_SeqAIJ,
3418cb5b572fSBarry Smith                                        MatNorm_SeqAIJ,
3419f4259b30SLisandro Dalcin                                        /* 20*/ NULL,
3420cb5b572fSBarry Smith                                        MatAssemblyEnd_SeqAIJ,
3421cb5b572fSBarry Smith                                        MatSetOption_SeqAIJ,
3422cb5b572fSBarry Smith                                        MatZeroEntries_SeqAIJ,
3423d519adbfSMatthew Knepley                                        /* 24*/ MatZeroRows_SeqAIJ,
3424f4259b30SLisandro Dalcin                                        NULL,
3425f4259b30SLisandro Dalcin                                        NULL,
3426f4259b30SLisandro Dalcin                                        NULL,
3427f4259b30SLisandro Dalcin                                        NULL,
342826cec326SBarry Smith                                        /* 29*/ MatSetUp_Seq_Hash,
3429f4259b30SLisandro Dalcin                                        NULL,
3430f4259b30SLisandro Dalcin                                        NULL,
3431f4259b30SLisandro Dalcin                                        NULL,
3432f4259b30SLisandro Dalcin                                        NULL,
3433d519adbfSMatthew Knepley                                        /* 34*/ MatDuplicate_SeqAIJ,
3434f4259b30SLisandro Dalcin                                        NULL,
3435f4259b30SLisandro Dalcin                                        NULL,
3436cb5b572fSBarry Smith                                        MatILUFactor_SeqAIJ,
3437f4259b30SLisandro Dalcin                                        NULL,
3438d519adbfSMatthew Knepley                                        /* 39*/ MatAXPY_SeqAIJ,
34397dae84e0SHong Zhang                                        MatCreateSubMatrices_SeqAIJ,
3440cb5b572fSBarry Smith                                        MatIncreaseOverlap_SeqAIJ,
3441cb5b572fSBarry Smith                                        MatGetValues_SeqAIJ,
3442cb5b572fSBarry Smith                                        MatCopy_SeqAIJ,
3443d519adbfSMatthew Knepley                                        /* 44*/ MatGetRowMax_SeqAIJ,
3444cb5b572fSBarry Smith                                        MatScale_SeqAIJ,
34457d68702bSBarry Smith                                        MatShift_SeqAIJ,
344679299369SBarry Smith                                        MatDiagonalSet_SeqAIJ,
34476e169961SBarry Smith                                        MatZeroRowsColumns_SeqAIJ,
344873a71a0fSBarry Smith                                        /* 49*/ MatSetRandom_SeqAIJ,
34493b2fbd54SBarry Smith                                        MatGetRowIJ_SeqAIJ,
34503b2fbd54SBarry Smith                                        MatRestoreRowIJ_SeqAIJ,
34513b2fbd54SBarry Smith                                        MatGetColumnIJ_SeqAIJ,
3452a93ec695SBarry Smith                                        MatRestoreColumnIJ_SeqAIJ,
345393dfae19SHong Zhang                                        /* 54*/ MatFDColoringCreate_SeqXAIJ,
3454f4259b30SLisandro Dalcin                                        NULL,
3455f4259b30SLisandro Dalcin                                        NULL,
3456cda55fadSBarry Smith                                        MatPermute_SeqAIJ,
3457f4259b30SLisandro Dalcin                                        NULL,
3458f4259b30SLisandro Dalcin                                        /* 59*/ NULL,
3459b9b97703SBarry Smith                                        MatDestroy_SeqAIJ,
3460b9b97703SBarry Smith                                        MatView_SeqAIJ,
3461f4259b30SLisandro Dalcin                                        NULL,
3462f4259b30SLisandro Dalcin                                        NULL,
34638bb0f5c6SPierre Jolivet                                        /* 64*/ MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ,
3464f4259b30SLisandro Dalcin                                        NULL,
3465f4259b30SLisandro Dalcin                                        NULL,
3466f4259b30SLisandro Dalcin                                        NULL,
34678bb0f5c6SPierre Jolivet                                        MatGetRowMaxAbs_SeqAIJ,
34688bb0f5c6SPierre Jolivet                                        /* 69*/ MatGetRowMinAbs_SeqAIJ,
3469f4259b30SLisandro Dalcin                                        NULL,
3470f4259b30SLisandro Dalcin                                        NULL,
34713acb8795SBarry Smith                                        MatFDColoringApply_AIJ,
3472f4259b30SLisandro Dalcin                                        NULL,
34738bb0f5c6SPierre Jolivet                                        /* 74*/ MatFindZeroDiagonals_SeqAIJ,
3474f4259b30SLisandro Dalcin                                        NULL,
3475f4259b30SLisandro Dalcin                                        NULL,
3476f4259b30SLisandro Dalcin                                        NULL,
3477bc011b1eSHong Zhang                                        MatLoad_SeqAIJ,
34788bb0f5c6SPierre Jolivet                                        /* 79*/ NULL,
34798bb0f5c6SPierre Jolivet                                        NULL,
34808bb0f5c6SPierre Jolivet                                        NULL,
34818bb0f5c6SPierre Jolivet                                        NULL,
34828bb0f5c6SPierre Jolivet                                        NULL,
34836cff0a6bSPierre Jolivet                                        /* 84*/ NULL,
348426be0446SHong Zhang                                        MatMatMultNumeric_SeqAIJ_SeqAIJ,
34858bb0f5c6SPierre Jolivet                                        MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy,
3486f4259b30SLisandro Dalcin                                        NULL,
34876fc122caSHong Zhang                                        MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ,
34888bb0f5c6SPierre Jolivet                                        /* 90*/ NULL,
34898bb0f5c6SPierre Jolivet                                        MatProductSetFromOptions_SeqAIJ,
3490f4259b30SLisandro Dalcin                                        NULL,
3491f4259b30SLisandro Dalcin                                        NULL,
349287d4246cSBarry Smith                                        MatConjugate_SeqAIJ,
34938bb0f5c6SPierre Jolivet                                        /* 94*/ NULL,
34948bb0f5c6SPierre Jolivet                                        MatSetValuesRow_SeqAIJ,
349599cafbc1SBarry Smith                                        MatRealPart_SeqAIJ,
3496f5edf698SHong Zhang                                        MatImaginaryPart_SeqAIJ,
3497f4259b30SLisandro Dalcin                                        NULL,
34988bb0f5c6SPierre Jolivet                                        /* 99*/ NULL,
34998bb0f5c6SPierre Jolivet                                        MatMatSolve_SeqAIJ,
3500f4259b30SLisandro Dalcin                                        NULL,
35012af78befSBarry Smith                                        MatGetRowMin_SeqAIJ,
3502f4259b30SLisandro Dalcin                                        NULL,
3503421480d9SBarry Smith                                        /*104*/ NULL,
3504f4259b30SLisandro Dalcin                                        NULL,
3505f4259b30SLisandro Dalcin                                        NULL,
3506f4259b30SLisandro Dalcin                                        NULL,
3507f4259b30SLisandro Dalcin                                        NULL,
35088bb0f5c6SPierre Jolivet                                        /*109*/ NULL,
3509f4259b30SLisandro Dalcin                                        NULL,
3510f4259b30SLisandro Dalcin                                        NULL,
3511f4259b30SLisandro Dalcin                                        NULL,
3512421480d9SBarry Smith                                        MatGetMultiProcBlock_SeqAIJ,
3513421480d9SBarry Smith                                        /*114*/ MatFindNonzeroRows_SeqAIJ,
3514a873a8cdSSam Reynolds                                        MatGetColumnReductions_SeqAIJ,
351537868618SMatthew G Knepley                                        MatInvertBlockDiagonal_SeqAIJ,
35160da83c2eSBarry Smith                                        MatInvertVariableBlockDiagonal_SeqAIJ,
3517f4259b30SLisandro Dalcin                                        NULL,
3518421480d9SBarry Smith                                        /*119*/ NULL,
3519f4259b30SLisandro Dalcin                                        NULL,
352075648e8dSHong Zhang                                        MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ,
3521b9af6bddSHong Zhang                                        MatTransposeColoringCreate_SeqAIJ,
3522421480d9SBarry Smith                                        MatTransColoringApplySpToDen_SeqAIJ,
3523421480d9SBarry Smith                                        /*124*/ MatTransColoringApplyDenToSp_SeqAIJ,
35243964eb88SJed Brown                                        MatRARtNumeric_SeqAIJ_SeqAIJ,
35258bb0f5c6SPierre Jolivet                                        NULL,
35268bb0f5c6SPierre Jolivet                                        NULL,
3527421480d9SBarry Smith                                        MatFDColoringSetUp_SeqXAIJ,
3528421480d9SBarry Smith                                        /*129*/ MatFindOffBlockDiagonalEntries_SeqAIJ,
35298bb0f5c6SPierre Jolivet                                        MatCreateMPIMatConcatenateSeqMat_SeqAIJ,
35308bb0f5c6SPierre Jolivet                                        MatDestroySubMatrices_SeqAIJ,
35318bb0f5c6SPierre Jolivet                                        NULL,
3532421480d9SBarry Smith                                        NULL,
3533421480d9SBarry Smith                                        /*134*/ MatCreateGraph_Simple_AIJ,
35348bb0f5c6SPierre Jolivet                                        MatTransposeSymbolic_SeqAIJ,
35358bb0f5c6SPierre Jolivet                                        MatEliminateZeros_SeqAIJ,
35368bb0f5c6SPierre Jolivet                                        MatGetRowSumAbs_SeqAIJ,
3537f4259b30SLisandro Dalcin                                        NULL,
3538421480d9SBarry Smith                                        /*139*/ NULL,
3539f4259b30SLisandro Dalcin                                        NULL,
354003db1824SAlex Lindsay                                        MatCopyHashToXAIJ_Seq_Hash,
3541c2be7ffeSStefano Zampini                                        NULL,
354203db1824SAlex Lindsay                                        NULL};
354317ab2063SBarry Smith 
MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat,PetscInt * indices)3544ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices)
3545d71ae5a4SJacob Faibussowitsch {
3546bef8e0ddSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
354797f1f81fSBarry Smith   PetscInt    i, nz, n;
3548bef8e0ddSBarry Smith 
3549bef8e0ddSBarry Smith   PetscFunctionBegin;
3550bef8e0ddSBarry Smith   nz = aij->maxnz;
3551d0f46423SBarry Smith   n  = mat->rmap->n;
3552ad540459SPierre Jolivet   for (i = 0; i < nz; i++) aij->j[i] = indices[i];
3553bef8e0ddSBarry Smith   aij->nz = nz;
3554ad540459SPierre Jolivet   for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i];
35553ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3556bef8e0ddSBarry Smith }
3557bef8e0ddSBarry Smith 
3558a3bb6f32SFande Kong /*
3559ddea5d60SJunchao Zhang  * Given a sparse matrix with global column indices, compact it by using a local column space.
3560ddea5d60SJunchao Zhang  * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable()
3561ddea5d60SJunchao Zhang  */
MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat,ISLocalToGlobalMapping * mapping)3562d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping)
3563d71ae5a4SJacob Faibussowitsch {
3564a3bb6f32SFande Kong   Mat_SeqAIJ   *aij = (Mat_SeqAIJ *)mat->data;
3565eec179cfSJacob Faibussowitsch   PetscHMapI    gid1_lid1;
3566eec179cfSJacob Faibussowitsch   PetscHashIter tpos;
356725b670f0SStefano Zampini   PetscInt      gid, lid, i, ec, nz = aij->nz;
356825b670f0SStefano Zampini   PetscInt     *garray, *jj = aij->j;
3569a3bb6f32SFande Kong 
3570a3bb6f32SFande Kong   PetscFunctionBegin;
3571a3bb6f32SFande Kong   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
35724f572ea9SToby Isaac   PetscAssertPointer(mapping, 2);
3573a3bb6f32SFande Kong   /* use a table */
3574eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1));
3575a3bb6f32SFande Kong   ec = 0;
357625b670f0SStefano Zampini   for (i = 0; i < nz; i++) {
357725b670f0SStefano Zampini     PetscInt data, gid1 = jj[i] + 1;
3578eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data));
3579a3bb6f32SFande Kong     if (!data) {
3580a3bb6f32SFande Kong       /* one based table */
3581c76ffc5fSJacob Faibussowitsch       PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec));
3582a3bb6f32SFande Kong     }
3583a3bb6f32SFande Kong   }
3584a3bb6f32SFande Kong   /* form array of columns we need */
35859566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ec, &garray));
3586eec179cfSJacob Faibussowitsch   PetscHashIterBegin(gid1_lid1, tpos);
3587eec179cfSJacob Faibussowitsch   while (!PetscHashIterAtEnd(gid1_lid1, tpos)) {
3588eec179cfSJacob Faibussowitsch     PetscHashIterGetKey(gid1_lid1, tpos, gid);
3589eec179cfSJacob Faibussowitsch     PetscHashIterGetVal(gid1_lid1, tpos, lid);
3590eec179cfSJacob Faibussowitsch     PetscHashIterNext(gid1_lid1, tpos);
3591a3bb6f32SFande Kong     gid--;
3592a3bb6f32SFande Kong     lid--;
3593a3bb6f32SFande Kong     garray[lid] = gid;
3594a3bb6f32SFande Kong   }
35959566063dSJacob Faibussowitsch   PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */
3596eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIClear(gid1_lid1));
3597c76ffc5fSJacob Faibussowitsch   for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1));
3598a3bb6f32SFande Kong   /* compact out the extra columns in B */
359925b670f0SStefano Zampini   for (i = 0; i < nz; i++) {
360025b670f0SStefano Zampini     PetscInt gid1 = jj[i] + 1;
3601eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid));
3602a3bb6f32SFande Kong     lid--;
360325b670f0SStefano Zampini     jj[i] = lid;
3604a3bb6f32SFande Kong   }
36059566063dSJacob Faibussowitsch   PetscCall(PetscLayoutDestroy(&mat->cmap));
3606eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIDestroy(&gid1_lid1));
36079566063dSJacob Faibussowitsch   PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap));
36089566063dSJacob Faibussowitsch   PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping));
36099566063dSJacob Faibussowitsch   PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH));
36103ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3611a3bb6f32SFande Kong }
3612a3bb6f32SFande Kong 
3613bef8e0ddSBarry Smith /*@
3614bef8e0ddSBarry Smith   MatSeqAIJSetColumnIndices - Set the column indices for all the rows
3615bef8e0ddSBarry Smith   in the matrix.
3616bef8e0ddSBarry Smith 
3617bef8e0ddSBarry Smith   Input Parameters:
361811a5261eSBarry Smith + mat     - the `MATSEQAIJ` matrix
3619bef8e0ddSBarry Smith - indices - the column indices
3620bef8e0ddSBarry Smith 
362115091d37SBarry Smith   Level: advanced
362215091d37SBarry Smith 
3623bef8e0ddSBarry Smith   Notes:
3624bef8e0ddSBarry Smith   This can be called if you have precomputed the nonzero structure of the
3625bef8e0ddSBarry Smith   matrix and want to provide it to the matrix object to improve the performance
362611a5261eSBarry Smith   of the `MatSetValues()` operation.
3627bef8e0ddSBarry Smith 
3628bef8e0ddSBarry Smith   You MUST have set the correct numbers of nonzeros per row in the call to
362911a5261eSBarry Smith   `MatCreateSeqAIJ()`, and the columns indices MUST be sorted.
3630bef8e0ddSBarry Smith 
363111a5261eSBarry Smith   MUST be called before any calls to `MatSetValues()`
3632bef8e0ddSBarry Smith 
3633b9617806SBarry Smith   The indices should start with zero, not one.
3634b9617806SBarry Smith 
36351cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQAIJ`
3636bef8e0ddSBarry Smith @*/
MatSeqAIJSetColumnIndices(Mat mat,PetscInt * indices)3637d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices)
3638d71ae5a4SJacob Faibussowitsch {
3639bef8e0ddSBarry Smith   PetscFunctionBegin;
36400700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
36414f572ea9SToby Isaac   PetscAssertPointer(indices, 2);
3642cac4c232SBarry Smith   PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices));
36433ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3644bef8e0ddSBarry Smith }
3645bef8e0ddSBarry Smith 
MatStoreValues_SeqAIJ(Mat mat)3646ba38deedSJacob Faibussowitsch static PetscErrorCode MatStoreValues_SeqAIJ(Mat mat)
3647d71ae5a4SJacob Faibussowitsch {
3648be6bf707SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
3649d0f46423SBarry Smith   size_t      nz  = aij->i[mat->rmap->n];
3650be6bf707SBarry Smith 
3651be6bf707SBarry Smith   PetscFunctionBegin;
365228b400f6SJacob Faibussowitsch   PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
3653be6bf707SBarry Smith 
3654be6bf707SBarry Smith   /* allocate space for values if not already there */
36553a7d0413SPierre Jolivet   if (!aij->saved_values) PetscCall(PetscMalloc1(nz + 1, &aij->saved_values));
3656be6bf707SBarry Smith 
3657be6bf707SBarry Smith   /* copy values over */
36589566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz));
36593ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3660be6bf707SBarry Smith }
3661be6bf707SBarry Smith 
3662be6bf707SBarry Smith /*@
366320f4b53cSBarry Smith   MatStoreValues - Stashes a copy of the matrix values; this allows reusing of the linear part of a Jacobian, while recomputing only the
3664be6bf707SBarry Smith   nonlinear portion.
3665be6bf707SBarry Smith 
3666c3339decSBarry Smith   Logically Collect
3667be6bf707SBarry Smith 
366827430b45SBarry Smith   Input Parameter:
366911a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option)
3670be6bf707SBarry Smith 
367115091d37SBarry Smith   Level: advanced
367215091d37SBarry Smith 
36732920cce0SJacob Faibussowitsch   Example Usage:
367427430b45SBarry Smith .vb
36752ef1f0ffSBarry Smith     Using SNES
367627430b45SBarry Smith     Create Jacobian matrix
367727430b45SBarry Smith     Set linear terms into matrix
367827430b45SBarry Smith     Apply boundary conditions to matrix, at this time matrix must have
367927430b45SBarry Smith       final nonzero structure (i.e. setting the nonlinear terms and applying
368027430b45SBarry Smith       boundary conditions again will not change the nonzero structure
368127430b45SBarry Smith     MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE);
368227430b45SBarry Smith     MatStoreValues(mat);
368327430b45SBarry Smith     Call SNESSetJacobian() with matrix
368427430b45SBarry Smith     In your Jacobian routine
368527430b45SBarry Smith       MatRetrieveValues(mat);
368627430b45SBarry Smith       Set nonlinear terms in matrix
3687be6bf707SBarry Smith 
368827430b45SBarry Smith     Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself:
368927430b45SBarry Smith     // build linear portion of Jacobian
369027430b45SBarry Smith     MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE);
369127430b45SBarry Smith     MatStoreValues(mat);
369227430b45SBarry Smith     loop over nonlinear iterations
369327430b45SBarry Smith        MatRetrieveValues(mat);
369427430b45SBarry Smith        // call MatSetValues(mat,...) to set nonliner portion of Jacobian
369527430b45SBarry Smith        // call MatAssemblyBegin/End() on matrix
369627430b45SBarry Smith        Solve linear system with Jacobian
369727430b45SBarry Smith     endloop
369827430b45SBarry Smith .ve
3699be6bf707SBarry Smith 
3700be6bf707SBarry Smith   Notes:
3701da81f932SPierre Jolivet   Matrix must already be assembled before calling this routine
370211a5261eSBarry Smith   Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before
3703be6bf707SBarry Smith   calling this routine.
3704be6bf707SBarry Smith 
37050c468ba9SBarry Smith   When this is called multiple times it overwrites the previous set of stored values
37060c468ba9SBarry Smith   and does not allocated additional space.
37070c468ba9SBarry Smith 
3708fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatRetrieveValues()`
3709be6bf707SBarry Smith @*/
MatStoreValues(Mat mat)3710d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat)
3711d71ae5a4SJacob Faibussowitsch {
3712be6bf707SBarry Smith   PetscFunctionBegin;
37130700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
371428b400f6SJacob Faibussowitsch   PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
371528b400f6SJacob Faibussowitsch   PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3716cac4c232SBarry Smith   PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat));
37173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3718be6bf707SBarry Smith }
3719be6bf707SBarry Smith 
MatRetrieveValues_SeqAIJ(Mat mat)3720ba38deedSJacob Faibussowitsch static PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat)
3721d71ae5a4SJacob Faibussowitsch {
3722be6bf707SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
3723d0f46423SBarry Smith   PetscInt    nz  = aij->i[mat->rmap->n];
3724be6bf707SBarry Smith 
3725be6bf707SBarry Smith   PetscFunctionBegin;
372628b400f6SJacob Faibussowitsch   PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
372728b400f6SJacob Faibussowitsch   PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first");
3728be6bf707SBarry Smith   /* copy values over */
37299566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz));
37303ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3731be6bf707SBarry Smith }
3732be6bf707SBarry Smith 
3733be6bf707SBarry Smith /*@
373420f4b53cSBarry Smith   MatRetrieveValues - Retrieves the copy of the matrix values that was stored with `MatStoreValues()`
3735be6bf707SBarry Smith 
3736c3339decSBarry Smith   Logically Collect
3737be6bf707SBarry Smith 
37382fe279fdSBarry Smith   Input Parameter:
373911a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option)
3740be6bf707SBarry Smith 
374115091d37SBarry Smith   Level: advanced
374215091d37SBarry Smith 
37431cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatStoreValues()`
3744be6bf707SBarry Smith @*/
MatRetrieveValues(Mat mat)3745d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat)
3746d71ae5a4SJacob Faibussowitsch {
3747be6bf707SBarry Smith   PetscFunctionBegin;
37480700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
374928b400f6SJacob Faibussowitsch   PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
375028b400f6SJacob Faibussowitsch   PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3751cac4c232SBarry Smith   PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat));
37523ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3753be6bf707SBarry Smith }
3754be6bf707SBarry Smith 
37555d83a8b1SBarry Smith /*@
375611a5261eSBarry Smith   MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format
37570d15e28bSLois Curfman McInnes   (the default parallel PETSc format).  For good matrix assembly performance
375820f4b53cSBarry Smith   the user should preallocate the matrix storage by setting the parameter `nz`
375920f4b53cSBarry Smith   (or the array `nnz`).
376017ab2063SBarry Smith 
3761d083f849SBarry Smith   Collective
3762db81eaa0SLois Curfman McInnes 
376317ab2063SBarry Smith   Input Parameters:
376411a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF`
376517ab2063SBarry Smith . m    - number of rows
376617ab2063SBarry Smith . n    - number of columns
376717ab2063SBarry Smith . nz   - number of nonzeros per row (same for all rows)
376851c19458SBarry Smith - nnz  - array containing the number of nonzeros in the various rows
37690298fd71SBarry Smith          (possibly different for each row) or NULL
377017ab2063SBarry Smith 
377117ab2063SBarry Smith   Output Parameter:
3772416022c9SBarry Smith . A - the matrix
377317ab2063SBarry Smith 
37742ef1f0ffSBarry Smith   Options Database Keys:
37752ef1f0ffSBarry Smith + -mat_no_inode            - Do not use inodes
37762ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5)
37772ef1f0ffSBarry Smith 
37782ef1f0ffSBarry Smith   Level: intermediate
3779175b88e8SBarry Smith 
3780b259b22eSLois Curfman McInnes   Notes:
378177433607SBarry Smith   It is recommend to use `MatCreateFromOptions()` instead of this routine
378277433607SBarry Smith 
37832ef1f0ffSBarry Smith   If `nnz` is given then `nz` is ignored
378449a6f317SBarry Smith 
37852ef1f0ffSBarry Smith   The `MATSEQAIJ` format, also called
37862ef1f0ffSBarry Smith   compressed row storage, is fully compatible with standard Fortran
37870002213bSLois Curfman McInnes   storage.  That is, the stored row and column indices can begin at
37882ef1f0ffSBarry Smith   either one (as in Fortran) or zero.
378917ab2063SBarry Smith 
379020f4b53cSBarry Smith   Specify the preallocated storage with either `nz` or `nnz` (not both).
37912ef1f0ffSBarry Smith   Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory
379220f4b53cSBarry Smith   allocation.
379317ab2063SBarry Smith 
3794682d7d0cSBarry Smith   By default, this format uses inodes (identical nodes) when possible, to
37954fca80b9SLois Curfman McInnes   improve numerical efficiency of matrix-vector products and solves. We
3796682d7d0cSBarry Smith   search for consecutive rows with the same nonzero structure, thereby
37976c7ebb05SLois Curfman McInnes   reusing matrix information to achieve increased efficiency.
37986c7ebb05SLois Curfman McInnes 
37991cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`
380017ab2063SBarry Smith @*/
MatCreateSeqAIJ(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt nz,const PetscInt nnz[],Mat * A)3801d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A)
3802d71ae5a4SJacob Faibussowitsch {
38033a40ed3dSBarry Smith   PetscFunctionBegin;
38049566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, A));
38059566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*A, m, n, m, n));
38069566063dSJacob Faibussowitsch   PetscCall(MatSetType(*A, MATSEQAIJ));
38079566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz));
38083ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3809273d9f13SBarry Smith }
3810273d9f13SBarry Smith 
38115d83a8b1SBarry Smith /*@
3812273d9f13SBarry Smith   MatSeqAIJSetPreallocation - For good matrix assembly performance
3813273d9f13SBarry Smith   the user should preallocate the matrix storage by setting the parameter nz
3814273d9f13SBarry Smith   (or the array nnz).  By setting these parameters accurately, performance
3815273d9f13SBarry Smith   during matrix assembly can be increased by more than a factor of 50.
3816273d9f13SBarry Smith 
3817d083f849SBarry Smith   Collective
3818273d9f13SBarry Smith 
3819273d9f13SBarry Smith   Input Parameters:
38201c4f3114SJed Brown + B   - The matrix
3821273d9f13SBarry Smith . nz  - number of nonzeros per row (same for all rows)
3822273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows
38230298fd71SBarry Smith          (possibly different for each row) or NULL
3824273d9f13SBarry Smith 
38252ef1f0ffSBarry Smith   Options Database Keys:
38262ef1f0ffSBarry Smith + -mat_no_inode            - Do not use inodes
38272ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5)
38282ef1f0ffSBarry Smith 
38292ef1f0ffSBarry Smith   Level: intermediate
38302ef1f0ffSBarry Smith 
3831273d9f13SBarry Smith   Notes:
38322ef1f0ffSBarry Smith   If `nnz` is given then `nz` is ignored
383349a6f317SBarry Smith 
383411a5261eSBarry Smith   The `MATSEQAIJ` format also called
38352ef1f0ffSBarry Smith   compressed row storage, is fully compatible with standard Fortran
3836273d9f13SBarry Smith   storage.  That is, the stored row and column indices can begin at
3837273d9f13SBarry Smith   either one (as in Fortran) or zero.  See the users' manual for details.
3838273d9f13SBarry Smith 
38392ef1f0ffSBarry Smith   Specify the preallocated storage with either `nz` or `nnz` (not both).
38402ef1f0ffSBarry Smith   Set nz = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory
38412ef1f0ffSBarry Smith   allocation.
3842273d9f13SBarry Smith 
384311a5261eSBarry Smith   You can call `MatGetInfo()` to get information on how effective the preallocation was;
3844aa95bbe8SBarry Smith   for example the fields mallocs,nz_allocated,nz_used,nz_unneeded;
3845aa95bbe8SBarry Smith   You can also run with the option -info and look for messages with the string
3846aa95bbe8SBarry Smith   malloc in them to see if additional memory allocation was needed.
3847aa95bbe8SBarry Smith 
384811a5261eSBarry Smith   Developer Notes:
384911a5261eSBarry Smith   Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix
3850a96a251dSBarry Smith   entries or columns indices
3851a96a251dSBarry Smith 
3852273d9f13SBarry Smith   By default, this format uses inodes (identical nodes) when possible, to
3853273d9f13SBarry Smith   improve numerical efficiency of matrix-vector products and solves. We
3854273d9f13SBarry Smith   search for consecutive rows with the same nonzero structure, thereby
3855273d9f13SBarry Smith   reusing matrix information to achieve increased efficiency.
3856273d9f13SBarry Smith 
38571cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`,
3858db781477SPatrick Sanan           `MatSeqAIJSetTotalPreallocation()`
3859273d9f13SBarry Smith @*/
MatSeqAIJSetPreallocation(Mat B,PetscInt nz,const PetscInt nnz[])3860d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[])
3861d71ae5a4SJacob Faibussowitsch {
3862a23d5eceSKris Buschelman   PetscFunctionBegin;
38636ba663aaSJed Brown   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
38646ba663aaSJed Brown   PetscValidType(B, 1);
3865cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz));
38663ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3867a23d5eceSKris Buschelman }
3868a23d5eceSKris Buschelman 
MatSeqAIJSetPreallocation_SeqAIJ(Mat B,PetscInt nz,const PetscInt * nnz)3869d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz)
3870d71ae5a4SJacob Faibussowitsch {
3871ad79cf63SBarry Smith   Mat_SeqAIJ *b              = (Mat_SeqAIJ *)B->data;
38722576faa2SJed Brown   PetscBool   skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE;
387397f1f81fSBarry Smith   PetscInt    i;
3874273d9f13SBarry Smith 
3875273d9f13SBarry Smith   PetscFunctionBegin;
3876ad79cf63SBarry Smith   if (B->hash_active) {
3877aea10558SJacob Faibussowitsch     B->ops[0] = b->cops;
3878ad79cf63SBarry Smith     PetscCall(PetscHMapIJVDestroy(&b->ht));
3879ad79cf63SBarry Smith     PetscCall(PetscFree(b->dnz));
3880ad79cf63SBarry Smith     B->hash_active = PETSC_FALSE;
3881ad79cf63SBarry Smith   }
38822576faa2SJed Brown   if (nz >= 0 || nnz) realalloc = PETSC_TRUE;
3883a96a251dSBarry Smith   if (nz == MAT_SKIP_ALLOCATION) {
3884c461c341SBarry Smith     skipallocation = PETSC_TRUE;
3885c461c341SBarry Smith     nz             = 0;
3886c461c341SBarry Smith   }
38879566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
38889566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
3889899cda47SBarry Smith 
3890435da068SBarry Smith   if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5;
389108401ef6SPierre Jolivet   PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz);
38929f0612e4SBarry Smith   if (nnz) {
3893d0f46423SBarry Smith     for (i = 0; i < B->rmap->n; i++) {
389408401ef6SPierre Jolivet       PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]);
389508401ef6SPierre Jolivet       PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n);
3896b73539f3SBarry Smith     }
3897b73539f3SBarry Smith   }
3898b73539f3SBarry Smith 
3899273d9f13SBarry Smith   B->preallocated = PETSC_TRUE;
3900ab93d7beSBarry Smith   if (!skipallocation) {
39013a7d0413SPierre Jolivet     if (!b->imax) PetscCall(PetscMalloc1(B->rmap->n, &b->imax));
3902071fcb05SBarry Smith     if (!b->ilen) {
3903071fcb05SBarry Smith       /* b->ilen will count nonzeros in each row so far. */
39049566063dSJacob Faibussowitsch       PetscCall(PetscCalloc1(B->rmap->n, &b->ilen));
3905071fcb05SBarry Smith     } else {
39069566063dSJacob Faibussowitsch       PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt)));
39072ee49352SLisandro Dalcin     }
3908aa624791SPierre Jolivet     if (!b->ipre) PetscCall(PetscMalloc1(B->rmap->n, &b->ipre));
3909273d9f13SBarry Smith     if (!nnz) {
3910435da068SBarry Smith       if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10;
3911c62bd62aSJed Brown       else if (nz < 0) nz = 1;
39125d2a9ed1SStefano Zampini       nz = PetscMin(nz, B->cmap->n);
3913d0f46423SBarry Smith       for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz;
3914c43c4a61SBarry Smith       PetscCall(PetscIntMultError(nz, B->rmap->n, &nz));
3915273d9f13SBarry Smith     } else {
3916c73702f5SBarry Smith       PetscInt64 nz64 = 0;
39179371c9d4SSatish Balay       for (i = 0; i < B->rmap->n; i++) {
39189371c9d4SSatish Balay         b->imax[i] = nnz[i];
39199371c9d4SSatish Balay         nz64 += nnz[i];
39209371c9d4SSatish Balay       }
39219566063dSJacob Faibussowitsch       PetscCall(PetscIntCast(nz64, &nz));
3922273d9f13SBarry Smith     }
3923ab93d7beSBarry Smith 
3924273d9f13SBarry Smith     /* allocate the matrix space */
39259566063dSJacob Faibussowitsch     PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i));
39269f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscInt), (void **)&b->j));
39279f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(B->rmap->n + 1, sizeof(PetscInt), (void **)&b->i));
39289f0612e4SBarry Smith     b->free_ij = PETSC_TRUE;
3929396832f4SHong Zhang     if (B->structure_only) {
39309f0612e4SBarry Smith       b->free_a = PETSC_FALSE;
3931396832f4SHong Zhang     } else {
39329f0612e4SBarry Smith       PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscScalar), (void **)&b->a));
39339f0612e4SBarry Smith       b->free_a = PETSC_TRUE;
3934396832f4SHong Zhang     }
3935bfeeae90SHong Zhang     b->i[0] = 0;
3936ad540459SPierre Jolivet     for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1];
3937c461c341SBarry Smith   } else {
3938e6b907acSBarry Smith     b->free_a  = PETSC_FALSE;
3939e6b907acSBarry Smith     b->free_ij = PETSC_FALSE;
3940c461c341SBarry Smith   }
3941273d9f13SBarry Smith 
3942846b4da1SFande Kong   if (b->ipre && nnz != b->ipre && b->imax) {
3943846b4da1SFande Kong     /* reserve user-requested sparsity */
39449566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n));
3945846b4da1SFande Kong   }
3946846b4da1SFande Kong 
3947273d9f13SBarry Smith   b->nz               = 0;
3948273d9f13SBarry Smith   b->maxnz            = nz;
3949273d9f13SBarry Smith   B->info.nz_unneeded = (double)b->maxnz;
39501baa6e33SBarry Smith   if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE));
3951cb7b82ddSBarry Smith   B->was_assembled = PETSC_FALSE;
3952cb7b82ddSBarry Smith   B->assembled     = PETSC_FALSE;
39535519a089SJose E. Roman   /* We simply deem preallocation has changed nonzero state. Updating the state
39545519a089SJose E. Roman      will give clients (like AIJKokkos) a chance to know something has happened.
39555519a089SJose E. Roman   */
39565519a089SJose E. Roman   B->nonzerostate++;
39573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3958273d9f13SBarry Smith }
3959273d9f13SBarry Smith 
MatResetPreallocation_SeqAIJ_Private(Mat A,PetscBool * memoryreset)39604c51d546SAlexander PetscErrorCode MatResetPreallocation_SeqAIJ_Private(Mat A, PetscBool *memoryreset)
3961d71ae5a4SJacob Faibussowitsch {
3962846b4da1SFande Kong   Mat_SeqAIJ *a;
3963a5bbaf83SFande Kong   PetscInt    i;
39641f14be2bSBarry Smith   PetscBool   skipreset;
3965846b4da1SFande Kong 
3966846b4da1SFande Kong   PetscFunctionBegin;
3967846b4da1SFande Kong   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
396814d0e64fSAlex Lindsay 
39694c51d546SAlexander   PetscCheck(A->insertmode == NOT_SET_VALUES, PETSC_COMM_SELF, PETSC_ERR_SUP, "Cannot reset preallocation after setting some values but not yet calling MatAssemblyBegin()/MatAssemblyEnd()");
39704c51d546SAlexander   if (A->num_ass == 0) PetscFunctionReturn(PETSC_SUCCESS);
39714c51d546SAlexander 
397214d0e64fSAlex Lindsay   /* Check local size. If zero, then return */
39733ba16761SJacob Faibussowitsch   if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS);
397414d0e64fSAlex Lindsay 
3975846b4da1SFande Kong   a = (Mat_SeqAIJ *)A->data;
39762c814fdeSFande Kong   /* if no saved info, we error out */
397728b400f6SJacob Faibussowitsch   PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info ");
39782c814fdeSFande Kong 
39791f14be2bSBarry Smith   PetscCheck(a->i && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and cannot reset preallocation ");
39802c814fdeSFande Kong 
39811f14be2bSBarry Smith   PetscCall(PetscArraycmp(a->ipre, a->ilen, A->rmap->n, &skipreset));
39824c51d546SAlexander   if (skipreset) PetscCall(MatZeroEntries(A));
39834c51d546SAlexander   else {
39849566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n));
39859566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(a->ilen, A->rmap->n));
3986846b4da1SFande Kong     a->i[0] = 0;
3987ad540459SPierre Jolivet     for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1];
3988846b4da1SFande Kong     A->preallocated     = PETSC_TRUE;
3989846b4da1SFande Kong     a->nz               = 0;
3990846b4da1SFande Kong     a->maxnz            = a->i[A->rmap->n];
3991846b4da1SFande Kong     A->info.nz_unneeded = (double)a->maxnz;
3992846b4da1SFande Kong     A->was_assembled    = PETSC_FALSE;
3993846b4da1SFande Kong     A->assembled        = PETSC_FALSE;
3994b3a35320SAlex Lindsay     A->nonzerostate++;
3995b3a35320SAlex Lindsay     /* Log that the state of this object has changed; this will help guarantee that preconditioners get re-setup */
3996b3a35320SAlex Lindsay     PetscCall(PetscObjectStateIncrease((PetscObject)A));
39971f14be2bSBarry Smith   }
39984c51d546SAlexander   if (memoryreset) *memoryreset = (PetscBool)!skipreset;
39994c51d546SAlexander   PetscFunctionReturn(PETSC_SUCCESS);
40004c51d546SAlexander }
40014c51d546SAlexander 
MatResetPreallocation_SeqAIJ(Mat A)40024c51d546SAlexander static PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A)
40034c51d546SAlexander {
40044c51d546SAlexander   PetscFunctionBegin;
40054c51d546SAlexander   PetscCall(MatResetPreallocation_SeqAIJ_Private(A, NULL));
40063ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4007846b4da1SFande Kong }
4008846b4da1SFande Kong 
400958d36128SBarry Smith /*@
401011a5261eSBarry Smith   MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format.
4011a1661176SMatthew Knepley 
4012a1661176SMatthew Knepley   Input Parameters:
4013a1661176SMatthew Knepley + B - the matrix
4014d8a51d2aSBarry Smith . i - the indices into `j` for the start of each row (indices start with zero)
4015d8a51d2aSBarry Smith . j - the column indices for each row (indices start with zero) these must be sorted for each row
4016d8a51d2aSBarry Smith - v - optional values in the matrix, use `NULL` if not provided
4017a1661176SMatthew Knepley 
4018a1661176SMatthew Knepley   Level: developer
4019a1661176SMatthew Knepley 
40206a9b8d82SBarry Smith   Notes:
40212ef1f0ffSBarry Smith   The `i`,`j`,`v` values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()`
402258d36128SBarry Smith 
40236a9b8d82SBarry Smith   This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero
40246a9b8d82SBarry Smith   structure will be the union of all the previous nonzero structures.
40256a9b8d82SBarry Smith 
40266a9b8d82SBarry Smith   Developer Notes:
40272ef1f0ffSBarry Smith   An optimization could be added to the implementation where it checks if the `i`, and `j` are identical to the current `i` and `j` and
40282ef1f0ffSBarry Smith   then just copies the `v` values directly with `PetscMemcpy()`.
40296a9b8d82SBarry Smith 
403011a5261eSBarry Smith   This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them.
40316a9b8d82SBarry Smith 
4032fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MATSEQAIJ`, `MatResetPreallocation()`
4033a1661176SMatthew Knepley @*/
MatSeqAIJSetPreallocationCSR(Mat B,const PetscInt i[],const PetscInt j[],const PetscScalar v[])4034d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[])
4035d71ae5a4SJacob Faibussowitsch {
4036a1661176SMatthew Knepley   PetscFunctionBegin;
40370700a824SBarry Smith   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
40386ba663aaSJed Brown   PetscValidType(B, 1);
4039cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v));
40403ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4041a1661176SMatthew Knepley }
4042a1661176SMatthew Knepley 
MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B,const PetscInt Ii[],const PetscInt J[],const PetscScalar v[])4043ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[])
4044d71ae5a4SJacob Faibussowitsch {
4045a1661176SMatthew Knepley   PetscInt  i;
4046a1661176SMatthew Knepley   PetscInt  m, n;
4047a1661176SMatthew Knepley   PetscInt  nz;
40486a9b8d82SBarry Smith   PetscInt *nnz;
4049a1661176SMatthew Knepley 
4050a1661176SMatthew Knepley   PetscFunctionBegin;
4051aed4548fSBarry Smith   PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]);
4052779a8d59SSatish Balay 
40539566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
40549566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
4055779a8d59SSatish Balay 
40569566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &m, &n));
40579566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nnz));
4058a1661176SMatthew Knepley   for (i = 0; i < m; i++) {
4059b7940d39SSatish Balay     nz = Ii[i + 1] - Ii[i];
406008401ef6SPierre Jolivet     PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz);
4061a1661176SMatthew Knepley     nnz[i] = nz;
4062a1661176SMatthew Knepley   }
40639566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz));
40649566063dSJacob Faibussowitsch   PetscCall(PetscFree(nnz));
4065a1661176SMatthew Knepley 
40668e3a54c0SPierre Jolivet   for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], PetscSafePointerPlusOffset(v, Ii[i]), INSERT_VALUES));
4067a1661176SMatthew Knepley 
40689566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY));
40699566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY));
4070a1661176SMatthew Knepley 
40719566063dSJacob Faibussowitsch   PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE));
40723ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4073a1661176SMatthew Knepley }
4074a1661176SMatthew Knepley 
4075ad7e164aSPierre Jolivet /*@
40762ef1f0ffSBarry Smith   MatSeqAIJKron - Computes `C`, the Kronecker product of `A` and `B`.
4077ad7e164aSPierre Jolivet 
4078ad7e164aSPierre Jolivet   Input Parameters:
4079ad7e164aSPierre Jolivet + A     - left-hand side matrix
4080ad7e164aSPierre Jolivet . B     - right-hand side matrix
408111a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX`
4082ad7e164aSPierre Jolivet 
4083ad7e164aSPierre Jolivet   Output Parameter:
40842ef1f0ffSBarry Smith . C - Kronecker product of `A` and `B`
4085ad7e164aSPierre Jolivet 
4086ad7e164aSPierre Jolivet   Level: intermediate
4087ad7e164aSPierre Jolivet 
408811a5261eSBarry Smith   Note:
408911a5261eSBarry Smith   `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`.
4090ad7e164aSPierre Jolivet 
40911cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse`
4092ad7e164aSPierre Jolivet @*/
MatSeqAIJKron(Mat A,Mat B,MatReuse reuse,Mat * C)4093d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C)
4094d71ae5a4SJacob Faibussowitsch {
4095ad7e164aSPierre Jolivet   PetscFunctionBegin;
4096ad7e164aSPierre Jolivet   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
4097ad7e164aSPierre Jolivet   PetscValidType(A, 1);
4098ad7e164aSPierre Jolivet   PetscValidHeaderSpecific(B, MAT_CLASSID, 2);
4099ad7e164aSPierre Jolivet   PetscValidType(B, 2);
41004f572ea9SToby Isaac   PetscAssertPointer(C, 4);
4101ad7e164aSPierre Jolivet   if (reuse == MAT_REUSE_MATRIX) {
4102ad7e164aSPierre Jolivet     PetscValidHeaderSpecific(*C, MAT_CLASSID, 4);
4103ad7e164aSPierre Jolivet     PetscValidType(*C, 4);
4104ad7e164aSPierre Jolivet   }
4105cac4c232SBarry Smith   PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C));
41063ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4107ad7e164aSPierre Jolivet }
4108ad7e164aSPierre Jolivet 
MatSeqAIJKron_SeqAIJ(Mat A,Mat B,MatReuse reuse,Mat * C)4109ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C)
4110d71ae5a4SJacob Faibussowitsch {
4111ad7e164aSPierre Jolivet   Mat                newmat;
4112ad7e164aSPierre Jolivet   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
4113ad7e164aSPierre Jolivet   Mat_SeqAIJ        *b = (Mat_SeqAIJ *)B->data;
4114ad7e164aSPierre Jolivet   PetscScalar       *v;
4115fff043a9SJunchao Zhang   const PetscScalar *aa, *ba;
4116ad7e164aSPierre Jolivet   PetscInt          *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n;
4117ad7e164aSPierre Jolivet   PetscBool          flg;
4118ad7e164aSPierre Jolivet 
4119ad7e164aSPierre Jolivet   PetscFunctionBegin;
412028b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
412128b400f6SJacob Faibussowitsch   PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
412228b400f6SJacob Faibussowitsch   PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
412328b400f6SJacob Faibussowitsch   PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
41249566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg));
412528b400f6SJacob Faibussowitsch   PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name);
4126aed4548fSBarry Smith   PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse);
4127ad7e164aSPierre Jolivet   if (reuse == MAT_INITIAL_MATRIX) {
41289566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j));
41299566063dSJacob Faibussowitsch     PetscCall(MatCreate(PETSC_COMM_SELF, &newmat));
41309566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn));
41319566063dSJacob Faibussowitsch     PetscCall(MatSetType(newmat, MATAIJ));
4132ad7e164aSPierre Jolivet     i[0] = 0;
4133ad7e164aSPierre Jolivet     for (m = 0; m < am; ++m) {
4134ad7e164aSPierre Jolivet       for (p = 0; p < bm; ++p) {
4135ad7e164aSPierre Jolivet         i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]);
4136ad7e164aSPierre Jolivet         for (n = a->i[m]; n < a->i[m + 1]; ++n) {
4137ad540459SPierre Jolivet           for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q];
4138ad7e164aSPierre Jolivet         }
4139ad7e164aSPierre Jolivet       }
4140ad7e164aSPierre Jolivet     }
41419566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL));
4142ad7e164aSPierre Jolivet     *C = newmat;
41439566063dSJacob Faibussowitsch     PetscCall(PetscFree2(i, j));
4144ad7e164aSPierre Jolivet     nnz = 0;
4145ad7e164aSPierre Jolivet   }
41469566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(*C, &v));
41479566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
41489566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &ba));
4149ad7e164aSPierre Jolivet   for (m = 0; m < am; ++m) {
4150ad7e164aSPierre Jolivet     for (p = 0; p < bm; ++p) {
4151ad7e164aSPierre Jolivet       for (n = a->i[m]; n < a->i[m + 1]; ++n) {
4152ad540459SPierre Jolivet         for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q];
4153ad7e164aSPierre Jolivet       }
4154ad7e164aSPierre Jolivet     }
4155ad7e164aSPierre Jolivet   }
41569566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(*C, &v));
41579566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
41589566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &ba));
41593ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4160ad7e164aSPierre Jolivet }
4161ad7e164aSPierre Jolivet 
4162c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h>
4163af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h>
4164170fe5c8SBarry Smith 
4165170fe5c8SBarry Smith /*
4166170fe5c8SBarry Smith     Computes (B'*A')' since computing B*A directly is untenable
4167170fe5c8SBarry Smith 
4168170fe5c8SBarry Smith                n                       p                          p
41692da392ccSBarry Smith         [             ]       [             ]         [                 ]
41702da392ccSBarry Smith       m [      A      ]  *  n [       B     ]   =   m [         C       ]
41712da392ccSBarry Smith         [             ]       [             ]         [                 ]
4172170fe5c8SBarry Smith 
4173170fe5c8SBarry Smith */
MatMatMultNumeric_SeqDense_SeqAIJ(Mat A,Mat B,Mat C)4174d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C)
4175d71ae5a4SJacob Faibussowitsch {
4176170fe5c8SBarry Smith   Mat_SeqDense      *sub_a = (Mat_SeqDense *)A->data;
4177170fe5c8SBarry Smith   Mat_SeqAIJ        *sub_b = (Mat_SeqAIJ *)B->data;
4178170fe5c8SBarry Smith   Mat_SeqDense      *sub_c = (Mat_SeqDense *)C->data;
417986214ceeSStefano Zampini   PetscInt           i, j, n, m, q, p;
4180170fe5c8SBarry Smith   const PetscInt    *ii, *idx;
4181170fe5c8SBarry Smith   const PetscScalar *b, *a, *a_q;
4182170fe5c8SBarry Smith   PetscScalar       *c, *c_q;
418386214ceeSStefano Zampini   PetscInt           clda = sub_c->lda;
418486214ceeSStefano Zampini   PetscInt           alda = sub_a->lda;
4185170fe5c8SBarry Smith 
4186170fe5c8SBarry Smith   PetscFunctionBegin;
4187d0f46423SBarry Smith   m = A->rmap->n;
4188d0f46423SBarry Smith   n = A->cmap->n;
4189d0f46423SBarry Smith   p = B->cmap->n;
4190170fe5c8SBarry Smith   a = sub_a->v;
4191170fe5c8SBarry Smith   b = sub_b->a;
4192170fe5c8SBarry Smith   c = sub_c->v;
419386214ceeSStefano Zampini   if (clda == m) {
41949566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(c, m * p));
419586214ceeSStefano Zampini   } else {
419686214ceeSStefano Zampini     for (j = 0; j < p; j++)
41979371c9d4SSatish Balay       for (i = 0; i < m; i++) c[j * clda + i] = 0.0;
419886214ceeSStefano Zampini   }
4199170fe5c8SBarry Smith   ii  = sub_b->i;
4200170fe5c8SBarry Smith   idx = sub_b->j;
4201170fe5c8SBarry Smith   for (i = 0; i < n; i++) {
4202170fe5c8SBarry Smith     q = ii[i + 1] - ii[i];
4203170fe5c8SBarry Smith     while (q-- > 0) {
420486214ceeSStefano Zampini       c_q = c + clda * (*idx);
420586214ceeSStefano Zampini       a_q = a + alda * i;
4206854c7f52SBarry Smith       PetscKernelAXPY(c_q, *b, a_q, m);
4207170fe5c8SBarry Smith       idx++;
4208170fe5c8SBarry Smith       b++;
4209170fe5c8SBarry Smith     }
4210170fe5c8SBarry Smith   }
42113ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4212170fe5c8SBarry Smith }
4213170fe5c8SBarry Smith 
MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A,Mat B,PetscReal fill,Mat C)4214d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C)
4215d71ae5a4SJacob Faibussowitsch {
4216d0f46423SBarry Smith   PetscInt  m = A->rmap->n, n = B->cmap->n;
421786214ceeSStefano Zampini   PetscBool cisdense;
4218170fe5c8SBarry Smith 
4219170fe5c8SBarry Smith   PetscFunctionBegin;
422008401ef6SPierre Jolivet   PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n);
42219566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(C, m, n, m, n));
42229566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(C, A, B));
4223d5e393b6SSuyash Tandon   PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, ""));
422448a46eb9SPierre Jolivet   if (!cisdense) PetscCall(MatSetType(C, MATDENSE));
42259566063dSJacob Faibussowitsch   PetscCall(MatSetUp(C));
4226d73949e8SHong Zhang 
42274222ddf1SHong Zhang   C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ;
42283ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4229170fe5c8SBarry Smith }
4230170fe5c8SBarry Smith 
42310bad9183SKris Buschelman /*MC
4232fafad747SKris Buschelman    MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices,
42330bad9183SKris Buschelman    based on compressed sparse row format.
42340bad9183SKris Buschelman 
42352ef1f0ffSBarry Smith    Options Database Key:
42360bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions()
42370bad9183SKris Buschelman 
42380bad9183SKris Buschelman    Level: beginner
42390bad9183SKris Buschelman 
42400cd7f59aSBarry Smith    Notes:
42412ef1f0ffSBarry Smith     `MatSetValues()` may be called for this matrix type with a `NULL` argument for the numerical values,
42420cd7f59aSBarry Smith     in this case the values associated with the rows and columns one passes in are set to zero
42430cd7f59aSBarry Smith     in the matrix
42440cd7f59aSBarry Smith 
424511a5261eSBarry Smith     `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no
424611a5261eSBarry Smith     space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored
42470cd7f59aSBarry Smith 
424811a5261eSBarry Smith   Developer Note:
42492ef1f0ffSBarry Smith     It would be nice if all matrix formats supported passing `NULL` in for the numerical values
42500cd7f59aSBarry Smith 
42511cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL`
42520bad9183SKris Buschelman M*/
42530bad9183SKris Buschelman 
4254ccd284c7SBarry Smith /*MC
4255ccd284c7SBarry Smith    MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices.
4256ccd284c7SBarry Smith 
425711a5261eSBarry Smith    This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator,
425811a5261eSBarry Smith    and `MATMPIAIJ` otherwise.  As a result, for single process communicators,
425911a5261eSBarry Smith    `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported
4260ccd284c7SBarry Smith    for communicators controlling multiple processes.  It is recommended that you call both of
4261ccd284c7SBarry Smith    the above preallocation routines for simplicity.
4262ccd284c7SBarry Smith 
42632ef1f0ffSBarry Smith    Options Database Key:
426411a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()`
4265ccd284c7SBarry Smith 
42662ef1f0ffSBarry Smith   Level: beginner
42672ef1f0ffSBarry Smith 
426811a5261eSBarry Smith    Note:
426911a5261eSBarry Smith    Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when
4270ccd284c7SBarry Smith    enough exist.
4271ccd284c7SBarry Smith 
42721cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL`
4273ccd284c7SBarry Smith M*/
4274ccd284c7SBarry Smith 
4275ccd284c7SBarry Smith /*MC
4276ccd284c7SBarry Smith    MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices.
4277ccd284c7SBarry Smith 
42782ef1f0ffSBarry Smith    Options Database Key:
42792ef1f0ffSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()`
42802ef1f0ffSBarry Smith 
42812ef1f0ffSBarry Smith   Level: beginner
42822ef1f0ffSBarry Smith 
42832ef1f0ffSBarry Smith    Note:
428411a5261eSBarry Smith    This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator,
428511a5261eSBarry Smith    and `MATMPIAIJCRL` otherwise.  As a result, for single process communicators,
428611a5261eSBarry Smith    `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported
4287ccd284c7SBarry Smith    for communicators controlling multiple processes.  It is recommended that you call both of
4288ccd284c7SBarry Smith    the above preallocation routines for simplicity.
4289ccd284c7SBarry Smith 
42901cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`
4291ccd284c7SBarry Smith M*/
4292ccd284c7SBarry Smith 
42937906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *);
42947906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
42957906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *);
42967906f579SHong Zhang #endif
4297d1a032dbSPierre Jolivet #if defined(PETSC_HAVE_SCALAPACK) && (defined(PETSC_USE_REAL_SINGLE) || defined(PETSC_USE_REAL_DOUBLE))
4298d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *);
4299d24d4204SJose E. Roman #endif
43007906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE)
43017906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *);
43027906f579SHong Zhang #endif
43037906f579SHong Zhang 
4304d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *);
4305c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *);
43064222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat);
43077906f579SHong Zhang 
43088c778c55SBarry Smith /*@C
430911a5261eSBarry Smith   MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored
43108c778c55SBarry Smith 
43118c778c55SBarry Smith   Not Collective
43128c778c55SBarry Smith 
43138c778c55SBarry Smith   Input Parameter:
4314fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
43158c778c55SBarry Smith 
43168c778c55SBarry Smith   Output Parameter:
43178c778c55SBarry Smith . array - pointer to the data
43188c778c55SBarry Smith 
43198c778c55SBarry Smith   Level: intermediate
43208c778c55SBarry Smith 
4321ce78bad3SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`
43228c778c55SBarry Smith @*/
MatSeqAIJGetArray(Mat A,PetscScalar * array[])43235d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar *array[])
4324d71ae5a4SJacob Faibussowitsch {
4325d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
43268c778c55SBarry Smith 
43278c778c55SBarry Smith   PetscFunctionBegin;
4328d67d9f35SJunchao Zhang   if (aij->ops->getarray) {
43299566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarray)(A, array));
4330d67d9f35SJunchao Zhang   } else {
4331d67d9f35SJunchao Zhang     *array = aij->a;
4332d67d9f35SJunchao Zhang   }
43333ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4334d67d9f35SJunchao Zhang }
4335d67d9f35SJunchao Zhang 
4336d67d9f35SJunchao Zhang /*@C
433711a5261eSBarry Smith   MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()`
4338d67d9f35SJunchao Zhang 
4339d67d9f35SJunchao Zhang   Not Collective
4340d67d9f35SJunchao Zhang 
4341d67d9f35SJunchao Zhang   Input Parameters:
4342fe59aa6dSJacob Faibussowitsch + A     - a `MATSEQAIJ` matrix
4343d67d9f35SJunchao Zhang - array - pointer to the data
4344d67d9f35SJunchao Zhang 
4345d67d9f35SJunchao Zhang   Level: intermediate
4346d67d9f35SJunchao Zhang 
4347ce78bad3SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`
4348d67d9f35SJunchao Zhang @*/
MatSeqAIJRestoreArray(Mat A,PetscScalar * array[])43495d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar *array[])
4350d71ae5a4SJacob Faibussowitsch {
4351d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4352d67d9f35SJunchao Zhang 
4353d67d9f35SJunchao Zhang   PetscFunctionBegin;
4354d67d9f35SJunchao Zhang   if (aij->ops->restorearray) {
43559566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearray)(A, array));
4356d67d9f35SJunchao Zhang   } else {
4357d67d9f35SJunchao Zhang     *array = NULL;
4358d67d9f35SJunchao Zhang   }
43599566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)A));
43603ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
43618c778c55SBarry Smith }
43628c778c55SBarry Smith 
436321e72a00SBarry Smith /*@C
436411a5261eSBarry Smith   MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored
43658f1ea47aSStefano Zampini 
43660ab4885dSBarry Smith   Not Collective; No Fortran Support
43678f1ea47aSStefano Zampini 
43688f1ea47aSStefano Zampini   Input Parameter:
4369fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
43708f1ea47aSStefano Zampini 
43718f1ea47aSStefano Zampini   Output Parameter:
43728f1ea47aSStefano Zampini . array - pointer to the data
43738f1ea47aSStefano Zampini 
43748f1ea47aSStefano Zampini   Level: intermediate
43758f1ea47aSStefano Zampini 
43761cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()`
43778f1ea47aSStefano Zampini @*/
MatSeqAIJGetArrayRead(Mat A,const PetscScalar * array[])43785d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar *array[])
4379d71ae5a4SJacob Faibussowitsch {
4380d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
43818f1ea47aSStefano Zampini 
43828f1ea47aSStefano Zampini   PetscFunctionBegin;
4383d67d9f35SJunchao Zhang   if (aij->ops->getarrayread) {
43849566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarrayread)(A, array));
4385d67d9f35SJunchao Zhang   } else {
4386d67d9f35SJunchao Zhang     *array = aij->a;
4387d67d9f35SJunchao Zhang   }
43883ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
43898f1ea47aSStefano Zampini }
43908f1ea47aSStefano Zampini 
43918f1ea47aSStefano Zampini /*@C
439211a5261eSBarry Smith   MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()`
43938f1ea47aSStefano Zampini 
43940ab4885dSBarry Smith   Not Collective; No Fortran Support
43958f1ea47aSStefano Zampini 
43968f1ea47aSStefano Zampini   Input Parameter:
4397fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
43988f1ea47aSStefano Zampini 
43998f1ea47aSStefano Zampini   Output Parameter:
44008f1ea47aSStefano Zampini . array - pointer to the data
44018f1ea47aSStefano Zampini 
44028f1ea47aSStefano Zampini   Level: intermediate
44038f1ea47aSStefano Zampini 
44041cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
44058f1ea47aSStefano Zampini @*/
MatSeqAIJRestoreArrayRead(Mat A,const PetscScalar * array[])44065d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar *array[])
4407d71ae5a4SJacob Faibussowitsch {
4408d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
44098f1ea47aSStefano Zampini 
44108f1ea47aSStefano Zampini   PetscFunctionBegin;
4411d67d9f35SJunchao Zhang   if (aij->ops->restorearrayread) {
44129566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearrayread)(A, array));
4413d67d9f35SJunchao Zhang   } else {
4414d67d9f35SJunchao Zhang     *array = NULL;
4415d67d9f35SJunchao Zhang   }
44163ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4417d67d9f35SJunchao Zhang }
4418d67d9f35SJunchao Zhang 
4419d67d9f35SJunchao Zhang /*@C
442011a5261eSBarry Smith   MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored
4421d67d9f35SJunchao Zhang 
44220ab4885dSBarry Smith   Not Collective; No Fortran Support
4423d67d9f35SJunchao Zhang 
4424d67d9f35SJunchao Zhang   Input Parameter:
4425fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
4426d67d9f35SJunchao Zhang 
4427d67d9f35SJunchao Zhang   Output Parameter:
4428d67d9f35SJunchao Zhang . array - pointer to the data
4429d67d9f35SJunchao Zhang 
4430d67d9f35SJunchao Zhang   Level: intermediate
4431d67d9f35SJunchao Zhang 
44321cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()`
4433d67d9f35SJunchao Zhang @*/
MatSeqAIJGetArrayWrite(Mat A,PetscScalar * array[])44345d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar *array[])
4435d71ae5a4SJacob Faibussowitsch {
4436d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4437d67d9f35SJunchao Zhang 
4438d67d9f35SJunchao Zhang   PetscFunctionBegin;
4439d67d9f35SJunchao Zhang   if (aij->ops->getarraywrite) {
44409566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarraywrite)(A, array));
4441d67d9f35SJunchao Zhang   } else {
4442d67d9f35SJunchao Zhang     *array = aij->a;
4443d67d9f35SJunchao Zhang   }
44449566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)A));
44453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4446d67d9f35SJunchao Zhang }
4447d67d9f35SJunchao Zhang 
4448d67d9f35SJunchao Zhang /*@C
4449d67d9f35SJunchao Zhang   MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead
4450d67d9f35SJunchao Zhang 
44510ab4885dSBarry Smith   Not Collective; No Fortran Support
4452d67d9f35SJunchao Zhang 
4453d67d9f35SJunchao Zhang   Input Parameter:
4454fe59aa6dSJacob Faibussowitsch . A - a MATSEQAIJ matrix
4455d67d9f35SJunchao Zhang 
4456d67d9f35SJunchao Zhang   Output Parameter:
4457d67d9f35SJunchao Zhang . array - pointer to the data
4458d67d9f35SJunchao Zhang 
4459d67d9f35SJunchao Zhang   Level: intermediate
4460d67d9f35SJunchao Zhang 
44611cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
4462d67d9f35SJunchao Zhang @*/
MatSeqAIJRestoreArrayWrite(Mat A,PetscScalar * array[])44635d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar *array[])
4464d71ae5a4SJacob Faibussowitsch {
4465d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4466d67d9f35SJunchao Zhang 
4467d67d9f35SJunchao Zhang   PetscFunctionBegin;
4468d67d9f35SJunchao Zhang   if (aij->ops->restorearraywrite) {
44699566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearraywrite)(A, array));
4470d67d9f35SJunchao Zhang   } else {
4471d67d9f35SJunchao Zhang     *array = NULL;
4472d67d9f35SJunchao Zhang   }
44733ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
44748f1ea47aSStefano Zampini }
44758f1ea47aSStefano Zampini 
44768f1ea47aSStefano Zampini /*@C
447711a5261eSBarry Smith   MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix
44787ee59b9bSJunchao Zhang 
44790ab4885dSBarry Smith   Not Collective; No Fortran Support
44807ee59b9bSJunchao Zhang 
44817ee59b9bSJunchao Zhang   Input Parameter:
448211a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses
44837ee59b9bSJunchao Zhang 
44847ee59b9bSJunchao Zhang   Output Parameters:
44857ee59b9bSJunchao Zhang + i     - row map array of the matrix
44867ee59b9bSJunchao Zhang . j     - column index array of the matrix
44877ee59b9bSJunchao Zhang . a     - data array of the matrix
4488fe59aa6dSJacob Faibussowitsch - mtype - memory type of the arrays
44897ee59b9bSJunchao Zhang 
4490fe59aa6dSJacob Faibussowitsch   Level: developer
44912ef1f0ffSBarry Smith 
44927ee59b9bSJunchao Zhang   Notes:
44932ef1f0ffSBarry Smith   Any of the output parameters can be `NULL`, in which case the corresponding value is not returned.
44947ee59b9bSJunchao Zhang   If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host.
44957ee59b9bSJunchao Zhang 
44967ee59b9bSJunchao Zhang   One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix.
44972ef1f0ffSBarry Smith   If the matrix is assembled, the data array `a` is guaranteed to have the latest values of the matrix.
44987ee59b9bSJunchao Zhang 
44991cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
45007ee59b9bSJunchao Zhang @*/
MatSeqAIJGetCSRAndMemType(Mat mat,const PetscInt * i[],const PetscInt * j[],PetscScalar * a[],PetscMemType * mtype)45015d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt *i[], const PetscInt *j[], PetscScalar *a[], PetscMemType *mtype)
4502d71ae5a4SJacob Faibussowitsch {
45037ee59b9bSJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
45047ee59b9bSJunchao Zhang 
45057ee59b9bSJunchao Zhang   PetscFunctionBegin;
45067ee59b9bSJunchao Zhang   PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated");
45077ee59b9bSJunchao Zhang   if (aij->ops->getcsrandmemtype) {
45087ee59b9bSJunchao Zhang     PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype));
45097ee59b9bSJunchao Zhang   } else {
45107ee59b9bSJunchao Zhang     if (i) *i = aij->i;
45117ee59b9bSJunchao Zhang     if (j) *j = aij->j;
45127ee59b9bSJunchao Zhang     if (a) *a = aij->a;
45137ee59b9bSJunchao Zhang     if (mtype) *mtype = PETSC_MEMTYPE_HOST;
45147ee59b9bSJunchao Zhang   }
45153ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
45167ee59b9bSJunchao Zhang }
45177ee59b9bSJunchao Zhang 
4518cc4c1da9SBarry Smith /*@
451921e72a00SBarry Smith   MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row
452021e72a00SBarry Smith 
452121e72a00SBarry Smith   Not Collective
452221e72a00SBarry Smith 
452321e72a00SBarry Smith   Input Parameter:
4524fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
452521e72a00SBarry Smith 
452621e72a00SBarry Smith   Output Parameter:
452721e72a00SBarry Smith . nz - the maximum number of nonzeros in any row
452821e72a00SBarry Smith 
452921e72a00SBarry Smith   Level: intermediate
453021e72a00SBarry Smith 
4531ce78bad3SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`
453221e72a00SBarry Smith @*/
MatSeqAIJGetMaxRowNonzeros(Mat A,PetscInt * nz)4533d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz)
4534d71ae5a4SJacob Faibussowitsch {
453521e72a00SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
453621e72a00SBarry Smith 
453721e72a00SBarry Smith   PetscFunctionBegin;
453821e72a00SBarry Smith   *nz = aij->rmax;
45393ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
454021e72a00SBarry Smith }
454121e72a00SBarry Smith 
MatCOOStructDestroy_SeqAIJ(PetscCtxRt data)4542*2a8381b2SBarry Smith static PetscErrorCode MatCOOStructDestroy_SeqAIJ(PetscCtxRt data)
45432c4ab24aSJunchao Zhang {
4544*2a8381b2SBarry Smith   MatCOOStruct_SeqAIJ *coo = *(MatCOOStruct_SeqAIJ **)data;
45454d86920dSPierre Jolivet 
45462c4ab24aSJunchao Zhang   PetscFunctionBegin;
45472c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo->perm));
45482c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo->jmap));
45492c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo));
45502c4ab24aSJunchao Zhang   PetscFunctionReturn(PETSC_SUCCESS);
45512c4ab24aSJunchao Zhang }
45522c4ab24aSJunchao Zhang 
MatSetPreallocationCOO_SeqAIJ(Mat mat,PetscCount coo_n,PetscInt coo_i[],PetscInt coo_j[])4553d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[])
4554d71ae5a4SJacob Faibussowitsch {
4555394ed5ebSJunchao Zhang   MPI_Comm             comm;
4556394ed5ebSJunchao Zhang   PetscInt            *i, *j;
45570d88f7f4SJunchao Zhang   PetscInt             M, N, row, iprev;
4558394ed5ebSJunchao Zhang   PetscCount           k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */
4559394ed5ebSJunchao Zhang   PetscInt            *Ai;                             /* Change to PetscCount once we use it for row pointers */
4560394ed5ebSJunchao Zhang   PetscInt            *Aj;
4561394ed5ebSJunchao Zhang   PetscScalar         *Aa;
4562f4f49eeaSPierre Jolivet   Mat_SeqAIJ          *seqaij = (Mat_SeqAIJ *)mat->data;
4563cbc6b225SStefano Zampini   MatType              rtype;
4564394ed5ebSJunchao Zhang   PetscCount          *perm, *jmap;
45652c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo;
45660d88f7f4SJunchao Zhang   PetscBool            isorted;
45679f0612e4SBarry Smith   PetscBool            hypre;
4568394ed5ebSJunchao Zhang 
4569394ed5ebSJunchao Zhang   PetscFunctionBegin;
45709566063dSJacob Faibussowitsch   PetscCall(PetscObjectGetComm((PetscObject)mat, &comm));
45719566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &M, &N));
4572e8729f6fSJunchao Zhang   i = coo_i;
4573e8729f6fSJunchao Zhang   j = coo_j;
45749566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n, &perm));
45750d88f7f4SJunchao Zhang 
45760d88f7f4SJunchao Zhang   /* Ignore entries with negative row or col indices; at the same time, check if i[] is already sorted (e.g., MatConvert_AlJ_HYPRE results in this case) */
45770d88f7f4SJunchao Zhang   isorted = PETSC_TRUE;
45780d88f7f4SJunchao Zhang   iprev   = PETSC_INT_MIN;
45790d88f7f4SJunchao Zhang   for (k = 0; k < coo_n; k++) {
4580394ed5ebSJunchao Zhang     if (j[k] < 0) i[k] = -1;
45810d88f7f4SJunchao Zhang     if (isorted) {
45820d88f7f4SJunchao Zhang       if (i[k] < iprev) isorted = PETSC_FALSE;
45830d88f7f4SJunchao Zhang       else iprev = i[k];
45840d88f7f4SJunchao Zhang     }
4585394ed5ebSJunchao Zhang     perm[k] = k;
4586394ed5ebSJunchao Zhang   }
4587394ed5ebSJunchao Zhang 
45880d88f7f4SJunchao Zhang   /* Sort by row if not already */
45890d88f7f4SJunchao Zhang   if (!isorted) PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm));
45902b35a777SBarry Smith   PetscCheck(coo_n == 0 || i[coo_n - 1] < M, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "COO row index %" PetscInt_FMT " is >= the matrix row size %" PetscInt_FMT, i[coo_n - 1], M);
4591651b1cf9SStefano Zampini 
4592651b1cf9SStefano Zampini   /* Advance k to the first row with a non-negative index */
4593651b1cf9SStefano Zampini   for (k = 0; k < coo_n; k++)
45949371c9d4SSatish Balay     if (i[k] >= 0) break;
4595394ed5ebSJunchao Zhang   nneg = k;
45969566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */
4597394ed5ebSJunchao Zhang   nnz = 0;                                          /* Total number of unique nonzeros to be counted */
459835cb6cd3SPierre Jolivet   jmap++;                                           /* Inc jmap by 1 for convenience */
4599394ed5ebSJunchao Zhang 
46009f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(M + 1, sizeof(PetscInt), (void **)&Ai)); /* CSR of A */
46019f0612e4SBarry Smith   PetscCall(PetscArrayzero(Ai, M + 1));
46029f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(coo_n - nneg, sizeof(PetscInt), (void **)&Aj)); /* We have at most coo_n-nneg unique nonzeros */
4603394ed5ebSJunchao Zhang 
460421fb621cSStefano Zampini   PetscCall(PetscStrcmp("_internal_COO_mat_for_hypre", ((PetscObject)mat)->name, &hypre));
4605651b1cf9SStefano Zampini 
4606394ed5ebSJunchao Zhang   /* In each row, sort by column, then unique column indices to get row length */
460735cb6cd3SPierre Jolivet   Ai++;  /* Inc by 1 for convenience */
4608394ed5ebSJunchao Zhang   q = 0; /* q-th unique nonzero, with q starting from 0 */
4609394ed5ebSJunchao Zhang   while (k < coo_n) {
46100d88f7f4SJunchao Zhang     PetscBool strictly_sorted; // this row is strictly sorted?
46110d88f7f4SJunchao Zhang     PetscInt  jprev;
46120d88f7f4SJunchao Zhang 
46130d88f7f4SJunchao Zhang     /* get [start,end) indices for this row; also check if cols in this row are strictly sorted */
4614394ed5ebSJunchao Zhang     row             = i[k];
46150d88f7f4SJunchao Zhang     start           = k;
46160d88f7f4SJunchao Zhang     jprev           = PETSC_INT_MIN;
46170d88f7f4SJunchao Zhang     strictly_sorted = PETSC_TRUE;
46180d88f7f4SJunchao Zhang     while (k < coo_n && i[k] == row) {
46190d88f7f4SJunchao Zhang       if (strictly_sorted) {
46200d88f7f4SJunchao Zhang         if (j[k] <= jprev) strictly_sorted = PETSC_FALSE;
46210d88f7f4SJunchao Zhang         else jprev = j[k];
46220d88f7f4SJunchao Zhang       }
46230d88f7f4SJunchao Zhang       k++;
46240d88f7f4SJunchao Zhang     }
4625394ed5ebSJunchao Zhang     end = k;
46260d88f7f4SJunchao Zhang 
4627651b1cf9SStefano Zampini     /* hack for HYPRE: swap min column to diag so that diagonal values will go first */
4628651b1cf9SStefano Zampini     if (hypre) {
46291690c2aeSBarry Smith       PetscInt  minj    = PETSC_INT_MAX;
4630651b1cf9SStefano Zampini       PetscBool hasdiag = PETSC_FALSE;
46310d88f7f4SJunchao Zhang 
46320d88f7f4SJunchao Zhang       if (strictly_sorted) { // fast path to swap the first and the diag
46330d88f7f4SJunchao Zhang         PetscCount tmp;
46340d88f7f4SJunchao Zhang         for (p = start; p < end; p++) {
46350d88f7f4SJunchao Zhang           if (j[p] == row && p != start) {
46361c265611SJunchao Zhang             j[p]        = j[start]; // swap j[], so that the diagonal value will go first (manipulated by perm[])
46370d88f7f4SJunchao Zhang             j[start]    = row;
46380d88f7f4SJunchao Zhang             tmp         = perm[start];
46391c265611SJunchao Zhang             perm[start] = perm[p]; // also swap perm[] so we can save the call to PetscSortIntWithCountArray() below
46400d88f7f4SJunchao Zhang             perm[p]     = tmp;
46410d88f7f4SJunchao Zhang             break;
46420d88f7f4SJunchao Zhang           }
46430d88f7f4SJunchao Zhang         }
46440d88f7f4SJunchao Zhang       } else {
4645651b1cf9SStefano Zampini         for (p = start; p < end; p++) {
4646651b1cf9SStefano Zampini           hasdiag = (PetscBool)(hasdiag || (j[p] == row));
4647651b1cf9SStefano Zampini           minj    = PetscMin(minj, j[p]);
4648651b1cf9SStefano Zampini         }
46490d88f7f4SJunchao Zhang 
4650651b1cf9SStefano Zampini         if (hasdiag) {
4651651b1cf9SStefano Zampini           for (p = start; p < end; p++) {
4652651b1cf9SStefano Zampini             if (j[p] == minj) j[p] = row;
4653651b1cf9SStefano Zampini             else if (j[p] == row) j[p] = minj;
4654651b1cf9SStefano Zampini           }
4655651b1cf9SStefano Zampini         }
4656651b1cf9SStefano Zampini       }
46570d88f7f4SJunchao Zhang     }
46581c265611SJunchao Zhang     // sort by columns in a row. perm[] indicates their original order
46590d88f7f4SJunchao Zhang     if (!strictly_sorted) PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start));
46608551dd9cSJunchao Zhang     PetscCheck(end == start || j[end - 1] < N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "COO column index %" PetscInt_FMT " is >= the matrix column size %" PetscInt_FMT, j[end - 1], N);
4661651b1cf9SStefano Zampini 
46620d88f7f4SJunchao Zhang     if (strictly_sorted) { // fast path to set Aj[], jmap[], Ai[], nnz, q
46630d88f7f4SJunchao Zhang       for (p = start; p < end; p++, q++) {
46640d88f7f4SJunchao Zhang         Aj[q]   = j[p];
46650d88f7f4SJunchao Zhang         jmap[q] = 1;
46660d88f7f4SJunchao Zhang       }
46676497c311SBarry Smith       PetscCall(PetscIntCast(end - start, Ai + row));
46680d88f7f4SJunchao Zhang       nnz += Ai[row]; // q is already advanced
46690d88f7f4SJunchao Zhang     } else {
4670394ed5ebSJunchao Zhang       /* Find number of unique col entries in this row */
4671394ed5ebSJunchao Zhang       Aj[q]   = j[start]; /* Log the first nonzero in this row */
4672651b1cf9SStefano Zampini       jmap[q] = 1;        /* Number of repeats of this nonzero entry */
4673394ed5ebSJunchao Zhang       Ai[row] = 1;
4674394ed5ebSJunchao Zhang       nnz++;
4675394ed5ebSJunchao Zhang 
4676394ed5ebSJunchao Zhang       for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */
4677394ed5ebSJunchao Zhang         if (j[p] != j[p - 1]) {           /* Meet a new nonzero */
4678394ed5ebSJunchao Zhang           q++;
4679394ed5ebSJunchao Zhang           jmap[q] = 1;
4680394ed5ebSJunchao Zhang           Aj[q]   = j[p];
4681394ed5ebSJunchao Zhang           Ai[row]++;
4682394ed5ebSJunchao Zhang           nnz++;
4683394ed5ebSJunchao Zhang         } else {
4684394ed5ebSJunchao Zhang           jmap[q]++;
4685394ed5ebSJunchao Zhang         }
4686394ed5ebSJunchao Zhang       }
4687394ed5ebSJunchao Zhang       q++; /* Move to next row and thus next unique nonzero */
4688394ed5ebSJunchao Zhang     }
46890d88f7f4SJunchao Zhang   }
46900d88f7f4SJunchao Zhang 
4691394ed5ebSJunchao Zhang   Ai--; /* Back to the beginning of Ai[] */
4692394ed5ebSJunchao Zhang   for (k = 0; k < M; k++) Ai[k + 1] += Ai[k];
46930d88f7f4SJunchao Zhang   jmap--; // Back to the beginning of jmap[]
4694394ed5ebSJunchao Zhang   jmap[0] = 0;
4695394ed5ebSJunchao Zhang   for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k];
46960d88f7f4SJunchao Zhang 
46979f0612e4SBarry Smith   if (nnz < coo_n - nneg) { /* Reallocate with actual number of unique nonzeros */
4698394ed5ebSJunchao Zhang     PetscCount *jmap_new;
4699394ed5ebSJunchao Zhang     PetscInt   *Aj_new;
4700394ed5ebSJunchao Zhang 
47019566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nnz + 1, &jmap_new));
47029566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1));
47039566063dSJacob Faibussowitsch     PetscCall(PetscFree(jmap));
4704394ed5ebSJunchao Zhang     jmap = jmap_new;
4705394ed5ebSJunchao Zhang 
47069f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscInt), (void **)&Aj_new));
47079566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(Aj_new, Aj, nnz));
47089f0612e4SBarry Smith     PetscCall(PetscShmgetDeallocateArray((void **)&Aj));
4709394ed5ebSJunchao Zhang     Aj = Aj_new;
4710394ed5ebSJunchao Zhang   }
4711394ed5ebSJunchao Zhang 
4712394ed5ebSJunchao Zhang   if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */
4713394ed5ebSJunchao Zhang     PetscCount *perm_new;
4714cbc6b225SStefano Zampini 
47159566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(coo_n - nneg, &perm_new));
47169566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg));
47179566063dSJacob Faibussowitsch     PetscCall(PetscFree(perm));
4718394ed5ebSJunchao Zhang     perm = perm_new;
4719394ed5ebSJunchao Zhang   }
4720394ed5ebSJunchao Zhang 
47219566063dSJacob Faibussowitsch   PetscCall(MatGetRootType_Private(mat, &rtype));
47229f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscScalar), (void **)&Aa));
47239f0612e4SBarry Smith   PetscCall(PetscArrayzero(Aa, nnz));
47249566063dSJacob Faibussowitsch   PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat));
4725394ed5ebSJunchao Zhang 
4726394ed5ebSJunchao Zhang   seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */
47272c4ab24aSJunchao Zhang 
47282c4ab24aSJunchao Zhang   // Put the COO struct in a container and then attach that to the matrix
47292c4ab24aSJunchao Zhang   PetscCall(PetscMalloc1(1, &coo));
47306497c311SBarry Smith   PetscCall(PetscIntCast(nnz, &coo->nz));
47312c4ab24aSJunchao Zhang   coo->n    = coo_n;
47322c4ab24aSJunchao Zhang   coo->Atot = coo_n - nneg; // Annz is seqaij->nz, so no need to record that again
47332c4ab24aSJunchao Zhang   coo->jmap = jmap;         // of length nnz+1
47342c4ab24aSJunchao Zhang   coo->perm = perm;
473503e76207SPierre Jolivet   PetscCall(PetscObjectContainerCompose((PetscObject)mat, "__PETSc_MatCOOStruct_Host", coo, MatCOOStructDestroy_SeqAIJ));
47363ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4737394ed5ebSJunchao Zhang }
4738394ed5ebSJunchao Zhang 
MatSetValuesCOO_SeqAIJ(Mat A,const PetscScalar v[],InsertMode imode)4739d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode)
4740d71ae5a4SJacob Faibussowitsch {
4741394ed5ebSJunchao Zhang   Mat_SeqAIJ          *aseq = (Mat_SeqAIJ *)A->data;
4742394ed5ebSJunchao Zhang   PetscCount           i, j, Annz = aseq->nz;
47432c4ab24aSJunchao Zhang   PetscCount          *perm, *jmap;
4744394ed5ebSJunchao Zhang   PetscScalar         *Aa;
47452c4ab24aSJunchao Zhang   PetscContainer       container;
47462c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo;
4747394ed5ebSJunchao Zhang 
4748394ed5ebSJunchao Zhang   PetscFunctionBegin;
47492c4ab24aSJunchao Zhang   PetscCall(PetscObjectQuery((PetscObject)A, "__PETSc_MatCOOStruct_Host", (PetscObject *)&container));
47502c4ab24aSJunchao Zhang   PetscCheck(container, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not found MatCOOStruct on this matrix");
4751*2a8381b2SBarry Smith   PetscCall(PetscContainerGetPointer(container, &coo));
47522c4ab24aSJunchao Zhang   perm = coo->perm;
47532c4ab24aSJunchao Zhang   jmap = coo->jmap;
47549566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &Aa));
4755394ed5ebSJunchao Zhang   for (i = 0; i < Annz; i++) {
4756b6c38306SJunchao Zhang     PetscScalar sum = 0.0;
4757b6c38306SJunchao Zhang     for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]];
4758b6c38306SJunchao Zhang     Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum;
4759394ed5ebSJunchao Zhang   }
47609566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &Aa));
47613ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4762394ed5ebSJunchao Zhang }
4763394ed5ebSJunchao Zhang 
476434b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
47655063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *);
476602fe1965SBarry Smith #endif
4767d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
4768d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *);
4769d5e393b6SSuyash Tandon #endif
47703d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
47715063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *);
47723d0639e7SStefano Zampini #endif
477302fe1965SBarry Smith 
MatCreate_SeqAIJ(Mat B)4774d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B)
4775d71ae5a4SJacob Faibussowitsch {
4776273d9f13SBarry Smith   Mat_SeqAIJ *b;
477738baddfdSBarry Smith   PetscMPIInt size;
4778273d9f13SBarry Smith 
4779273d9f13SBarry Smith   PetscFunctionBegin;
47809566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size));
478108401ef6SPierre Jolivet   PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1");
4782273d9f13SBarry Smith 
47834dfa11a4SJacob Faibussowitsch   PetscCall(PetscNew(&b));
47842205254eSKarl Rupp 
4785b0a32e0cSBarry Smith   B->data   = (void *)b;
4786aea10558SJacob Faibussowitsch   B->ops[0] = MatOps_Values;
4787071fcb05SBarry Smith   if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
47882205254eSKarl Rupp 
4789f4259b30SLisandro Dalcin   b->row                = NULL;
4790f4259b30SLisandro Dalcin   b->col                = NULL;
4791f4259b30SLisandro Dalcin   b->icol               = NULL;
4792b810aeb4SBarry Smith   b->reallocs           = 0;
479336db0b34SBarry Smith   b->ignorezeroentries  = PETSC_FALSE;
4794f1e2ffcdSBarry Smith   b->roworiented        = PETSC_TRUE;
4795416022c9SBarry Smith   b->nonew              = 0;
4796f4259b30SLisandro Dalcin   b->diag               = NULL;
4797f4259b30SLisandro Dalcin   b->solve_work         = NULL;
4798f4259b30SLisandro Dalcin   B->spptr              = NULL;
4799f4259b30SLisandro Dalcin   b->saved_values       = NULL;
4800f4259b30SLisandro Dalcin   b->idiag              = NULL;
4801f4259b30SLisandro Dalcin   b->mdiag              = NULL;
4802f4259b30SLisandro Dalcin   b->ssor_work          = NULL;
480371f1c65dSBarry Smith   b->omega              = 1.0;
480471f1c65dSBarry Smith   b->fshift             = 0.0;
4805bbead8a2SBarry Smith   b->ibdiagvalid        = PETSC_FALSE;
4806a9817697SBarry Smith   b->keepnonzeropattern = PETSC_FALSE;
480717ab2063SBarry Smith 
48089566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ));
4809d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB)
48109566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ));
48119566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ));
4812b3866ffcSBarry Smith #endif
48139566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ));
48149566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ));
48159566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ));
48169566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ));
48179566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ));
48189566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM));
48199566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL));
48209779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
48219566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL));
4822191b95cbSRichard Tran Mills #endif
482334b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
48249566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE));
48259566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ));
48269566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ));
482702fe1965SBarry Smith #endif
4828d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
4829d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE));
4830d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ));
4831d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ));
4832d5e393b6SSuyash Tandon #endif
48333d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
48349566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos));
48353d0639e7SStefano Zampini #endif
48369566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL));
4837af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
48389566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental));
4839af8000cdSHong Zhang #endif
4840d1a032dbSPierre Jolivet #if defined(PETSC_HAVE_SCALAPACK) && (defined(PETSC_USE_REAL_SINGLE) || defined(PETSC_USE_REAL_DOUBLE))
48419566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK));
4842d24d4204SJose E. Roman #endif
484363c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
48449566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE));
48459566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ));
484663c07aadSStefano Zampini #endif
48479566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense));
48489566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL));
48499566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS));
48509566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ));
485114e4dea2SJose E. Roman   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsHermitianTranspose_SeqAIJ));
48529566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ));
48539566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ));
4854674b392bSAlexander   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetHash_C", MatResetHash_SeqAIJ));
48559566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ));
48569566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ));
48579566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ));
48589566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ));
48599566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ));
48609566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ));
48619566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ));
48629566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ));
48639566063dSJacob Faibussowitsch   PetscCall(MatCreate_SeqAIJ_Inode(B));
48649566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ));
48659566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */
48663ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
486717ab2063SBarry Smith }
486817ab2063SBarry Smith 
4869b24902e0SBarry Smith /*
48703893b582SJunchao Zhang     Given a matrix generated with MatGetFactor() duplicates all the information in A into C
4871b24902e0SBarry Smith */
MatDuplicateNoCreate_SeqAIJ(Mat C,Mat A,MatDuplicateOption cpvalues,PetscBool mallocmatspace)4872d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace)
4873d71ae5a4SJacob Faibussowitsch {
48742a350339SBarry Smith   Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data;
4875071fcb05SBarry Smith   PetscInt    m = A->rmap->n, i;
487617ab2063SBarry Smith 
48773a40ed3dSBarry Smith   PetscFunctionBegin;
4878aed4548fSBarry Smith   PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix");
4879273d9f13SBarry Smith 
4880d5f3da31SBarry Smith   C->factortype = A->factortype;
4881f4259b30SLisandro Dalcin   c->row        = NULL;
4882f4259b30SLisandro Dalcin   c->col        = NULL;
4883f4259b30SLisandro Dalcin   c->icol       = NULL;
48846ad4291fSHong Zhang   c->reallocs   = 0;
488569272f91SPierre Jolivet   C->assembled  = A->assembled;
488617ab2063SBarry Smith 
488769272f91SPierre Jolivet   if (A->preallocated) {
48889566063dSJacob Faibussowitsch     PetscCall(PetscLayoutReference(A->rmap, &C->rmap));
48899566063dSJacob Faibussowitsch     PetscCall(PetscLayoutReference(A->cmap, &C->cmap));
4890eec197d1SBarry Smith 
489131fe6a7dSBarry Smith     if (!A->hash_active) {
48929566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m, &c->imax));
4893418fb43bSPierre Jolivet       PetscCall(PetscArraycpy(c->imax, a->imax, m));
48949566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m, &c->ilen));
4895418fb43bSPierre Jolivet       PetscCall(PetscArraycpy(c->ilen, a->ilen, m));
489617ab2063SBarry Smith 
489717ab2063SBarry Smith       /* allocate the matrix space */
4898f77e22a1SHong Zhang       if (mallocmatspace) {
48999f0612e4SBarry Smith         PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscScalar), (void **)&c->a));
49009f0612e4SBarry Smith         PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscInt), (void **)&c->j));
49019f0612e4SBarry Smith         PetscCall(PetscShmgetAllocateArray(m + 1, sizeof(PetscInt), (void **)&c->i));
49029566063dSJacob Faibussowitsch         PetscCall(PetscArraycpy(c->i, a->i, m + 1));
49039f0612e4SBarry Smith         c->free_a  = PETSC_TRUE;
49049f0612e4SBarry Smith         c->free_ij = PETSC_TRUE;
490517ab2063SBarry Smith         if (m > 0) {
49069566063dSJacob Faibussowitsch           PetscCall(PetscArraycpy(c->j, a->j, a->i[m]));
4907be6bf707SBarry Smith           if (cpvalues == MAT_COPY_VALUES) {
49082e5835c6SStefano Zampini             const PetscScalar *aa;
49092e5835c6SStefano Zampini 
49109566063dSJacob Faibussowitsch             PetscCall(MatSeqAIJGetArrayRead(A, &aa));
49119566063dSJacob Faibussowitsch             PetscCall(PetscArraycpy(c->a, aa, a->i[m]));
49129566063dSJacob Faibussowitsch             PetscCall(MatSeqAIJGetArrayRead(A, &aa));
4913be6bf707SBarry Smith           } else {
49149566063dSJacob Faibussowitsch             PetscCall(PetscArrayzero(c->a, a->i[m]));
491517ab2063SBarry Smith           }
491608480c60SBarry Smith         }
4917f77e22a1SHong Zhang       }
491831fe6a7dSBarry Smith       C->preallocated = PETSC_TRUE;
491931fe6a7dSBarry Smith     } else {
492031fe6a7dSBarry Smith       PetscCheck(mallocmatspace, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot malloc matrix memory from a non-preallocated matrix");
492131fe6a7dSBarry Smith       PetscCall(MatSetUp(C));
492231fe6a7dSBarry Smith     }
492317ab2063SBarry Smith 
49246ad4291fSHong Zhang     c->ignorezeroentries  = a->ignorezeroentries;
4925416022c9SBarry Smith     c->roworiented        = a->roworiented;
4926416022c9SBarry Smith     c->nonew              = a->nonew;
4927f4259b30SLisandro Dalcin     c->solve_work         = NULL;
4928f4259b30SLisandro Dalcin     c->saved_values       = NULL;
4929f4259b30SLisandro Dalcin     c->idiag              = NULL;
4930f4259b30SLisandro Dalcin     c->ssor_work          = NULL;
4931a9817697SBarry Smith     c->keepnonzeropattern = a->keepnonzeropattern;
49326ad4291fSHong Zhang 
4933893ad86cSHong Zhang     c->rmax  = a->rmax;
4934416022c9SBarry Smith     c->nz    = a->nz;
49358ed568f8SMatthew G Knepley     c->maxnz = a->nz; /* Since we allocate exactly the right amount */
4936754ec7b1SSatish Balay 
49376ad4291fSHong Zhang     c->compressedrow.use   = a->compressedrow.use;
49386ad4291fSHong Zhang     c->compressedrow.nrows = a->compressedrow.nrows;
4939cd6b891eSBarry Smith     if (a->compressedrow.use) {
49406ad4291fSHong Zhang       i = a->compressedrow.nrows;
49419566063dSJacob Faibussowitsch       PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex));
49429566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1));
49439566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i));
494427ea64f8SHong Zhang     } else {
494527ea64f8SHong Zhang       c->compressedrow.use    = PETSC_FALSE;
49460298fd71SBarry Smith       c->compressedrow.i      = NULL;
49470298fd71SBarry Smith       c->compressedrow.rindex = NULL;
49486ad4291fSHong Zhang     }
4949ea632784SBarry Smith     c->nonzerorowcnt = a->nonzerorowcnt;
4950e56f5c9eSBarry Smith     C->nonzerostate  = A->nonzerostate;
49514846f1f5SKris Buschelman 
49529566063dSJacob Faibussowitsch     PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C));
495369272f91SPierre Jolivet   }
49549566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist));
49553ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
495617ab2063SBarry Smith }
495717ab2063SBarry Smith 
MatDuplicate_SeqAIJ(Mat A,MatDuplicateOption cpvalues,Mat * B)4958d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B)
4959d71ae5a4SJacob Faibussowitsch {
4960b24902e0SBarry Smith   PetscFunctionBegin;
49619566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B));
49629566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n));
496348a46eb9SPierre Jolivet   if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A));
49649566063dSJacob Faibussowitsch   PetscCall(MatSetType(*B, ((PetscObject)A)->type_name));
49659566063dSJacob Faibussowitsch   PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE));
49663ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4967b24902e0SBarry Smith }
4968b24902e0SBarry Smith 
MatLoad_SeqAIJ(Mat newMat,PetscViewer viewer)4969d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer)
4970d71ae5a4SJacob Faibussowitsch {
497152f91c60SVaclav Hapla   PetscBool isbinary, ishdf5;
497252f91c60SVaclav Hapla 
497352f91c60SVaclav Hapla   PetscFunctionBegin;
497452f91c60SVaclav Hapla   PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1);
497552f91c60SVaclav Hapla   PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2);
4976c27b3999SVaclav Hapla   /* force binary viewer to load .info file if it has not yet done so */
49779566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
49789566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
49799566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5));
498052f91c60SVaclav Hapla   if (isbinary) {
49819566063dSJacob Faibussowitsch     PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer));
498252f91c60SVaclav Hapla   } else if (ishdf5) {
498352f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5)
49849566063dSJacob Faibussowitsch     PetscCall(MatLoad_AIJ_HDF5(newMat, viewer));
498552f91c60SVaclav Hapla #else
498652f91c60SVaclav Hapla     SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5");
498752f91c60SVaclav Hapla #endif
498852f91c60SVaclav Hapla   } else {
498998921bdaSJacob Faibussowitsch     SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name);
499052f91c60SVaclav Hapla   }
49913ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
499252f91c60SVaclav Hapla }
499352f91c60SVaclav Hapla 
MatLoad_SeqAIJ_Binary(Mat mat,PetscViewer viewer)4994d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer)
4995d71ae5a4SJacob Faibussowitsch {
49963ea6fe3dSLisandro Dalcin   Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data;
49973ea6fe3dSLisandro Dalcin   PetscInt    header[4], *rowlens, M, N, nz, sum, rows, cols, i;
4998fbdbba38SShri Abhyankar 
4999fbdbba38SShri Abhyankar   PetscFunctionBegin;
50009566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
5001bbead8a2SBarry Smith 
50023ea6fe3dSLisandro Dalcin   /* read in matrix header */
50039566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT));
500408401ef6SPierre Jolivet   PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file");
50059371c9d4SSatish Balay   M  = header[1];
50069371c9d4SSatish Balay   N  = header[2];
50079371c9d4SSatish Balay   nz = header[3];
500808401ef6SPierre Jolivet   PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M);
500908401ef6SPierre Jolivet   PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N);
501008401ef6SPierre Jolivet   PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ");
5011fbdbba38SShri Abhyankar 
50123ea6fe3dSLisandro Dalcin   /* set block sizes from the viewer's .info file */
50139566063dSJacob Faibussowitsch   PetscCall(MatLoad_Binary_BlockSizes(mat, viewer));
50143ea6fe3dSLisandro Dalcin   /* set local and global sizes if not set already */
50153ea6fe3dSLisandro Dalcin   if (mat->rmap->n < 0) mat->rmap->n = M;
50163ea6fe3dSLisandro Dalcin   if (mat->cmap->n < 0) mat->cmap->n = N;
50173ea6fe3dSLisandro Dalcin   if (mat->rmap->N < 0) mat->rmap->N = M;
50183ea6fe3dSLisandro Dalcin   if (mat->cmap->N < 0) mat->cmap->N = N;
50199566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(mat->rmap));
50209566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(mat->cmap));
50213ea6fe3dSLisandro Dalcin 
50223ea6fe3dSLisandro Dalcin   /* check if the matrix sizes are correct */
50239566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &rows, &cols));
5024aed4548fSBarry Smith   PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols);
50253ea6fe3dSLisandro Dalcin 
5026fbdbba38SShri Abhyankar   /* read in row lengths */
50279566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(M, &rowlens));
50289566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT));
50293ea6fe3dSLisandro Dalcin   /* check if sum(rowlens) is same as nz */
50309371c9d4SSatish Balay   sum = 0;
50319371c9d4SSatish Balay   for (i = 0; i < M; i++) sum += rowlens[i];
503208401ef6SPierre Jolivet   PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum);
50333ea6fe3dSLisandro Dalcin   /* preallocate and check sizes */
50349566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens));
50359566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &rows, &cols));
5036aed4548fSBarry Smith   PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols);
50373ea6fe3dSLisandro Dalcin   /* store row lengths */
50389566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(a->ilen, rowlens, M));
50399566063dSJacob Faibussowitsch   PetscCall(PetscFree(rowlens));
5040fbdbba38SShri Abhyankar 
50413ea6fe3dSLisandro Dalcin   /* fill in "i" row pointers */
50429371c9d4SSatish Balay   a->i[0] = 0;
50439371c9d4SSatish Balay   for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i];
50443ea6fe3dSLisandro Dalcin   /* read in "j" column indices */
50459566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT));
50463ea6fe3dSLisandro Dalcin   /* read in "a" nonzero values */
50479566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR));
5048fbdbba38SShri Abhyankar 
50499566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY));
50509566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY));
50513ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5052fbdbba38SShri Abhyankar }
5053fbdbba38SShri Abhyankar 
MatEqual_SeqAIJ(Mat A,Mat B,PetscBool * flg)5054d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg)
5055d71ae5a4SJacob Faibussowitsch {
50567264ac53SSatish Balay   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data;
5057fff043a9SJunchao Zhang   const PetscScalar *aa, *ba;
50587264ac53SSatish Balay 
50593a40ed3dSBarry Smith   PetscFunctionBegin;
5060bfeeae90SHong Zhang   /* If the  matrix dimensions are not equal,or no of nonzeros */
5061d0f46423SBarry Smith   if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) {
5062ca44d042SBarry Smith     *flg = PETSC_FALSE;
50633ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
5064bcd2baecSBarry Smith   }
50657264ac53SSatish Balay 
50667264ac53SSatish Balay   /* if the a->i are the same */
50679566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg));
50683ba16761SJacob Faibussowitsch   if (!*flg) PetscFunctionReturn(PETSC_SUCCESS);
50697264ac53SSatish Balay 
50707264ac53SSatish Balay   /* if a->j are the same */
50719566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg));
50723ba16761SJacob Faibussowitsch   if (!*flg) PetscFunctionReturn(PETSC_SUCCESS);
5073bcd2baecSBarry Smith 
50749566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
50759566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &ba));
5076bcd2baecSBarry Smith   /* if a->a are the same */
50779566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(aa, ba, a->nz, flg));
50789566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
50799566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &ba));
50803ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
50817264ac53SSatish Balay }
508236db0b34SBarry Smith 
508305869f15SSatish Balay /*@
508411a5261eSBarry Smith   MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format)
508536db0b34SBarry Smith   provided by the user.
508636db0b34SBarry Smith 
5087d083f849SBarry Smith   Collective
508836db0b34SBarry Smith 
508936db0b34SBarry Smith   Input Parameters:
509036db0b34SBarry Smith + comm - must be an MPI communicator of size 1
509136db0b34SBarry Smith . m    - number of rows
509236db0b34SBarry Smith . n    - number of columns
5093483a2f95SBarry Smith . i    - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix
509436db0b34SBarry Smith . j    - column indices
509536db0b34SBarry Smith - a    - matrix values
509636db0b34SBarry Smith 
509736db0b34SBarry Smith   Output Parameter:
509836db0b34SBarry Smith . mat - the matrix
509936db0b34SBarry Smith 
510036db0b34SBarry Smith   Level: intermediate
510136db0b34SBarry Smith 
510236db0b34SBarry Smith   Notes:
51032ef1f0ffSBarry Smith   The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays
5104292fb18eSBarry Smith   once the matrix is destroyed and not before
510536db0b34SBarry Smith 
510636db0b34SBarry Smith   You cannot set new nonzero locations into this matrix, that will generate an error.
510736db0b34SBarry Smith 
51082ef1f0ffSBarry Smith   The `i` and `j` indices are 0 based
510936db0b34SBarry Smith 
5110a4552177SSatish Balay   The format which is used for the sparse matrix input, is equivalent to a
5111a4552177SSatish Balay   row-major ordering.. i.e for the following matrix, the input data expected is
51128eef79e4SBarry Smith   as shown
51132ef1f0ffSBarry Smith .vb
51142ef1f0ffSBarry Smith         1 0 0
51152ef1f0ffSBarry Smith         2 0 3
51162ef1f0ffSBarry Smith         4 5 6
5117a4552177SSatish Balay 
51182ef1f0ffSBarry Smith         i =  {0,1,3,6}  [size = nrow+1  = 3+1]
51192ef1f0ffSBarry Smith         j =  {0,0,2,0,1,2}  [size = 6]; values must be sorted for each row
51202ef1f0ffSBarry Smith         v =  {1,2,3,4,5,6}  [size = 6]
51212ef1f0ffSBarry Smith .ve
5122a4552177SSatish Balay 
51231cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`
512436db0b34SBarry Smith @*/
MatCreateSeqAIJWithArrays(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt i[],PetscInt j[],PetscScalar a[],Mat * mat)5125d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat)
5126d71ae5a4SJacob Faibussowitsch {
5127cbcfb4deSHong Zhang   PetscInt    ii;
512836db0b34SBarry Smith   Mat_SeqAIJ *aij;
5129cbcfb4deSHong Zhang   PetscInt    jj;
513036db0b34SBarry Smith 
513136db0b34SBarry Smith   PetscFunctionBegin;
5132aed4548fSBarry Smith   PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0");
51339566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, mat));
51349566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*mat, m, n, m, n));
51359566063dSJacob Faibussowitsch   /* PetscCall(MatSetBlockSizes(*mat,,)); */
51369566063dSJacob Faibussowitsch   PetscCall(MatSetType(*mat, MATSEQAIJ));
51379566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL));
5138ab93d7beSBarry Smith   aij = (Mat_SeqAIJ *)(*mat)->data;
51399566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &aij->imax));
51409566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &aij->ilen));
5141ab93d7beSBarry Smith 
514236db0b34SBarry Smith   aij->i       = i;
514336db0b34SBarry Smith   aij->j       = j;
514436db0b34SBarry Smith   aij->a       = a;
514536db0b34SBarry Smith   aij->nonew   = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/
5146e6b907acSBarry Smith   aij->free_a  = PETSC_FALSE;
5147e6b907acSBarry Smith   aij->free_ij = PETSC_FALSE;
514836db0b34SBarry Smith 
5149cbc6b225SStefano Zampini   for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) {
515036db0b34SBarry Smith     aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii];
515176bd3646SJed Brown     if (PetscDefined(USE_DEBUG)) {
5152aed4548fSBarry Smith       PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]);
51539985e31cSBarry Smith       for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) {
515408401ef6SPierre Jolivet         PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii);
515508401ef6SPierre Jolivet         PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii);
51569985e31cSBarry Smith       }
515736db0b34SBarry Smith     }
515876bd3646SJed Brown   }
515976bd3646SJed Brown   if (PetscDefined(USE_DEBUG)) {
516036db0b34SBarry Smith     for (ii = 0; ii < aij->i[m]; ii++) {
516108401ef6SPierre Jolivet       PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]);
5162da0802e2SStefano Zampini       PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT " last column = %" PetscInt_FMT, ii, j[ii], n - 1);
516336db0b34SBarry Smith     }
516476bd3646SJed Brown   }
516536db0b34SBarry Smith 
51669566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY));
51679566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY));
51683ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
516936db0b34SBarry Smith }
5170cbc6b225SStefano Zampini 
5171f62e3866SBarry Smith /*@
517211a5261eSBarry Smith   MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format)
51738a0b0e6bSVictor Minden   provided by the user.
51748a0b0e6bSVictor Minden 
5175d083f849SBarry Smith   Collective
51768a0b0e6bSVictor Minden 
51778a0b0e6bSVictor Minden   Input Parameters:
51788a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1
51798a0b0e6bSVictor Minden . m    - number of rows
51808a0b0e6bSVictor Minden . n    - number of columns
51818a0b0e6bSVictor Minden . i    - row indices
51828a0b0e6bSVictor Minden . j    - column indices
51831230e6d1SVictor Minden . a    - matrix values
51841230e6d1SVictor Minden . nz   - number of nonzeros
51852ef1f0ffSBarry Smith - idx  - if the `i` and `j` indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE`
51868a0b0e6bSVictor Minden 
51878a0b0e6bSVictor Minden   Output Parameter:
51888a0b0e6bSVictor Minden . mat - the matrix
51898a0b0e6bSVictor Minden 
51908a0b0e6bSVictor Minden   Level: intermediate
51918a0b0e6bSVictor Minden 
5192f62e3866SBarry Smith   Example:
5193f62e3866SBarry Smith   For the following matrix, the input data expected is as shown (using 0 based indexing)
51949e99939fSJunchao Zhang .vb
51958a0b0e6bSVictor Minden         1 0 0
51968a0b0e6bSVictor Minden         2 0 3
51978a0b0e6bSVictor Minden         4 5 6
51988a0b0e6bSVictor Minden 
51998a0b0e6bSVictor Minden         i =  {0,1,1,2,2,2}
52008a0b0e6bSVictor Minden         j =  {0,0,2,0,1,2}
52018a0b0e6bSVictor Minden         v =  {1,2,3,4,5,6}
52029e99939fSJunchao Zhang .ve
5203fe59aa6dSJacob Faibussowitsch 
52042ef1f0ffSBarry Smith   Note:
5205d7547e51SJunchao Zhang   Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries,
5206d7547e51SJunchao Zhang   and are particularly useful in iterative applications.
52078a0b0e6bSVictor Minden 
52081cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()`
52098a0b0e6bSVictor Minden @*/
MatCreateSeqAIJFromTriple(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt i[],PetscInt j[],PetscScalar a[],Mat * mat,PetscCount nz,PetscBool idx)5210ce78bad3SBarry Smith PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscCount nz, PetscBool idx)
5211d71ae5a4SJacob Faibussowitsch {
5212d021a1c5SVictor Minden   PetscInt ii, *nnz, one = 1, row, col;
52138a0b0e6bSVictor Minden 
52148a0b0e6bSVictor Minden   PetscFunctionBegin;
52159566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(m, &nnz));
5216ad540459SPierre Jolivet   for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1;
52179566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, mat));
52189566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*mat, m, n, m, n));
52199566063dSJacob Faibussowitsch   PetscCall(MatSetType(*mat, MATSEQAIJ));
52209566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz));
52211230e6d1SVictor Minden   for (ii = 0; ii < nz; ii++) {
52221230e6d1SVictor Minden     if (idx) {
52231230e6d1SVictor Minden       row = i[ii] - 1;
52241230e6d1SVictor Minden       col = j[ii] - 1;
52251230e6d1SVictor Minden     } else {
52261230e6d1SVictor Minden       row = i[ii];
52271230e6d1SVictor Minden       col = j[ii];
52288a0b0e6bSVictor Minden     }
52299566063dSJacob Faibussowitsch     PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES));
52308a0b0e6bSVictor Minden   }
52319566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY));
52329566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY));
52339566063dSJacob Faibussowitsch   PetscCall(PetscFree(nnz));
52343ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
52358a0b0e6bSVictor Minden }
523636db0b34SBarry Smith 
MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm,Mat inmat,PetscInt n,MatReuse scall,Mat * outmat)5237d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat)
5238d71ae5a4SJacob Faibussowitsch {
52399c8f2541SHong Zhang   PetscFunctionBegin;
52409566063dSJacob Faibussowitsch   PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat));
52413ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
52429c8f2541SHong Zhang }
52439c8f2541SHong Zhang 
524481824310SBarry Smith /*
524553dd7562SDmitry Karpeev  Permute A into C's *local* index space using rowemb,colemb.
524653dd7562SDmitry Karpeev  The embedding are supposed to be injections and the above implies that the range of rowemb is a subset
524753dd7562SDmitry Karpeev  of [0,m), colemb is in [0,n).
524853dd7562SDmitry Karpeev  If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A.
524953dd7562SDmitry Karpeev  */
MatSetSeqMat_SeqAIJ(Mat C,IS rowemb,IS colemb,MatStructure pattern,Mat B)5250d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B)
5251d71ae5a4SJacob Faibussowitsch {
525253dd7562SDmitry Karpeev   /* If making this function public, change the error returned in this function away from _PLIB. */
525353dd7562SDmitry Karpeev   Mat_SeqAIJ     *Baij;
525453dd7562SDmitry Karpeev   PetscBool       seqaij;
525553dd7562SDmitry Karpeev   PetscInt        m, n, *nz, i, j, count;
525653dd7562SDmitry Karpeev   PetscScalar     v;
525753dd7562SDmitry Karpeev   const PetscInt *rowindices, *colindices;
525853dd7562SDmitry Karpeev 
525953dd7562SDmitry Karpeev   PetscFunctionBegin;
52603ba16761SJacob Faibussowitsch   if (!B) PetscFunctionReturn(PETSC_SUCCESS);
526153dd7562SDmitry Karpeev   /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */
52629566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij));
526328b400f6SJacob Faibussowitsch   PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type");
526453dd7562SDmitry Karpeev   if (rowemb) {
52659566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(rowemb, &m));
526608401ef6SPierre Jolivet     PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n);
526753dd7562SDmitry Karpeev   } else {
526808401ef6SPierre Jolivet     PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix");
526953dd7562SDmitry Karpeev   }
527053dd7562SDmitry Karpeev   if (colemb) {
52719566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(colemb, &n));
527208401ef6SPierre Jolivet     PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n);
527353dd7562SDmitry Karpeev   } else {
527408401ef6SPierre Jolivet     PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix");
527553dd7562SDmitry Karpeev   }
527653dd7562SDmitry Karpeev 
5277f4f49eeaSPierre Jolivet   Baij = (Mat_SeqAIJ *)B->data;
527853dd7562SDmitry Karpeev   if (pattern == DIFFERENT_NONZERO_PATTERN) {
52799566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(B->rmap->n, &nz));
5280ad540459SPierre Jolivet     for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i];
52819566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(C, 0, nz));
52829566063dSJacob Faibussowitsch     PetscCall(PetscFree(nz));
528353dd7562SDmitry Karpeev   }
528448a46eb9SPierre Jolivet   if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C));
528553dd7562SDmitry Karpeev   count      = 0;
528653dd7562SDmitry Karpeev   rowindices = NULL;
528753dd7562SDmitry Karpeev   colindices = NULL;
528848a46eb9SPierre Jolivet   if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices));
528948a46eb9SPierre Jolivet   if (colemb) PetscCall(ISGetIndices(colemb, &colindices));
529053dd7562SDmitry Karpeev   for (i = 0; i < B->rmap->n; i++) {
529153dd7562SDmitry Karpeev     PetscInt row;
529253dd7562SDmitry Karpeev     row = i;
529353dd7562SDmitry Karpeev     if (rowindices) row = rowindices[i];
529453dd7562SDmitry Karpeev     for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) {
529553dd7562SDmitry Karpeev       PetscInt col;
529653dd7562SDmitry Karpeev       col = Baij->j[count];
529753dd7562SDmitry Karpeev       if (colindices) col = colindices[col];
529853dd7562SDmitry Karpeev       v = Baij->a[count];
52999566063dSJacob Faibussowitsch       PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES));
530053dd7562SDmitry Karpeev       ++count;
530153dd7562SDmitry Karpeev     }
530253dd7562SDmitry Karpeev   }
530353dd7562SDmitry Karpeev   /* FIXME: set C's nonzerostate correctly. */
530453dd7562SDmitry Karpeev   /* Assembly for C is necessary. */
530553dd7562SDmitry Karpeev   C->preallocated  = PETSC_TRUE;
530653dd7562SDmitry Karpeev   C->assembled     = PETSC_TRUE;
530753dd7562SDmitry Karpeev   C->was_assembled = PETSC_FALSE;
53083ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
530953dd7562SDmitry Karpeev }
531053dd7562SDmitry Karpeev 
MatEliminateZeros_SeqAIJ(Mat A,PetscBool keep)531158c11ad4SPierre Jolivet PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A, PetscBool keep)
5312dec0b466SHong Zhang {
5313dec0b466SHong Zhang   Mat_SeqAIJ *a  = (Mat_SeqAIJ *)A->data;
5314dec0b466SHong Zhang   MatScalar  *aa = a->a;
5315dec0b466SHong Zhang   PetscInt    m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k;
5316dec0b466SHong Zhang   PetscInt   *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0;
5317dec0b466SHong Zhang 
5318dec0b466SHong Zhang   PetscFunctionBegin;
5319dec0b466SHong Zhang   PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix");
5320dec0b466SHong Zhang   if (m) rmax = ailen[0]; /* determine row with most nonzeros */
5321dec0b466SHong Zhang   for (i = 1; i <= m; i++) {
5322dec0b466SHong Zhang     /* move each nonzero entry back by the amount of zero slots (fshift) before it*/
5323dec0b466SHong Zhang     for (k = ai[i - 1]; k < ai[i]; k++) {
532458c11ad4SPierre Jolivet       if (aa[k] == 0 && (aj[k] != i - 1 || !keep)) fshift++;
5325dec0b466SHong Zhang       else {
5326dec0b466SHong Zhang         if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1));
5327dec0b466SHong Zhang         aa[k - fshift] = aa[k];
5328dec0b466SHong Zhang         aj[k - fshift] = aj[k];
5329dec0b466SHong Zhang       }
5330dec0b466SHong Zhang     }
5331dec0b466SHong Zhang     ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration
5332dec0b466SHong Zhang     fshift_prev = fshift;
5333dec0b466SHong Zhang     /* reset ilen and imax for each row */
5334dec0b466SHong Zhang     ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1];
5335dec0b466SHong Zhang     a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0);
5336dec0b466SHong Zhang     rmax = PetscMax(rmax, ailen[i - 1]);
5337dec0b466SHong Zhang   }
5338312eded4SPierre Jolivet   if (fshift) {
5339dec0b466SHong Zhang     if (m) {
5340dec0b466SHong Zhang       ai[m] -= fshift;
5341dec0b466SHong Zhang       a->nz = ai[m];
5342dec0b466SHong Zhang     }
5343dec0b466SHong Zhang     PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz));
5344312eded4SPierre Jolivet     A->nonzerostate++;
5345dec0b466SHong Zhang     A->info.nz_unneeded += (PetscReal)fshift;
5346dec0b466SHong Zhang     a->rmax = rmax;
5347dec0b466SHong Zhang     if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A));
5348dec0b466SHong Zhang     PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY));
5349dec0b466SHong Zhang     PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY));
5350312eded4SPierre Jolivet   }
53513ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5352dec0b466SHong Zhang }
5353dec0b466SHong Zhang 
53544099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL;
53554099cc6bSBarry Smith 
5356cc4c1da9SBarry Smith /*@
535711a5261eSBarry Smith   MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype
53584099cc6bSBarry Smith 
5359c3339decSBarry Smith   Collective
53604099cc6bSBarry Smith 
53614099cc6bSBarry Smith   Input Parameters:
53624099cc6bSBarry Smith + mat    - the matrix object
53634099cc6bSBarry Smith - matype - matrix type
53644099cc6bSBarry Smith 
53654099cc6bSBarry Smith   Options Database Key:
53664e187271SRichard Tran Mills . -mat_seqaij_type  <method> - for example seqaijcrl
53674099cc6bSBarry Smith 
53684099cc6bSBarry Smith   Level: intermediate
53694099cc6bSBarry Smith 
5370fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`
53714099cc6bSBarry Smith @*/
MatSeqAIJSetType(Mat mat,MatType matype)5372d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype)
5373d71ae5a4SJacob Faibussowitsch {
53744099cc6bSBarry Smith   PetscBool sametype;
53755f80ce2aSJacob Faibussowitsch   PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *);
53764099cc6bSBarry Smith 
53774099cc6bSBarry Smith   PetscFunctionBegin;
53784099cc6bSBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
53799566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype));
53803ba16761SJacob Faibussowitsch   if (sametype) PetscFunctionReturn(PETSC_SUCCESS);
53814099cc6bSBarry Smith 
53829566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r));
53836adde796SStefano Zampini   PetscCheck(r, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype);
53849566063dSJacob Faibussowitsch   PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat));
53853ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
53864099cc6bSBarry Smith }
53874099cc6bSBarry Smith 
53884099cc6bSBarry Smith /*@C
538911a5261eSBarry Smith   MatSeqAIJRegister -  - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices
53904099cc6bSBarry Smith 
5391cc4c1da9SBarry Smith   Not Collective, No Fortran Support
53924099cc6bSBarry Smith 
53934099cc6bSBarry Smith   Input Parameters:
5394fe59aa6dSJacob Faibussowitsch + sname    - name of a new user-defined matrix type, for example `MATSEQAIJCRL`
53954099cc6bSBarry Smith - function - routine to convert to subtype
53964099cc6bSBarry Smith 
53972ef1f0ffSBarry Smith   Level: advanced
53982ef1f0ffSBarry Smith 
53994099cc6bSBarry Smith   Notes:
540011a5261eSBarry Smith   `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers.
54014099cc6bSBarry Smith 
54024099cc6bSBarry Smith   Then, your matrix can be chosen with the procedural interface at runtime via the option
5403b44f4de4SBarry Smith .vb
5404b44f4de4SBarry Smith   -mat_seqaij_type my_mat
5405b44f4de4SBarry Smith .ve
54064099cc6bSBarry Smith 
54071cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRegisterAll()`
54084099cc6bSBarry Smith @*/
MatSeqAIJRegister(const char sname[],PetscErrorCode (* function)(Mat,MatType,MatReuse,Mat *))5409d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *))
5410d71ae5a4SJacob Faibussowitsch {
54114099cc6bSBarry Smith   PetscFunctionBegin;
54129566063dSJacob Faibussowitsch   PetscCall(MatInitializePackage());
54139566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function));
54143ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
54154099cc6bSBarry Smith }
54164099cc6bSBarry Smith 
54174099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE;
54184099cc6bSBarry Smith 
54194099cc6bSBarry Smith /*@C
542011a5261eSBarry Smith   MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ`
54214099cc6bSBarry Smith 
54224099cc6bSBarry Smith   Not Collective
54234099cc6bSBarry Smith 
54244099cc6bSBarry Smith   Level: advanced
54254099cc6bSBarry Smith 
54262ef1f0ffSBarry Smith   Note:
54272ef1f0ffSBarry Smith   This registers the versions of `MATSEQAIJ` for GPUs
54282ef1f0ffSBarry Smith 
54291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatRegisterAll()`, `MatSeqAIJRegister()`
54304099cc6bSBarry Smith @*/
MatSeqAIJRegisterAll(void)5431d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void)
5432d71ae5a4SJacob Faibussowitsch {
54334099cc6bSBarry Smith   PetscFunctionBegin;
54343ba16761SJacob Faibussowitsch   if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS);
54354099cc6bSBarry Smith   MatSeqAIJRegisterAllCalled = PETSC_TRUE;
54364099cc6bSBarry Smith 
54379566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL));
54389566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM));
54399566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL));
54409779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
54419566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL));
5442485f9817SRichard Tran Mills #endif
54435063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA)
54449566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE));
54455063d097SStefano Zampini #endif
5446d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
5447d5e393b6SSuyash Tandon   PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE));
5448d5e393b6SSuyash Tandon #endif
54495063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
54509566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos));
54515063d097SStefano Zampini #endif
54524099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA)
54539566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL));
54544099cc6bSBarry Smith #endif
54553ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
54564099cc6bSBarry Smith }
545753dd7562SDmitry Karpeev 
545853dd7562SDmitry Karpeev /*
545981824310SBarry Smith     Special version for direct calls from Fortran
546081824310SBarry Smith */
546181824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS)
546281824310SBarry Smith   #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ
546381824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE)
546481824310SBarry Smith   #define matsetvaluesseqaij_ matsetvaluesseqaij
546581824310SBarry Smith #endif
546681824310SBarry Smith 
546781824310SBarry Smith /* Change these macros so can be used in void function */
546898921bdaSJacob Faibussowitsch 
546998921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */
54709566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */
54719566063dSJacob Faibussowitsch #undef PetscCall
54729371c9d4SSatish Balay #define PetscCall(...) \
54739371c9d4SSatish Balay   do { \
54745f80ce2aSJacob Faibussowitsch     PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \
547598921bdaSJacob Faibussowitsch     if (PetscUnlikely(ierr_msv_mpiaij)) { \
547698921bdaSJacob Faibussowitsch       *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \
547798921bdaSJacob Faibussowitsch       return; \
547898921bdaSJacob Faibussowitsch     } \
547998921bdaSJacob Faibussowitsch   } while (0)
548098921bdaSJacob Faibussowitsch 
548198921bdaSJacob Faibussowitsch #undef SETERRQ
54829371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \
54839371c9d4SSatish Balay   do { \
548498921bdaSJacob Faibussowitsch     *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \
548598921bdaSJacob Faibussowitsch     return; \
548698921bdaSJacob Faibussowitsch   } while (0)
548781824310SBarry Smith 
matsetvaluesseqaij_(Mat * AA,PetscInt * mm,const PetscInt im[],PetscInt * nn,const PetscInt in[],const PetscScalar v[],InsertMode * isis,PetscErrorCode * _ierr)5488d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr)
5489d71ae5a4SJacob Faibussowitsch {
549081824310SBarry Smith   Mat         A = *AA;
549181824310SBarry Smith   PetscInt    m = *mm, n = *nn;
549281824310SBarry Smith   InsertMode  is = *isis;
549381824310SBarry Smith   Mat_SeqAIJ *a  = (Mat_SeqAIJ *)A->data;
549481824310SBarry Smith   PetscInt   *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N;
549581824310SBarry Smith   PetscInt   *imax, *ai, *ailen;
549681824310SBarry Smith   PetscInt   *aj, nonew = a->nonew, lastcol = -1;
549754f21887SBarry Smith   MatScalar  *ap, value, *aa;
5498ace3abfcSBarry Smith   PetscBool   ignorezeroentries = a->ignorezeroentries;
5499ace3abfcSBarry Smith   PetscBool   roworiented       = a->roworiented;
550081824310SBarry Smith 
550181824310SBarry Smith   PetscFunctionBegin;
55024994cf47SJed Brown   MatCheckPreallocated(A, 1);
550381824310SBarry Smith   imax  = a->imax;
550481824310SBarry Smith   ai    = a->i;
550581824310SBarry Smith   ailen = a->ilen;
550681824310SBarry Smith   aj    = a->j;
550781824310SBarry Smith   aa    = a->a;
550881824310SBarry Smith 
550981824310SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
551081824310SBarry Smith     row = im[k];
551181824310SBarry Smith     if (row < 0) continue;
55125f80ce2aSJacob Faibussowitsch     PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large");
55139371c9d4SSatish Balay     rp   = aj + ai[row];
55149371c9d4SSatish Balay     ap   = aa + ai[row];
55159371c9d4SSatish Balay     rmax = imax[row];
55169371c9d4SSatish Balay     nrow = ailen[row];
551781824310SBarry Smith     low  = 0;
551881824310SBarry Smith     high = nrow;
551981824310SBarry Smith     for (l = 0; l < n; l++) { /* loop over added columns */
552081824310SBarry Smith       if (in[l] < 0) continue;
55215f80ce2aSJacob Faibussowitsch       PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large");
552281824310SBarry Smith       col = in[l];
55232205254eSKarl Rupp       if (roworiented) value = v[l + k * n];
55242205254eSKarl Rupp       else value = v[k + l * m];
55252205254eSKarl Rupp 
552681824310SBarry Smith       if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue;
552781824310SBarry Smith 
55282205254eSKarl Rupp       if (col <= lastcol) low = 0;
55292205254eSKarl Rupp       else high = nrow;
553081824310SBarry Smith       lastcol = col;
553181824310SBarry Smith       while (high - low > 5) {
553281824310SBarry Smith         t = (low + high) / 2;
553381824310SBarry Smith         if (rp[t] > col) high = t;
553481824310SBarry Smith         else low = t;
553581824310SBarry Smith       }
553681824310SBarry Smith       for (i = low; i < high; i++) {
553781824310SBarry Smith         if (rp[i] > col) break;
553881824310SBarry Smith         if (rp[i] == col) {
553981824310SBarry Smith           if (is == ADD_VALUES) ap[i] += value;
554081824310SBarry Smith           else ap[i] = value;
554181824310SBarry Smith           goto noinsert;
554281824310SBarry Smith         }
554381824310SBarry Smith       }
554481824310SBarry Smith       if (value == 0.0 && ignorezeroentries) goto noinsert;
554581824310SBarry Smith       if (nonew == 1) goto noinsert;
55465f80ce2aSJacob Faibussowitsch       PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix");
5547fef13f97SBarry Smith       MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
55489371c9d4SSatish Balay       N = nrow++ - 1;
55499371c9d4SSatish Balay       a->nz++;
55509371c9d4SSatish Balay       high++;
555181824310SBarry Smith       /* shift up all the later entries in this row */
555281824310SBarry Smith       for (ii = N; ii >= i; ii--) {
555381824310SBarry Smith         rp[ii + 1] = rp[ii];
555481824310SBarry Smith         ap[ii + 1] = ap[ii];
555581824310SBarry Smith       }
555681824310SBarry Smith       rp[i] = col;
555781824310SBarry Smith       ap[i] = value;
555881824310SBarry Smith     noinsert:;
555981824310SBarry Smith       low = i + 1;
556081824310SBarry Smith     }
556181824310SBarry Smith     ailen[row] = nrow;
556281824310SBarry Smith   }
556381824310SBarry Smith   PetscFunctionReturnVoid();
556481824310SBarry Smith }
556598921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No
556698921bdaSJacob Faibussowitsch  * other PETSc functions should be defined past this point, as it is impossible to recover the
556798921bdaSJacob Faibussowitsch  * original definitions */
55689566063dSJacob Faibussowitsch #undef PetscCall
556998921bdaSJacob Faibussowitsch #undef SETERRQ
5570