163c07aadSStefano Zampini /*
263c07aadSStefano Zampini Creates hypre ijmatrix from PETSc matrix
363c07aadSStefano Zampini */
4225daaf8SStefano Zampini
5c6698e78SStefano Zampini #include <petscpkg_version.h>
639accc25SStefano Zampini #include <petsc/private/petschypre.h>
7dd9c0a25Sstefano_zampini #include <petscmathypre.h>
863c07aadSStefano Zampini #include <petsc/private/matimpl.h>
9a4af0ceeSJacob Faibussowitsch #include <petsc/private/deviceimpl.h>
1063c07aadSStefano Zampini #include <../src/mat/impls/hypre/mhypre.h>
1163c07aadSStefano Zampini #include <../src/mat/impls/aij/mpi/mpiaij.h>
1258968eb6SStefano Zampini #include <../src/vec/vec/impls/hypre/vhyp.h>
1358968eb6SStefano Zampini #include <HYPRE.h>
14c1a070e6SStefano Zampini #include <HYPRE_utilities.h>
15cd8bc7baSStefano Zampini #include <_hypre_parcsr_ls.h>
1668ec7858SStefano Zampini #include <_hypre_sstruct_ls.h>
1763c07aadSStefano Zampini
180e6427aaSSatish Balay #if PETSC_PKG_HYPRE_VERSION_LT(2, 18, 0)
190e6427aaSSatish Balay #define hypre_ParCSRMatrixClone(A, B) hypre_ParCSRMatrixCompleteClone(A)
200e6427aaSSatish Balay #endif
210e6427aaSSatish Balay
22bb16242fSVictor A. P. Magri #if PETSC_PKG_HYPRE_VERSION_GE(2, 15, 0)
23bb16242fSVictor A. P. Magri #define HYPRE_AssumedPartitionCheck() 1
24bb16242fSVictor A. P. Magri #endif
25bb16242fSVictor A. P. Magri
2663c07aadSStefano Zampini static PetscErrorCode MatHYPRE_CreateFromMat(Mat, Mat_HYPRE *);
2763c07aadSStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixPreallocate(Mat, Mat, HYPRE_IJMatrix);
28b73e3080SStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixCopyIJ_MPIAIJ(Mat, HYPRE_IJMatrix);
29b73e3080SStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixCopyIJ_SeqAIJ(Mat, HYPRE_IJMatrix);
3039accc25SStefano Zampini static PetscErrorCode MatHYPRE_MultKernel_Private(Mat, HYPRE_Complex, Vec, HYPRE_Complex, Vec, PetscBool);
316ea7df73SStefano Zampini static PetscErrorCode MatSetValues_HYPRE(Mat, PetscInt, const PetscInt[], PetscInt, const PetscInt[], const PetscScalar[], InsertMode ins);
3263c07aadSStefano Zampini
MatHYPRE_IJMatrixPreallocate(Mat A_d,Mat A_o,HYPRE_IJMatrix ij)33d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_IJMatrixPreallocate(Mat A_d, Mat A_o, HYPRE_IJMatrix ij)
34d71ae5a4SJacob Faibussowitsch {
3563c07aadSStefano Zampini PetscInt i, n_d, n_o;
3663c07aadSStefano Zampini const PetscInt *ia_d, *ia_o;
3763c07aadSStefano Zampini PetscBool done_d = PETSC_FALSE, done_o = PETSC_FALSE;
382cf14000SStefano Zampini HYPRE_Int *nnz_d = NULL, *nnz_o = NULL;
3963c07aadSStefano Zampini
4063c07aadSStefano Zampini PetscFunctionBegin;
4163c07aadSStefano Zampini if (A_d) { /* determine number of nonzero entries in local diagonal part */
429566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(A_d, 0, PETSC_FALSE, PETSC_FALSE, &n_d, &ia_d, NULL, &done_d));
4363c07aadSStefano Zampini if (done_d) {
449566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n_d, &nnz_d));
45f2f41e48SZach Atkins for (i = 0; i < n_d; i++) nnz_d[i] = (HYPRE_Int)(ia_d[i + 1] - ia_d[i]);
4663c07aadSStefano Zampini }
479566063dSJacob Faibussowitsch PetscCall(MatRestoreRowIJ(A_d, 0, PETSC_FALSE, PETSC_FALSE, NULL, &ia_d, NULL, &done_d));
4863c07aadSStefano Zampini }
4963c07aadSStefano Zampini if (A_o) { /* determine number of nonzero entries in local off-diagonal part */
509566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(A_o, 0, PETSC_FALSE, PETSC_FALSE, &n_o, &ia_o, NULL, &done_o));
5163c07aadSStefano Zampini if (done_o) {
529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n_o, &nnz_o));
53f2f41e48SZach Atkins for (i = 0; i < n_o; i++) nnz_o[i] = (HYPRE_Int)(ia_o[i + 1] - ia_o[i]);
5463c07aadSStefano Zampini }
559566063dSJacob Faibussowitsch PetscCall(MatRestoreRowIJ(A_o, 0, PETSC_FALSE, PETSC_FALSE, &n_o, &ia_o, NULL, &done_o));
5663c07aadSStefano Zampini }
5763c07aadSStefano Zampini if (done_d) { /* set number of nonzeros in HYPRE IJ matrix */
5863c07aadSStefano Zampini if (!done_o) { /* only diagonal part */
599566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n_d, &nnz_o));
6063c07aadSStefano Zampini }
61c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 16, 0)
62c6698e78SStefano Zampini { /* If we don't do this, the columns of the matrix will be all zeros! */
63c6698e78SStefano Zampini hypre_AuxParCSRMatrix *aux_matrix;
64c6698e78SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij);
65c6698e78SStefano Zampini hypre_AuxParCSRMatrixDestroy(aux_matrix);
66c6698e78SStefano Zampini hypre_IJMatrixTranslator(ij) = NULL;
67a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixSetDiagOffdSizes(ij, nnz_d, nnz_o));
6822235d61SPierre Jolivet /* it seems they partially fixed it in 2.19.0 */
6922235d61SPierre Jolivet #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0)
70c6698e78SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij);
71c6698e78SStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 1;
7222235d61SPierre Jolivet #endif
73c6698e78SStefano Zampini }
74c6698e78SStefano Zampini #else
75a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixSetDiagOffdSizes(ij, nnz_d, nnz_o));
76c6698e78SStefano Zampini #endif
779566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz_d));
789566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz_o));
7963c07aadSStefano Zampini }
803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
8163c07aadSStefano Zampini }
8263c07aadSStefano Zampini
MatHYPRE_CreateFromMat(Mat A,Mat_HYPRE * hA)83d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_CreateFromMat(Mat A, Mat_HYPRE *hA)
84d71ae5a4SJacob Faibussowitsch {
85f2f41e48SZach Atkins HYPRE_Int rstart, rend, cstart, cend;
8663c07aadSStefano Zampini
8763c07aadSStefano Zampini PetscFunctionBegin;
889566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap));
899566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap));
90f2f41e48SZach Atkins rstart = (HYPRE_Int)A->rmap->rstart;
91f2f41e48SZach Atkins rend = (HYPRE_Int)A->rmap->rend;
92f2f41e48SZach Atkins cstart = (HYPRE_Int)A->cmap->rstart;
93f2f41e48SZach Atkins cend = (HYPRE_Int)A->cmap->rend;
94*5482091fSJunchao Zhang PetscCall(PetscHYPREInitialize());
95651b1cf9SStefano Zampini if (hA->ij) {
96651b1cf9SStefano Zampini if (!hA->inner_free) hypre_IJMatrixObject(hA->ij) = NULL;
97a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixDestroy(hA->ij));
98651b1cf9SStefano Zampini }
99a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixCreate(hA->comm, rstart, rend - 1, cstart, cend - 1, &hA->ij));
100a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixSetObjectType(hA->ij, HYPRE_PARCSR));
10163c07aadSStefano Zampini {
10263c07aadSStefano Zampini PetscBool same;
10363c07aadSStefano Zampini Mat A_d, A_o;
10463c07aadSStefano Zampini const PetscInt *colmap;
1059566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &same));
10663c07aadSStefano Zampini if (same) {
1079566063dSJacob Faibussowitsch PetscCall(MatMPIAIJGetSeqAIJ(A, &A_d, &A_o, &colmap));
1089566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixPreallocate(A_d, A_o, hA->ij));
1093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
11063c07aadSStefano Zampini }
1119566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIBAIJ, &same));
11263c07aadSStefano Zampini if (same) {
1139566063dSJacob Faibussowitsch PetscCall(MatMPIBAIJGetSeqBAIJ(A, &A_d, &A_o, &colmap));
1149566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixPreallocate(A_d, A_o, hA->ij));
1153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
11663c07aadSStefano Zampini }
1179566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQAIJ, &same));
11863c07aadSStefano Zampini if (same) {
1199566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixPreallocate(A, NULL, hA->ij));
1203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
12163c07aadSStefano Zampini }
1229566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQBAIJ, &same));
12363c07aadSStefano Zampini if (same) {
1249566063dSJacob Faibussowitsch PetscCall(MatHYPRE_IJMatrixPreallocate(A, NULL, hA->ij));
1253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
12663c07aadSStefano Zampini }
12763c07aadSStefano Zampini }
1283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
12963c07aadSStefano Zampini }
13063c07aadSStefano Zampini
MatHYPRE_IJMatrixCopyIJ(Mat A,HYPRE_IJMatrix ij)131b73e3080SStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixCopyIJ(Mat A, HYPRE_IJMatrix ij)
132d71ae5a4SJacob Faibussowitsch {
13363c07aadSStefano Zampini PetscBool flg;
13463c07aadSStefano Zampini
13563c07aadSStefano Zampini PetscFunctionBegin;
1366ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0)
137a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixInitialize(ij));
1386ea7df73SStefano Zampini #else
139a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixInitialize_v2(ij, HYPRE_MEMORY_HOST));
1406ea7df73SStefano Zampini #endif
1419566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &flg));
142b73e3080SStefano Zampini if (flg) {
143b73e3080SStefano Zampini PetscCall(MatHYPRE_IJMatrixCopyIJ_MPIAIJ(A, ij));
1443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
14563c07aadSStefano Zampini }
1469566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQAIJ, &flg));
14763c07aadSStefano Zampini if (flg) {
148b73e3080SStefano Zampini PetscCall(MatHYPRE_IJMatrixCopyIJ_SeqAIJ(A, ij));
1493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
15063c07aadSStefano Zampini }
151b73e3080SStefano Zampini PetscCheck(PETSC_FALSE, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "No support for matrix type %s", ((PetscObject)A)->type_name);
15287ef5fa6SStefano Zampini PetscFunctionReturn(PETSC_SUCCESS);
15363c07aadSStefano Zampini }
15463c07aadSStefano Zampini
MatHYPRE_IJMatrixCopyIJ_SeqAIJ(Mat A,HYPRE_IJMatrix ij)155b73e3080SStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixCopyIJ_SeqAIJ(Mat A, HYPRE_IJMatrix ij)
156d71ae5a4SJacob Faibussowitsch {
15763c07aadSStefano Zampini Mat_SeqAIJ *pdiag = (Mat_SeqAIJ *)A->data;
15858968eb6SStefano Zampini HYPRE_Int type;
15963c07aadSStefano Zampini hypre_ParCSRMatrix *par_matrix;
16063c07aadSStefano Zampini hypre_AuxParCSRMatrix *aux_matrix;
16163c07aadSStefano Zampini hypre_CSRMatrix *hdiag;
1622cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int));
16363c07aadSStefano Zampini
16463c07aadSStefano Zampini PetscFunctionBegin;
165a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(ij, &type));
16608401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
167a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(ij, (void **)&par_matrix));
16863c07aadSStefano Zampini hdiag = hypre_ParCSRMatrixDiag(par_matrix);
16963c07aadSStefano Zampini /*
17063c07aadSStefano Zampini this is the Hack part where we monkey directly with the hypre datastructures
17163c07aadSStefano Zampini */
1722cf14000SStefano Zampini if (sameint) {
1739566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hdiag->i, pdiag->i, A->rmap->n + 1));
1749566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hdiag->j, pdiag->j, pdiag->nz));
1752cf14000SStefano Zampini } else {
1762cf14000SStefano Zampini PetscInt i;
1772cf14000SStefano Zampini
1782cf14000SStefano Zampini for (i = 0; i < A->rmap->n + 1; i++) hdiag->i[i] = (HYPRE_Int)pdiag->i[i];
1792cf14000SStefano Zampini for (i = 0; i < pdiag->nz; i++) hdiag->j[i] = (HYPRE_Int)pdiag->j[i];
1802cf14000SStefano Zampini }
1816ea7df73SStefano Zampini
182ea9daf28SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij);
18363c07aadSStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0;
1843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
18563c07aadSStefano Zampini }
18663c07aadSStefano Zampini
MatHYPRE_IJMatrixCopyIJ_MPIAIJ(Mat A,HYPRE_IJMatrix ij)187b73e3080SStefano Zampini static PetscErrorCode MatHYPRE_IJMatrixCopyIJ_MPIAIJ(Mat A, HYPRE_IJMatrix ij)
188d71ae5a4SJacob Faibussowitsch {
18963c07aadSStefano Zampini Mat_MPIAIJ *pA = (Mat_MPIAIJ *)A->data;
19063c07aadSStefano Zampini Mat_SeqAIJ *pdiag, *poffd;
19163c07aadSStefano Zampini PetscInt i, *garray = pA->garray, *jj, cstart, *pjj;
1922cf14000SStefano Zampini HYPRE_Int *hjj, type;
19363c07aadSStefano Zampini hypre_ParCSRMatrix *par_matrix;
19463c07aadSStefano Zampini hypre_AuxParCSRMatrix *aux_matrix;
19563c07aadSStefano Zampini hypre_CSRMatrix *hdiag, *hoffd;
1962cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int));
19763c07aadSStefano Zampini
19863c07aadSStefano Zampini PetscFunctionBegin;
19963c07aadSStefano Zampini pdiag = (Mat_SeqAIJ *)pA->A->data;
20063c07aadSStefano Zampini poffd = (Mat_SeqAIJ *)pA->B->data;
201da81f932SPierre Jolivet /* cstart is only valid for square MPIAIJ laid out in the usual way */
2029566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(A, &cstart, NULL));
20363c07aadSStefano Zampini
204a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(ij, &type));
20508401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
206a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(ij, (void **)&par_matrix));
20763c07aadSStefano Zampini hdiag = hypre_ParCSRMatrixDiag(par_matrix);
20863c07aadSStefano Zampini hoffd = hypre_ParCSRMatrixOffd(par_matrix);
20963c07aadSStefano Zampini
2102cf14000SStefano Zampini if (sameint) {
2119566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hdiag->i, pdiag->i, pA->A->rmap->n + 1));
2122cf14000SStefano Zampini } else {
213f4f49eeaSPierre Jolivet for (i = 0; i < pA->A->rmap->n + 1; i++) hdiag->i[i] = (HYPRE_Int)pdiag->i[i];
2142cf14000SStefano Zampini }
215b73e3080SStefano Zampini
2162cf14000SStefano Zampini hjj = hdiag->j;
2172cf14000SStefano Zampini pjj = pdiag->j;
218c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 16, 0)
219f2f41e48SZach Atkins for (i = 0; i < pdiag->nz; i++) hjj[i] = (HYPRE_Int)pjj[i];
220c6698e78SStefano Zampini #else
2212cf14000SStefano Zampini for (i = 0; i < pdiag->nz; i++) hjj[i] = cstart + pjj[i];
222c6698e78SStefano Zampini #endif
2232cf14000SStefano Zampini if (sameint) {
2249566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hoffd->i, poffd->i, pA->A->rmap->n + 1));
2252cf14000SStefano Zampini } else {
226f4f49eeaSPierre Jolivet for (i = 0; i < pA->A->rmap->n + 1; i++) hoffd->i[i] = (HYPRE_Int)poffd->i[i];
2272cf14000SStefano Zampini }
2282cf14000SStefano Zampini
22906977982Sstefanozampini jj = (PetscInt *)hoffd->j;
230c6698e78SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 16, 0)
231a333fa2bSZach Atkins PetscCallHYPRE(hypre_CSRMatrixBigInitialize(hoffd));
232c6698e78SStefano Zampini jj = (PetscInt *)hoffd->big_j;
233c6698e78SStefano Zampini #endif
2342cf14000SStefano Zampini pjj = poffd->j;
23563c07aadSStefano Zampini for (i = 0; i < poffd->nz; i++) jj[i] = garray[pjj[i]];
236c6698e78SStefano Zampini
237ea9daf28SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(ij);
23863c07aadSStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0;
2393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
24063c07aadSStefano Zampini }
24163c07aadSStefano Zampini
MatConvert_HYPRE_IS(Mat A,MatType mtype,MatReuse reuse,Mat * B)242d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatConvert_HYPRE_IS(Mat A, MatType mtype, MatReuse reuse, Mat *B)
243d71ae5a4SJacob Faibussowitsch {
244f4f49eeaSPierre Jolivet Mat_HYPRE *mhA = (Mat_HYPRE *)A->data;
2452df22349SStefano Zampini Mat lA;
2462df22349SStefano Zampini ISLocalToGlobalMapping rl2g, cl2g;
2472df22349SStefano Zampini IS is;
2482df22349SStefano Zampini hypre_ParCSRMatrix *hA;
2492df22349SStefano Zampini hypre_CSRMatrix *hdiag, *hoffd;
2502df22349SStefano Zampini MPI_Comm comm;
25139accc25SStefano Zampini HYPRE_Complex *hdd, *hod, *aa;
25239accc25SStefano Zampini PetscScalar *data;
2532cf14000SStefano Zampini HYPRE_BigInt *col_map_offd;
2542cf14000SStefano Zampini HYPRE_Int *hdi, *hdj, *hoi, *hoj;
2552df22349SStefano Zampini PetscInt *ii, *jj, *iptr, *jptr;
2562df22349SStefano Zampini PetscInt cum, dr, dc, oc, str, stc, nnz, i, jd, jo, M, N;
25758968eb6SStefano Zampini HYPRE_Int type;
25806977982Sstefanozampini MatType lmattype = NULL;
25906977982Sstefanozampini PetscBool freeparcsr = PETSC_FALSE;
2602df22349SStefano Zampini
2612df22349SStefano Zampini PetscFunctionBegin;
262a1787963SStefano Zampini comm = PetscObjectComm((PetscObject)A);
263a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(mhA->ij, &type));
26408401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, comm, PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
265a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(mhA->ij, (void **)&hA));
26606977982Sstefanozampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
26706977982Sstefanozampini if (HYPRE_MEMORY_DEVICE == hypre_IJMatrixMemoryLocation(mhA->ij)) {
26806977982Sstefanozampini /* Support by copying back on the host and copy to GPU
26906977982Sstefanozampini Kind of inefficient, but this is the best we can do now */
27006977982Sstefanozampini #if defined(HYPRE_USING_HIP)
27106977982Sstefanozampini lmattype = MATSEQAIJHIPSPARSE;
27206977982Sstefanozampini #elif defined(HYPRE_USING_CUDA)
27306977982Sstefanozampini lmattype = MATSEQAIJCUSPARSE;
27406977982Sstefanozampini #endif
27506977982Sstefanozampini hA = hypre_ParCSRMatrixClone_v2(hA, 1, HYPRE_MEMORY_HOST);
27606977982Sstefanozampini freeparcsr = PETSC_TRUE;
27706977982Sstefanozampini }
27806977982Sstefanozampini #endif
2792df22349SStefano Zampini M = hypre_ParCSRMatrixGlobalNumRows(hA);
2802df22349SStefano Zampini N = hypre_ParCSRMatrixGlobalNumCols(hA);
2812df22349SStefano Zampini str = hypre_ParCSRMatrixFirstRowIndex(hA);
2822df22349SStefano Zampini stc = hypre_ParCSRMatrixFirstColDiag(hA);
2832df22349SStefano Zampini hdiag = hypre_ParCSRMatrixDiag(hA);
2842df22349SStefano Zampini hoffd = hypre_ParCSRMatrixOffd(hA);
2852df22349SStefano Zampini dr = hypre_CSRMatrixNumRows(hdiag);
2862df22349SStefano Zampini dc = hypre_CSRMatrixNumCols(hdiag);
2872df22349SStefano Zampini nnz = hypre_CSRMatrixNumNonzeros(hdiag);
2882df22349SStefano Zampini hdi = hypre_CSRMatrixI(hdiag);
2892df22349SStefano Zampini hdj = hypre_CSRMatrixJ(hdiag);
2902df22349SStefano Zampini hdd = hypre_CSRMatrixData(hdiag);
2912df22349SStefano Zampini oc = hypre_CSRMatrixNumCols(hoffd);
2922df22349SStefano Zampini nnz += hypre_CSRMatrixNumNonzeros(hoffd);
2932df22349SStefano Zampini hoi = hypre_CSRMatrixI(hoffd);
2942df22349SStefano Zampini hoj = hypre_CSRMatrixJ(hoffd);
2952df22349SStefano Zampini hod = hypre_CSRMatrixData(hoffd);
2962df22349SStefano Zampini if (reuse != MAT_REUSE_MATRIX) {
2972df22349SStefano Zampini PetscInt *aux;
2982df22349SStefano Zampini
2992df22349SStefano Zampini /* generate l2g maps for rows and cols */
3009566063dSJacob Faibussowitsch PetscCall(ISCreateStride(comm, dr, str, 1, &is));
3019566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreateIS(is, &rl2g));
3029566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is));
3032df22349SStefano Zampini col_map_offd = hypre_ParCSRMatrixColMapOffd(hA);
3049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(dc + oc, &aux));
3052df22349SStefano Zampini for (i = 0; i < dc; i++) aux[i] = i + stc;
3062df22349SStefano Zampini for (i = 0; i < oc; i++) aux[i + dc] = col_map_offd[i];
3079566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(comm, dc + oc, aux, PETSC_OWN_POINTER, &is));
3089566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreateIS(is, &cl2g));
3099566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is));
3102df22349SStefano Zampini /* create MATIS object */
3119566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, B));
3129566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, dr, dc, M, N));
3139566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, MATIS));
3149566063dSJacob Faibussowitsch PetscCall(MatSetLocalToGlobalMapping(*B, rl2g, cl2g));
3159566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingDestroy(&rl2g));
3169566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingDestroy(&cl2g));
3172df22349SStefano Zampini
3182df22349SStefano Zampini /* allocate CSR for local matrix */
3199566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(dr + 1, &iptr));
3209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &jptr));
3219566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &data));
3222df22349SStefano Zampini } else {
3232df22349SStefano Zampini PetscInt nr;
3242df22349SStefano Zampini PetscBool done;
3259566063dSJacob Faibussowitsch PetscCall(MatISGetLocalMat(*B, &lA));
3269566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(lA, 0, PETSC_FALSE, PETSC_FALSE, &nr, (const PetscInt **)&iptr, (const PetscInt **)&jptr, &done));
32708401ef6SPierre Jolivet PetscCheck(nr == dr, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of rows in local mat! %" PetscInt_FMT " != %" PetscInt_FMT, nr, dr);
32808401ef6SPierre Jolivet PetscCheck(iptr[nr] >= nnz, PETSC_COMM_SELF, PETSC_ERR_USER, "Cannot reuse mat: invalid number of nonzeros in local mat! reuse %" PetscInt_FMT " requested %" PetscInt_FMT, iptr[nr], nnz);
32906977982Sstefanozampini PetscCall(MatSeqAIJGetArrayWrite(lA, &data));
3302df22349SStefano Zampini }
3312df22349SStefano Zampini /* merge local matrices */
3322df22349SStefano Zampini ii = iptr;
3332df22349SStefano Zampini jj = jptr;
33439accc25SStefano Zampini aa = (HYPRE_Complex *)data; /* this cast fixes the clang error when doing the assignments below: implicit conversion from 'HYPRE_Complex' (aka '_Complex double') to 'double' is not permitted in C++ */
3352df22349SStefano Zampini *ii = *(hdi++) + *(hoi++);
3362df22349SStefano Zampini for (jd = 0, jo = 0, cum = 0; *ii < nnz; cum++) {
33739accc25SStefano Zampini PetscScalar *aold = (PetscScalar *)aa;
3382df22349SStefano Zampini PetscInt *jold = jj, nc = jd + jo;
3399371c9d4SSatish Balay for (; jd < *hdi; jd++) {
3409371c9d4SSatish Balay *jj++ = *hdj++;
3419371c9d4SSatish Balay *aa++ = *hdd++;
3429371c9d4SSatish Balay }
3439371c9d4SSatish Balay for (; jo < *hoi; jo++) {
3449371c9d4SSatish Balay *jj++ = *hoj++ + dc;
3459371c9d4SSatish Balay *aa++ = *hod++;
3469371c9d4SSatish Balay }
3472df22349SStefano Zampini *(++ii) = *(hdi++) + *(hoi++);
3489566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(jd + jo - nc, jold, aold));
3492df22349SStefano Zampini }
3502df22349SStefano Zampini for (; cum < dr; cum++) *(++ii) = nnz;
3512df22349SStefano Zampini if (reuse != MAT_REUSE_MATRIX) {
352a033916dSStefano Zampini Mat_SeqAIJ *a;
353a033916dSStefano Zampini
3549566063dSJacob Faibussowitsch PetscCall(MatCreateSeqAIJWithArrays(PETSC_COMM_SELF, dr, dc + oc, iptr, jptr, data, &lA));
355a033916dSStefano Zampini /* hack SeqAIJ */
356f4f49eeaSPierre Jolivet a = (Mat_SeqAIJ *)lA->data;
357a033916dSStefano Zampini a->free_a = PETSC_TRUE;
358a033916dSStefano Zampini a->free_ij = PETSC_TRUE;
35906977982Sstefanozampini if (lmattype) PetscCall(MatConvert(lA, lmattype, MAT_INPLACE_MATRIX, &lA));
36006977982Sstefanozampini PetscCall(MatISSetLocalMat(*B, lA));
3619566063dSJacob Faibussowitsch PetscCall(MatDestroy(&lA));
36206977982Sstefanozampini } else {
36306977982Sstefanozampini PetscCall(MatSeqAIJRestoreArrayWrite(lA, &data));
3642df22349SStefano Zampini }
3659566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY));
3669566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY));
36748a46eb9SPierre Jolivet if (reuse == MAT_INPLACE_MATRIX) PetscCall(MatHeaderReplace(A, B));
368a333fa2bSZach Atkins if (freeparcsr) PetscCallHYPRE(hypre_ParCSRMatrixDestroy(hA));
3693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
3702df22349SStefano Zampini }
3712df22349SStefano Zampini
MatHYPRE_DestroyCOOMat(Mat mat)37206977982Sstefanozampini static PetscErrorCode MatHYPRE_DestroyCOOMat(Mat mat)
373d71ae5a4SJacob Faibussowitsch {
37406977982Sstefanozampini Mat_HYPRE *hA = (Mat_HYPRE *)mat->data;
37563c07aadSStefano Zampini
37663c07aadSStefano Zampini PetscFunctionBegin;
37706977982Sstefanozampini if (hA->cooMat) { /* If cooMat is present we need to destroy the column indices */
37806977982Sstefanozampini PetscCall(MatDestroy(&hA->cooMat));
37906977982Sstefanozampini if (hA->cooMatAttached) {
38006977982Sstefanozampini hypre_CSRMatrix *csr;
38106977982Sstefanozampini hypre_ParCSRMatrix *parcsr;
38206977982Sstefanozampini HYPRE_MemoryLocation mem;
38306977982Sstefanozampini
384a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij, (void **)&parcsr));
38506977982Sstefanozampini csr = hypre_ParCSRMatrixDiag(parcsr);
38606977982Sstefanozampini if (csr) {
38706977982Sstefanozampini mem = hypre_CSRMatrixMemoryLocation(csr);
38806977982Sstefanozampini PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixJ(csr), mem));
38906977982Sstefanozampini PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixBigJ(csr), mem));
390b73e3080SStefano Zampini }
39106977982Sstefanozampini csr = hypre_ParCSRMatrixOffd(parcsr);
39206977982Sstefanozampini if (csr) {
39306977982Sstefanozampini mem = hypre_CSRMatrixMemoryLocation(csr);
39406977982Sstefanozampini PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixJ(csr), mem));
39506977982Sstefanozampini PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixBigJ(csr), mem));
396b73e3080SStefano Zampini }
397b73e3080SStefano Zampini }
39806977982Sstefanozampini }
39906977982Sstefanozampini hA->cooMatAttached = PETSC_FALSE;
400b73e3080SStefano Zampini PetscFunctionReturn(PETSC_SUCCESS);
401b73e3080SStefano Zampini }
402b73e3080SStefano Zampini
MatHYPRE_CreateCOOMat(Mat mat)40306977982Sstefanozampini static PetscErrorCode MatHYPRE_CreateCOOMat(Mat mat)
404b73e3080SStefano Zampini {
40506977982Sstefanozampini MPI_Comm comm;
40606977982Sstefanozampini PetscMPIInt size;
40706977982Sstefanozampini PetscLayout rmap, cmap;
40806977982Sstefanozampini Mat_HYPRE *hmat = (Mat_HYPRE *)mat->data;
40906977982Sstefanozampini MatType matType = MATAIJ; /* default type of cooMat */
410b73e3080SStefano Zampini
411b73e3080SStefano Zampini PetscFunctionBegin;
41206977982Sstefanozampini /* Build an agent matrix cooMat with AIJ format
41306977982Sstefanozampini It has the same sparsity pattern as mat, and also shares the data array with mat. We use cooMat to do the COO work.
41406977982Sstefanozampini */
41506977982Sstefanozampini PetscCall(PetscObjectGetComm((PetscObject)mat, &comm));
41606977982Sstefanozampini PetscCallMPI(MPI_Comm_size(comm, &size));
41706977982Sstefanozampini PetscCall(PetscLayoutSetUp(mat->rmap));
41806977982Sstefanozampini PetscCall(PetscLayoutSetUp(mat->cmap));
41906977982Sstefanozampini PetscCall(MatGetLayouts(mat, &rmap, &cmap));
420b73e3080SStefano Zampini
42106977982Sstefanozampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
42206977982Sstefanozampini if (!mat->boundtocpu) { /* mat will be on device, so will cooMat */
42306977982Sstefanozampini #if defined(HYPRE_USING_HIP)
42406977982Sstefanozampini matType = MATAIJHIPSPARSE;
42506977982Sstefanozampini #elif defined(HYPRE_USING_CUDA)
42606977982Sstefanozampini matType = MATAIJCUSPARSE;
427e64794e4SJunchao Zhang #elif defined(HYPRE_USING_SYCL) && defined(PETSC_HAVE_KOKKOS_KERNELS)
428e64794e4SJunchao Zhang matType = MATAIJKOKKOS;
42906977982Sstefanozampini #else
430e64794e4SJunchao Zhang SETERRQ(comm, PETSC_ERR_SUP, "No HYPRE device available. Suggest re-installing with Kokkos Kernels");
43106977982Sstefanozampini #endif
432b73e3080SStefano Zampini }
43306977982Sstefanozampini #endif
43406977982Sstefanozampini
43506977982Sstefanozampini /* Do COO preallocation through cooMat */
43606977982Sstefanozampini PetscCall(MatHYPRE_DestroyCOOMat(mat));
43706977982Sstefanozampini PetscCall(MatCreate(comm, &hmat->cooMat));
43806977982Sstefanozampini PetscCall(MatSetType(hmat->cooMat, matType));
43906977982Sstefanozampini PetscCall(MatSetLayouts(hmat->cooMat, rmap, cmap));
44006977982Sstefanozampini
44106977982Sstefanozampini /* allocate local matrices if needed */
44206977982Sstefanozampini PetscCall(MatMPIAIJSetPreallocation(hmat->cooMat, 0, NULL, 0, NULL));
44306977982Sstefanozampini PetscFunctionReturn(PETSC_SUCCESS);
44406977982Sstefanozampini }
44506977982Sstefanozampini
44606977982Sstefanozampini /* Attach cooMat data array to hypre matrix.
44706977982Sstefanozampini When AIJCUPMSPARSE will support raw device pointers and not THRUSTARRAY
44806977982Sstefanozampini we should swap the arrays: i.e., attach hypre matrix array to cooMat
44906977982Sstefanozampini This is because hypre should be in charge of handling the memory,
45006977982Sstefanozampini cooMat is only a way to reuse PETSc COO code.
45106977982Sstefanozampini attaching the memory will then be done at MatSetValuesCOO time and it will dynamically
45206977982Sstefanozampini support hypre matrix migrating to host.
45306977982Sstefanozampini */
MatHYPRE_AttachCOOMat(Mat mat)45406977982Sstefanozampini static PetscErrorCode MatHYPRE_AttachCOOMat(Mat mat)
45506977982Sstefanozampini {
45606977982Sstefanozampini Mat_HYPRE *hmat = (Mat_HYPRE *)mat->data;
45706977982Sstefanozampini hypre_CSRMatrix *diag, *offd;
45806977982Sstefanozampini hypre_ParCSRMatrix *parCSR;
45906977982Sstefanozampini HYPRE_MemoryLocation hmem = HYPRE_MEMORY_HOST;
46006977982Sstefanozampini PetscMemType pmem;
46106977982Sstefanozampini Mat A, B;
46206977982Sstefanozampini PetscScalar *a;
46306977982Sstefanozampini PetscMPIInt size;
46406977982Sstefanozampini MPI_Comm comm;
46506977982Sstefanozampini
46606977982Sstefanozampini PetscFunctionBegin;
46706977982Sstefanozampini PetscCheck(hmat->cooMat, PetscObjectComm((PetscObject)mat), PETSC_ERR_PLIB, "HYPRE COO delegate matrix has not been created yet");
46806977982Sstefanozampini if (hmat->cooMatAttached) PetscFunctionReturn(PETSC_SUCCESS);
46906977982Sstefanozampini PetscCheck(hmat->cooMat->preallocated, PetscObjectComm((PetscObject)mat), PETSC_ERR_PLIB, "HYPRE COO delegate matrix is not preallocated");
47006977982Sstefanozampini PetscCall(PetscObjectSetName((PetscObject)hmat->cooMat, "_internal_COO_mat_for_hypre"));
47106977982Sstefanozampini PetscCall(PetscObjectGetComm((PetscObject)mat, &comm));
47206977982Sstefanozampini PetscCallMPI(MPI_Comm_size(comm, &size));
47306977982Sstefanozampini
47406977982Sstefanozampini /* Alias cooMat's data array to IJMatrix's */
475a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hmat->ij, (void **)&parCSR));
47606977982Sstefanozampini diag = hypre_ParCSRMatrixDiag(parCSR);
47706977982Sstefanozampini offd = hypre_ParCSRMatrixOffd(parCSR);
47806977982Sstefanozampini
47906977982Sstefanozampini A = (size == 1) ? hmat->cooMat : ((Mat_MPIAIJ *)hmat->cooMat->data)->A;
48006977982Sstefanozampini B = (size == 1) ? NULL : ((Mat_MPIAIJ *)hmat->cooMat->data)->B;
48106977982Sstefanozampini
48206977982Sstefanozampini PetscCall(PetscObjectSetName((PetscObject)A, "_internal_COO_mat_for_hypre"));
48306977982Sstefanozampini hmem = hypre_CSRMatrixMemoryLocation(diag);
48406977982Sstefanozampini PetscCall(MatSeqAIJGetCSRAndMemType(A, NULL, NULL, &a, &pmem));
48506977982Sstefanozampini PetscAssert((PetscMemTypeHost(pmem) && hmem == HYPRE_MEMORY_HOST) || (PetscMemTypeDevice(pmem) && hmem == HYPRE_MEMORY_DEVICE), comm, PETSC_ERR_PLIB, "PETSc and hypre's memory types mismatch");
48606977982Sstefanozampini PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixData(diag), hmem));
48706977982Sstefanozampini hypre_CSRMatrixData(diag) = (HYPRE_Complex *)a;
48806977982Sstefanozampini hypre_CSRMatrixOwnsData(diag) = 0; /* Take ownership of (j,a) away from hypre. As a result, we need to free them on our own */
48906977982Sstefanozampini
49006977982Sstefanozampini if (B) {
49106977982Sstefanozampini hmem = hypre_CSRMatrixMemoryLocation(offd);
49206977982Sstefanozampini PetscCall(MatSeqAIJGetCSRAndMemType(B, NULL, NULL, &a, &pmem));
49306977982Sstefanozampini PetscAssert((PetscMemTypeHost(pmem) && hmem == HYPRE_MEMORY_HOST) || (PetscMemTypeDevice(pmem) && hmem == HYPRE_MEMORY_DEVICE), comm, PETSC_ERR_PLIB, "PETSc and hypre's memory types mismatch");
49406977982Sstefanozampini PetscStackCallExternalVoid("hypre_TFree", hypre_TFree(hypre_CSRMatrixData(offd), hmem));
49506977982Sstefanozampini hypre_CSRMatrixData(offd) = (HYPRE_Complex *)a;
49606977982Sstefanozampini hypre_CSRMatrixOwnsData(offd) = 0;
49706977982Sstefanozampini }
49806977982Sstefanozampini hmat->cooMatAttached = PETSC_TRUE;
49906977982Sstefanozampini PetscFunctionReturn(PETSC_SUCCESS);
50006977982Sstefanozampini }
50106977982Sstefanozampini
5021c265611SJunchao Zhang // Build COO's coordinate list i[], j[] based on CSR's i[], j[] arrays and the number of local rows 'n'
CSRtoCOO_Private(PetscInt n,const PetscInt ii[],const PetscInt jj[],PetscCount * ncoo,PetscInt ** coo_i,PetscInt ** coo_j)50306977982Sstefanozampini static PetscErrorCode CSRtoCOO_Private(PetscInt n, const PetscInt ii[], const PetscInt jj[], PetscCount *ncoo, PetscInt **coo_i, PetscInt **coo_j)
50406977982Sstefanozampini {
50506977982Sstefanozampini PetscInt *cooi, *cooj;
50606977982Sstefanozampini
50706977982Sstefanozampini PetscFunctionBegin;
50806977982Sstefanozampini *ncoo = ii[n];
50906977982Sstefanozampini PetscCall(PetscMalloc2(*ncoo, &cooi, *ncoo, &cooj));
51006977982Sstefanozampini for (PetscInt i = 0; i < n; i++) {
51106977982Sstefanozampini for (PetscInt j = ii[i]; j < ii[i + 1]; j++) cooi[j] = i;
51206977982Sstefanozampini }
51306977982Sstefanozampini PetscCall(PetscArraycpy(cooj, jj, *ncoo));
51406977982Sstefanozampini *coo_i = cooi;
51506977982Sstefanozampini *coo_j = cooj;
51606977982Sstefanozampini PetscFunctionReturn(PETSC_SUCCESS);
51706977982Sstefanozampini }
51806977982Sstefanozampini
5191c265611SJunchao Zhang // Similar to CSRtoCOO_Private, but the CSR's i[], j[] are of type HYPRE_Int
CSRtoCOO_HYPRE_Int_Private(PetscInt n,const HYPRE_Int ii[],const HYPRE_Int jj[],PetscCount * ncoo,PetscInt ** coo_i,PetscInt ** coo_j)52006977982Sstefanozampini static PetscErrorCode CSRtoCOO_HYPRE_Int_Private(PetscInt n, const HYPRE_Int ii[], const HYPRE_Int jj[], PetscCount *ncoo, PetscInt **coo_i, PetscInt **coo_j)
52106977982Sstefanozampini {
52206977982Sstefanozampini PetscInt *cooi, *cooj;
52306977982Sstefanozampini
52406977982Sstefanozampini PetscFunctionBegin;
52506977982Sstefanozampini *ncoo = ii[n];
52606977982Sstefanozampini PetscCall(PetscMalloc2(*ncoo, &cooi, *ncoo, &cooj));
52706977982Sstefanozampini for (PetscInt i = 0; i < n; i++) {
52806977982Sstefanozampini for (HYPRE_Int j = ii[i]; j < ii[i + 1]; j++) cooi[j] = i;
52906977982Sstefanozampini }
53006977982Sstefanozampini for (PetscCount i = 0; i < *ncoo; i++) cooj[i] = jj[i];
53106977982Sstefanozampini *coo_i = cooi;
53206977982Sstefanozampini *coo_j = cooj;
53306977982Sstefanozampini PetscFunctionReturn(PETSC_SUCCESS);
53406977982Sstefanozampini }
53506977982Sstefanozampini
5361c265611SJunchao Zhang // Build a COO data structure for the seqaij matrix, as if the nonzeros are laid out in the same order as in the CSR
MatSeqAIJGetCOO_Private(Mat A,PetscCount * ncoo,PetscInt ** coo_i,PetscInt ** coo_j)53706977982Sstefanozampini static PetscErrorCode MatSeqAIJGetCOO_Private(Mat A, PetscCount *ncoo, PetscInt **coo_i, PetscInt **coo_j)
53806977982Sstefanozampini {
53906977982Sstefanozampini PetscInt n;
54006977982Sstefanozampini const PetscInt *ii, *jj;
54106977982Sstefanozampini PetscBool done;
54206977982Sstefanozampini
54306977982Sstefanozampini PetscFunctionBegin;
54406977982Sstefanozampini PetscCall(MatGetRowIJ(A, 0, PETSC_FALSE, PETSC_FALSE, &n, &ii, &jj, &done));
54506977982Sstefanozampini PetscCheck(done, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "Failure for MatGetRowIJ");
54606977982Sstefanozampini PetscCall(CSRtoCOO_Private(n, ii, jj, ncoo, coo_i, coo_j));
54706977982Sstefanozampini PetscCall(MatRestoreRowIJ(A, 0, PETSC_FALSE, PETSC_FALSE, &n, &ii, &jj, &done));
54806977982Sstefanozampini PetscCheck(done, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "Failure for MatRestoreRowIJ");
54906977982Sstefanozampini PetscFunctionReturn(PETSC_SUCCESS);
55006977982Sstefanozampini }
55106977982Sstefanozampini
5521c265611SJunchao Zhang // Build a COO data structure for the hypreCSRMatrix, as if the nonzeros are laid out in the same order as in the hypreCSRMatrix
hypreCSRMatrixGetCOO_Private(hypre_CSRMatrix * A,PetscCount * ncoo,PetscInt ** coo_i,PetscInt ** coo_j)55306977982Sstefanozampini static PetscErrorCode hypreCSRMatrixGetCOO_Private(hypre_CSRMatrix *A, PetscCount *ncoo, PetscInt **coo_i, PetscInt **coo_j)
55406977982Sstefanozampini {
55506977982Sstefanozampini PetscInt n = hypre_CSRMatrixNumRows(A);
55606977982Sstefanozampini HYPRE_Int *ii, *jj;
55706977982Sstefanozampini HYPRE_MemoryLocation mem = HYPRE_MEMORY_HOST;
55806977982Sstefanozampini
55906977982Sstefanozampini PetscFunctionBegin;
56006977982Sstefanozampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
56106977982Sstefanozampini mem = hypre_CSRMatrixMemoryLocation(A);
56206977982Sstefanozampini if (mem != HYPRE_MEMORY_HOST) {
56306977982Sstefanozampini PetscCount nnz = hypre_CSRMatrixNumNonzeros(A);
56406977982Sstefanozampini PetscCall(PetscMalloc2(n + 1, &ii, nnz, &jj));
56506977982Sstefanozampini hypre_TMemcpy(ii, hypre_CSRMatrixI(A), HYPRE_Int, n + 1, HYPRE_MEMORY_HOST, mem);
56606977982Sstefanozampini hypre_TMemcpy(jj, hypre_CSRMatrixJ(A), HYPRE_Int, nnz, HYPRE_MEMORY_HOST, mem);
56706977982Sstefanozampini } else {
56806977982Sstefanozampini #else
56906977982Sstefanozampini {
57006977982Sstefanozampini #endif
57106977982Sstefanozampini ii = hypre_CSRMatrixI(A);
57206977982Sstefanozampini jj = hypre_CSRMatrixJ(A);
57306977982Sstefanozampini }
57406977982Sstefanozampini PetscCall(CSRtoCOO_HYPRE_Int_Private(n, ii, jj, ncoo, coo_i, coo_j));
57506977982Sstefanozampini if (mem != HYPRE_MEMORY_HOST) PetscCall(PetscFree2(ii, jj));
57606977982Sstefanozampini PetscFunctionReturn(PETSC_SUCCESS);
57706977982Sstefanozampini }
57806977982Sstefanozampini
57906977982Sstefanozampini static PetscErrorCode MatSetValuesCOOFromCSRMatrix_Private(Mat A, hypre_CSRMatrix *H)
58006977982Sstefanozampini {
58106977982Sstefanozampini PetscBool iscpu = PETSC_TRUE;
58206977982Sstefanozampini PetscScalar *a;
58306977982Sstefanozampini HYPRE_MemoryLocation mem = HYPRE_MEMORY_HOST;
58406977982Sstefanozampini
58506977982Sstefanozampini PetscFunctionBegin;
58606977982Sstefanozampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
58706977982Sstefanozampini mem = hypre_CSRMatrixMemoryLocation(H);
58806977982Sstefanozampini PetscCall(PetscObjectTypeCompare((PetscObject)A, MATSEQAIJ, &iscpu));
58906977982Sstefanozampini #endif
59006977982Sstefanozampini if (iscpu && mem != HYPRE_MEMORY_HOST) {
59106977982Sstefanozampini PetscCount nnz = hypre_CSRMatrixNumNonzeros(H);
59206977982Sstefanozampini PetscCall(PetscMalloc1(nnz, &a));
59306977982Sstefanozampini hypre_TMemcpy(a, hypre_CSRMatrixData(H), PetscScalar, nnz, HYPRE_MEMORY_HOST, mem);
59406977982Sstefanozampini } else {
59506977982Sstefanozampini a = (PetscScalar *)hypre_CSRMatrixData(H);
59606977982Sstefanozampini }
59706977982Sstefanozampini PetscCall(MatSetValuesCOO(A, a, INSERT_VALUES));
59806977982Sstefanozampini if (iscpu && mem != HYPRE_MEMORY_HOST) PetscCall(PetscFree(a));
599b73e3080SStefano Zampini PetscFunctionReturn(PETSC_SUCCESS);
600b73e3080SStefano Zampini }
601b73e3080SStefano Zampini
602b73e3080SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType type, MatReuse reuse, Mat *B)
603b73e3080SStefano Zampini {
604b73e3080SStefano Zampini MPI_Comm comm = PetscObjectComm((PetscObject)A);
60506977982Sstefanozampini Mat M = NULL, dH = NULL, oH = NULL, dA = NULL, oA = NULL;
606d7185485SAlex Lindsay PetscBool ismpiaij, issbaij, isbaij, boundtocpu = PETSC_TRUE;
607b73e3080SStefano Zampini Mat_HYPRE *hA;
608d7185485SAlex Lindsay PetscMemType memtype = PETSC_MEMTYPE_HOST;
609b73e3080SStefano Zampini
610b73e3080SStefano Zampini PetscFunctionBegin;
611d7185485SAlex Lindsay if (PetscDefined(HAVE_HYPRE_DEVICE)) {
612d7185485SAlex Lindsay PetscCall(MatGetCurrentMemType(A, &memtype));
613*5482091fSJunchao Zhang PetscCall(PetscHYPREInitialize());
614d7185485SAlex Lindsay boundtocpu = PetscMemTypeHost(memtype) ? PETSC_TRUE : PETSC_FALSE;
615a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_SetMemoryLocation(boundtocpu ? HYPRE_MEMORY_HOST : HYPRE_MEMORY_DEVICE));
616d7185485SAlex Lindsay }
617d7185485SAlex Lindsay
618b73e3080SStefano Zampini PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &issbaij, MATSEQSBAIJ, MATMPIBAIJ, ""));
619b73e3080SStefano Zampini PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &isbaij, MATSEQBAIJ, MATMPIBAIJ, ""));
620b73e3080SStefano Zampini if (isbaij || issbaij) { /* handle BAIJ and SBAIJ */
621b73e3080SStefano Zampini PetscBool ismpi;
622b73e3080SStefano Zampini MatType newtype;
623b73e3080SStefano Zampini
624b73e3080SStefano Zampini PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &ismpi, MATMPISBAIJ, MATMPIBAIJ, ""));
625b73e3080SStefano Zampini newtype = ismpi ? MATMPIAIJ : MATSEQAIJ;
62663c07aadSStefano Zampini if (reuse == MAT_REUSE_MATRIX) {
627b73e3080SStefano Zampini PetscCall(MatConvert(*B, newtype, MAT_INPLACE_MATRIX, B));
628b73e3080SStefano Zampini PetscCall(MatConvert(A, newtype, MAT_REUSE_MATRIX, B));
629b73e3080SStefano Zampini PetscCall(MatConvert(*B, MATHYPRE, MAT_INPLACE_MATRIX, B));
630b73e3080SStefano Zampini } else if (reuse == MAT_INITIAL_MATRIX) {
631b73e3080SStefano Zampini PetscCall(MatConvert(A, newtype, MAT_INITIAL_MATRIX, B));
632b73e3080SStefano Zampini PetscCall(MatConvert(*B, MATHYPRE, MAT_INPLACE_MATRIX, B));
63363c07aadSStefano Zampini } else {
634b73e3080SStefano Zampini PetscCall(MatConvert(A, newtype, MAT_INPLACE_MATRIX, &A));
635b73e3080SStefano Zampini PetscCall(MatConvert(A, MATHYPRE, MAT_INPLACE_MATRIX, &A));
636b73e3080SStefano Zampini }
637d7185485SAlex Lindsay #if defined(PETSC_HAVE_DEVICE)
638d7185485SAlex Lindsay (*B)->boundtocpu = boundtocpu;
639d7185485SAlex Lindsay #endif
640b73e3080SStefano Zampini PetscFunctionReturn(PETSC_SUCCESS);
641b73e3080SStefano Zampini }
64206977982Sstefanozampini
64306977982Sstefanozampini dA = A;
644b73e3080SStefano Zampini PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &ismpiaij));
645b73e3080SStefano Zampini if (ismpiaij) PetscCall(MatMPIAIJGetSeqAIJ(A, &dA, &oA, NULL));
64606977982Sstefanozampini
647b73e3080SStefano Zampini if (reuse != MAT_REUSE_MATRIX) {
64806977982Sstefanozampini PetscCount coo_n;
64906977982Sstefanozampini PetscInt *coo_i, *coo_j;
65006977982Sstefanozampini
6519566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, &M));
6529566063dSJacob Faibussowitsch PetscCall(MatSetType(M, MATHYPRE));
6539566063dSJacob Faibussowitsch PetscCall(MatSetSizes(M, A->rmap->n, A->cmap->n, A->rmap->N, A->cmap->N));
654b73e3080SStefano Zampini PetscCall(MatSetOption(M, MAT_SORTED_FULL, PETSC_TRUE));
655b73e3080SStefano Zampini PetscCall(MatSetOption(M, MAT_NO_OFF_PROC_ENTRIES, PETSC_TRUE));
656b73e3080SStefano Zampini
657b73e3080SStefano Zampini hA = (Mat_HYPRE *)M->data;
65806977982Sstefanozampini PetscCall(MatHYPRE_CreateFromMat(A, hA));
65906977982Sstefanozampini PetscCall(MatHYPRE_IJMatrixCopyIJ(A, hA->ij));
66006977982Sstefanozampini
66106977982Sstefanozampini PetscCall(MatHYPRE_CreateCOOMat(M));
66206977982Sstefanozampini
66306977982Sstefanozampini dH = hA->cooMat;
66406977982Sstefanozampini PetscCall(PetscObjectBaseTypeCompare((PetscObject)hA->cooMat, MATMPIAIJ, &ismpiaij));
66506977982Sstefanozampini if (ismpiaij) PetscCall(MatMPIAIJGetSeqAIJ(hA->cooMat, &dH, &oH, NULL));
66606977982Sstefanozampini
66706977982Sstefanozampini PetscCall(PetscObjectSetName((PetscObject)dH, "_internal_COO_mat_for_hypre"));
66806977982Sstefanozampini PetscCall(MatSeqAIJGetCOO_Private(dA, &coo_n, &coo_i, &coo_j));
66906977982Sstefanozampini PetscCall(MatSetPreallocationCOO(dH, coo_n, coo_i, coo_j));
67006977982Sstefanozampini PetscCall(PetscFree2(coo_i, coo_j));
67106977982Sstefanozampini if (oH) {
67206977982Sstefanozampini PetscCall(PetscLayoutDestroy(&oH->cmap));
67306977982Sstefanozampini PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)oH), oA->cmap->n, oA->cmap->n, 1, &oH->cmap));
67406977982Sstefanozampini PetscCall(MatSeqAIJGetCOO_Private(oA, &coo_n, &coo_i, &coo_j));
67506977982Sstefanozampini PetscCall(MatSetPreallocationCOO(oH, coo_n, coo_i, coo_j));
67606977982Sstefanozampini PetscCall(PetscFree2(coo_i, coo_j));
67706977982Sstefanozampini }
67806977982Sstefanozampini hA->cooMat->assembled = PETSC_TRUE;
67906977982Sstefanozampini
680b73e3080SStefano Zampini M->preallocated = PETSC_TRUE;
68106977982Sstefanozampini PetscCall(MatAssemblyBegin(M, MAT_FINAL_ASSEMBLY));
68206977982Sstefanozampini PetscCall(MatAssemblyEnd(M, MAT_FINAL_ASSEMBLY));
68306977982Sstefanozampini
68406977982Sstefanozampini PetscCall(MatHYPRE_AttachCOOMat(M));
68584d4e069SStefano Zampini if (reuse == MAT_INITIAL_MATRIX) *B = M;
686b73e3080SStefano Zampini } else M = *B;
687b73e3080SStefano Zampini
688b73e3080SStefano Zampini hA = (Mat_HYPRE *)M->data;
68906977982Sstefanozampini PetscCheck(hA->cooMat, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "HYPRE COO delegate matrix has not been created yet");
69006977982Sstefanozampini
69106977982Sstefanozampini dH = hA->cooMat;
69206977982Sstefanozampini PetscCall(PetscObjectBaseTypeCompare((PetscObject)hA->cooMat, MATMPIAIJ, &ismpiaij));
69306977982Sstefanozampini if (ismpiaij) PetscCall(MatMPIAIJGetSeqAIJ(hA->cooMat, &dH, &oH, NULL));
69406977982Sstefanozampini
69506977982Sstefanozampini PetscScalar *a;
69606977982Sstefanozampini PetscCall(MatSeqAIJGetCSRAndMemType(dA, NULL, NULL, &a, NULL));
69706977982Sstefanozampini PetscCall(MatSetValuesCOO(dH, a, INSERT_VALUES));
69806977982Sstefanozampini if (oH) {
69906977982Sstefanozampini PetscCall(MatSeqAIJGetCSRAndMemType(oA, NULL, NULL, &a, NULL));
70006977982Sstefanozampini PetscCall(MatSetValuesCOO(oH, a, INSERT_VALUES));
70106977982Sstefanozampini }
702b73e3080SStefano Zampini
70348a46eb9SPierre Jolivet if (reuse == MAT_INPLACE_MATRIX) PetscCall(MatHeaderReplace(A, &M));
704d7185485SAlex Lindsay #if defined(PETSC_HAVE_DEVICE)
705d7185485SAlex Lindsay (*B)->boundtocpu = boundtocpu;
706d7185485SAlex Lindsay #endif
7073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
70863c07aadSStefano Zampini }
70963c07aadSStefano Zampini
710d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatConvert_HYPRE_AIJ(Mat A, MatType mtype, MatReuse reuse, Mat *B)
711d71ae5a4SJacob Faibussowitsch {
71206977982Sstefanozampini Mat M, dA = NULL, oA = NULL;
71363c07aadSStefano Zampini hypre_ParCSRMatrix *parcsr;
71406977982Sstefanozampini hypre_CSRMatrix *dH, *oH;
71563c07aadSStefano Zampini MPI_Comm comm;
71606977982Sstefanozampini PetscBool ismpiaij, isseqaij;
71763c07aadSStefano Zampini
71863c07aadSStefano Zampini PetscFunctionBegin;
71963c07aadSStefano Zampini comm = PetscObjectComm((PetscObject)A);
72063c07aadSStefano Zampini if (reuse == MAT_REUSE_MATRIX) {
7219566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)*B, MATMPIAIJ, &ismpiaij));
7229566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)*B, MATSEQAIJ, &isseqaij));
72306977982Sstefanozampini PetscCheck(ismpiaij || isseqaij, comm, PETSC_ERR_SUP, "Only MATMPIAIJ or MATSEQAIJ base types are supported");
72463c07aadSStefano Zampini }
72506977982Sstefanozampini PetscCall(MatHYPREGetParCSR(A, &parcsr));
7266ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
72706977982Sstefanozampini if (HYPRE_MEMORY_DEVICE == hypre_ParCSRMatrixMemoryLocation(parcsr)) {
72806977982Sstefanozampini PetscBool isaij;
72906977982Sstefanozampini
73006977982Sstefanozampini PetscCall(PetscStrcmp(mtype, MATAIJ, &isaij));
73106977982Sstefanozampini if (isaij) {
73206977982Sstefanozampini PetscMPIInt size;
73306977982Sstefanozampini
7349566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm, &size));
73506977982Sstefanozampini #if defined(HYPRE_USING_HIP)
73606977982Sstefanozampini mtype = size > 1 ? MATMPIAIJHIPSPARSE : MATSEQAIJHIPSPARSE;
73706977982Sstefanozampini #elif defined(HYPRE_USING_CUDA)
73806977982Sstefanozampini mtype = size > 1 ? MATMPIAIJCUSPARSE : MATSEQAIJCUSPARSE;
73906977982Sstefanozampini #else
74006977982Sstefanozampini mtype = size > 1 ? MATMPIAIJ : MATSEQAIJ;
74106977982Sstefanozampini #endif
74263c07aadSStefano Zampini }
74363c07aadSStefano Zampini }
74406977982Sstefanozampini #endif
74506977982Sstefanozampini dH = hypre_ParCSRMatrixDiag(parcsr);
74606977982Sstefanozampini oH = hypre_ParCSRMatrixOffd(parcsr);
7479371c9d4SSatish Balay if (reuse != MAT_REUSE_MATRIX) {
74806977982Sstefanozampini PetscCount coo_n;
74906977982Sstefanozampini PetscInt *coo_i, *coo_j;
75063c07aadSStefano Zampini
75106977982Sstefanozampini PetscCall(MatCreate(comm, &M));
75206977982Sstefanozampini PetscCall(MatSetType(M, mtype));
75306977982Sstefanozampini PetscCall(MatSetSizes(M, A->rmap->n, A->cmap->n, A->rmap->N, A->cmap->N));
75406977982Sstefanozampini PetscCall(MatMPIAIJSetPreallocation(M, 0, NULL, 0, NULL));
75563c07aadSStefano Zampini
75606977982Sstefanozampini dA = M;
75706977982Sstefanozampini PetscCall(PetscObjectBaseTypeCompare((PetscObject)M, MATMPIAIJ, &ismpiaij));
75806977982Sstefanozampini if (ismpiaij) PetscCall(MatMPIAIJGetSeqAIJ(M, &dA, &oA, NULL));
759a16187a7SStefano Zampini
76006977982Sstefanozampini PetscCall(hypreCSRMatrixGetCOO_Private(dH, &coo_n, &coo_i, &coo_j));
76106977982Sstefanozampini PetscCall(MatSetPreallocationCOO(dA, coo_n, coo_i, coo_j));
76206977982Sstefanozampini PetscCall(PetscFree2(coo_i, coo_j));
76306977982Sstefanozampini if (ismpiaij) {
76406977982Sstefanozampini HYPRE_Int nc = hypre_CSRMatrixNumCols(oH);
765a16187a7SStefano Zampini
76606977982Sstefanozampini PetscCall(PetscLayoutDestroy(&oA->cmap));
76706977982Sstefanozampini PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)oA), nc, nc, 1, &oA->cmap));
76806977982Sstefanozampini PetscCall(hypreCSRMatrixGetCOO_Private(oH, &coo_n, &coo_i, &coo_j));
76906977982Sstefanozampini PetscCall(MatSetPreallocationCOO(oA, coo_n, coo_i, coo_j));
77006977982Sstefanozampini PetscCall(PetscFree2(coo_i, coo_j));
771a16187a7SStefano Zampini
77206977982Sstefanozampini /* garray */
773f4f49eeaSPierre Jolivet Mat_MPIAIJ *aij = (Mat_MPIAIJ *)M->data;
77406977982Sstefanozampini HYPRE_BigInt *harray = hypre_ParCSRMatrixColMapOffd(parcsr);
77506977982Sstefanozampini PetscInt *garray;
77606977982Sstefanozampini
77706977982Sstefanozampini PetscCall(PetscFree(aij->garray));
77806977982Sstefanozampini PetscCall(PetscMalloc1(nc, &garray));
77906977982Sstefanozampini for (HYPRE_Int i = 0; i < nc; i++) garray[i] = (PetscInt)harray[i];
78006977982Sstefanozampini aij->garray = garray;
78106977982Sstefanozampini PetscCall(MatSetUpMultiply_MPIAIJ(M));
782a16187a7SStefano Zampini }
78306977982Sstefanozampini if (reuse == MAT_INITIAL_MATRIX) *B = M;
78406977982Sstefanozampini } else M = *B;
785225daaf8SStefano Zampini
78606977982Sstefanozampini dA = M;
78706977982Sstefanozampini PetscCall(PetscObjectBaseTypeCompare((PetscObject)M, MATMPIAIJ, &ismpiaij));
78806977982Sstefanozampini if (ismpiaij) PetscCall(MatMPIAIJGetSeqAIJ(M, &dA, &oA, NULL));
78906977982Sstefanozampini PetscCall(MatSetValuesCOOFromCSRMatrix_Private(dA, dH));
79006977982Sstefanozampini if (oA) PetscCall(MatSetValuesCOOFromCSRMatrix_Private(oA, oH));
79106977982Sstefanozampini M->assembled = PETSC_TRUE;
79206977982Sstefanozampini if (reuse == MAT_INPLACE_MATRIX) PetscCall(MatHeaderReplace(A, &M));
7933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
79463c07aadSStefano Zampini }
79563c07aadSStefano Zampini
796d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAIJGetParCSR_Private(Mat A, hypre_ParCSRMatrix **hA)
797d71ae5a4SJacob Faibussowitsch {
798613e5ff0Sstefano_zampini hypre_ParCSRMatrix *tA;
799c1a070e6SStefano Zampini hypre_CSRMatrix *hdiag, *hoffd;
800c1a070e6SStefano Zampini Mat_SeqAIJ *diag, *offd;
8012cf14000SStefano Zampini PetscInt *garray, i, noffd, dnnz, onnz, *row_starts, *col_starts;
802c1a070e6SStefano Zampini MPI_Comm comm = PetscObjectComm((PetscObject)A);
803613e5ff0Sstefano_zampini PetscBool ismpiaij, isseqaij;
8042cf14000SStefano Zampini PetscBool sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int));
8056ea7df73SStefano Zampini HYPRE_Int *hdi = NULL, *hdj = NULL, *hoi = NULL, *hoj = NULL;
8065c97c10fSStefano Zampini PetscInt *pdi = NULL, *pdj = NULL, *poi = NULL, *poj = NULL;
80706977982Sstefanozampini PetscBool iscuda, iship;
80806977982Sstefanozampini #if defined(PETSC_HAVE_DEVICE) && defined(PETSC_HAVE_HYPRE_DEVICE)
80906977982Sstefanozampini PetscBool boundtocpu = A->boundtocpu;
81006977982Sstefanozampini #else
81106977982Sstefanozampini PetscBool boundtocpu = PETSC_TRUE;
8126ea7df73SStefano Zampini #endif
813c1a070e6SStefano Zampini
814c1a070e6SStefano Zampini PetscFunctionBegin;
8159566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &ismpiaij));
8169566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATSEQAIJ, &isseqaij));
81708401ef6SPierre Jolivet PetscCheck(ismpiaij || isseqaij, comm, PETSC_ERR_SUP, "Unsupported type %s", ((PetscObject)A)->type_name);
818b655ebf8SZach Atkins PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &iscuda, MATSEQAIJCUSPARSE, MATMPIAIJCUSPARSE, ""));
819b655ebf8SZach Atkins PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &iship, MATSEQAIJHIPSPARSE, MATMPIAIJHIPSPARSE, ""));
820*5482091fSJunchao Zhang PetscCall(PetscHYPREInitialize());
821c1a070e6SStefano Zampini if (ismpiaij) {
822f4f49eeaSPierre Jolivet Mat_MPIAIJ *a = (Mat_MPIAIJ *)A->data;
823c1a070e6SStefano Zampini
824c1a070e6SStefano Zampini diag = (Mat_SeqAIJ *)a->A->data;
825c1a070e6SStefano Zampini offd = (Mat_SeqAIJ *)a->B->data;
82606977982Sstefanozampini if (!boundtocpu && (iscuda || iship)) {
82706977982Sstefanozampini #if defined(HYPRE_USING_CUDA) && defined(PETSC_HAVE_CUDA)
82806977982Sstefanozampini if (iscuda) {
8296ea7df73SStefano Zampini sameint = PETSC_TRUE;
8309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJCUSPARSEGetIJ(a->A, PETSC_FALSE, (const HYPRE_Int **)&hdi, (const HYPRE_Int **)&hdj));
8319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJCUSPARSEGetIJ(a->B, PETSC_FALSE, (const HYPRE_Int **)&hoi, (const HYPRE_Int **)&hoj));
83206977982Sstefanozampini }
8336ea7df73SStefano Zampini #endif
83406977982Sstefanozampini #if defined(HYPRE_USING_HIP) && defined(PETSC_HAVE_HIP)
83506977982Sstefanozampini if (iship) {
83606977982Sstefanozampini sameint = PETSC_TRUE;
83706977982Sstefanozampini PetscCall(MatSeqAIJHIPSPARSEGetIJ(a->A, PETSC_FALSE, (const HYPRE_Int **)&hdi, (const HYPRE_Int **)&hdj));
83806977982Sstefanozampini PetscCall(MatSeqAIJHIPSPARSEGetIJ(a->B, PETSC_FALSE, (const HYPRE_Int **)&hoi, (const HYPRE_Int **)&hoj));
83906977982Sstefanozampini }
84006977982Sstefanozampini #endif
84106977982Sstefanozampini } else {
84206977982Sstefanozampini boundtocpu = PETSC_TRUE;
8436ea7df73SStefano Zampini pdi = diag->i;
8446ea7df73SStefano Zampini pdj = diag->j;
8456ea7df73SStefano Zampini poi = offd->i;
8466ea7df73SStefano Zampini poj = offd->j;
8476ea7df73SStefano Zampini if (sameint) {
8486ea7df73SStefano Zampini hdi = (HYPRE_Int *)pdi;
8496ea7df73SStefano Zampini hdj = (HYPRE_Int *)pdj;
8506ea7df73SStefano Zampini hoi = (HYPRE_Int *)poi;
8516ea7df73SStefano Zampini hoj = (HYPRE_Int *)poj;
8526ea7df73SStefano Zampini }
8536ea7df73SStefano Zampini }
854c1a070e6SStefano Zampini garray = a->garray;
855c1a070e6SStefano Zampini noffd = a->B->cmap->N;
856c1a070e6SStefano Zampini dnnz = diag->nz;
857c1a070e6SStefano Zampini onnz = offd->nz;
858c1a070e6SStefano Zampini } else {
859c1a070e6SStefano Zampini diag = (Mat_SeqAIJ *)A->data;
860c1a070e6SStefano Zampini offd = NULL;
86106977982Sstefanozampini if (!boundtocpu && (iscuda || iship)) {
86206977982Sstefanozampini #if defined(HYPRE_USING_CUDA) && defined(PETSC_HAVE_CUDA)
86306977982Sstefanozampini if (iscuda) {
8646ea7df73SStefano Zampini sameint = PETSC_TRUE;
8659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJCUSPARSEGetIJ(A, PETSC_FALSE, (const HYPRE_Int **)&hdi, (const HYPRE_Int **)&hdj));
86606977982Sstefanozampini }
8676ea7df73SStefano Zampini #endif
86806977982Sstefanozampini #if defined(HYPRE_USING_HIP) && defined(PETSC_HAVE_HIP)
86906977982Sstefanozampini if (iship) {
87006977982Sstefanozampini sameint = PETSC_TRUE;
87106977982Sstefanozampini PetscCall(MatSeqAIJHIPSPARSEGetIJ(A, PETSC_FALSE, (const HYPRE_Int **)&hdi, (const HYPRE_Int **)&hdj));
87206977982Sstefanozampini }
87306977982Sstefanozampini #endif
87406977982Sstefanozampini } else {
87506977982Sstefanozampini boundtocpu = PETSC_TRUE;
8766ea7df73SStefano Zampini pdi = diag->i;
8776ea7df73SStefano Zampini pdj = diag->j;
8786ea7df73SStefano Zampini if (sameint) {
8796ea7df73SStefano Zampini hdi = (HYPRE_Int *)pdi;
8806ea7df73SStefano Zampini hdj = (HYPRE_Int *)pdj;
8816ea7df73SStefano Zampini }
8826ea7df73SStefano Zampini }
883c1a070e6SStefano Zampini garray = NULL;
884c1a070e6SStefano Zampini noffd = 0;
885c1a070e6SStefano Zampini dnnz = diag->nz;
886c1a070e6SStefano Zampini onnz = 0;
887c1a070e6SStefano Zampini }
888225daaf8SStefano Zampini
889c1a070e6SStefano Zampini /* create a temporary ParCSR */
890c1a070e6SStefano Zampini if (HYPRE_AssumedPartitionCheck()) {
891c1a070e6SStefano Zampini PetscMPIInt myid;
892c1a070e6SStefano Zampini
8939566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(comm, &myid));
894c1a070e6SStefano Zampini row_starts = A->rmap->range + myid;
895c1a070e6SStefano Zampini col_starts = A->cmap->range + myid;
896c1a070e6SStefano Zampini } else {
897c1a070e6SStefano Zampini row_starts = A->rmap->range;
898c1a070e6SStefano Zampini col_starts = A->cmap->range;
899c1a070e6SStefano Zampini }
900f2f41e48SZach Atkins tA = hypre_ParCSRMatrixCreate(comm, A->rmap->N, A->cmap->N, (HYPRE_BigInt *)row_starts, (HYPRE_BigInt *)col_starts, (HYPRE_Int)noffd, (HYPRE_Int)dnnz, (HYPRE_Int)onnz);
901a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts)
902c1a070e6SStefano Zampini hypre_ParCSRMatrixSetRowStartsOwner(tA, 0);
903c1a070e6SStefano Zampini hypre_ParCSRMatrixSetColStartsOwner(tA, 0);
904a1d2239cSSatish Balay #endif
905c1a070e6SStefano Zampini
906225daaf8SStefano Zampini /* set diagonal part */
907c1a070e6SStefano Zampini hdiag = hypre_ParCSRMatrixDiag(tA);
9086ea7df73SStefano Zampini if (!sameint) { /* malloc CSR pointers */
9099566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(A->rmap->n + 1, &hdi, dnnz, &hdj));
910f4f49eeaSPierre Jolivet for (i = 0; i < A->rmap->n + 1; i++) hdi[i] = (HYPRE_Int)pdi[i];
911f4f49eeaSPierre Jolivet for (i = 0; i < dnnz; i++) hdj[i] = (HYPRE_Int)pdj[i];
9122cf14000SStefano Zampini }
9136ea7df73SStefano Zampini hypre_CSRMatrixI(hdiag) = hdi;
9146ea7df73SStefano Zampini hypre_CSRMatrixJ(hdiag) = hdj;
91539accc25SStefano Zampini hypre_CSRMatrixData(hdiag) = (HYPRE_Complex *)diag->a;
916f2f41e48SZach Atkins hypre_CSRMatrixNumNonzeros(hdiag) = (HYPRE_Int)diag->nz;
917c1a070e6SStefano Zampini hypre_CSRMatrixSetDataOwner(hdiag, 0);
918c1a070e6SStefano Zampini
9194cf0e950SBarry Smith /* set off-diagonal part */
920c1a070e6SStefano Zampini hoffd = hypre_ParCSRMatrixOffd(tA);
921c1a070e6SStefano Zampini if (offd) {
9226ea7df73SStefano Zampini if (!sameint) { /* malloc CSR pointers */
9239566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(A->rmap->n + 1, &hoi, onnz, &hoj));
924f4f49eeaSPierre Jolivet for (i = 0; i < A->rmap->n + 1; i++) hoi[i] = (HYPRE_Int)poi[i];
925f4f49eeaSPierre Jolivet for (i = 0; i < onnz; i++) hoj[i] = (HYPRE_Int)poj[i];
9262cf14000SStefano Zampini }
9276ea7df73SStefano Zampini hypre_CSRMatrixI(hoffd) = hoi;
9286ea7df73SStefano Zampini hypre_CSRMatrixJ(hoffd) = hoj;
92939accc25SStefano Zampini hypre_CSRMatrixData(hoffd) = (HYPRE_Complex *)offd->a;
930f2f41e48SZach Atkins hypre_CSRMatrixNumNonzeros(hoffd) = (HYPRE_Int)offd->nz;
931c1a070e6SStefano Zampini hypre_CSRMatrixSetDataOwner(hoffd, 0);
9326ea7df73SStefano Zampini }
9336ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
934a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixInitialize_v2(tA, !boundtocpu ? HYPRE_MEMORY_DEVICE : HYPRE_MEMORY_HOST));
9356ea7df73SStefano Zampini #else
9366ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 18, 0)
937a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixInitialize(tA));
9386ea7df73SStefano Zampini #else
939a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixInitialize_v2(tA, HYPRE_MEMORY_HOST));
9406ea7df73SStefano Zampini #endif
9416ea7df73SStefano Zampini #endif
942bb16242fSVictor A. P. Magri
943bb16242fSVictor A. P. Magri /* MatrixSetRownnz comes after MatrixInitialize, so the first uses the right memory location */
944bb16242fSVictor A. P. Magri hypre_CSRMatrixSetRownnz(hdiag);
945bb16242fSVictor A. P. Magri if (offd) hypre_CSRMatrixSetRownnz(hoffd);
946bb16242fSVictor A. P. Magri
9476ea7df73SStefano Zampini hypre_TFree(hypre_ParCSRMatrixColMapOffd(tA), HYPRE_MEMORY_HOST);
948c1a070e6SStefano Zampini hypre_ParCSRMatrixSetNumNonzeros(tA);
9492cf14000SStefano Zampini hypre_ParCSRMatrixColMapOffd(tA) = (HYPRE_BigInt *)garray;
950a333fa2bSZach Atkins if (!hypre_ParCSRMatrixCommPkg(tA)) PetscCallHYPRE(hypre_MatvecCommPkgCreate(tA));
951613e5ff0Sstefano_zampini *hA = tA;
9523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
953613e5ff0Sstefano_zampini }
954c1a070e6SStefano Zampini
955d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAIJRestoreParCSR_Private(Mat A, hypre_ParCSRMatrix **hA)
956d71ae5a4SJacob Faibussowitsch {
957613e5ff0Sstefano_zampini hypre_CSRMatrix *hdiag, *hoffd;
9586ea7df73SStefano Zampini PetscBool ismpiaij, sameint = (PetscBool)(sizeof(PetscInt) == sizeof(HYPRE_Int));
959b655ebf8SZach Atkins PetscBool iscuda, iship;
960c1a070e6SStefano Zampini
961613e5ff0Sstefano_zampini PetscFunctionBegin;
9629566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)A, MATMPIAIJ, &ismpiaij));
9639566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &iscuda, MATSEQAIJCUSPARSE, MATMPIAIJCUSPARSE, ""));
964b655ebf8SZach Atkins PetscCall(PetscObjectTypeCompareAny((PetscObject)A, &iship, MATSEQAIJHIPSPARSE, MATMPIAIJHIPSPARSE, ""));
965b655ebf8SZach Atkins #if defined(HYPRE_USING_CUDA) && defined(PETSC_HAVE_CUDA)
9666ea7df73SStefano Zampini if (iscuda) sameint = PETSC_TRUE;
967b655ebf8SZach Atkins #elif defined(HYPRE_USING_HIP) && defined(PETSC_HAVE_HIP)
968b655ebf8SZach Atkins if (iship) sameint = PETSC_TRUE;
9696ea7df73SStefano Zampini #endif
970613e5ff0Sstefano_zampini hdiag = hypre_ParCSRMatrixDiag(*hA);
971613e5ff0Sstefano_zampini hoffd = hypre_ParCSRMatrixOffd(*hA);
9726ea7df73SStefano Zampini /* free temporary memory allocated by PETSc
9736ea7df73SStefano Zampini set pointers to NULL before destroying tA */
9742cf14000SStefano Zampini if (!sameint) {
9752cf14000SStefano Zampini HYPRE_Int *hi, *hj;
9762cf14000SStefano Zampini
9772cf14000SStefano Zampini hi = hypre_CSRMatrixI(hdiag);
9782cf14000SStefano Zampini hj = hypre_CSRMatrixJ(hdiag);
9799566063dSJacob Faibussowitsch PetscCall(PetscFree2(hi, hj));
9806ea7df73SStefano Zampini if (ismpiaij) {
9812cf14000SStefano Zampini hi = hypre_CSRMatrixI(hoffd);
9822cf14000SStefano Zampini hj = hypre_CSRMatrixJ(hoffd);
9839566063dSJacob Faibussowitsch PetscCall(PetscFree2(hi, hj));
9842cf14000SStefano Zampini }
9852cf14000SStefano Zampini }
986c1a070e6SStefano Zampini hypre_CSRMatrixI(hdiag) = NULL;
987c1a070e6SStefano Zampini hypre_CSRMatrixJ(hdiag) = NULL;
988c1a070e6SStefano Zampini hypre_CSRMatrixData(hdiag) = NULL;
9896ea7df73SStefano Zampini if (ismpiaij) {
990c1a070e6SStefano Zampini hypre_CSRMatrixI(hoffd) = NULL;
991c1a070e6SStefano Zampini hypre_CSRMatrixJ(hoffd) = NULL;
992c1a070e6SStefano Zampini hypre_CSRMatrixData(hoffd) = NULL;
9936ea7df73SStefano Zampini }
994613e5ff0Sstefano_zampini hypre_ParCSRMatrixColMapOffd(*hA) = NULL;
995613e5ff0Sstefano_zampini hypre_ParCSRMatrixDestroy(*hA);
996613e5ff0Sstefano_zampini *hA = NULL;
9973ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
998613e5ff0Sstefano_zampini }
999613e5ff0Sstefano_zampini
1000613e5ff0Sstefano_zampini /* calls RAP from BoomerAMG:
10013dad0653Sstefano_zampini the resulting ParCSR will not own the column and row starts
10026ea7df73SStefano Zampini It looks like we don't need to have the diagonal entries ordered first */
1003d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_ParCSR_RAP(hypre_ParCSRMatrix *hR, hypre_ParCSRMatrix *hA, hypre_ParCSRMatrix *hP, hypre_ParCSRMatrix **hRAP)
1004d71ae5a4SJacob Faibussowitsch {
1005a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts)
1006613e5ff0Sstefano_zampini HYPRE_Int P_owns_col_starts, R_owns_row_starts;
1007a1d2239cSSatish Balay #endif
1008613e5ff0Sstefano_zampini
1009613e5ff0Sstefano_zampini PetscFunctionBegin;
1010a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts)
1011613e5ff0Sstefano_zampini P_owns_col_starts = hypre_ParCSRMatrixOwnsColStarts(hP);
1012613e5ff0Sstefano_zampini R_owns_row_starts = hypre_ParCSRMatrixOwnsRowStarts(hR);
1013a1d2239cSSatish Balay #endif
10146ea7df73SStefano Zampini /* can be replaced by version test later */
10156ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
1016792fecdfSBarry Smith PetscStackPushExternal("hypre_ParCSRMatrixRAP");
10176ea7df73SStefano Zampini *hRAP = hypre_ParCSRMatrixRAP(hR, hA, hP);
10186ea7df73SStefano Zampini PetscStackPop;
10196ea7df73SStefano Zampini #else
1020a333fa2bSZach Atkins PetscCallHYPRE(hypre_BoomerAMGBuildCoarseOperator(hR, hA, hP, hRAP));
1021a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixSetNumNonzeros(*hRAP));
10226ea7df73SStefano Zampini #endif
1023613e5ff0Sstefano_zampini /* hypre_BoomerAMGBuildCoarseOperator steals the col_starts from P and the row_starts from R */
1024a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts)
1025613e5ff0Sstefano_zampini hypre_ParCSRMatrixSetRowStartsOwner(*hRAP, 0);
1026613e5ff0Sstefano_zampini hypre_ParCSRMatrixSetColStartsOwner(*hRAP, 0);
1027613e5ff0Sstefano_zampini if (P_owns_col_starts) hypre_ParCSRMatrixSetColStartsOwner(hP, 1);
1028613e5ff0Sstefano_zampini if (R_owns_row_starts) hypre_ParCSRMatrixSetRowStartsOwner(hR, 1);
1029a1d2239cSSatish Balay #endif
10303ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
1031613e5ff0Sstefano_zampini }
1032613e5ff0Sstefano_zampini
1033d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatPtAPNumeric_AIJ_AIJ_wHYPRE(Mat A, Mat P, Mat C)
1034d71ae5a4SJacob Faibussowitsch {
10356f231fbdSstefano_zampini Mat B;
10366abb4441SStefano Zampini hypre_ParCSRMatrix *hA, *hP, *hPtAP = NULL;
10374222ddf1SHong Zhang Mat_Product *product = C->product;
1038613e5ff0Sstefano_zampini
1039613e5ff0Sstefano_zampini PetscFunctionBegin;
10409566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(A, &hA));
10419566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(P, &hP));
10429566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_RAP(hP, hA, hP, &hPtAP));
10439566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(hPtAP, MATAIJ, PETSC_OWN_POINTER, &B));
10444222ddf1SHong Zhang
10459566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(C, &B));
10464222ddf1SHong Zhang C->product = product;
10474222ddf1SHong Zhang
10489566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(A, &hA));
10499566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(P, &hP));
10503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
10516f231fbdSstefano_zampini }
10526f231fbdSstefano_zampini
1053d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatPtAPSymbolic_AIJ_AIJ_wHYPRE(Mat A, Mat P, PetscReal fill, Mat C)
1054d71ae5a4SJacob Faibussowitsch {
10556f231fbdSstefano_zampini PetscFunctionBegin;
10569566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATAIJ));
10574222ddf1SHong Zhang C->ops->ptapnumeric = MatPtAPNumeric_AIJ_AIJ_wHYPRE;
10584222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_PtAP;
10593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
1060613e5ff0Sstefano_zampini }
1061613e5ff0Sstefano_zampini
1062d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatPtAPNumeric_AIJ_HYPRE(Mat A, Mat P, Mat C)
1063d71ae5a4SJacob Faibussowitsch {
10644cc28894Sstefano_zampini Mat B;
10654cc28894Sstefano_zampini Mat_HYPRE *hP;
10666abb4441SStefano Zampini hypre_ParCSRMatrix *hA = NULL, *Pparcsr, *ptapparcsr = NULL;
1067613e5ff0Sstefano_zampini HYPRE_Int type;
1068613e5ff0Sstefano_zampini MPI_Comm comm = PetscObjectComm((PetscObject)A);
10694cc28894Sstefano_zampini PetscBool ishypre;
1070613e5ff0Sstefano_zampini
1071613e5ff0Sstefano_zampini PetscFunctionBegin;
10729566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)P, MATHYPRE, &ishypre));
107328b400f6SJacob Faibussowitsch PetscCheck(ishypre, comm, PETSC_ERR_USER, "P should be of type %s", MATHYPRE);
10744cc28894Sstefano_zampini hP = (Mat_HYPRE *)P->data;
1075a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(hP->ij, &type));
107608401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, comm, PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
1077a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hP->ij, (void **)&Pparcsr));
1078613e5ff0Sstefano_zampini
10799566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(A, &hA));
10809566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_RAP(Pparcsr, hA, Pparcsr, &ptapparcsr));
10819566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(A, &hA));
1082225daaf8SStefano Zampini
10834cc28894Sstefano_zampini /* create temporary matrix and merge to C */
10849566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(ptapparcsr, ((PetscObject)C)->type_name, PETSC_OWN_POINTER, &B));
10859566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(C, &B));
10863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
10874cc28894Sstefano_zampini }
10884cc28894Sstefano_zampini
1089d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatPtAPNumeric_HYPRE_HYPRE(Mat A, Mat P, Mat C)
1090d71ae5a4SJacob Faibussowitsch {
10914cc28894Sstefano_zampini Mat B;
10926abb4441SStefano Zampini hypre_ParCSRMatrix *Aparcsr, *Pparcsr, *ptapparcsr = NULL;
10934cc28894Sstefano_zampini Mat_HYPRE *hA, *hP;
10944cc28894Sstefano_zampini PetscBool ishypre;
10954cc28894Sstefano_zampini HYPRE_Int type;
10964cc28894Sstefano_zampini
10974cc28894Sstefano_zampini PetscFunctionBegin;
10989566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)P, MATHYPRE, &ishypre));
109928b400f6SJacob Faibussowitsch PetscCheck(ishypre, PetscObjectComm((PetscObject)P), PETSC_ERR_USER, "P should be of type %s", MATHYPRE);
11009566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)A, MATHYPRE, &ishypre));
110128b400f6SJacob Faibussowitsch PetscCheck(ishypre, PetscObjectComm((PetscObject)A), PETSC_ERR_USER, "A should be of type %s", MATHYPRE);
11024cc28894Sstefano_zampini hA = (Mat_HYPRE *)A->data;
11034cc28894Sstefano_zampini hP = (Mat_HYPRE *)P->data;
1104a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(hA->ij, &type));
110508401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
1106a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(hP->ij, &type));
110708401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)P), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
1108a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij, (void **)&Aparcsr));
1109a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hP->ij, (void **)&Pparcsr));
11109566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_RAP(Pparcsr, Aparcsr, Pparcsr, &ptapparcsr));
11119566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(ptapparcsr, MATHYPRE, PETSC_OWN_POINTER, &B));
11129566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(C, &B));
11133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
11144cc28894Sstefano_zampini }
11154cc28894Sstefano_zampini
1116d501dc42Sstefano_zampini /* calls hypre_ParMatmul
1117d501dc42Sstefano_zampini hypre_ParMatMul uses hypre_ParMatrixCreate with the communicator of hA
11183dad0653Sstefano_zampini hypre_ParMatrixCreate does not duplicate the communicator
11196ea7df73SStefano Zampini It looks like we don't need to have the diagonal entries ordered first */
1120d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_ParCSR_MatMatMult(hypre_ParCSRMatrix *hA, hypre_ParCSRMatrix *hB, hypre_ParCSRMatrix **hAB)
1121d71ae5a4SJacob Faibussowitsch {
1122d501dc42Sstefano_zampini PetscFunctionBegin;
11236ea7df73SStefano Zampini /* can be replaced by version test later */
11246ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
1125792fecdfSBarry Smith PetscStackPushExternal("hypre_ParCSRMatMat");
11266ea7df73SStefano Zampini *hAB = hypre_ParCSRMatMat(hA, hB);
11276ea7df73SStefano Zampini #else
1128792fecdfSBarry Smith PetscStackPushExternal("hypre_ParMatmul");
1129d501dc42Sstefano_zampini *hAB = hypre_ParMatmul(hA, hB);
11306ea7df73SStefano Zampini #endif
1131d501dc42Sstefano_zampini PetscStackPop;
11323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
1133d501dc42Sstefano_zampini }
1134d501dc42Sstefano_zampini
1135d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMatMultNumeric_AIJ_AIJ_wHYPRE(Mat A, Mat B, Mat C)
1136d71ae5a4SJacob Faibussowitsch {
11375e5acdf2Sstefano_zampini Mat D;
1138d501dc42Sstefano_zampini hypre_ParCSRMatrix *hA, *hB, *hAB = NULL;
11394222ddf1SHong Zhang Mat_Product *product = C->product;
11405e5acdf2Sstefano_zampini
11415e5acdf2Sstefano_zampini PetscFunctionBegin;
11429566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(A, &hA));
11439566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(B, &hB));
11449566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_MatMatMult(hA, hB, &hAB));
11459566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(hAB, MATAIJ, PETSC_OWN_POINTER, &D));
11464222ddf1SHong Zhang
11479566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(C, &D));
11484222ddf1SHong Zhang C->product = product;
11494222ddf1SHong Zhang
11509566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(A, &hA));
11519566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(B, &hB));
11523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
11535e5acdf2Sstefano_zampini }
11545e5acdf2Sstefano_zampini
1155d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatMatMultSymbolic_AIJ_AIJ_wHYPRE(Mat A, Mat B, PetscReal fill, Mat C)
1156d71ae5a4SJacob Faibussowitsch {
11575e5acdf2Sstefano_zampini PetscFunctionBegin;
11589566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATAIJ));
11594222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_AIJ_AIJ_wHYPRE;
11604222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AB;
11613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
11625e5acdf2Sstefano_zampini }
11635e5acdf2Sstefano_zampini
1164d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMatMultNumeric_HYPRE_HYPRE(Mat A, Mat B, Mat C)
1165d71ae5a4SJacob Faibussowitsch {
1166d501dc42Sstefano_zampini Mat D;
1167d501dc42Sstefano_zampini hypre_ParCSRMatrix *Aparcsr, *Bparcsr, *ABparcsr = NULL;
1168d501dc42Sstefano_zampini Mat_HYPRE *hA, *hB;
1169d501dc42Sstefano_zampini PetscBool ishypre;
1170d501dc42Sstefano_zampini HYPRE_Int type;
11714222ddf1SHong Zhang Mat_Product *product;
1172d501dc42Sstefano_zampini
1173d501dc42Sstefano_zampini PetscFunctionBegin;
11749566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATHYPRE, &ishypre));
117528b400f6SJacob Faibussowitsch PetscCheck(ishypre, PetscObjectComm((PetscObject)B), PETSC_ERR_USER, "B should be of type %s", MATHYPRE);
11769566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)A, MATHYPRE, &ishypre));
117728b400f6SJacob Faibussowitsch PetscCheck(ishypre, PetscObjectComm((PetscObject)A), PETSC_ERR_USER, "A should be of type %s", MATHYPRE);
1178d501dc42Sstefano_zampini hA = (Mat_HYPRE *)A->data;
1179d501dc42Sstefano_zampini hB = (Mat_HYPRE *)B->data;
1180a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(hA->ij, &type));
118108401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
1182a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(hB->ij, &type));
118308401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)B), PETSC_ERR_SUP, "Only HYPRE_PARCSR is supported");
1184a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij, (void **)&Aparcsr));
1185a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hB->ij, (void **)&Bparcsr));
11869566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_MatMatMult(Aparcsr, Bparcsr, &ABparcsr));
11879566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(ABparcsr, MATHYPRE, PETSC_OWN_POINTER, &D));
11884222ddf1SHong Zhang
1189d501dc42Sstefano_zampini /* need to use HeaderReplace because HeaderMerge messes up with the communicator */
11904222ddf1SHong Zhang product = C->product; /* save it from MatHeaderReplace() */
11914222ddf1SHong Zhang C->product = NULL;
11929566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(C, &D));
11934222ddf1SHong Zhang C->product = product;
1194d501dc42Sstefano_zampini C->ops->matmultnumeric = MatMatMultNumeric_HYPRE_HYPRE;
11954222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AB;
11963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
1197d501dc42Sstefano_zampini }
1198d501dc42Sstefano_zampini
1199d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatTransposeMatMatMultNumeric_AIJ_AIJ_AIJ_wHYPRE(Mat A, Mat B, Mat C, Mat D)
1200d71ae5a4SJacob Faibussowitsch {
120120e1dc0dSstefano_zampini Mat E;
12026abb4441SStefano Zampini hypre_ParCSRMatrix *hA, *hB, *hC, *hABC = NULL;
120320e1dc0dSstefano_zampini
120420e1dc0dSstefano_zampini PetscFunctionBegin;
12059566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(A, &hA));
12069566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(B, &hB));
12079566063dSJacob Faibussowitsch PetscCall(MatAIJGetParCSR_Private(C, &hC));
12089566063dSJacob Faibussowitsch PetscCall(MatHYPRE_ParCSR_RAP(hA, hB, hC, &hABC));
12099566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(hABC, MATAIJ, PETSC_OWN_POINTER, &E));
12109566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(D, &E));
12119566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(A, &hA));
12129566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(B, &hB));
12139566063dSJacob Faibussowitsch PetscCall(MatAIJRestoreParCSR_Private(C, &hC));
12143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
121520e1dc0dSstefano_zampini }
121620e1dc0dSstefano_zampini
1217d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatTransposeMatMatMultSymbolic_AIJ_AIJ_AIJ_wHYPRE(Mat A, Mat B, Mat C, PetscReal fill, Mat D)
1218d71ae5a4SJacob Faibussowitsch {
121920e1dc0dSstefano_zampini PetscFunctionBegin;
12209566063dSJacob Faibussowitsch PetscCall(MatSetType(D, MATAIJ));
12213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
122220e1dc0dSstefano_zampini }
122320e1dc0dSstefano_zampini
1224d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSymbolic_AB_HYPRE(Mat C)
1225d71ae5a4SJacob Faibussowitsch {
12264222ddf1SHong Zhang PetscFunctionBegin;
12274222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AB;
12283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
12294222ddf1SHong Zhang }
12304222ddf1SHong Zhang
1231d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSetFromOptions_HYPRE_AB(Mat C)
1232d71ae5a4SJacob Faibussowitsch {
12334222ddf1SHong Zhang Mat_Product *product = C->product;
12344222ddf1SHong Zhang PetscBool Ahypre;
12354222ddf1SHong Zhang
12364222ddf1SHong Zhang PetscFunctionBegin;
12379566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)product->A, MATHYPRE, &Ahypre));
12384222ddf1SHong Zhang if (Ahypre) { /* A is a Hypre matrix */
12399566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATHYPRE));
12404222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_AB_HYPRE;
12414222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_HYPRE_HYPRE;
12423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
12436718818eSStefano Zampini }
12443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
12454222ddf1SHong Zhang }
12464222ddf1SHong Zhang
1247d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSymbolic_PtAP_HYPRE(Mat C)
1248d71ae5a4SJacob Faibussowitsch {
12494222ddf1SHong Zhang PetscFunctionBegin;
12504222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_PtAP;
12513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
12524222ddf1SHong Zhang }
12534222ddf1SHong Zhang
1254d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSetFromOptions_HYPRE_PtAP(Mat C)
1255d71ae5a4SJacob Faibussowitsch {
12564222ddf1SHong Zhang Mat_Product *product = C->product;
12574222ddf1SHong Zhang PetscBool flg;
12584222ddf1SHong Zhang PetscInt type = 0;
12594222ddf1SHong Zhang const char *outTypes[4] = {"aij", "seqaij", "mpiaij", "hypre"};
12604222ddf1SHong Zhang PetscInt ntype = 4;
12614222ddf1SHong Zhang Mat A = product->A;
12624222ddf1SHong Zhang PetscBool Ahypre;
12634222ddf1SHong Zhang
12644222ddf1SHong Zhang PetscFunctionBegin;
12659566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)A, MATHYPRE, &Ahypre));
12664222ddf1SHong Zhang if (Ahypre) { /* A is a Hypre matrix */
12679566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATHYPRE));
12684222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_PtAP_HYPRE;
12694222ddf1SHong Zhang C->ops->ptapnumeric = MatPtAPNumeric_HYPRE_HYPRE;
12703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
12714222ddf1SHong Zhang }
12724222ddf1SHong Zhang
12734222ddf1SHong Zhang /* A is AIJ, P is Hypre, C = PtAP can be either AIJ or Hypre format */
12744222ddf1SHong Zhang /* Get runtime option */
12754222ddf1SHong Zhang if (product->api_user) {
1276d0609cedSBarry Smith PetscOptionsBegin(PetscObjectComm((PetscObject)C), ((PetscObject)C)->prefix, "MatPtAP_HYPRE", "Mat");
12779566063dSJacob Faibussowitsch PetscCall(PetscOptionsEList("-matptap_hypre_outtype", "MatPtAP outtype", "MatPtAP outtype", outTypes, ntype, outTypes[type], &type, &flg));
1278d0609cedSBarry Smith PetscOptionsEnd();
12794222ddf1SHong Zhang } else {
1280d0609cedSBarry Smith PetscOptionsBegin(PetscObjectComm((PetscObject)C), ((PetscObject)C)->prefix, "MatProduct_PtAP_HYPRE", "Mat");
12819566063dSJacob Faibussowitsch PetscCall(PetscOptionsEList("-mat_product_algorithm_hypre_outtype", "MatProduct_PtAP outtype", "MatProduct_PtAP", outTypes, ntype, outTypes[type], &type, &flg));
1282d0609cedSBarry Smith PetscOptionsEnd();
12834222ddf1SHong Zhang }
12844222ddf1SHong Zhang
12854222ddf1SHong Zhang if (type == 0 || type == 1 || type == 2) {
12869566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATAIJ));
12874222ddf1SHong Zhang } else if (type == 3) {
12889566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATHYPRE));
12894222ddf1SHong Zhang } else SETERRQ(PetscObjectComm((PetscObject)C), PETSC_ERR_SUP, "MatPtAP outtype is not supported");
12904222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_PtAP_HYPRE;
12914222ddf1SHong Zhang C->ops->ptapnumeric = MatPtAPNumeric_AIJ_HYPRE;
12923ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
12934222ddf1SHong Zhang }
12944222ddf1SHong Zhang
1295d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatProductSetFromOptions_HYPRE(Mat C)
1296d71ae5a4SJacob Faibussowitsch {
12974222ddf1SHong Zhang Mat_Product *product = C->product;
12984222ddf1SHong Zhang
12994222ddf1SHong Zhang PetscFunctionBegin;
13004222ddf1SHong Zhang switch (product->type) {
1301d71ae5a4SJacob Faibussowitsch case MATPRODUCT_AB:
1302d71ae5a4SJacob Faibussowitsch PetscCall(MatProductSetFromOptions_HYPRE_AB(C));
1303d71ae5a4SJacob Faibussowitsch break;
1304d71ae5a4SJacob Faibussowitsch case MATPRODUCT_PtAP:
1305d71ae5a4SJacob Faibussowitsch PetscCall(MatProductSetFromOptions_HYPRE_PtAP(C));
1306d71ae5a4SJacob Faibussowitsch break;
1307d71ae5a4SJacob Faibussowitsch default:
1308d71ae5a4SJacob Faibussowitsch break;
13094222ddf1SHong Zhang }
13103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
13114222ddf1SHong Zhang }
13124222ddf1SHong Zhang
1313d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMultTranspose_HYPRE(Mat A, Vec x, Vec y)
1314d71ae5a4SJacob Faibussowitsch {
131563c07aadSStefano Zampini PetscFunctionBegin;
13169566063dSJacob Faibussowitsch PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 0.0, y, PETSC_TRUE));
13173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
131863c07aadSStefano Zampini }
131963c07aadSStefano Zampini
1320d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMult_HYPRE(Mat A, Vec x, Vec y)
1321d71ae5a4SJacob Faibussowitsch {
132263c07aadSStefano Zampini PetscFunctionBegin;
13239566063dSJacob Faibussowitsch PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 0.0, y, PETSC_FALSE));
13243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
132563c07aadSStefano Zampini }
132663c07aadSStefano Zampini
1327d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMultAdd_HYPRE(Mat A, Vec x, Vec y, Vec z)
1328d71ae5a4SJacob Faibussowitsch {
1329414bd5c3SStefano Zampini PetscFunctionBegin;
133048a46eb9SPierre Jolivet if (y != z) PetscCall(VecCopy(y, z));
13319566063dSJacob Faibussowitsch PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 1.0, z, PETSC_FALSE));
13323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
1333414bd5c3SStefano Zampini }
1334414bd5c3SStefano Zampini
1335d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMultTransposeAdd_HYPRE(Mat A, Vec x, Vec y, Vec z)
1336d71ae5a4SJacob Faibussowitsch {
1337414bd5c3SStefano Zampini PetscFunctionBegin;
133848a46eb9SPierre Jolivet if (y != z) PetscCall(VecCopy(y, z));
13399566063dSJacob Faibussowitsch PetscCall(MatHYPRE_MultKernel_Private(A, 1.0, x, 1.0, z, PETSC_TRUE));
13403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
1341414bd5c3SStefano Zampini }
1342414bd5c3SStefano Zampini
1343414bd5c3SStefano Zampini /* y = a * A * x + b * y or y = a * A^t * x + b * y depending on trans */
1344d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRE_MultKernel_Private(Mat A, HYPRE_Complex a, Vec x, HYPRE_Complex b, Vec y, PetscBool trans)
1345d71ae5a4SJacob Faibussowitsch {
134663c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
134763c07aadSStefano Zampini hypre_ParCSRMatrix *parcsr;
134863c07aadSStefano Zampini hypre_ParVector *hx, *hy;
134963c07aadSStefano Zampini
135063c07aadSStefano Zampini PetscFunctionBegin;
135163c07aadSStefano Zampini if (trans) {
13529566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorPushVecRead(hA->b, x));
13539566063dSJacob Faibussowitsch if (b != 0.0) PetscCall(VecHYPRE_IJVectorPushVec(hA->x, y));
13549566063dSJacob Faibussowitsch else PetscCall(VecHYPRE_IJVectorPushVecWrite(hA->x, y));
1355a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJVectorGetObject(hA->b->ij, (void **)&hx));
1356a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJVectorGetObject(hA->x->ij, (void **)&hy));
135763c07aadSStefano Zampini } else {
13589566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorPushVecRead(hA->x, x));
13599566063dSJacob Faibussowitsch if (b != 0.0) PetscCall(VecHYPRE_IJVectorPushVec(hA->b, y));
13609566063dSJacob Faibussowitsch else PetscCall(VecHYPRE_IJVectorPushVecWrite(hA->b, y));
1361a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJVectorGetObject(hA->x->ij, (void **)&hx));
1362a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJVectorGetObject(hA->b->ij, (void **)&hy));
136363c07aadSStefano Zampini }
1364a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij, (void **)&parcsr));
13656ea7df73SStefano Zampini if (trans) {
1366a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixMatvecT(a, parcsr, hx, b, hy));
13676ea7df73SStefano Zampini } else {
1368a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixMatvec(a, parcsr, hx, b, hy));
13696ea7df73SStefano Zampini }
13709566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorPopVec(hA->x));
13719566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorPopVec(hA->b));
13723ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
137363c07aadSStefano Zampini }
137463c07aadSStefano Zampini
1375d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatDestroy_HYPRE(Mat A)
1376d71ae5a4SJacob Faibussowitsch {
137763c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
137863c07aadSStefano Zampini
137963c07aadSStefano Zampini PetscFunctionBegin;
13809566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorDestroy(&hA->x));
13819566063dSJacob Faibussowitsch PetscCall(VecHYPRE_IJVectorDestroy(&hA->b));
138206977982Sstefanozampini PetscCall(MatHYPRE_DestroyCOOMat(A)); /* must be called before destroying the individual CSR */
1383978814f1SStefano Zampini if (hA->ij) {
1384978814f1SStefano Zampini if (!hA->inner_free) hypre_IJMatrixObject(hA->ij) = NULL;
1385a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixDestroy(hA->ij));
1386978814f1SStefano Zampini }
13879566063dSJacob Faibussowitsch if (hA->comm) PetscCall(PetscCommRestoreComm(PetscObjectComm((PetscObject)A), &hA->comm));
1388c69f721fSFande Kong
13899566063dSJacob Faibussowitsch PetscCall(MatStashDestroy_Private(&A->stash));
13909566063dSJacob Faibussowitsch PetscCall(PetscFree(hA->array));
1391a32e9c99SJunchao Zhang if (hA->rows_d) PetscStackCallExternalVoid("hypre_Free", hypre_Free(hA->rows_d, HYPRE_MEMORY_DEVICE));
1392c69f721fSFande Kong
13939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_hypre_aij_C", NULL));
13949566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_hypre_is_C", NULL));
13959566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_hypre_C", NULL));
13969566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_mpiaij_hypre_C", NULL));
139706977982Sstefanozampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_hypre_C", NULL));
139806977982Sstefanozampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_mpiaijhipsparse_hypre_C", NULL));
139906977982Sstefanozampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_hypre_C", NULL));
140006977982Sstefanozampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_mpiaijcusparse_hypre_C", NULL));
14019566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatHYPRESetPreallocation_C", NULL));
14029566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatHYPREGetParCSR_C", NULL));
14035fbaff96SJunchao Zhang PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL));
14045fbaff96SJunchao Zhang PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL));
14059566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data));
14063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
140763c07aadSStefano Zampini }
140863c07aadSStefano Zampini
1409d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetUp_HYPRE(Mat A)
1410d71ae5a4SJacob Faibussowitsch {
14114ec6421dSstefano_zampini PetscFunctionBegin;
141206977982Sstefanozampini if (!A->preallocated) PetscCall(MatHYPRESetPreallocation(A, PETSC_DEFAULT, NULL, PETSC_DEFAULT, NULL));
14133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
14144ec6421dSstefano_zampini }
14154ec6421dSstefano_zampini
14166ea7df73SStefano Zampini //TODO FIX hypre_CSRMatrixMatvecOutOfPlace
14176ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
1418d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatBindToCPU_HYPRE(Mat A, PetscBool bind)
1419d71ae5a4SJacob Faibussowitsch {
14206ea7df73SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
14216ea7df73SStefano Zampini HYPRE_MemoryLocation hmem = bind ? HYPRE_MEMORY_HOST : HYPRE_MEMORY_DEVICE;
14226ea7df73SStefano Zampini
14236ea7df73SStefano Zampini PetscFunctionBegin;
14246ea7df73SStefano Zampini A->boundtocpu = bind;
14255fbaff96SJunchao Zhang if (hA->ij && hypre_IJMatrixAssembleFlag(hA->ij) && hmem != hypre_IJMatrixMemoryLocation(hA->ij)) {
14266ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr;
1427a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij, (void **)&parcsr));
1428a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixMigrate(parcsr, hmem));
14296ea7df73SStefano Zampini }
14309566063dSJacob Faibussowitsch if (hA->x) PetscCall(VecHYPRE_IJBindToCPU(hA->x, bind));
14319566063dSJacob Faibussowitsch if (hA->b) PetscCall(VecHYPRE_IJBindToCPU(hA->b, bind));
14323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
14336ea7df73SStefano Zampini }
14346ea7df73SStefano Zampini #endif
14356ea7df73SStefano Zampini
1436d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAssemblyEnd_HYPRE(Mat A, MatAssemblyType mode)
1437d71ae5a4SJacob Faibussowitsch {
143863c07aadSStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
1439c69f721fSFande Kong PetscMPIInt n;
1440c69f721fSFande Kong PetscInt i, j, rstart, ncols, flg;
1441c69f721fSFande Kong PetscInt *row, *col;
1442c69f721fSFande Kong PetscScalar *val;
144363c07aadSStefano Zampini
144463c07aadSStefano Zampini PetscFunctionBegin;
144508401ef6SPierre Jolivet PetscCheck(mode != MAT_FLUSH_ASSEMBLY, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "MAT_FLUSH_ASSEMBLY currently not supported with MATHYPRE");
1446c69f721fSFande Kong
1447c69f721fSFande Kong if (!A->nooffprocentries) {
1448c69f721fSFande Kong while (1) {
14499566063dSJacob Faibussowitsch PetscCall(MatStashScatterGetMesg_Private(&A->stash, &n, &row, &col, &val, &flg));
1450c69f721fSFande Kong if (!flg) break;
1451c69f721fSFande Kong
1452c69f721fSFande Kong for (i = 0; i < n;) {
1453c69f721fSFande Kong /* Now identify the consecutive vals belonging to the same row */
1454c69f721fSFande Kong for (j = i, rstart = row[j]; j < n; j++) {
1455c69f721fSFande Kong if (row[j] != rstart) break;
1456c69f721fSFande Kong }
1457c69f721fSFande Kong if (j < n) ncols = j - i;
1458c69f721fSFande Kong else ncols = n - i;
1459c69f721fSFande Kong /* Now assemble all these values with a single function call */
14609566063dSJacob Faibussowitsch PetscCall(MatSetValues_HYPRE(A, 1, row + i, ncols, col + i, val + i, A->insertmode));
1461c69f721fSFande Kong
1462c69f721fSFande Kong i = j;
1463c69f721fSFande Kong }
1464c69f721fSFande Kong }
14659566063dSJacob Faibussowitsch PetscCall(MatStashScatterEnd_Private(&A->stash));
1466c69f721fSFande Kong }
1467c69f721fSFande Kong
1468a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixAssemble(hA->ij));
1469336664bdSPierre Jolivet /* The assembly routine destroys the aux_matrix, we recreate it here by calling HYPRE_IJMatrixInitialize */
1470336664bdSPierre Jolivet /* If the option MAT_SORTED_FULL is set to true, the indices and values can be passed to hypre directly, so we don't need the aux_matrix */
1471651b1cf9SStefano Zampini if (!A->sortedfull) {
1472af1cf968SStefano Zampini hypre_AuxParCSRMatrix *aux_matrix;
1473af1cf968SStefano Zampini
1474af1cf968SStefano Zampini /* call destroy just to make sure we do not leak anything */
1475af1cf968SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij);
1476a333fa2bSZach Atkins PetscCallHYPRE(hypre_AuxParCSRMatrixDestroy(aux_matrix));
1477af1cf968SStefano Zampini hypre_IJMatrixTranslator(hA->ij) = NULL;
1478af1cf968SStefano Zampini
1479af1cf968SStefano Zampini /* Initialize with assembled flag -> it only recreates the aux_par_matrix */
1480a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixInitialize(hA->ij));
1481af1cf968SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij);
14826ea7df73SStefano Zampini if (aux_matrix) {
1483af1cf968SStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 1; /* see comment in MatHYPRESetPreallocation_HYPRE */
148422235d61SPierre Jolivet #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0)
1485a333fa2bSZach Atkins PetscCallHYPRE(hypre_AuxParCSRMatrixInitialize(aux_matrix));
148622235d61SPierre Jolivet #else
1487a333fa2bSZach Atkins PetscCallHYPRE(hypre_AuxParCSRMatrixInitialize_v2(aux_matrix, HYPRE_MEMORY_HOST));
148822235d61SPierre Jolivet #endif
1489af1cf968SStefano Zampini }
14906ea7df73SStefano Zampini }
14916ea7df73SStefano Zampini {
14926ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr;
14936ea7df73SStefano Zampini
1494a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij, (void **)&parcsr));
1495a333fa2bSZach Atkins if (!hypre_ParCSRMatrixCommPkg(parcsr)) PetscCallHYPRE(hypre_MatvecCommPkgCreate(parcsr));
14966ea7df73SStefano Zampini }
14979566063dSJacob Faibussowitsch if (!hA->x) PetscCall(VecHYPRE_IJVectorCreate(A->cmap, &hA->x));
14989566063dSJacob Faibussowitsch if (!hA->b) PetscCall(VecHYPRE_IJVectorCreate(A->rmap, &hA->b));
14996ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
15009566063dSJacob Faibussowitsch PetscCall(MatBindToCPU_HYPRE(A, A->boundtocpu));
15016ea7df73SStefano Zampini #endif
15023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
150363c07aadSStefano Zampini }
150463c07aadSStefano Zampini
1505d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetArray_HYPRE(Mat A, PetscInt size, void **array)
1506d71ae5a4SJacob Faibussowitsch {
1507c69f721fSFande Kong Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
1508c69f721fSFande Kong
1509c69f721fSFande Kong PetscFunctionBegin;
1510651b1cf9SStefano Zampini PetscCheck(hA->array_available, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Temporary space is in use");
1511c69f721fSFande Kong
1512651b1cf9SStefano Zampini if (hA->array_size >= size) {
151339accc25SStefano Zampini *array = hA->array;
151439accc25SStefano Zampini } else {
15159566063dSJacob Faibussowitsch PetscCall(PetscFree(hA->array));
1516651b1cf9SStefano Zampini hA->array_size = size;
1517651b1cf9SStefano Zampini PetscCall(PetscMalloc(hA->array_size, &hA->array));
1518c69f721fSFande Kong *array = hA->array;
1519c69f721fSFande Kong }
1520c69f721fSFande Kong
1521651b1cf9SStefano Zampini hA->array_available = PETSC_FALSE;
15223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
1523c69f721fSFande Kong }
1524c69f721fSFande Kong
1525d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreArray_HYPRE(Mat A, void **array)
1526d71ae5a4SJacob Faibussowitsch {
1527c69f721fSFande Kong Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
1528c69f721fSFande Kong
1529c69f721fSFande Kong PetscFunctionBegin;
1530c69f721fSFande Kong *array = NULL;
1531651b1cf9SStefano Zampini hA->array_available = PETSC_TRUE;
15323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
1533c69f721fSFande Kong }
1534c69f721fSFande Kong
1535d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValues_HYPRE(Mat A, PetscInt nr, const PetscInt rows[], PetscInt nc, const PetscInt cols[], const PetscScalar v[], InsertMode ins)
1536d71ae5a4SJacob Faibussowitsch {
1537d975228cSstefano_zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
1538d975228cSstefano_zampini PetscScalar *vals = (PetscScalar *)v;
153939accc25SStefano Zampini HYPRE_Complex *sscr;
1540c69f721fSFande Kong PetscInt *cscr[2];
1541c69f721fSFande Kong PetscInt i, nzc;
1542651b1cf9SStefano Zampini PetscInt rst = A->rmap->rstart, ren = A->rmap->rend;
154308defe43SFande Kong void *array = NULL;
1544d975228cSstefano_zampini
1545d975228cSstefano_zampini PetscFunctionBegin;
15469566063dSJacob Faibussowitsch PetscCall(MatGetArray_HYPRE(A, sizeof(PetscInt) * (2 * nc) + sizeof(HYPRE_Complex) * nc * nr, &array));
1547c69f721fSFande Kong cscr[0] = (PetscInt *)array;
1548c69f721fSFande Kong cscr[1] = ((PetscInt *)array) + nc;
154939accc25SStefano Zampini sscr = (HYPRE_Complex *)(((PetscInt *)array) + nc * 2);
1550d975228cSstefano_zampini for (i = 0, nzc = 0; i < nc; i++) {
1551d975228cSstefano_zampini if (cols[i] >= 0) {
1552d975228cSstefano_zampini cscr[0][nzc] = cols[i];
1553d975228cSstefano_zampini cscr[1][nzc++] = i;
1554d975228cSstefano_zampini }
1555d975228cSstefano_zampini }
1556c69f721fSFande Kong if (!nzc) {
15579566063dSJacob Faibussowitsch PetscCall(MatRestoreArray_HYPRE(A, &array));
15583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
1559c69f721fSFande Kong }
1560d975228cSstefano_zampini
15616ea7df73SStefano Zampini #if 0 //defined(PETSC_HAVE_HYPRE_DEVICE)
15626ea7df73SStefano Zampini if (HYPRE_MEMORY_HOST != hypre_IJMatrixMemoryLocation(hA->ij)) {
15636ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr;
15646ea7df73SStefano Zampini
1565a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij,(void**)&parcsr));
1566a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixMigrate(parcsr, HYPRE_MEMORY_HOST));
15676ea7df73SStefano Zampini }
15686ea7df73SStefano Zampini #endif
15696ea7df73SStefano Zampini
1570d975228cSstefano_zampini if (ins == ADD_VALUES) {
1571d975228cSstefano_zampini for (i = 0; i < nr; i++) {
15726ea7df73SStefano Zampini if (rows[i] >= 0) {
1573d975228cSstefano_zampini PetscInt j;
15742cf14000SStefano Zampini HYPRE_Int hnc = (HYPRE_Int)nzc;
15752cf14000SStefano Zampini
1576651b1cf9SStefano Zampini if (!nzc) continue;
1577651b1cf9SStefano Zampini /* nonlocal values */
1578651b1cf9SStefano Zampini if (rows[i] < rst || rows[i] >= ren) {
1579651b1cf9SStefano Zampini PetscCheck(!A->nooffprocentries, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Setting off process row %" PetscInt_FMT " even though MatSetOption(,MAT_NO_OFF_PROC_ENTRIES,PETSC_TRUE) was set", rows[i]);
1580651b1cf9SStefano Zampini if (hA->donotstash) continue;
1581651b1cf9SStefano Zampini }
1582aed4548fSBarry Smith PetscCheck((PetscInt)hnc == nzc, PETSC_COMM_SELF, PETSC_ERR_SUP, "Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT, nzc, rows[i]);
15839566063dSJacob Faibussowitsch for (j = 0; j < nzc; j++) PetscCall(PetscHYPREScalarCast(vals[cscr[1][j]], &sscr[j]));
1584a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixAddToValues(hA->ij, 1, &hnc, (HYPRE_BigInt *)(rows + i), (HYPRE_BigInt *)cscr[0], sscr));
1585d975228cSstefano_zampini }
1586d975228cSstefano_zampini vals += nc;
1587d975228cSstefano_zampini }
1588d975228cSstefano_zampini } else { /* INSERT_VALUES */
1589d975228cSstefano_zampini for (i = 0; i < nr; i++) {
15906ea7df73SStefano Zampini if (rows[i] >= 0) {
1591d975228cSstefano_zampini PetscInt j;
15922cf14000SStefano Zampini HYPRE_Int hnc = (HYPRE_Int)nzc;
15932cf14000SStefano Zampini
1594651b1cf9SStefano Zampini if (!nzc) continue;
1595aed4548fSBarry Smith PetscCheck((PetscInt)hnc == nzc, PETSC_COMM_SELF, PETSC_ERR_SUP, "Hypre overflow! number of columns %" PetscInt_FMT " for row %" PetscInt_FMT, nzc, rows[i]);
15969566063dSJacob Faibussowitsch for (j = 0; j < nzc; j++) PetscCall(PetscHYPREScalarCast(vals[cscr[1][j]], &sscr[j]));
1597c69f721fSFande Kong /* nonlocal values */
1598651b1cf9SStefano Zampini if (rows[i] < rst || rows[i] >= ren) {
1599651b1cf9SStefano Zampini PetscCheck(!A->nooffprocentries, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Setting off process row %" PetscInt_FMT " even though MatSetOption(,MAT_NO_OFF_PROC_ENTRIES,PETSC_TRUE) was set", rows[i]);
1600651b1cf9SStefano Zampini if (!hA->donotstash) PetscCall(MatStashValuesRow_Private(&A->stash, rows[i], nzc, cscr[0], (PetscScalar *)sscr, PETSC_FALSE));
1601651b1cf9SStefano Zampini }
1602c69f721fSFande Kong /* local values */
1603651b1cf9SStefano Zampini else
1604a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixSetValues(hA->ij, 1, &hnc, (HYPRE_BigInt *)(rows + i), (HYPRE_BigInt *)cscr[0], sscr));
1605d975228cSstefano_zampini }
1606d975228cSstefano_zampini vals += nc;
1607d975228cSstefano_zampini }
1608d975228cSstefano_zampini }
1609c69f721fSFande Kong
16109566063dSJacob Faibussowitsch PetscCall(MatRestoreArray_HYPRE(A, &array));
16113ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
1612d975228cSstefano_zampini }
1613d975228cSstefano_zampini
1614d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPRESetPreallocation_HYPRE(Mat A, PetscInt dnz, const PetscInt dnnz[], PetscInt onz, const PetscInt onnz[])
1615d71ae5a4SJacob Faibussowitsch {
1616d975228cSstefano_zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
16177d968826Sstefano_zampini HYPRE_Int *hdnnz, *honnz;
161806a29025Sstefano_zampini PetscInt i, rs, re, cs, ce, bs;
1619d975228cSstefano_zampini PetscMPIInt size;
1620d975228cSstefano_zampini
1621d975228cSstefano_zampini PetscFunctionBegin;
16229566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap));
16239566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap));
1624d975228cSstefano_zampini rs = A->rmap->rstart;
1625d975228cSstefano_zampini re = A->rmap->rend;
1626d975228cSstefano_zampini cs = A->cmap->rstart;
1627d975228cSstefano_zampini ce = A->cmap->rend;
1628d975228cSstefano_zampini if (!hA->ij) {
1629a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixCreate(hA->comm, rs, re - 1, cs, ce - 1, &hA->ij));
1630a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixSetObjectType(hA->ij, HYPRE_PARCSR));
1631d975228cSstefano_zampini } else {
16322cf14000SStefano Zampini HYPRE_BigInt hrs, hre, hcs, hce;
1633a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetLocalRange(hA->ij, &hrs, &hre, &hcs, &hce));
1634aed4548fSBarry Smith PetscCheck(hre - hrs + 1 == re - rs, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Inconsistent local rows: IJMatrix [%" PetscHYPRE_BigInt_FMT ",%" PetscHYPRE_BigInt_FMT "), PETSc [%" PetscInt_FMT ",%" PetscInt_FMT ")", hrs, hre + 1, rs, re);
1635aed4548fSBarry Smith PetscCheck(hce - hcs + 1 == ce - cs, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Inconsistent local cols: IJMatrix [%" PetscHYPRE_BigInt_FMT ",%" PetscHYPRE_BigInt_FMT "), PETSc [%" PetscInt_FMT ",%" PetscInt_FMT ")", hcs, hce + 1, cs, ce);
1636d975228cSstefano_zampini }
163706977982Sstefanozampini PetscCall(MatHYPRE_DestroyCOOMat(A));
16389566063dSJacob Faibussowitsch PetscCall(MatGetBlockSize(A, &bs));
163906a29025Sstefano_zampini if (dnz == PETSC_DEFAULT || dnz == PETSC_DECIDE) dnz = 10 * bs;
164006a29025Sstefano_zampini if (onz == PETSC_DEFAULT || onz == PETSC_DECIDE) onz = 10 * bs;
164106a29025Sstefano_zampini
1642d975228cSstefano_zampini if (!dnnz) {
16439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &hdnnz));
1644f2f41e48SZach Atkins for (i = 0; i < A->rmap->n; i++) hdnnz[i] = (HYPRE_Int)dnz;
1645d975228cSstefano_zampini } else {
16467d968826Sstefano_zampini hdnnz = (HYPRE_Int *)dnnz;
1647d975228cSstefano_zampini }
16489566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)A), &size));
1649d975228cSstefano_zampini if (size > 1) {
1650ddbeb582SStefano Zampini hypre_AuxParCSRMatrix *aux_matrix;
1651d975228cSstefano_zampini if (!onnz) {
16529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &honnz));
1653f2f41e48SZach Atkins for (i = 0; i < A->rmap->n; i++) honnz[i] = (HYPRE_Int)onz;
165422235d61SPierre Jolivet } else honnz = (HYPRE_Int *)onnz;
1655ddbeb582SStefano Zampini /* SetDiagOffdSizes sets hypre_AuxParCSRMatrixNeedAux(aux_matrix) = 0, since it seems
1656ddbeb582SStefano Zampini they assume the user will input the entire row values, properly sorted
1657336664bdSPierre Jolivet In PETSc, we don't make such an assumption and set this flag to 1,
1658336664bdSPierre Jolivet unless the option MAT_SORTED_FULL is set to true.
1659ddbeb582SStefano Zampini Also, to avoid possible memory leaks, we destroy and recreate the translator
1660ddbeb582SStefano Zampini This has to be done here, as HYPRE_IJMatrixInitialize will properly initialize
1661ddbeb582SStefano Zampini the IJ matrix for us */
1662ddbeb582SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij);
1663ddbeb582SStefano Zampini hypre_AuxParCSRMatrixDestroy(aux_matrix);
1664ddbeb582SStefano Zampini hypre_IJMatrixTranslator(hA->ij) = NULL;
1665a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixSetDiagOffdSizes(hA->ij, hdnnz, honnz));
1666ddbeb582SStefano Zampini aux_matrix = (hypre_AuxParCSRMatrix *)hypre_IJMatrixTranslator(hA->ij);
1667651b1cf9SStefano Zampini hypre_AuxParCSRMatrixNeedAux(aux_matrix) = !A->sortedfull;
1668d975228cSstefano_zampini } else {
1669d975228cSstefano_zampini honnz = NULL;
1670a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixSetRowSizes(hA->ij, hdnnz));
1671d975228cSstefano_zampini }
1672ddbeb582SStefano Zampini
1673af1cf968SStefano Zampini /* reset assembled flag and call the initialize method */
1674af1cf968SStefano Zampini hypre_IJMatrixAssembleFlag(hA->ij) = 0;
16756ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0)
1676a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixInitialize(hA->ij));
16776ea7df73SStefano Zampini #else
1678a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixInitialize_v2(hA->ij, HYPRE_MEMORY_HOST));
16796ea7df73SStefano Zampini #endif
168048a46eb9SPierre Jolivet if (!dnnz) PetscCall(PetscFree(hdnnz));
168148a46eb9SPierre Jolivet if (!onnz && honnz) PetscCall(PetscFree(honnz));
1682af1cf968SStefano Zampini /* Match AIJ logic */
168306a29025Sstefano_zampini A->preallocated = PETSC_TRUE;
1684af1cf968SStefano Zampini A->assembled = PETSC_FALSE;
16853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
1686d975228cSstefano_zampini }
1687d975228cSstefano_zampini
1688d975228cSstefano_zampini /*@C
1689d975228cSstefano_zampini MatHYPRESetPreallocation - Preallocates memory for a sparse parallel matrix in HYPRE IJ format
1690d975228cSstefano_zampini
1691c3339decSBarry Smith Collective
1692d975228cSstefano_zampini
1693d975228cSstefano_zampini Input Parameters:
1694d975228cSstefano_zampini + A - the matrix
1695d975228cSstefano_zampini . dnz - number of nonzeros per row in DIAGONAL portion of local submatrix
1696d975228cSstefano_zampini (same value is used for all local rows)
1697d975228cSstefano_zampini . dnnz - array containing the number of nonzeros in the various rows of the
1698d975228cSstefano_zampini DIAGONAL portion of the local submatrix (possibly different for each row)
16992ef1f0ffSBarry Smith or `NULL` (`PETSC_NULL_INTEGER` in Fortran), if `d_nz` is used to specify the nonzero structure.
17002ef1f0ffSBarry Smith The size of this array is equal to the number of local rows, i.e `m`.
1701d975228cSstefano_zampini For matrices that will be factored, you must leave room for (and set)
1702d975228cSstefano_zampini the diagonal entry even if it is zero.
1703d975228cSstefano_zampini . onz - number of nonzeros per row in the OFF-DIAGONAL portion of local
1704d975228cSstefano_zampini submatrix (same value is used for all local rows).
1705d975228cSstefano_zampini - onnz - array containing the number of nonzeros in the various rows of the
1706d975228cSstefano_zampini OFF-DIAGONAL portion of the local submatrix (possibly different for
17072ef1f0ffSBarry Smith each row) or `NULL` (`PETSC_NULL_INTEGER` in Fortran), if `o_nz` is used to specify the nonzero
1708d975228cSstefano_zampini structure. The size of this array is equal to the number
17092ef1f0ffSBarry Smith of local rows, i.e `m`.
1710d975228cSstefano_zampini
17112fe279fdSBarry Smith Level: intermediate
17122fe279fdSBarry Smith
171311a5261eSBarry Smith Note:
17142ef1f0ffSBarry Smith If the *nnz parameter is given then the *nz parameter is ignored; for sequential matrices, `onz` and `onnz` are ignored.
1715d975228cSstefano_zampini
17161cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatMPIAIJSetPreallocation()`, `MATHYPRE`, `MATAIJ`
1717d975228cSstefano_zampini @*/
1718d71ae5a4SJacob Faibussowitsch PetscErrorCode MatHYPRESetPreallocation(Mat A, PetscInt dnz, const PetscInt dnnz[], PetscInt onz, const PetscInt onnz[])
1719d71ae5a4SJacob Faibussowitsch {
1720d975228cSstefano_zampini PetscFunctionBegin;
1721d975228cSstefano_zampini PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
1722d975228cSstefano_zampini PetscValidType(A, 1);
1723cac4c232SBarry Smith PetscTryMethod(A, "MatHYPRESetPreallocation_C", (Mat, PetscInt, const PetscInt[], PetscInt, const PetscInt[]), (A, dnz, dnnz, onz, onnz));
17243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
1725d975228cSstefano_zampini }
1726d975228cSstefano_zampini
172720f4b53cSBarry Smith /*@C
17282ef1f0ffSBarry Smith MatCreateFromParCSR - Creates a `Mat` from a `hypre_ParCSRMatrix`
1729225daaf8SStefano Zampini
1730225daaf8SStefano Zampini Collective
1731225daaf8SStefano Zampini
1732225daaf8SStefano Zampini Input Parameters:
17332ef1f0ffSBarry Smith + parcsr - the pointer to the `hypre_ParCSRMatrix`
17342ef1f0ffSBarry Smith . mtype - matrix type to be created. Currently `MATAIJ`, `MATIS` and `MATHYPRE` are supported.
173520f4b53cSBarry Smith - copymode - PETSc copying options, see `PetscCopyMode`
1736225daaf8SStefano Zampini
1737225daaf8SStefano Zampini Output Parameter:
1738225daaf8SStefano Zampini . A - the matrix
1739225daaf8SStefano Zampini
1740225daaf8SStefano Zampini Level: intermediate
1741225daaf8SStefano Zampini
1742bfe80ac4SPierre Jolivet .seealso: [](ch_matrices), `Mat`, `MATHYPRE`, `PetscCopyMode`
174320f4b53cSBarry Smith @*/
1744d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreateFromParCSR(hypre_ParCSRMatrix *parcsr, MatType mtype, PetscCopyMode copymode, Mat *A)
1745d71ae5a4SJacob Faibussowitsch {
1746225daaf8SStefano Zampini Mat T;
1747978814f1SStefano Zampini Mat_HYPRE *hA;
1748978814f1SStefano Zampini MPI_Comm comm;
1749978814f1SStefano Zampini PetscInt rstart, rend, cstart, cend, M, N;
1750d248a85cSRichard Tran Mills PetscBool isseqaij, isseqaijmkl, ismpiaij, isaij, ishyp, isis;
1751978814f1SStefano Zampini
1752978814f1SStefano Zampini PetscFunctionBegin;
1753978814f1SStefano Zampini comm = hypre_ParCSRMatrixComm(parcsr);
17549566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATSEQAIJ, &isseqaij));
17559566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATSEQAIJMKL, &isseqaijmkl));
17569566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATMPIAIJ, &ismpiaij));
17579566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATAIJ, &isaij));
17589566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATHYPRE, &ishyp));
17599566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(mtype, MATIS, &isis));
1760d248a85cSRichard Tran Mills isaij = (PetscBool)(isseqaij || isseqaijmkl || ismpiaij || isaij);
17616ea7df73SStefano Zampini /* TODO */
1762aed4548fSBarry Smith PetscCheck(isaij || ishyp || isis, comm, PETSC_ERR_SUP, "Unsupported MatType %s! Supported types are %s, %s, %s, %s, %s, and %s", mtype, MATAIJ, MATSEQAIJ, MATSEQAIJMKL, MATMPIAIJ, MATIS, MATHYPRE);
1763978814f1SStefano Zampini /* access ParCSRMatrix */
1764978814f1SStefano Zampini rstart = hypre_ParCSRMatrixFirstRowIndex(parcsr);
1765978814f1SStefano Zampini rend = hypre_ParCSRMatrixLastRowIndex(parcsr);
1766978814f1SStefano Zampini cstart = hypre_ParCSRMatrixFirstColDiag(parcsr);
1767978814f1SStefano Zampini cend = hypre_ParCSRMatrixLastColDiag(parcsr);
1768978814f1SStefano Zampini M = hypre_ParCSRMatrixGlobalNumRows(parcsr);
1769978814f1SStefano Zampini N = hypre_ParCSRMatrixGlobalNumCols(parcsr);
1770978814f1SStefano Zampini
1771978814f1SStefano Zampini /* create PETSc matrix with MatHYPRE */
17729566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, &T));
1773c2886e86SStefano Zampini PetscCall(MatSetSizes(T, PetscMax(rend - rstart + 1, 0), PetscMax(cend - cstart + 1, 0), M, N));
17749566063dSJacob Faibussowitsch PetscCall(MatSetType(T, MATHYPRE));
1775f4f49eeaSPierre Jolivet hA = (Mat_HYPRE *)T->data;
1776978814f1SStefano Zampini
1777978814f1SStefano Zampini /* create HYPRE_IJMatrix */
1778a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixCreate(hA->comm, rstart, rend, cstart, cend, &hA->ij));
1779a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixSetObjectType(hA->ij, HYPRE_PARCSR));
178045b8d346SStefano Zampini
178145b8d346SStefano Zampini /* create new ParCSR object if needed */
178245b8d346SStefano Zampini if (ishyp && copymode == PETSC_COPY_VALUES) {
178345b8d346SStefano Zampini hypre_ParCSRMatrix *new_parcsr;
17846ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 18, 0)
178545b8d346SStefano Zampini hypre_CSRMatrix *hdiag, *hoffd, *ndiag, *noffd;
178645b8d346SStefano Zampini
17870e6427aaSSatish Balay new_parcsr = hypre_ParCSRMatrixClone(parcsr, 0);
178845b8d346SStefano Zampini hdiag = hypre_ParCSRMatrixDiag(parcsr);
178945b8d346SStefano Zampini hoffd = hypre_ParCSRMatrixOffd(parcsr);
179045b8d346SStefano Zampini ndiag = hypre_ParCSRMatrixDiag(new_parcsr);
179145b8d346SStefano Zampini noffd = hypre_ParCSRMatrixOffd(new_parcsr);
17929566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hypre_CSRMatrixData(ndiag), hypre_CSRMatrixData(hdiag), hypre_CSRMatrixNumNonzeros(hdiag)));
17939566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(hypre_CSRMatrixData(noffd), hypre_CSRMatrixData(hoffd), hypre_CSRMatrixNumNonzeros(hoffd)));
17946ea7df73SStefano Zampini #else
17956ea7df73SStefano Zampini new_parcsr = hypre_ParCSRMatrixClone(parcsr, 1);
17966ea7df73SStefano Zampini #endif
179745b8d346SStefano Zampini parcsr = new_parcsr;
179845b8d346SStefano Zampini copymode = PETSC_OWN_POINTER;
179945b8d346SStefano Zampini }
1800978814f1SStefano Zampini
1801978814f1SStefano Zampini /* set ParCSR object */
1802978814f1SStefano Zampini hypre_IJMatrixObject(hA->ij) = parcsr;
18034ec6421dSstefano_zampini T->preallocated = PETSC_TRUE;
1804978814f1SStefano Zampini
1805978814f1SStefano Zampini /* set assembled flag */
1806978814f1SStefano Zampini hypre_IJMatrixAssembleFlag(hA->ij) = 1;
18076ea7df73SStefano Zampini #if 0
1808a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixInitialize(hA->ij));
18096ea7df73SStefano Zampini #endif
1810225daaf8SStefano Zampini if (ishyp) {
18116d2a658fSstefano_zampini PetscMPIInt myid = 0;
18126d2a658fSstefano_zampini
18136d2a658fSstefano_zampini /* make sure we always have row_starts and col_starts available */
181448a46eb9SPierre Jolivet if (HYPRE_AssumedPartitionCheck()) PetscCallMPI(MPI_Comm_rank(comm, &myid));
1815a1d2239cSSatish Balay #if defined(hypre_ParCSRMatrixOwnsRowStarts)
18166d2a658fSstefano_zampini if (!hypre_ParCSRMatrixOwnsColStarts(parcsr)) {
18176d2a658fSstefano_zampini PetscLayout map;
18186d2a658fSstefano_zampini
18199566063dSJacob Faibussowitsch PetscCall(MatGetLayouts(T, NULL, &map));
18209566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(map));
18212cf14000SStefano Zampini hypre_ParCSRMatrixColStarts(parcsr) = (HYPRE_BigInt *)(map->range + myid);
18226d2a658fSstefano_zampini }
18236d2a658fSstefano_zampini if (!hypre_ParCSRMatrixOwnsRowStarts(parcsr)) {
18246d2a658fSstefano_zampini PetscLayout map;
18256d2a658fSstefano_zampini
18269566063dSJacob Faibussowitsch PetscCall(MatGetLayouts(T, &map, NULL));
18279566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(map));
18282cf14000SStefano Zampini hypre_ParCSRMatrixRowStarts(parcsr) = (HYPRE_BigInt *)(map->range + myid);
18296d2a658fSstefano_zampini }
1830a1d2239cSSatish Balay #endif
1831978814f1SStefano Zampini /* prevent from freeing the pointer */
1832978814f1SStefano Zampini if (copymode == PETSC_USE_POINTER) hA->inner_free = PETSC_FALSE;
1833225daaf8SStefano Zampini *A = T;
18349566063dSJacob Faibussowitsch PetscCall(MatSetOption(*A, MAT_SORTED_FULL, PETSC_TRUE));
18359566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*A, MAT_FINAL_ASSEMBLY));
18369566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*A, MAT_FINAL_ASSEMBLY));
1837bb4689ddSStefano Zampini } else if (isaij) {
1838bb4689ddSStefano Zampini if (copymode != PETSC_OWN_POINTER) {
1839225daaf8SStefano Zampini /* prevent from freeing the pointer */
1840225daaf8SStefano Zampini hA->inner_free = PETSC_FALSE;
18419566063dSJacob Faibussowitsch PetscCall(MatConvert_HYPRE_AIJ(T, MATAIJ, MAT_INITIAL_MATRIX, A));
18429566063dSJacob Faibussowitsch PetscCall(MatDestroy(&T));
1843225daaf8SStefano Zampini } else { /* AIJ return type with PETSC_OWN_POINTER */
18449566063dSJacob Faibussowitsch PetscCall(MatConvert_HYPRE_AIJ(T, MATAIJ, MAT_INPLACE_MATRIX, &T));
1845225daaf8SStefano Zampini *A = T;
1846225daaf8SStefano Zampini }
1847bb4689ddSStefano Zampini } else if (isis) {
18489566063dSJacob Faibussowitsch PetscCall(MatConvert_HYPRE_IS(T, MATIS, MAT_INITIAL_MATRIX, A));
18498cfe8d00SStefano Zampini if (copymode != PETSC_OWN_POINTER) hA->inner_free = PETSC_FALSE;
18509566063dSJacob Faibussowitsch PetscCall(MatDestroy(&T));
1851bb4689ddSStefano Zampini }
18523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
1853978814f1SStefano Zampini }
1854978814f1SStefano Zampini
1855d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatHYPREGetParCSR_HYPRE(Mat A, hypre_ParCSRMatrix **parcsr)
1856d71ae5a4SJacob Faibussowitsch {
1857dd9c0a25Sstefano_zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
1858dd9c0a25Sstefano_zampini HYPRE_Int type;
1859dd9c0a25Sstefano_zampini
1860dd9c0a25Sstefano_zampini PetscFunctionBegin;
186128b400f6SJacob Faibussowitsch PetscCheck(hA->ij, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "HYPRE_IJMatrix not present");
1862a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObjectType(hA->ij, &type));
186308401ef6SPierre Jolivet PetscCheck(type == HYPRE_PARCSR, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "HYPRE_IJMatrix is not of type HYPRE_PARCSR");
1864a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetObject(hA->ij, (void **)parcsr));
18653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
1866dd9c0a25Sstefano_zampini }
1867dd9c0a25Sstefano_zampini
186820f4b53cSBarry Smith /*@C
1869dd9c0a25Sstefano_zampini MatHYPREGetParCSR - Gets the pointer to the ParCSR matrix
1870dd9c0a25Sstefano_zampini
1871cc4c1da9SBarry Smith Not Collective, No Fortran Support
1872dd9c0a25Sstefano_zampini
187320f4b53cSBarry Smith Input Parameter:
187420f4b53cSBarry Smith . A - the `MATHYPRE` object
1875dd9c0a25Sstefano_zampini
1876dd9c0a25Sstefano_zampini Output Parameter:
18772ef1f0ffSBarry Smith . parcsr - the pointer to the `hypre_ParCSRMatrix`
1878dd9c0a25Sstefano_zampini
1879dd9c0a25Sstefano_zampini Level: intermediate
1880dd9c0a25Sstefano_zampini
1881bfe80ac4SPierre Jolivet .seealso: [](ch_matrices), `Mat`, `MATHYPRE`, `PetscCopyMode`
188220f4b53cSBarry Smith @*/
1883d71ae5a4SJacob Faibussowitsch PetscErrorCode MatHYPREGetParCSR(Mat A, hypre_ParCSRMatrix **parcsr)
1884d71ae5a4SJacob Faibussowitsch {
1885dd9c0a25Sstefano_zampini PetscFunctionBegin;
1886dd9c0a25Sstefano_zampini PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
1887dd9c0a25Sstefano_zampini PetscValidType(A, 1);
1888cac4c232SBarry Smith PetscUseMethod(A, "MatHYPREGetParCSR_C", (Mat, hypre_ParCSRMatrix **), (A, parcsr));
18893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
1890dd9c0a25Sstefano_zampini }
1891dd9c0a25Sstefano_zampini
1892d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatScale_HYPRE(Mat A, PetscScalar s)
1893d71ae5a4SJacob Faibussowitsch {
189468ec7858SStefano Zampini hypre_ParCSRMatrix *parcsr;
18956ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_LT(2, 19, 0)
189668ec7858SStefano Zampini hypre_CSRMatrix *ha;
18976ea7df73SStefano Zampini #endif
189839accc25SStefano Zampini HYPRE_Complex hs;
189968ec7858SStefano Zampini
190068ec7858SStefano Zampini PetscFunctionBegin;
19019566063dSJacob Faibussowitsch PetscCall(PetscHYPREScalarCast(s, &hs));
19029566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
19036ea7df73SStefano Zampini #if PETSC_PKG_HYPRE_VERSION_GE(2, 19, 0)
1904a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixScale(parcsr, hs));
19056ea7df73SStefano Zampini #else /* diagonal part */
190668ec7858SStefano Zampini ha = hypre_ParCSRMatrixDiag(parcsr);
190768ec7858SStefano Zampini if (ha) {
190868299464SStefano Zampini PetscInt size, i;
190968299464SStefano Zampini HYPRE_Int *ii;
191039accc25SStefano Zampini HYPRE_Complex *a;
191168ec7858SStefano Zampini
191268ec7858SStefano Zampini size = hypre_CSRMatrixNumRows(ha);
191368ec7858SStefano Zampini a = hypre_CSRMatrixData(ha);
191468ec7858SStefano Zampini ii = hypre_CSRMatrixI(ha);
191539accc25SStefano Zampini for (i = 0; i < ii[size]; i++) a[i] *= hs;
191668ec7858SStefano Zampini }
19174cf0e950SBarry Smith /* off-diagonal part */
191868ec7858SStefano Zampini ha = hypre_ParCSRMatrixOffd(parcsr);
191968ec7858SStefano Zampini if (ha) {
192068299464SStefano Zampini PetscInt size, i;
192168299464SStefano Zampini HYPRE_Int *ii;
192239accc25SStefano Zampini HYPRE_Complex *a;
192368ec7858SStefano Zampini
192468ec7858SStefano Zampini size = hypre_CSRMatrixNumRows(ha);
192568ec7858SStefano Zampini a = hypre_CSRMatrixData(ha);
192668ec7858SStefano Zampini ii = hypre_CSRMatrixI(ha);
192739accc25SStefano Zampini for (i = 0; i < ii[size]; i++) a[i] *= hs;
192868ec7858SStefano Zampini }
19296ea7df73SStefano Zampini #endif
19303ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
193168ec7858SStefano Zampini }
193268ec7858SStefano Zampini
1933d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_HYPRE(Mat A, PetscInt numRows, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
1934d71ae5a4SJacob Faibussowitsch {
193568ec7858SStefano Zampini hypre_ParCSRMatrix *parcsr;
193668299464SStefano Zampini HYPRE_Int *lrows;
193768299464SStefano Zampini PetscInt rst, ren, i;
193868ec7858SStefano Zampini
193968ec7858SStefano Zampini PetscFunctionBegin;
194008401ef6SPierre Jolivet PetscCheck(!x && !b, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "To be implemented");
19419566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
19429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(numRows, &lrows));
19439566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(A, &rst, &ren));
194468ec7858SStefano Zampini for (i = 0; i < numRows; i++) {
19457a46b595SBarry Smith PetscCheck(rows[i] >= rst && rows[i] < ren, PETSC_COMM_SELF, PETSC_ERR_SUP, "Non-local rows not yet supported");
1946f2f41e48SZach Atkins lrows[i] = (HYPRE_Int)(rows[i] - rst);
194768ec7858SStefano Zampini }
1948f2f41e48SZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixEliminateRowsCols(parcsr, (HYPRE_Int)numRows, lrows));
19499566063dSJacob Faibussowitsch PetscCall(PetscFree(lrows));
19503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
195168ec7858SStefano Zampini }
195268ec7858SStefano Zampini
1953d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroEntries_HYPRE_CSRMatrix(hypre_CSRMatrix *ha)
1954d71ae5a4SJacob Faibussowitsch {
1955c69f721fSFande Kong PetscFunctionBegin;
1956c69f721fSFande Kong if (ha) {
1957c69f721fSFande Kong HYPRE_Int *ii, size;
1958c69f721fSFande Kong HYPRE_Complex *a;
1959c69f721fSFande Kong
1960c69f721fSFande Kong size = hypre_CSRMatrixNumRows(ha);
1961c69f721fSFande Kong a = hypre_CSRMatrixData(ha);
1962c69f721fSFande Kong ii = hypre_CSRMatrixI(ha);
1963c69f721fSFande Kong
19649566063dSJacob Faibussowitsch if (a) PetscCall(PetscArrayzero(a, ii[size]));
1965c69f721fSFande Kong }
19663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
1967c69f721fSFande Kong }
1968c69f721fSFande Kong
196966976f2fSJacob Faibussowitsch static PetscErrorCode MatZeroEntries_HYPRE(Mat A)
1970d71ae5a4SJacob Faibussowitsch {
19716ea7df73SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
19726ea7df73SStefano Zampini
19736ea7df73SStefano Zampini PetscFunctionBegin;
19746ea7df73SStefano Zampini if (HYPRE_MEMORY_DEVICE == hypre_IJMatrixMemoryLocation(hA->ij)) {
1975a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixSetConstantValues(hA->ij, 0.0));
19766ea7df73SStefano Zampini } else {
1977c69f721fSFande Kong hypre_ParCSRMatrix *parcsr;
1978c69f721fSFande Kong
19799566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
19809566063dSJacob Faibussowitsch PetscCall(MatZeroEntries_HYPRE_CSRMatrix(hypre_ParCSRMatrixDiag(parcsr)));
19819566063dSJacob Faibussowitsch PetscCall(MatZeroEntries_HYPRE_CSRMatrix(hypre_ParCSRMatrixOffd(parcsr)));
19826ea7df73SStefano Zampini }
19833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
1984c69f721fSFande Kong }
1985c69f721fSFande Kong
1986d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroRows_HYPRE_CSRMatrix(hypre_CSRMatrix *hA, PetscInt N, const PetscInt rows[], HYPRE_Complex diag)
1987d71ae5a4SJacob Faibussowitsch {
198839accc25SStefano Zampini PetscInt ii;
198939accc25SStefano Zampini HYPRE_Int *i, *j;
199039accc25SStefano Zampini HYPRE_Complex *a;
1991c69f721fSFande Kong
1992c69f721fSFande Kong PetscFunctionBegin;
19933ba16761SJacob Faibussowitsch if (!hA) PetscFunctionReturn(PETSC_SUCCESS);
1994c69f721fSFande Kong
199539accc25SStefano Zampini i = hypre_CSRMatrixI(hA);
199639accc25SStefano Zampini j = hypre_CSRMatrixJ(hA);
1997c69f721fSFande Kong a = hypre_CSRMatrixData(hA);
1998a32e9c99SJunchao Zhang #if defined(PETSC_HAVE_HYPRE_DEVICE)
1999a32e9c99SJunchao Zhang if (HYPRE_MEMORY_DEVICE == hypre_CSRMatrixMemoryLocation(hA)) {
2000a32e9c99SJunchao Zhang #if defined(HYPRE_USING_CUDA)
2001cdd1b302SZach Atkins PetscCall(MatZeroRows_CUDA(N, rows, i, j, a, diag));
2002a32e9c99SJunchao Zhang #elif defined(HYPRE_USING_HIP)
2003cdd1b302SZach Atkins PetscCall(MatZeroRows_HIP(N, rows, i, j, a, diag));
2004a32e9c99SJunchao Zhang #elif defined(PETSC_HAVE_KOKKOS)
2005cdd1b302SZach Atkins PetscCall(MatZeroRows_Kokkos(N, rows, i, j, a, diag));
2006a32e9c99SJunchao Zhang #else
2007a32e9c99SJunchao Zhang SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for MatZeroRows on a hypre matrix in this memory location");
2008a32e9c99SJunchao Zhang #endif
2009a32e9c99SJunchao Zhang } else
2010a32e9c99SJunchao Zhang #endif
2011a32e9c99SJunchao Zhang {
2012c69f721fSFande Kong for (ii = 0; ii < N; ii++) {
201339accc25SStefano Zampini HYPRE_Int jj, ibeg, iend, irow;
201439accc25SStefano Zampini
2015f2f41e48SZach Atkins irow = (HYPRE_Int)rows[ii];
2016c69f721fSFande Kong ibeg = i[irow];
2017c69f721fSFande Kong iend = i[irow + 1];
2018c69f721fSFande Kong for (jj = ibeg; jj < iend; jj++)
2019c69f721fSFande Kong if (j[jj] == irow) a[jj] = diag;
2020c69f721fSFande Kong else a[jj] = 0.0;
2021c69f721fSFande Kong }
2022a32e9c99SJunchao Zhang }
20233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
2024c69f721fSFande Kong }
2025c69f721fSFande Kong
2026d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroRows_HYPRE(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
2027d71ae5a4SJacob Faibussowitsch {
2028c69f721fSFande Kong hypre_ParCSRMatrix *parcsr;
2029a32e9c99SJunchao Zhang PetscInt *lrows, len, *lrows2;
203039accc25SStefano Zampini HYPRE_Complex hdiag;
2031c69f721fSFande Kong
2032c69f721fSFande Kong PetscFunctionBegin;
203308401ef6SPierre Jolivet PetscCheck(!x && !b, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Does not support to modify the solution and the right hand size");
20349566063dSJacob Faibussowitsch PetscCall(PetscHYPREScalarCast(diag, &hdiag));
2035c69f721fSFande Kong /* retrieve the internal matrix */
20369566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
2037c69f721fSFande Kong /* get locally owned rows */
20389566063dSJacob Faibussowitsch PetscCall(MatZeroRowsMapLocal_Private(A, N, rows, &len, &lrows));
2039a32e9c99SJunchao Zhang
2040a32e9c99SJunchao Zhang #if defined(PETSC_HAVE_HYPRE_DEVICE)
2041a32e9c99SJunchao Zhang if (HYPRE_MEMORY_DEVICE == hypre_CSRMatrixMemoryLocation(hypre_ParCSRMatrixDiag(parcsr))) {
2042a32e9c99SJunchao Zhang Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
2043a32e9c99SJunchao Zhang PetscInt m;
2044a32e9c99SJunchao Zhang PetscCall(MatGetLocalSize(A, &m, NULL));
2045a32e9c99SJunchao Zhang if (!hA->rows_d) {
2046a32e9c99SJunchao Zhang hA->rows_d = hypre_TAlloc(PetscInt, m, HYPRE_MEMORY_DEVICE);
2047a32e9c99SJunchao Zhang if (m) PetscCheck(hA->rows_d, PETSC_COMM_SELF, PETSC_ERR_MEM, "HYPRE_TAlloc failed");
2048a32e9c99SJunchao Zhang }
2049a32e9c99SJunchao Zhang PetscCheck(len <= m, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Too many rows in rows[]");
2050a32e9c99SJunchao Zhang PetscStackCallExternalVoid("hypre_Memcpy", hypre_Memcpy(hA->rows_d, lrows, sizeof(PetscInt) * len, HYPRE_MEMORY_DEVICE, HYPRE_MEMORY_HOST));
2051a32e9c99SJunchao Zhang lrows2 = hA->rows_d;
2052a32e9c99SJunchao Zhang } else
2053a32e9c99SJunchao Zhang #endif
2054a32e9c99SJunchao Zhang {
2055a32e9c99SJunchao Zhang lrows2 = lrows;
2056a32e9c99SJunchao Zhang }
2057a32e9c99SJunchao Zhang
2058c69f721fSFande Kong /* zero diagonal part */
2059a32e9c99SJunchao Zhang PetscCall(MatZeroRows_HYPRE_CSRMatrix(hypre_ParCSRMatrixDiag(parcsr), len, lrows2, hdiag));
2060c69f721fSFande Kong /* zero off-diagonal part */
2061a32e9c99SJunchao Zhang PetscCall(MatZeroRows_HYPRE_CSRMatrix(hypre_ParCSRMatrixOffd(parcsr), len, lrows2, 0.0));
2062c69f721fSFande Kong
20639566063dSJacob Faibussowitsch PetscCall(PetscFree(lrows));
20643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
2065c69f721fSFande Kong }
2066c69f721fSFande Kong
2067d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAssemblyBegin_HYPRE(Mat mat, MatAssemblyType mode)
2068d71ae5a4SJacob Faibussowitsch {
2069c69f721fSFande Kong PetscFunctionBegin;
20703ba16761SJacob Faibussowitsch if (mat->nooffprocentries) PetscFunctionReturn(PETSC_SUCCESS);
2071c69f721fSFande Kong
20729566063dSJacob Faibussowitsch PetscCall(MatStashScatterBegin_Private(mat, &mat->stash, mat->rmap->range));
20733ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
2074c69f721fSFande Kong }
2075c69f721fSFande Kong
2076d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetRow_HYPRE(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2077d71ae5a4SJacob Faibussowitsch {
2078c69f721fSFande Kong hypre_ParCSRMatrix *parcsr;
20792cf14000SStefano Zampini HYPRE_Int hnz;
2080c69f721fSFande Kong
2081c69f721fSFande Kong PetscFunctionBegin;
2082c69f721fSFande Kong /* retrieve the internal matrix */
20839566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
2084c69f721fSFande Kong /* call HYPRE API */
2085a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_ParCSRMatrixGetRow(parcsr, row, &hnz, (HYPRE_BigInt **)idx, (HYPRE_Complex **)v));
20862cf14000SStefano Zampini if (nz) *nz = (PetscInt)hnz;
20873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
2088c69f721fSFande Kong }
2089c69f721fSFande Kong
2090d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreRow_HYPRE(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2091d71ae5a4SJacob Faibussowitsch {
2092c69f721fSFande Kong hypre_ParCSRMatrix *parcsr;
20932cf14000SStefano Zampini HYPRE_Int hnz;
2094c69f721fSFande Kong
2095c69f721fSFande Kong PetscFunctionBegin;
2096c69f721fSFande Kong /* retrieve the internal matrix */
20979566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
2098c69f721fSFande Kong /* call HYPRE API */
20992cf14000SStefano Zampini hnz = nz ? (HYPRE_Int)(*nz) : 0;
2100a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_ParCSRMatrixRestoreRow(parcsr, row, &hnz, (HYPRE_BigInt **)idx, (HYPRE_Complex **)v));
21013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
2102c69f721fSFande Kong }
2103c69f721fSFande Kong
2104d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetValues_HYPRE(Mat A, PetscInt m, const PetscInt idxm[], PetscInt n, const PetscInt idxn[], PetscScalar v[])
2105d71ae5a4SJacob Faibussowitsch {
210645b8d346SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
2107c69f721fSFande Kong PetscInt i;
21081d4906efSStefano Zampini
2109c69f721fSFande Kong PetscFunctionBegin;
21103ba16761SJacob Faibussowitsch if (!m || !n) PetscFunctionReturn(PETSC_SUCCESS);
2111c69f721fSFande Kong /* Ignore negative row indices
2112c69f721fSFande Kong * And negative column indices should be automatically ignored in hypre
2113c69f721fSFande Kong * */
21142cf14000SStefano Zampini for (i = 0; i < m; i++) {
21152cf14000SStefano Zampini if (idxm[i] >= 0) {
21162cf14000SStefano Zampini HYPRE_Int hn = (HYPRE_Int)n;
2117a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixGetValues(hA->ij, 1, &hn, (HYPRE_BigInt *)&idxm[i], (HYPRE_BigInt *)idxn, (HYPRE_Complex *)(v + i * n)));
21182cf14000SStefano Zampini }
21192cf14000SStefano Zampini }
21203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
2121c69f721fSFande Kong }
2122c69f721fSFande Kong
2123d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetOption_HYPRE(Mat A, MatOption op, PetscBool flg)
2124d71ae5a4SJacob Faibussowitsch {
2125ddbeb582SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
2126ddbeb582SStefano Zampini
2127ddbeb582SStefano Zampini PetscFunctionBegin;
2128c6698e78SStefano Zampini switch (op) {
2129ddbeb582SStefano Zampini case MAT_NO_OFF_PROC_ENTRIES:
2130a333fa2bSZach Atkins if (flg) PetscCallHYPRE(HYPRE_IJMatrixSetMaxOffProcElmts(hA->ij, 0));
2131ddbeb582SStefano Zampini break;
2132651b1cf9SStefano Zampini case MAT_IGNORE_OFF_PROC_ENTRIES:
2133651b1cf9SStefano Zampini hA->donotstash = flg;
2134d71ae5a4SJacob Faibussowitsch break;
2135d71ae5a4SJacob Faibussowitsch default:
2136d71ae5a4SJacob Faibussowitsch break;
2137ddbeb582SStefano Zampini }
21383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
2139ddbeb582SStefano Zampini }
2140c69f721fSFande Kong
2141d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_HYPRE(Mat A, PetscViewer view)
2142d71ae5a4SJacob Faibussowitsch {
214345b8d346SStefano Zampini PetscViewerFormat format;
214445b8d346SStefano Zampini
214545b8d346SStefano Zampini PetscFunctionBegin;
21469566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(view, &format));
21473ba16761SJacob Faibussowitsch if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS);
214845b8d346SStefano Zampini if (format != PETSC_VIEWER_NATIVE) {
21496ea7df73SStefano Zampini Mat B;
21506ea7df73SStefano Zampini hypre_ParCSRMatrix *parcsr;
21516ea7df73SStefano Zampini PetscErrorCode (*mview)(Mat, PetscViewer) = NULL;
21526ea7df73SStefano Zampini
21539566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
21549566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(parcsr, MATAIJ, PETSC_USE_POINTER, &B));
215557d50842SBarry Smith PetscCall(MatGetOperation(B, MATOP_VIEW, (PetscErrorCodeFn **)&mview));
215628b400f6SJacob Faibussowitsch PetscCheck(mview, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "Missing view operation");
21579566063dSJacob Faibussowitsch PetscCall((*mview)(B, view));
21589566063dSJacob Faibussowitsch PetscCall(MatDestroy(&B));
215945b8d346SStefano Zampini } else {
216045b8d346SStefano Zampini Mat_HYPRE *hA = (Mat_HYPRE *)A->data;
216145b8d346SStefano Zampini PetscMPIInt size;
216245b8d346SStefano Zampini PetscBool isascii;
216345b8d346SStefano Zampini const char *filename;
216445b8d346SStefano Zampini
216545b8d346SStefano Zampini /* HYPRE uses only text files */
21669566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)view, PETSCVIEWERASCII, &isascii));
216728b400f6SJacob Faibussowitsch PetscCheck(isascii, PetscObjectComm((PetscObject)view), PETSC_ERR_SUP, "PetscViewerType %s: native HYPRE format needs PETSCVIEWERASCII", ((PetscObject)view)->type_name);
21689566063dSJacob Faibussowitsch PetscCall(PetscViewerFileGetName(view, &filename));
2169a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_IJMatrixPrint(hA->ij, filename));
21709566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(hA->comm, &size));
217145b8d346SStefano Zampini if (size > 1) {
21729566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(view, "Matrix files: %s.%05d ... %s.%05d\n", filename, 0, filename, size - 1));
217345b8d346SStefano Zampini } else {
21749566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(view, "Matrix file: %s.%05d\n", filename, 0));
217545b8d346SStefano Zampini }
217645b8d346SStefano Zampini }
21773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
217845b8d346SStefano Zampini }
217945b8d346SStefano Zampini
2180d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatCopy_HYPRE(Mat A, Mat B, MatStructure str)
2181d71ae5a4SJacob Faibussowitsch {
2182465edc17SStefano Zampini hypre_ParCSRMatrix *acsr, *bcsr;
2183465edc17SStefano Zampini
2184465edc17SStefano Zampini PetscFunctionBegin;
2185465edc17SStefano Zampini if (str == SAME_NONZERO_PATTERN && A->ops->copy == B->ops->copy) {
21869566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &acsr));
21879566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(B, &bcsr));
2188a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixCopy(acsr, bcsr, 1));
21899566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_SORTED_FULL, PETSC_TRUE)); /* "perfect" preallocation, so no need for hypre_AuxParCSRMatrixNeedAux */
21909566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY));
21919566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY));
2192465edc17SStefano Zampini } else {
21939566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str));
2194465edc17SStefano Zampini }
21953ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
2196465edc17SStefano Zampini }
2197465edc17SStefano Zampini
2198d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_HYPRE(Mat A, Vec d)
2199d71ae5a4SJacob Faibussowitsch {
22006305df00SStefano Zampini hypre_ParCSRMatrix *parcsr;
22016305df00SStefano Zampini hypre_CSRMatrix *dmat;
220239accc25SStefano Zampini HYPRE_Complex *a;
22036305df00SStefano Zampini PetscBool cong;
22046305df00SStefano Zampini
22056305df00SStefano Zampini PetscFunctionBegin;
22069566063dSJacob Faibussowitsch PetscCall(MatHasCongruentLayouts(A, &cong));
220728b400f6SJacob Faibussowitsch PetscCheck(cong, PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "Only for square matrices with same local distributions of rows and columns");
22089566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
22096305df00SStefano Zampini dmat = hypre_ParCSRMatrixDiag(parcsr);
22106305df00SStefano Zampini if (dmat) {
221106977982Sstefanozampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
221206977982Sstefanozampini HYPRE_MemoryLocation mem = hypre_CSRMatrixMemoryLocation(dmat);
221306977982Sstefanozampini #else
221406977982Sstefanozampini HYPRE_MemoryLocation mem = HYPRE_MEMORY_HOST;
221506977982Sstefanozampini #endif
221606977982Sstefanozampini
221706977982Sstefanozampini if (mem != HYPRE_MEMORY_HOST) PetscCall(VecGetArrayWriteAndMemType(d, (PetscScalar **)&a, NULL));
221806977982Sstefanozampini else PetscCall(VecGetArrayWrite(d, (PetscScalar **)&a));
221906977982Sstefanozampini hypre_CSRMatrixExtractDiagonal(dmat, a, 0);
222006977982Sstefanozampini if (mem != HYPRE_MEMORY_HOST) PetscCall(VecRestoreArrayWriteAndMemType(d, (PetscScalar **)&a));
222106977982Sstefanozampini else PetscCall(VecRestoreArrayWrite(d, (PetscScalar **)&a));
22226305df00SStefano Zampini }
22233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
22246305df00SStefano Zampini }
22256305df00SStefano Zampini
2226363d496dSStefano Zampini #include <petscblaslapack.h>
2227363d496dSStefano Zampini
2228d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAXPY_HYPRE(Mat Y, PetscScalar a, Mat X, MatStructure str)
2229d71ae5a4SJacob Faibussowitsch {
2230363d496dSStefano Zampini PetscFunctionBegin;
22316ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
22326ea7df73SStefano Zampini {
22336ea7df73SStefano Zampini Mat B;
22346ea7df73SStefano Zampini hypre_ParCSRMatrix *x, *y, *z;
22356ea7df73SStefano Zampini
22369566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR(Y, &y));
22379566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR(X, &x));
2238a333fa2bSZach Atkins PetscCallHYPRE(hypre_ParCSRMatrixAdd(1.0, y, 1.0, x, &z));
22399566063dSJacob Faibussowitsch PetscCall(MatCreateFromParCSR(z, MATHYPRE, PETSC_OWN_POINTER, &B));
22409566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B));
22416ea7df73SStefano Zampini }
22426ea7df73SStefano Zampini #else
2243363d496dSStefano Zampini if (str == SAME_NONZERO_PATTERN) {
2244363d496dSStefano Zampini hypre_ParCSRMatrix *x, *y;
2245363d496dSStefano Zampini hypre_CSRMatrix *xloc, *yloc;
2246363d496dSStefano Zampini PetscInt xnnz, ynnz;
224739accc25SStefano Zampini HYPRE_Complex *xarr, *yarr;
2248363d496dSStefano Zampini PetscBLASInt one = 1, bnz;
2249363d496dSStefano Zampini
22509566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR(Y, &y));
22519566063dSJacob Faibussowitsch PetscCall(MatHYPREGetParCSR(X, &x));
2252363d496dSStefano Zampini
2253363d496dSStefano Zampini /* diagonal block */
2254363d496dSStefano Zampini xloc = hypre_ParCSRMatrixDiag(x);
2255363d496dSStefano Zampini yloc = hypre_ParCSRMatrixDiag(y);
2256363d496dSStefano Zampini xnnz = 0;
2257363d496dSStefano Zampini ynnz = 0;
2258363d496dSStefano Zampini xarr = NULL;
2259363d496dSStefano Zampini yarr = NULL;
2260363d496dSStefano Zampini if (xloc) {
226139accc25SStefano Zampini xarr = hypre_CSRMatrixData(xloc);
2262363d496dSStefano Zampini xnnz = hypre_CSRMatrixNumNonzeros(xloc);
2263363d496dSStefano Zampini }
2264363d496dSStefano Zampini if (yloc) {
226539accc25SStefano Zampini yarr = hypre_CSRMatrixData(yloc);
2266363d496dSStefano Zampini ynnz = hypre_CSRMatrixNumNonzeros(yloc);
2267363d496dSStefano Zampini }
226808401ef6SPierre Jolivet PetscCheck(xnnz == ynnz, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Different number of nonzeros in diagonal block %" PetscInt_FMT " != %" PetscInt_FMT, xnnz, ynnz);
22699566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(xnnz, &bnz));
2270792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &a, (PetscScalar *)xarr, &one, (PetscScalar *)yarr, &one));
2271363d496dSStefano Zampini
2272363d496dSStefano Zampini /* off-diagonal block */
2273363d496dSStefano Zampini xloc = hypre_ParCSRMatrixOffd(x);
2274363d496dSStefano Zampini yloc = hypre_ParCSRMatrixOffd(y);
2275363d496dSStefano Zampini xnnz = 0;
2276363d496dSStefano Zampini ynnz = 0;
2277363d496dSStefano Zampini xarr = NULL;
2278363d496dSStefano Zampini yarr = NULL;
2279363d496dSStefano Zampini if (xloc) {
228039accc25SStefano Zampini xarr = hypre_CSRMatrixData(xloc);
2281363d496dSStefano Zampini xnnz = hypre_CSRMatrixNumNonzeros(xloc);
2282363d496dSStefano Zampini }
2283363d496dSStefano Zampini if (yloc) {
228439accc25SStefano Zampini yarr = hypre_CSRMatrixData(yloc);
2285363d496dSStefano Zampini ynnz = hypre_CSRMatrixNumNonzeros(yloc);
2286363d496dSStefano Zampini }
228708401ef6SPierre Jolivet PetscCheck(xnnz == ynnz, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Different number of nonzeros in off-diagonal block %" PetscInt_FMT " != %" PetscInt_FMT, xnnz, ynnz);
22889566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(xnnz, &bnz));
2289792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &a, (PetscScalar *)xarr, &one, (PetscScalar *)yarr, &one));
2290363d496dSStefano Zampini } else if (str == SUBSET_NONZERO_PATTERN) {
22919566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str));
2292363d496dSStefano Zampini } else {
2293363d496dSStefano Zampini Mat B;
2294363d496dSStefano Zampini
22959566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic_Preallocate(Y, X, &B));
22969566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str));
22979566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(Y, &B));
2298363d496dSStefano Zampini }
22996ea7df73SStefano Zampini #endif
23003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
2301363d496dSStefano Zampini }
2302363d496dSStefano Zampini
23032c4ab24aSJunchao Zhang static PetscErrorCode MatDuplicate_HYPRE(Mat A, MatDuplicateOption op, Mat *B)
23042c4ab24aSJunchao Zhang {
23052c4ab24aSJunchao Zhang hypre_ParCSRMatrix *parcsr = NULL;
23062c4ab24aSJunchao Zhang PetscCopyMode cpmode;
23072c4ab24aSJunchao Zhang Mat_HYPRE *hA;
23082c4ab24aSJunchao Zhang
23092c4ab24aSJunchao Zhang PetscFunctionBegin;
23102c4ab24aSJunchao Zhang PetscCall(MatHYPREGetParCSR_HYPRE(A, &parcsr));
23112c4ab24aSJunchao Zhang if (op == MAT_DO_NOT_COPY_VALUES || op == MAT_SHARE_NONZERO_PATTERN) {
23122c4ab24aSJunchao Zhang parcsr = hypre_ParCSRMatrixClone(parcsr, 0);
23132c4ab24aSJunchao Zhang cpmode = PETSC_OWN_POINTER;
23142c4ab24aSJunchao Zhang } else {
23152c4ab24aSJunchao Zhang cpmode = PETSC_COPY_VALUES;
23162c4ab24aSJunchao Zhang }
23172c4ab24aSJunchao Zhang PetscCall(MatCreateFromParCSR(parcsr, MATHYPRE, cpmode, B));
23182c4ab24aSJunchao Zhang hA = (Mat_HYPRE *)A->data;
23192c4ab24aSJunchao Zhang if (hA->cooMat) {
232006977982Sstefanozampini Mat_HYPRE *hB = (Mat_HYPRE *)((*B)->data);
2321b73e3080SStefano Zampini op = (op == MAT_DO_NOT_COPY_VALUES) ? op : MAT_COPY_VALUES;
2322b73e3080SStefano Zampini /* Cannot simply increase the reference count of hA->cooMat, since B needs to share cooMat's data array */
232306977982Sstefanozampini PetscCall(MatDuplicate(hA->cooMat, op, &hB->cooMat));
232406977982Sstefanozampini PetscCall(MatHYPRE_AttachCOOMat(*B));
23252c4ab24aSJunchao Zhang }
23262c4ab24aSJunchao Zhang PetscFunctionReturn(PETSC_SUCCESS);
23272c4ab24aSJunchao Zhang }
23282c4ab24aSJunchao Zhang
2329d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetPreallocationCOO_HYPRE(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[])
2330d71ae5a4SJacob Faibussowitsch {
233106977982Sstefanozampini Mat_HYPRE *hmat = (Mat_HYPRE *)mat->data;
23325fbaff96SJunchao Zhang
23335fbaff96SJunchao Zhang PetscFunctionBegin;
2334651b1cf9SStefano Zampini /* Build an agent matrix cooMat with AIJ format
23355fbaff96SJunchao Zhang It has the same sparsity pattern as mat, and also shares the data array with mat. We use cooMat to do the COO work.
23365fbaff96SJunchao Zhang */
233706977982Sstefanozampini PetscCall(MatHYPRE_CreateCOOMat(mat));
233806977982Sstefanozampini PetscCall(MatSetOption(hmat->cooMat, MAT_IGNORE_OFF_PROC_ENTRIES, hmat->donotstash));
233906977982Sstefanozampini PetscCall(MatSetOption(hmat->cooMat, MAT_NO_OFF_PROC_ENTRIES, mat->nooffprocentries));
2340651b1cf9SStefano Zampini
2341651b1cf9SStefano Zampini /* MatSetPreallocationCOO_SeqAIJ and MatSetPreallocationCOO_MPIAIJ uses this specific
2342651b1cf9SStefano Zampini name to automatically put the diagonal entries first */
234306977982Sstefanozampini PetscCall(PetscObjectSetName((PetscObject)hmat->cooMat, "_internal_COO_mat_for_hypre"));
234406977982Sstefanozampini PetscCall(MatSetPreallocationCOO(hmat->cooMat, coo_n, coo_i, coo_j));
234506977982Sstefanozampini hmat->cooMat->assembled = PETSC_TRUE;
23465fbaff96SJunchao Zhang
23475fbaff96SJunchao Zhang /* Copy the sparsity pattern from cooMat to hypre IJMatrix hmat->ij */
23485fbaff96SJunchao Zhang PetscCall(MatSetOption(mat, MAT_SORTED_FULL, PETSC_TRUE));
234906977982Sstefanozampini PetscCall(MatHYPRE_CreateFromMat(hmat->cooMat, hmat)); /* Create hmat->ij and preallocate it */
235006977982Sstefanozampini PetscCall(MatHYPRE_IJMatrixCopyIJ(hmat->cooMat, hmat->ij)); /* Copy A's (i,j) to hmat->ij */
23515fbaff96SJunchao Zhang
23525fbaff96SJunchao Zhang mat->preallocated = PETSC_TRUE;
23535fbaff96SJunchao Zhang PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY));
23545fbaff96SJunchao Zhang PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); /* Migrate mat to device if it is bound to. Hypre builds its own SpMV context here */
23555fbaff96SJunchao Zhang
23562c4ab24aSJunchao Zhang /* Attach cooMat to mat */
235706977982Sstefanozampini PetscCall(MatHYPRE_AttachCOOMat(mat));
23583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
23595fbaff96SJunchao Zhang }
23605fbaff96SJunchao Zhang
2361d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_HYPRE(Mat mat, const PetscScalar v[], InsertMode imode)
2362d71ae5a4SJacob Faibussowitsch {
23635fbaff96SJunchao Zhang Mat_HYPRE *hmat = (Mat_HYPRE *)mat->data;
23645fbaff96SJunchao Zhang
23655fbaff96SJunchao Zhang PetscFunctionBegin;
2366b73e3080SStefano Zampini PetscCheck(hmat->cooMat, PetscObjectComm((PetscObject)mat), PETSC_ERR_PLIB, "HYPRE COO delegate matrix has not been created yet");
23675fbaff96SJunchao Zhang PetscCall(MatSetValuesCOO(hmat->cooMat, v, imode));
2368651b1cf9SStefano Zampini PetscCall(MatViewFromOptions(hmat->cooMat, (PetscObject)mat, "-cooMat_view"));
23693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
23705fbaff96SJunchao Zhang }
23715fbaff96SJunchao Zhang
237203db1824SAlex Lindsay static PetscErrorCode MatGetCurrentMemType_HYPRE(Mat A, PetscMemType *m)
237303db1824SAlex Lindsay {
237403db1824SAlex Lindsay PetscBool petsconcpu;
237503db1824SAlex Lindsay
237603db1824SAlex Lindsay PetscFunctionBegin;
237703db1824SAlex Lindsay PetscCall(MatBoundToCPU(A, &petsconcpu));
237803db1824SAlex Lindsay *m = petsconcpu ? PETSC_MEMTYPE_HOST : PETSC_MEMTYPE_DEVICE;
237903db1824SAlex Lindsay PetscFunctionReturn(PETSC_SUCCESS);
238003db1824SAlex Lindsay }
238103db1824SAlex Lindsay
2382a055b5aaSBarry Smith /*MC
23832ef1f0ffSBarry Smith MATHYPRE - "hypre" - A matrix type to be used for sequential and parallel sparse matrices
2384a055b5aaSBarry Smith based on the hypre IJ interface.
2385a055b5aaSBarry Smith
2386a055b5aaSBarry Smith Level: intermediate
2387a055b5aaSBarry Smith
23881cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatHYPRESetPreallocation`
2389a055b5aaSBarry Smith M*/
2390d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_HYPRE(Mat B)
2391d71ae5a4SJacob Faibussowitsch {
239263c07aadSStefano Zampini Mat_HYPRE *hB;
2393a9e6c71bSAlex Lindsay #if defined(PETSC_HAVE_HYPRE_DEVICE)
2394a9e6c71bSAlex Lindsay HYPRE_MemoryLocation memory_location;
2395a9e6c71bSAlex Lindsay #endif
239663c07aadSStefano Zampini
239763c07aadSStefano Zampini PetscFunctionBegin;
2398*5482091fSJunchao Zhang PetscCall(PetscHYPREInitialize());
23994dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&hB));
24006ea7df73SStefano Zampini
2401978814f1SStefano Zampini hB->inner_free = PETSC_TRUE;
2402651b1cf9SStefano Zampini hB->array_available = PETSC_TRUE;
2403978814f1SStefano Zampini
240463c07aadSStefano Zampini B->data = (void *)hB;
240563c07aadSStefano Zampini
24069566063dSJacob Faibussowitsch PetscCall(PetscMemzero(B->ops, sizeof(struct _MatOps)));
240763c07aadSStefano Zampini B->ops->mult = MatMult_HYPRE;
240863c07aadSStefano Zampini B->ops->multtranspose = MatMultTranspose_HYPRE;
2409414bd5c3SStefano Zampini B->ops->multadd = MatMultAdd_HYPRE;
2410414bd5c3SStefano Zampini B->ops->multtransposeadd = MatMultTransposeAdd_HYPRE;
241163c07aadSStefano Zampini B->ops->setup = MatSetUp_HYPRE;
241263c07aadSStefano Zampini B->ops->destroy = MatDestroy_HYPRE;
241363c07aadSStefano Zampini B->ops->assemblyend = MatAssemblyEnd_HYPRE;
2414c69f721fSFande Kong B->ops->assemblybegin = MatAssemblyBegin_HYPRE;
2415d975228cSstefano_zampini B->ops->setvalues = MatSetValues_HYPRE;
241668ec7858SStefano Zampini B->ops->scale = MatScale_HYPRE;
241768ec7858SStefano Zampini B->ops->zerorowscolumns = MatZeroRowsColumns_HYPRE;
2418c69f721fSFande Kong B->ops->zeroentries = MatZeroEntries_HYPRE;
2419c69f721fSFande Kong B->ops->zerorows = MatZeroRows_HYPRE;
2420c69f721fSFande Kong B->ops->getrow = MatGetRow_HYPRE;
2421c69f721fSFande Kong B->ops->restorerow = MatRestoreRow_HYPRE;
2422c69f721fSFande Kong B->ops->getvalues = MatGetValues_HYPRE;
2423ddbeb582SStefano Zampini B->ops->setoption = MatSetOption_HYPRE;
242445b8d346SStefano Zampini B->ops->duplicate = MatDuplicate_HYPRE;
2425465edc17SStefano Zampini B->ops->copy = MatCopy_HYPRE;
242645b8d346SStefano Zampini B->ops->view = MatView_HYPRE;
24276305df00SStefano Zampini B->ops->getdiagonal = MatGetDiagonal_HYPRE;
2428363d496dSStefano Zampini B->ops->axpy = MatAXPY_HYPRE;
24294222ddf1SHong Zhang B->ops->productsetfromoptions = MatProductSetFromOptions_HYPRE;
243003db1824SAlex Lindsay B->ops->getcurrentmemtype = MatGetCurrentMemType_HYPRE;
24316ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
24326ea7df73SStefano Zampini B->ops->bindtocpu = MatBindToCPU_HYPRE;
2433a9e6c71bSAlex Lindsay /* Get hypre's default memory location. Users can control this using the corresponding HYPRE_SetMemoryLocation API */
2434a333fa2bSZach Atkins PetscCallHYPRE(HYPRE_GetMemoryLocation(&memory_location));
2435a9e6c71bSAlex Lindsay B->boundtocpu = (memory_location == HYPRE_MEMORY_HOST) ? PETSC_TRUE : PETSC_FALSE;
24366ea7df73SStefano Zampini #endif
243745b8d346SStefano Zampini
243845b8d346SStefano Zampini /* build cache for off array entries formed */
24399566063dSJacob Faibussowitsch PetscCall(MatStashCreate_Private(PetscObjectComm((PetscObject)B), 1, &B->stash));
244063c07aadSStefano Zampini
24419566063dSJacob Faibussowitsch PetscCall(PetscCommGetComm(PetscObjectComm((PetscObject)B), &hB->comm));
24429566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATHYPRE));
24439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_hypre_aij_C", MatConvert_HYPRE_AIJ));
24449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_hypre_is_C", MatConvert_HYPRE_IS));
24459566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_hypre_C", MatProductSetFromOptions_HYPRE));
24469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_mpiaij_hypre_C", MatProductSetFromOptions_HYPRE));
24479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatHYPRESetPreallocation_C", MatHYPRESetPreallocation_HYPRE));
24489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatHYPREGetParCSR_C", MatHYPREGetParCSR_HYPRE));
24495fbaff96SJunchao Zhang PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_HYPRE));
24505fbaff96SJunchao Zhang PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_HYPRE));
24516ea7df73SStefano Zampini #if defined(PETSC_HAVE_HYPRE_DEVICE)
24526ea7df73SStefano Zampini #if defined(HYPRE_USING_HIP)
245306977982Sstefanozampini PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_hypre_C", MatProductSetFromOptions_HYPRE));
245406977982Sstefanozampini PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_mpiaijhipsparse_hypre_C", MatProductSetFromOptions_HYPRE));
24559566063dSJacob Faibussowitsch PetscCall(PetscDeviceInitialize(PETSC_DEVICE_HIP));
24569566063dSJacob Faibussowitsch PetscCall(MatSetVecType(B, VECHIP));
24576ea7df73SStefano Zampini #endif
24586ea7df73SStefano Zampini #if defined(HYPRE_USING_CUDA)
245906977982Sstefanozampini PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_hypre_C", MatProductSetFromOptions_HYPRE));
246006977982Sstefanozampini PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_mpiaijcusparse_hypre_C", MatProductSetFromOptions_HYPRE));
24619566063dSJacob Faibussowitsch PetscCall(PetscDeviceInitialize(PETSC_DEVICE_CUDA));
24629566063dSJacob Faibussowitsch PetscCall(MatSetVecType(B, VECCUDA));
24636ea7df73SStefano Zampini #endif
24646ea7df73SStefano Zampini #endif
24653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
246663c07aadSStefano Zampini }
2467