1120bdd93SDave May #include <petsc/private/matimpl.h>
21e07b27eSBarry Smith #include <petsc/private/pcimpl.h>
35e897e82SDave May #include <petsc/private/dmimpl.h>
41e07b27eSBarry Smith #include <petscksp.h> /*I "petscksp.h" I*/
51e07b27eSBarry Smith #include <petscdm.h>
61e07b27eSBarry Smith #include <petscdmda.h>
71e07b27eSBarry Smith
8575a0592SBarry Smith #include "../src/ksp/pc/impls/telescope/telescope.h"
91e07b27eSBarry Smith
10bf00f589SPatrick Sanan static PetscBool cited = PETSC_FALSE;
119371c9d4SSatish Balay static const char citation[] = "@inproceedings{MaySananRuppKnepleySmith2016,\n"
12bf00f589SPatrick Sanan " title = {Extreme-Scale Multigrid Components within PETSc},\n"
13bf00f589SPatrick Sanan " author = {Dave A. May and Patrick Sanan and Karl Rupp and Matthew G. Knepley and Barry F. Smith},\n"
14bf00f589SPatrick Sanan " booktitle = {Proceedings of the Platform for Advanced Scientific Computing Conference},\n"
15bf00f589SPatrick Sanan " series = {PASC '16},\n"
16bf00f589SPatrick Sanan " isbn = {978-1-4503-4126-4},\n"
17bf00f589SPatrick Sanan " location = {Lausanne, Switzerland},\n"
18bf00f589SPatrick Sanan " pages = {5:1--5:12},\n"
19bf00f589SPatrick Sanan " articleno = {5},\n"
20bf00f589SPatrick Sanan " numpages = {12},\n"
21a8d69d7bSBarry Smith " url = {https://doi.acm.org/10.1145/2929908.2929913},\n"
22bf00f589SPatrick Sanan " doi = {10.1145/2929908.2929913},\n"
23bf00f589SPatrick Sanan " acmid = {2929913},\n"
24bf00f589SPatrick Sanan " publisher = {ACM},\n"
25bf00f589SPatrick Sanan " address = {New York, NY, USA},\n"
26bf00f589SPatrick Sanan " keywords = {GPU, HPC, agglomeration, coarse-level solver, multigrid, parallel computing, preconditioning},\n"
27bf00f589SPatrick Sanan " year = {2016}\n"
28bf00f589SPatrick Sanan "}\n";
29bf00f589SPatrick Sanan
_DMDADetermineRankFromGlobalIJK(PetscInt dim,PetscInt i,PetscInt j,PetscInt k,PetscInt Mp,PetscInt Np,PetscInt Pp,PetscInt start_i[],PetscInt start_j[],PetscInt start_k[],PetscInt span_i[],PetscInt span_j[],PetscInt span_k[],PetscMPIInt * _pi,PetscMPIInt * _pj,PetscMPIInt * _pk,PetscMPIInt * rank_re)30d71ae5a4SJacob Faibussowitsch static PetscErrorCode _DMDADetermineRankFromGlobalIJK(PetscInt dim, PetscInt i, PetscInt j, PetscInt k, PetscInt Mp, PetscInt Np, PetscInt Pp, PetscInt start_i[], PetscInt start_j[], PetscInt start_k[], PetscInt span_i[], PetscInt span_j[], PetscInt span_k[], PetscMPIInt *_pi, PetscMPIInt *_pj, PetscMPIInt *_pk, PetscMPIInt *rank_re)
31d71ae5a4SJacob Faibussowitsch {
321e07b27eSBarry Smith PetscInt pi, pj, pk, n;
331e07b27eSBarry Smith
341e07b27eSBarry Smith PetscFunctionBegin;
35137d0469SJed Brown *rank_re = -1;
36137d0469SJed Brown if (_pi) *_pi = -1;
37137d0469SJed Brown if (_pj) *_pj = -1;
38137d0469SJed Brown if (_pk) *_pk = -1;
391e07b27eSBarry Smith pi = pj = pk = -1;
401e07b27eSBarry Smith if (_pi) {
411e07b27eSBarry Smith for (n = 0; n < Mp; n++) {
421e07b27eSBarry Smith if ((i >= start_i[n]) && (i < start_i[n] + span_i[n])) {
431e07b27eSBarry Smith pi = n;
441e07b27eSBarry Smith break;
451e07b27eSBarry Smith }
461e07b27eSBarry Smith }
4763a3b9bcSJacob Faibussowitsch PetscCheck(pi != -1, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmda-ijk] pi cannot be determined : range %" PetscInt_FMT ", val %" PetscInt_FMT, Mp, i);
48835f2295SStefano Zampini PetscCall(PetscMPIIntCast(pi, _pi));
491e07b27eSBarry Smith }
501e07b27eSBarry Smith
511e07b27eSBarry Smith if (_pj) {
521e07b27eSBarry Smith for (n = 0; n < Np; n++) {
531e07b27eSBarry Smith if ((j >= start_j[n]) && (j < start_j[n] + span_j[n])) {
541e07b27eSBarry Smith pj = n;
551e07b27eSBarry Smith break;
561e07b27eSBarry Smith }
571e07b27eSBarry Smith }
5863a3b9bcSJacob Faibussowitsch PetscCheck(pj != -1, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmda-ijk] pj cannot be determined : range %" PetscInt_FMT ", val %" PetscInt_FMT, Np, j);
59835f2295SStefano Zampini PetscCall(PetscMPIIntCast(pj, _pj));
601e07b27eSBarry Smith }
611e07b27eSBarry Smith
621e07b27eSBarry Smith if (_pk) {
631e07b27eSBarry Smith for (n = 0; n < Pp; n++) {
641e07b27eSBarry Smith if ((k >= start_k[n]) && (k < start_k[n] + span_k[n])) {
651e07b27eSBarry Smith pk = n;
661e07b27eSBarry Smith break;
671e07b27eSBarry Smith }
681e07b27eSBarry Smith }
6963a3b9bcSJacob Faibussowitsch PetscCheck(pk != -1, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmda-ijk] pk cannot be determined : range %" PetscInt_FMT ", val %" PetscInt_FMT, Pp, k);
70835f2295SStefano Zampini PetscCall(PetscMPIIntCast(pk, _pk));
711e07b27eSBarry Smith }
721e07b27eSBarry Smith
731e07b27eSBarry Smith switch (dim) {
74d71ae5a4SJacob Faibussowitsch case 1:
75835f2295SStefano Zampini PetscCall(PetscMPIIntCast(pi, rank_re));
76d71ae5a4SJacob Faibussowitsch break;
77d71ae5a4SJacob Faibussowitsch case 2:
78835f2295SStefano Zampini PetscCall(PetscMPIIntCast(pi + pj * Mp, rank_re));
79d71ae5a4SJacob Faibussowitsch break;
80d71ae5a4SJacob Faibussowitsch case 3:
81835f2295SStefano Zampini PetscCall(PetscMPIIntCast(pi + pj * Mp + pk * (Mp * Np), rank_re));
82d71ae5a4SJacob Faibussowitsch break;
831e07b27eSBarry Smith }
843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
851e07b27eSBarry Smith }
861e07b27eSBarry Smith
_DMDADetermineGlobalS0(PetscInt dim,PetscMPIInt rank_re,PetscInt Mp_re,PetscInt Np_re,PetscInt Pp_re,PetscInt range_i_re[],PetscInt range_j_re[],PetscInt range_k_re[],PetscInt * s0)87d71ae5a4SJacob Faibussowitsch static PetscErrorCode _DMDADetermineGlobalS0(PetscInt dim, PetscMPIInt rank_re, PetscInt Mp_re, PetscInt Np_re, PetscInt Pp_re, PetscInt range_i_re[], PetscInt range_j_re[], PetscInt range_k_re[], PetscInt *s0)
88d71ae5a4SJacob Faibussowitsch {
89c6a0d831SBarry Smith PetscInt i, j, k, start_IJK = 0;
901e07b27eSBarry Smith PetscInt rank_ijk;
911e07b27eSBarry Smith
921e07b27eSBarry Smith PetscFunctionBegin;
931e07b27eSBarry Smith switch (dim) {
941e07b27eSBarry Smith case 1:
951e07b27eSBarry Smith for (i = 0; i < Mp_re; i++) {
961e07b27eSBarry Smith rank_ijk = i;
97ad540459SPierre Jolivet if (rank_ijk < rank_re) start_IJK += range_i_re[i];
981e07b27eSBarry Smith }
991e07b27eSBarry Smith break;
1001e07b27eSBarry Smith case 2:
1011e07b27eSBarry Smith for (j = 0; j < Np_re; j++) {
1021e07b27eSBarry Smith for (i = 0; i < Mp_re; i++) {
1031e07b27eSBarry Smith rank_ijk = i + j * Mp_re;
104ad540459SPierre Jolivet if (rank_ijk < rank_re) start_IJK += range_i_re[i] * range_j_re[j];
1051e07b27eSBarry Smith }
1061e07b27eSBarry Smith }
1071e07b27eSBarry Smith break;
1081e07b27eSBarry Smith case 3:
1091e07b27eSBarry Smith for (k = 0; k < Pp_re; k++) {
1101e07b27eSBarry Smith for (j = 0; j < Np_re; j++) {
1111e07b27eSBarry Smith for (i = 0; i < Mp_re; i++) {
1121e07b27eSBarry Smith rank_ijk = i + j * Mp_re + k * Mp_re * Np_re;
113ad540459SPierre Jolivet if (rank_ijk < rank_re) start_IJK += range_i_re[i] * range_j_re[j] * range_k_re[k];
1141e07b27eSBarry Smith }
1151e07b27eSBarry Smith }
1161e07b27eSBarry Smith }
1171e07b27eSBarry Smith break;
1181e07b27eSBarry Smith }
1191e07b27eSBarry Smith *s0 = start_IJK;
1203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
1211e07b27eSBarry Smith }
1221e07b27eSBarry Smith
PCTelescopeSetUp_dmda_repart_coors2d(PC_Telescope sred,DM dm,DM subdm)123d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCTelescopeSetUp_dmda_repart_coors2d(PC_Telescope sred, DM dm, DM subdm)
124d71ae5a4SJacob Faibussowitsch {
1251e07b27eSBarry Smith DM cdm;
1261e07b27eSBarry Smith Vec coor, coor_natural, perm_coors;
1271e07b27eSBarry Smith PetscInt i, j, si, sj, ni, nj, M, N, Ml, Nl, c, nidx;
1281e07b27eSBarry Smith PetscInt *fine_indices;
1291e07b27eSBarry Smith IS is_fine, is_local;
1301e07b27eSBarry Smith VecScatter sctx;
1311e07b27eSBarry Smith
1321e07b27eSBarry Smith PetscFunctionBegin;
1339566063dSJacob Faibussowitsch PetscCall(DMGetCoordinates(dm, &coor));
1343ba16761SJacob Faibussowitsch if (!coor) PetscFunctionReturn(PETSC_SUCCESS);
13548a46eb9SPierre Jolivet if (PCTelescope_isActiveRank(sred)) PetscCall(DMDASetUniformCoordinates(subdm, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0));
1361e07b27eSBarry Smith /* Get the coordinate vector from the distributed array */
1379566063dSJacob Faibussowitsch PetscCall(DMGetCoordinateDM(dm, &cdm));
1389566063dSJacob Faibussowitsch PetscCall(DMDACreateNaturalVector(cdm, &coor_natural));
1391e07b27eSBarry Smith
1409566063dSJacob Faibussowitsch PetscCall(DMDAGlobalToNaturalBegin(cdm, coor, INSERT_VALUES, coor_natural));
1419566063dSJacob Faibussowitsch PetscCall(DMDAGlobalToNaturalEnd(cdm, coor, INSERT_VALUES, coor_natural));
1421e07b27eSBarry Smith
1431e07b27eSBarry Smith /* get indices of the guys I want to grab */
1449566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(dm, NULL, &M, &N, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL));
14557f12427SDave May if (PCTelescope_isActiveRank(sred)) {
1469566063dSJacob Faibussowitsch PetscCall(DMDAGetCorners(subdm, &si, &sj, NULL, &ni, &nj, NULL));
14715dd08bcSBarry Smith Ml = ni;
14815dd08bcSBarry Smith Nl = nj;
1491e07b27eSBarry Smith } else {
150c41e779fSDave May si = sj = 0;
151c41e779fSDave May ni = nj = 0;
1523ac26c5eSBarry Smith Ml = Nl = 0;
1531e07b27eSBarry Smith }
1541e07b27eSBarry Smith
1559566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Ml * Nl * 2, &fine_indices));
1561e07b27eSBarry Smith c = 0;
15757f12427SDave May if (PCTelescope_isActiveRank(sred)) {
1581e07b27eSBarry Smith for (j = sj; j < sj + nj; j++) {
1591e07b27eSBarry Smith for (i = si; i < si + ni; i++) {
1601e07b27eSBarry Smith nidx = (i) + (j)*M;
1611e07b27eSBarry Smith fine_indices[c] = 2 * nidx;
1621e07b27eSBarry Smith fine_indices[c + 1] = 2 * nidx + 1;
1631e07b27eSBarry Smith c = c + 2;
1641e07b27eSBarry Smith }
1651e07b27eSBarry Smith }
16663a3b9bcSJacob Faibussowitsch PetscCheck(c == Ml * Nl * 2, PETSC_COMM_SELF, PETSC_ERR_PLIB, "c %" PetscInt_FMT " should equal 2 * Ml %" PetscInt_FMT " * Nl %" PetscInt_FMT, c, Ml, Nl);
1671e07b27eSBarry Smith }
1681e07b27eSBarry Smith
1691e07b27eSBarry Smith /* generate scatter */
1709566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)dm), Ml * Nl * 2, fine_indices, PETSC_USE_POINTER, &is_fine));
1719566063dSJacob Faibussowitsch PetscCall(ISCreateStride(PETSC_COMM_SELF, Ml * Nl * 2, 0, 1, &is_local));
1721e07b27eSBarry Smith
1731e07b27eSBarry Smith /* scatter */
1749566063dSJacob Faibussowitsch PetscCall(VecCreate(PETSC_COMM_SELF, &perm_coors));
1759566063dSJacob Faibussowitsch PetscCall(VecSetSizes(perm_coors, PETSC_DECIDE, Ml * Nl * 2));
1769566063dSJacob Faibussowitsch PetscCall(VecSetType(perm_coors, VECSEQ));
1771e07b27eSBarry Smith
1789566063dSJacob Faibussowitsch PetscCall(VecScatterCreate(coor_natural, is_fine, perm_coors, is_local, &sctx));
1799566063dSJacob Faibussowitsch PetscCall(VecScatterBegin(sctx, coor_natural, perm_coors, INSERT_VALUES, SCATTER_FORWARD));
1809566063dSJacob Faibussowitsch PetscCall(VecScatterEnd(sctx, coor_natural, perm_coors, INSERT_VALUES, SCATTER_FORWARD));
1811e07b27eSBarry Smith /* access */
18257f12427SDave May if (PCTelescope_isActiveRank(sred)) {
1831e07b27eSBarry Smith Vec _coors;
1841e07b27eSBarry Smith const PetscScalar *LA_perm;
1851e07b27eSBarry Smith PetscScalar *LA_coors;
1861e07b27eSBarry Smith
1879566063dSJacob Faibussowitsch PetscCall(DMGetCoordinates(subdm, &_coors));
1889566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(perm_coors, &LA_perm));
1899566063dSJacob Faibussowitsch PetscCall(VecGetArray(_coors, &LA_coors));
190ad540459SPierre Jolivet for (i = 0; i < Ml * Nl * 2; i++) LA_coors[i] = LA_perm[i];
1919566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(_coors, &LA_coors));
1929566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(perm_coors, &LA_perm));
1931e07b27eSBarry Smith }
1941e07b27eSBarry Smith
1951e07b27eSBarry Smith /* update local coords */
19657f12427SDave May if (PCTelescope_isActiveRank(sred)) {
1971e07b27eSBarry Smith DM _dmc;
1981e07b27eSBarry Smith Vec _coors, _coors_local;
1999566063dSJacob Faibussowitsch PetscCall(DMGetCoordinateDM(subdm, &_dmc));
2009566063dSJacob Faibussowitsch PetscCall(DMGetCoordinates(subdm, &_coors));
2019566063dSJacob Faibussowitsch PetscCall(DMGetCoordinatesLocal(subdm, &_coors_local));
2029566063dSJacob Faibussowitsch PetscCall(DMGlobalToLocalBegin(_dmc, _coors, INSERT_VALUES, _coors_local));
2039566063dSJacob Faibussowitsch PetscCall(DMGlobalToLocalEnd(_dmc, _coors, INSERT_VALUES, _coors_local));
2041e07b27eSBarry Smith }
2059566063dSJacob Faibussowitsch PetscCall(VecScatterDestroy(&sctx));
2069566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is_fine));
2079566063dSJacob Faibussowitsch PetscCall(PetscFree(fine_indices));
2089566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is_local));
2099566063dSJacob Faibussowitsch PetscCall(VecDestroy(&perm_coors));
2109566063dSJacob Faibussowitsch PetscCall(VecDestroy(&coor_natural));
2113ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
2121e07b27eSBarry Smith }
2131e07b27eSBarry Smith
PCTelescopeSetUp_dmda_repart_coors3d(PC_Telescope sred,DM dm,DM subdm)214d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCTelescopeSetUp_dmda_repart_coors3d(PC_Telescope sred, DM dm, DM subdm)
215d71ae5a4SJacob Faibussowitsch {
2161e07b27eSBarry Smith DM cdm;
2171e07b27eSBarry Smith Vec coor, coor_natural, perm_coors;
2181e07b27eSBarry Smith PetscInt i, j, k, si, sj, sk, ni, nj, nk, M, N, P, Ml, Nl, Pl, c, nidx;
2191e07b27eSBarry Smith PetscInt *fine_indices;
2201e07b27eSBarry Smith IS is_fine, is_local;
2211e07b27eSBarry Smith VecScatter sctx;
2221e07b27eSBarry Smith
2231e07b27eSBarry Smith PetscFunctionBegin;
2249566063dSJacob Faibussowitsch PetscCall(DMGetCoordinates(dm, &coor));
2253ba16761SJacob Faibussowitsch if (!coor) PetscFunctionReturn(PETSC_SUCCESS);
2261e07b27eSBarry Smith
22748a46eb9SPierre Jolivet if (PCTelescope_isActiveRank(sred)) PetscCall(DMDASetUniformCoordinates(subdm, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0));
2281e07b27eSBarry Smith
2291e07b27eSBarry Smith /* Get the coordinate vector from the distributed array */
2309566063dSJacob Faibussowitsch PetscCall(DMGetCoordinateDM(dm, &cdm));
2319566063dSJacob Faibussowitsch PetscCall(DMDACreateNaturalVector(cdm, &coor_natural));
2329566063dSJacob Faibussowitsch PetscCall(DMDAGlobalToNaturalBegin(cdm, coor, INSERT_VALUES, coor_natural));
2339566063dSJacob Faibussowitsch PetscCall(DMDAGlobalToNaturalEnd(cdm, coor, INSERT_VALUES, coor_natural));
2341e07b27eSBarry Smith
2351e07b27eSBarry Smith /* get indices of the guys I want to grab */
2369566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(dm, NULL, &M, &N, &P, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL));
2371e07b27eSBarry Smith
23857f12427SDave May if (PCTelescope_isActiveRank(sred)) {
2399566063dSJacob Faibussowitsch PetscCall(DMDAGetCorners(subdm, &si, &sj, &sk, &ni, &nj, &nk));
240553d0ae9SBarry Smith Ml = ni;
241553d0ae9SBarry Smith Nl = nj;
242553d0ae9SBarry Smith Pl = nk;
2431e07b27eSBarry Smith } else {
244c41e779fSDave May si = sj = sk = 0;
245c41e779fSDave May ni = nj = nk = 0;
2463ac26c5eSBarry Smith Ml = Nl = Pl = 0;
2471e07b27eSBarry Smith }
2481e07b27eSBarry Smith
2499566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Ml * Nl * Pl * 3, &fine_indices));
2501e07b27eSBarry Smith
2511e07b27eSBarry Smith c = 0;
25257f12427SDave May if (PCTelescope_isActiveRank(sred)) {
2531e07b27eSBarry Smith for (k = sk; k < sk + nk; k++) {
2541e07b27eSBarry Smith for (j = sj; j < sj + nj; j++) {
2551e07b27eSBarry Smith for (i = si; i < si + ni; i++) {
2561e07b27eSBarry Smith nidx = (i) + (j)*M + (k)*M * N;
2571e07b27eSBarry Smith fine_indices[c] = 3 * nidx;
2581e07b27eSBarry Smith fine_indices[c + 1] = 3 * nidx + 1;
2591e07b27eSBarry Smith fine_indices[c + 2] = 3 * nidx + 2;
2601e07b27eSBarry Smith c = c + 3;
2611e07b27eSBarry Smith }
2621e07b27eSBarry Smith }
2631e07b27eSBarry Smith }
2641e07b27eSBarry Smith }
2651e07b27eSBarry Smith
2661e07b27eSBarry Smith /* generate scatter */
2679566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)dm), Ml * Nl * Pl * 3, fine_indices, PETSC_USE_POINTER, &is_fine));
2689566063dSJacob Faibussowitsch PetscCall(ISCreateStride(PETSC_COMM_SELF, Ml * Nl * Pl * 3, 0, 1, &is_local));
2691e07b27eSBarry Smith
2701e07b27eSBarry Smith /* scatter */
2719566063dSJacob Faibussowitsch PetscCall(VecCreate(PETSC_COMM_SELF, &perm_coors));
2729566063dSJacob Faibussowitsch PetscCall(VecSetSizes(perm_coors, PETSC_DECIDE, Ml * Nl * Pl * 3));
2739566063dSJacob Faibussowitsch PetscCall(VecSetType(perm_coors, VECSEQ));
2749566063dSJacob Faibussowitsch PetscCall(VecScatterCreate(coor_natural, is_fine, perm_coors, is_local, &sctx));
2759566063dSJacob Faibussowitsch PetscCall(VecScatterBegin(sctx, coor_natural, perm_coors, INSERT_VALUES, SCATTER_FORWARD));
2769566063dSJacob Faibussowitsch PetscCall(VecScatterEnd(sctx, coor_natural, perm_coors, INSERT_VALUES, SCATTER_FORWARD));
2771e07b27eSBarry Smith
2781e07b27eSBarry Smith /* access */
27957f12427SDave May if (PCTelescope_isActiveRank(sred)) {
2801e07b27eSBarry Smith Vec _coors;
2811e07b27eSBarry Smith const PetscScalar *LA_perm;
2821e07b27eSBarry Smith PetscScalar *LA_coors;
2831e07b27eSBarry Smith
2849566063dSJacob Faibussowitsch PetscCall(DMGetCoordinates(subdm, &_coors));
2859566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(perm_coors, &LA_perm));
2869566063dSJacob Faibussowitsch PetscCall(VecGetArray(_coors, &LA_coors));
287ad540459SPierre Jolivet for (i = 0; i < Ml * Nl * Pl * 3; i++) LA_coors[i] = LA_perm[i];
2889566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(_coors, &LA_coors));
2899566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(perm_coors, &LA_perm));
2901e07b27eSBarry Smith }
2911e07b27eSBarry Smith
2921e07b27eSBarry Smith /* update local coords */
29357f12427SDave May if (PCTelescope_isActiveRank(sred)) {
2941e07b27eSBarry Smith DM _dmc;
2951e07b27eSBarry Smith Vec _coors, _coors_local;
2961e07b27eSBarry Smith
2979566063dSJacob Faibussowitsch PetscCall(DMGetCoordinateDM(subdm, &_dmc));
2989566063dSJacob Faibussowitsch PetscCall(DMGetCoordinates(subdm, &_coors));
2999566063dSJacob Faibussowitsch PetscCall(DMGetCoordinatesLocal(subdm, &_coors_local));
3009566063dSJacob Faibussowitsch PetscCall(DMGlobalToLocalBegin(_dmc, _coors, INSERT_VALUES, _coors_local));
3019566063dSJacob Faibussowitsch PetscCall(DMGlobalToLocalEnd(_dmc, _coors, INSERT_VALUES, _coors_local));
3021e07b27eSBarry Smith }
3031e07b27eSBarry Smith
3049566063dSJacob Faibussowitsch PetscCall(VecScatterDestroy(&sctx));
3059566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is_fine));
3069566063dSJacob Faibussowitsch PetscCall(PetscFree(fine_indices));
3079566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is_local));
3089566063dSJacob Faibussowitsch PetscCall(VecDestroy(&perm_coors));
3099566063dSJacob Faibussowitsch PetscCall(VecDestroy(&coor_natural));
3103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
3111e07b27eSBarry Smith }
3121e07b27eSBarry Smith
PCTelescopeSetUp_dmda_repart_coors(PC pc,PC_Telescope sred,PC_Telescope_DMDACtx * ctx)313d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCTelescopeSetUp_dmda_repart_coors(PC pc, PC_Telescope sred, PC_Telescope_DMDACtx *ctx)
314d71ae5a4SJacob Faibussowitsch {
3151e07b27eSBarry Smith PetscInt dim;
3161e07b27eSBarry Smith DM dm, subdm;
3171e07b27eSBarry Smith PetscSubcomm psubcomm;
3181e07b27eSBarry Smith MPI_Comm comm;
3191e07b27eSBarry Smith Vec coor;
3201e07b27eSBarry Smith
3211e07b27eSBarry Smith PetscFunctionBegin;
3229566063dSJacob Faibussowitsch PetscCall(PCGetDM(pc, &dm));
3239566063dSJacob Faibussowitsch PetscCall(DMGetCoordinates(dm, &coor));
3243ba16761SJacob Faibussowitsch if (!coor) PetscFunctionReturn(PETSC_SUCCESS);
3251e07b27eSBarry Smith psubcomm = sred->psubcomm;
3261e07b27eSBarry Smith comm = PetscSubcommParent(psubcomm);
3271e07b27eSBarry Smith subdm = ctx->dmrepart;
3281e07b27eSBarry Smith
3299566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescope: setting up the coordinates (DMDA)\n"));
3309566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(dm, &dim, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL));
3311e07b27eSBarry Smith switch (dim) {
332d71ae5a4SJacob Faibussowitsch case 1:
333d71ae5a4SJacob Faibussowitsch SETERRQ(comm, PETSC_ERR_SUP, "Telescope: DMDA (1D) repartitioning not provided");
334d71ae5a4SJacob Faibussowitsch case 2:
335d71ae5a4SJacob Faibussowitsch PetscCall(PCTelescopeSetUp_dmda_repart_coors2d(sred, dm, subdm));
336d71ae5a4SJacob Faibussowitsch break;
337d71ae5a4SJacob Faibussowitsch case 3:
338d71ae5a4SJacob Faibussowitsch PetscCall(PCTelescopeSetUp_dmda_repart_coors3d(sred, dm, subdm));
339d71ae5a4SJacob Faibussowitsch break;
3401e07b27eSBarry Smith }
3413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
3421e07b27eSBarry Smith }
3431e07b27eSBarry Smith
3441e07b27eSBarry Smith /* setup repartitioned dm */
PCTelescopeSetUp_dmda_repart(PC pc,PC_Telescope sred,PC_Telescope_DMDACtx * ctx)34566976f2fSJacob Faibussowitsch static PetscErrorCode PCTelescopeSetUp_dmda_repart(PC pc, PC_Telescope sred, PC_Telescope_DMDACtx *ctx)
346d71ae5a4SJacob Faibussowitsch {
3471e07b27eSBarry Smith DM dm;
3481e07b27eSBarry Smith PetscInt dim, nx, ny, nz, ndof, nsw, sum, k;
3491e07b27eSBarry Smith DMBoundaryType bx, by, bz;
3501e07b27eSBarry Smith DMDAStencilType stencil;
3511e07b27eSBarry Smith const PetscInt *_range_i_re;
3521e07b27eSBarry Smith const PetscInt *_range_j_re;
3531e07b27eSBarry Smith const PetscInt *_range_k_re;
3541e07b27eSBarry Smith DMDAInterpolationType itype;
3551e07b27eSBarry Smith PetscInt refine_x, refine_y, refine_z;
3561e07b27eSBarry Smith MPI_Comm comm, subcomm;
3571e07b27eSBarry Smith const char *prefix;
358835f2295SStefano Zampini PetscMPIInt ni;
3591e07b27eSBarry Smith
3601e07b27eSBarry Smith PetscFunctionBegin;
3611e07b27eSBarry Smith comm = PetscSubcommParent(sred->psubcomm);
3621e07b27eSBarry Smith subcomm = PetscSubcommChild(sred->psubcomm);
3639566063dSJacob Faibussowitsch PetscCall(PCGetDM(pc, &dm));
3641e07b27eSBarry Smith
3659566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(dm, &dim, &nx, &ny, &nz, NULL, NULL, NULL, &ndof, &nsw, &bx, &by, &bz, &stencil));
3669566063dSJacob Faibussowitsch PetscCall(DMDAGetInterpolationType(dm, &itype));
3679566063dSJacob Faibussowitsch PetscCall(DMDAGetRefinementFactor(dm, &refine_x, &refine_y, &refine_z));
3681e07b27eSBarry Smith
3691e07b27eSBarry Smith ctx->dmrepart = NULL;
3701e07b27eSBarry Smith _range_i_re = _range_j_re = _range_k_re = NULL;
3711e07b27eSBarry Smith /* Create DMDA on the child communicator */
37257f12427SDave May if (PCTelescope_isActiveRank(sred)) {
3731e07b27eSBarry Smith switch (dim) {
3741e07b27eSBarry Smith case 1:
3759566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescope: setting up the DMDA on comm subset (1D)\n"));
3769566063dSJacob Faibussowitsch /* PetscCall(DMDACreate1d(subcomm,bx,nx,ndof,nsw,NULL,&ctx->dmrepart)); */
3771e07b27eSBarry Smith ny = nz = 1;
3781e07b27eSBarry Smith by = bz = DM_BOUNDARY_NONE;
3791e07b27eSBarry Smith break;
3801e07b27eSBarry Smith case 2:
3819566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescope: setting up the DMDA on comm subset (2D)\n"));
3829566063dSJacob Faibussowitsch /* PetscCall(DMDACreate2d(subcomm,bx,by,stencil,nx,ny, PETSC_DECIDE,PETSC_DECIDE,
3839566063dSJacob Faibussowitsch ndof,nsw, NULL,NULL,&ctx->dmrepart)); */
3841e07b27eSBarry Smith nz = 1;
3851e07b27eSBarry Smith bz = DM_BOUNDARY_NONE;
3861e07b27eSBarry Smith break;
3871e07b27eSBarry Smith case 3:
3889566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescope: setting up the DMDA on comm subset (3D)\n"));
3899566063dSJacob Faibussowitsch /* PetscCall(DMDACreate3d(subcomm,bx,by,bz,stencil,nx,ny,nz,
3909566063dSJacob Faibussowitsch PETSC_DECIDE,PETSC_DECIDE,PETSC_DECIDE, ndof,nsw, NULL,NULL,NULL,&ctx->dmrepart)); */
3911e07b27eSBarry Smith break;
3921e07b27eSBarry Smith }
3931e07b27eSBarry Smith /*
3941e07b27eSBarry Smith The API DMDACreate1d(), DMDACreate2d(), DMDACreate3d() does not allow us to set/append
3951e07b27eSBarry Smith a unique option prefix for the DM, thus I prefer to expose the contents of these API's here.
3961e07b27eSBarry Smith This allows users to control the partitioning of the subDM.
3971e07b27eSBarry Smith */
3989566063dSJacob Faibussowitsch PetscCall(DMDACreate(subcomm, &ctx->dmrepart));
3991e07b27eSBarry Smith /* Set unique option prefix name */
4009566063dSJacob Faibussowitsch PetscCall(KSPGetOptionsPrefix(sred->ksp, &prefix));
4019566063dSJacob Faibussowitsch PetscCall(DMSetOptionsPrefix(ctx->dmrepart, prefix));
4029566063dSJacob Faibussowitsch PetscCall(DMAppendOptionsPrefix(ctx->dmrepart, "repart_"));
4031e07b27eSBarry Smith /* standard setup from DMDACreate{1,2,3}d() */
4049566063dSJacob Faibussowitsch PetscCall(DMSetDimension(ctx->dmrepart, dim));
4059566063dSJacob Faibussowitsch PetscCall(DMDASetSizes(ctx->dmrepart, nx, ny, nz));
4069566063dSJacob Faibussowitsch PetscCall(DMDASetNumProcs(ctx->dmrepart, PETSC_DECIDE, PETSC_DECIDE, PETSC_DECIDE));
4079566063dSJacob Faibussowitsch PetscCall(DMDASetBoundaryType(ctx->dmrepart, bx, by, bz));
4089566063dSJacob Faibussowitsch PetscCall(DMDASetDof(ctx->dmrepart, ndof));
4099566063dSJacob Faibussowitsch PetscCall(DMDASetStencilType(ctx->dmrepart, stencil));
4109566063dSJacob Faibussowitsch PetscCall(DMDASetStencilWidth(ctx->dmrepart, nsw));
4119566063dSJacob Faibussowitsch PetscCall(DMDASetOwnershipRanges(ctx->dmrepart, NULL, NULL, NULL));
4129566063dSJacob Faibussowitsch PetscCall(DMSetFromOptions(ctx->dmrepart));
4139566063dSJacob Faibussowitsch PetscCall(DMSetUp(ctx->dmrepart));
4141e07b27eSBarry Smith /* Set refinement factors and interpolation type from the partent */
4159566063dSJacob Faibussowitsch PetscCall(DMDASetRefinementFactor(ctx->dmrepart, refine_x, refine_y, refine_z));
4169566063dSJacob Faibussowitsch PetscCall(DMDASetInterpolationType(ctx->dmrepart, itype));
4171e07b27eSBarry Smith
4189566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(ctx->dmrepart, NULL, NULL, NULL, NULL, &ctx->Mp_re, &ctx->Np_re, &ctx->Pp_re, NULL, NULL, NULL, NULL, NULL, NULL));
4199566063dSJacob Faibussowitsch PetscCall(DMDAGetOwnershipRanges(ctx->dmrepart, &_range_i_re, &_range_j_re, &_range_k_re));
4205e897e82SDave May
4215e897e82SDave May ctx->dmrepart->ops->creatematrix = dm->ops->creatematrix;
4225e897e82SDave May ctx->dmrepart->ops->createdomaindecomposition = dm->ops->createdomaindecomposition;
4231e07b27eSBarry Smith }
4241e07b27eSBarry Smith
4251e07b27eSBarry Smith /* generate ranges for repartitioned dm */
4261e07b27eSBarry Smith /* note - assume rank 0 always participates */
427071fcb05SBarry Smith /* TODO: use a single MPI call */
4289566063dSJacob Faibussowitsch PetscCallMPI(MPI_Bcast(&ctx->Mp_re, 1, MPIU_INT, 0, comm));
4299566063dSJacob Faibussowitsch PetscCallMPI(MPI_Bcast(&ctx->Np_re, 1, MPIU_INT, 0, comm));
4309566063dSJacob Faibussowitsch PetscCallMPI(MPI_Bcast(&ctx->Pp_re, 1, MPIU_INT, 0, comm));
4311e07b27eSBarry Smith
4329566063dSJacob Faibussowitsch PetscCall(PetscCalloc3(ctx->Mp_re, &ctx->range_i_re, ctx->Np_re, &ctx->range_j_re, ctx->Pp_re, &ctx->range_k_re));
4331e07b27eSBarry Smith
4349566063dSJacob Faibussowitsch if (_range_i_re) PetscCall(PetscArraycpy(ctx->range_i_re, _range_i_re, ctx->Mp_re));
4359566063dSJacob Faibussowitsch if (_range_j_re) PetscCall(PetscArraycpy(ctx->range_j_re, _range_j_re, ctx->Np_re));
4369566063dSJacob Faibussowitsch if (_range_k_re) PetscCall(PetscArraycpy(ctx->range_k_re, _range_k_re, ctx->Pp_re));
4371e07b27eSBarry Smith
438071fcb05SBarry Smith /* TODO: use a single MPI call */
439835f2295SStefano Zampini PetscCall(PetscMPIIntCast(ctx->Mp_re, &ni));
440835f2295SStefano Zampini PetscCallMPI(MPI_Bcast(ctx->range_i_re, ni, MPIU_INT, 0, comm));
441835f2295SStefano Zampini PetscCall(PetscMPIIntCast(ctx->Np_re, &ni));
442835f2295SStefano Zampini PetscCallMPI(MPI_Bcast(ctx->range_j_re, ni, MPIU_INT, 0, comm));
443835f2295SStefano Zampini PetscCall(PetscMPIIntCast(ctx->Pp_re, &ni));
444835f2295SStefano Zampini PetscCallMPI(MPI_Bcast(ctx->range_k_re, ni, MPIU_INT, 0, comm));
4451e07b27eSBarry Smith
4469566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(ctx->Mp_re, &ctx->start_i_re, ctx->Np_re, &ctx->start_j_re, ctx->Pp_re, &ctx->start_k_re));
4471e07b27eSBarry Smith
4481e07b27eSBarry Smith sum = 0;
4491e07b27eSBarry Smith for (k = 0; k < ctx->Mp_re; k++) {
4501e07b27eSBarry Smith ctx->start_i_re[k] = sum;
4511e07b27eSBarry Smith sum += ctx->range_i_re[k];
4521e07b27eSBarry Smith }
4531e07b27eSBarry Smith
4541e07b27eSBarry Smith sum = 0;
4551e07b27eSBarry Smith for (k = 0; k < ctx->Np_re; k++) {
4561e07b27eSBarry Smith ctx->start_j_re[k] = sum;
4571e07b27eSBarry Smith sum += ctx->range_j_re[k];
4581e07b27eSBarry Smith }
4591e07b27eSBarry Smith
4601e07b27eSBarry Smith sum = 0;
4611e07b27eSBarry Smith for (k = 0; k < ctx->Pp_re; k++) {
4621e07b27eSBarry Smith ctx->start_k_re[k] = sum;
4631e07b27eSBarry Smith sum += ctx->range_k_re[k];
4641e07b27eSBarry Smith }
4651e07b27eSBarry Smith
466ba1c3560SDave May /* attach repartitioned dm to child ksp */
467ba1c3560SDave May {
468ba1c3560SDave May PetscErrorCode (*dmksp_func)(KSP, Mat, Mat, void *);
469ba1c3560SDave May void *dmksp_ctx;
470ba1c3560SDave May
4719566063dSJacob Faibussowitsch PetscCall(DMKSPGetComputeOperators(dm, &dmksp_func, &dmksp_ctx));
472ba1c3560SDave May
4731e07b27eSBarry Smith /* attach dm to ksp on sub communicator */
47457f12427SDave May if (PCTelescope_isActiveRank(sred)) {
4759566063dSJacob Faibussowitsch PetscCall(KSPSetDM(sred->ksp, ctx->dmrepart));
476ba1c3560SDave May
477c5db1f53SDave May if (!dmksp_func || sred->ignore_kspcomputeoperators) {
478*bf0c7fc2SBarry Smith PetscCall(KSPSetDMActive(sred->ksp, KSP_DMACTIVE_ALL, PETSC_FALSE));
479ba1c3560SDave May } else {
480ba1c3560SDave May /* sub ksp inherits dmksp_func and context provided by user */
4819566063dSJacob Faibussowitsch PetscCall(KSPSetComputeOperators(sred->ksp, dmksp_func, dmksp_ctx));
482*bf0c7fc2SBarry Smith PetscCall(KSPSetDMActive(sred->ksp, KSP_DMACTIVE_ALL, PETSC_TRUE));
483ba1c3560SDave May }
484ba1c3560SDave May }
4851e07b27eSBarry Smith }
4863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
4871e07b27eSBarry Smith }
4881e07b27eSBarry Smith
PCTelescopeSetUp_dmda_permutation_3d(PC pc,PC_Telescope sred,PC_Telescope_DMDACtx * ctx)48966976f2fSJacob Faibussowitsch static PetscErrorCode PCTelescopeSetUp_dmda_permutation_3d(PC pc, PC_Telescope sred, PC_Telescope_DMDACtx *ctx)
490d71ae5a4SJacob Faibussowitsch {
4911e07b27eSBarry Smith DM dm;
4921e07b27eSBarry Smith MPI_Comm comm;
4931e07b27eSBarry Smith Mat Pscalar, P;
4941e07b27eSBarry Smith PetscInt ndof;
4951e07b27eSBarry Smith PetscInt i, j, k, location, startI[3], endI[3], lenI[3], nx, ny, nz;
4961e07b27eSBarry Smith PetscInt sr, er, Mr;
4971e07b27eSBarry Smith Vec V;
4981e07b27eSBarry Smith
4991e07b27eSBarry Smith PetscFunctionBegin;
5009566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescope: setting up the permutation matrix (DMDA-3D)\n"));
5019566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)pc, &comm));
5021e07b27eSBarry Smith
5039566063dSJacob Faibussowitsch PetscCall(PCGetDM(pc, &dm));
5049566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(dm, NULL, &nx, &ny, &nz, NULL, NULL, NULL, &ndof, NULL, NULL, NULL, NULL, NULL));
5051e07b27eSBarry Smith
5069566063dSJacob Faibussowitsch PetscCall(DMGetGlobalVector(dm, &V));
5079566063dSJacob Faibussowitsch PetscCall(VecGetSize(V, &Mr));
5089566063dSJacob Faibussowitsch PetscCall(VecGetOwnershipRange(V, &sr, &er));
5099566063dSJacob Faibussowitsch PetscCall(DMRestoreGlobalVector(dm, &V));
5101e07b27eSBarry Smith sr = sr / ndof;
5111e07b27eSBarry Smith er = er / ndof;
5121e07b27eSBarry Smith Mr = Mr / ndof;
5131e07b27eSBarry Smith
5149566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, &Pscalar));
51557508eceSPierre Jolivet PetscCall(MatSetSizes(Pscalar, er - sr, er - sr, Mr, Mr));
5169566063dSJacob Faibussowitsch PetscCall(MatSetType(Pscalar, MATAIJ));
5179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(Pscalar, 1, NULL));
5189566063dSJacob Faibussowitsch PetscCall(MatMPIAIJSetPreallocation(Pscalar, 1, NULL, 1, NULL));
5191e07b27eSBarry Smith
5209566063dSJacob Faibussowitsch PetscCall(DMDAGetCorners(dm, NULL, NULL, NULL, &lenI[0], &lenI[1], &lenI[2]));
5219566063dSJacob Faibussowitsch PetscCall(DMDAGetCorners(dm, &startI[0], &startI[1], &startI[2], &endI[0], &endI[1], &endI[2]));
5221e07b27eSBarry Smith endI[0] += startI[0];
5231e07b27eSBarry Smith endI[1] += startI[1];
5241e07b27eSBarry Smith endI[2] += startI[2];
5251e07b27eSBarry Smith
5261e07b27eSBarry Smith for (k = startI[2]; k < endI[2]; k++) {
5271e07b27eSBarry Smith for (j = startI[1]; j < endI[1]; j++) {
5281e07b27eSBarry Smith for (i = startI[0]; i < endI[0]; i++) {
5291e07b27eSBarry Smith PetscMPIInt rank_ijk_re, rank_reI[3];
5301e07b27eSBarry Smith PetscInt s0_re;
531c6a0d831SBarry Smith PetscInt ii, jj, kk, local_ijk_re, mapped_ijk;
5321e07b27eSBarry Smith PetscInt lenI_re[3];
5331e07b27eSBarry Smith
5341e07b27eSBarry Smith location = (i - startI[0]) + (j - startI[1]) * lenI[0] + (k - startI[2]) * lenI[0] * lenI[1];
5359371c9d4SSatish Balay PetscCall(_DMDADetermineRankFromGlobalIJK(3, i, j, k, ctx->Mp_re, ctx->Np_re, ctx->Pp_re, ctx->start_i_re, ctx->start_j_re, ctx->start_k_re, ctx->range_i_re, ctx->range_j_re, ctx->range_k_re, &rank_reI[0], &rank_reI[1], &rank_reI[2], &rank_ijk_re));
5369566063dSJacob Faibussowitsch PetscCall(_DMDADetermineGlobalS0(3, rank_ijk_re, ctx->Mp_re, ctx->Np_re, ctx->Pp_re, ctx->range_i_re, ctx->range_j_re, ctx->range_k_re, &s0_re));
5371e07b27eSBarry Smith ii = i - ctx->start_i_re[rank_reI[0]];
53808401ef6SPierre Jolivet PetscCheck(ii >= 0, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmdarepart-perm3d] index error ii");
5391e07b27eSBarry Smith jj = j - ctx->start_j_re[rank_reI[1]];
54008401ef6SPierre Jolivet PetscCheck(jj >= 0, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmdarepart-perm3d] index error jj");
5411e07b27eSBarry Smith kk = k - ctx->start_k_re[rank_reI[2]];
54208401ef6SPierre Jolivet PetscCheck(kk >= 0, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmdarepart-perm3d] index error kk");
5431e07b27eSBarry Smith lenI_re[0] = ctx->range_i_re[rank_reI[0]];
5441e07b27eSBarry Smith lenI_re[1] = ctx->range_j_re[rank_reI[1]];
5451e07b27eSBarry Smith lenI_re[2] = ctx->range_k_re[rank_reI[2]];
5461e07b27eSBarry Smith local_ijk_re = ii + jj * lenI_re[0] + kk * lenI_re[0] * lenI_re[1];
5471e07b27eSBarry Smith mapped_ijk = s0_re + local_ijk_re;
5489566063dSJacob Faibussowitsch PetscCall(MatSetValue(Pscalar, sr + location, mapped_ijk, 1.0, INSERT_VALUES));
5491e07b27eSBarry Smith }
5501e07b27eSBarry Smith }
5511e07b27eSBarry Smith }
5529566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(Pscalar, MAT_FINAL_ASSEMBLY));
5539566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(Pscalar, MAT_FINAL_ASSEMBLY));
5549566063dSJacob Faibussowitsch PetscCall(MatCreateMAIJ(Pscalar, ndof, &P));
5559566063dSJacob Faibussowitsch PetscCall(MatDestroy(&Pscalar));
5561e07b27eSBarry Smith ctx->permutation = P;
5573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
5581e07b27eSBarry Smith }
5591e07b27eSBarry Smith
PCTelescopeSetUp_dmda_permutation_2d(PC pc,PC_Telescope sred,PC_Telescope_DMDACtx * ctx)56066976f2fSJacob Faibussowitsch static PetscErrorCode PCTelescopeSetUp_dmda_permutation_2d(PC pc, PC_Telescope sred, PC_Telescope_DMDACtx *ctx)
561d71ae5a4SJacob Faibussowitsch {
5621e07b27eSBarry Smith DM dm;
5631e07b27eSBarry Smith MPI_Comm comm;
5641e07b27eSBarry Smith Mat Pscalar, P;
5651e07b27eSBarry Smith PetscInt ndof;
5661e07b27eSBarry Smith PetscInt i, j, location, startI[2], endI[2], lenI[2], nx, ny, nz;
5671e07b27eSBarry Smith PetscInt sr, er, Mr;
5681e07b27eSBarry Smith Vec V;
5691e07b27eSBarry Smith
5701e07b27eSBarry Smith PetscFunctionBegin;
5719566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescope: setting up the permutation matrix (DMDA-2D)\n"));
5729566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)pc, &comm));
5739566063dSJacob Faibussowitsch PetscCall(PCGetDM(pc, &dm));
5749566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(dm, NULL, &nx, &ny, &nz, NULL, NULL, NULL, &ndof, NULL, NULL, NULL, NULL, NULL));
5759566063dSJacob Faibussowitsch PetscCall(DMGetGlobalVector(dm, &V));
5769566063dSJacob Faibussowitsch PetscCall(VecGetSize(V, &Mr));
5779566063dSJacob Faibussowitsch PetscCall(VecGetOwnershipRange(V, &sr, &er));
5789566063dSJacob Faibussowitsch PetscCall(DMRestoreGlobalVector(dm, &V));
5791e07b27eSBarry Smith sr = sr / ndof;
5801e07b27eSBarry Smith er = er / ndof;
5811e07b27eSBarry Smith Mr = Mr / ndof;
5821e07b27eSBarry Smith
5839566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, &Pscalar));
58457508eceSPierre Jolivet PetscCall(MatSetSizes(Pscalar, er - sr, er - sr, Mr, Mr));
5859566063dSJacob Faibussowitsch PetscCall(MatSetType(Pscalar, MATAIJ));
5869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(Pscalar, 1, NULL));
5879566063dSJacob Faibussowitsch PetscCall(MatMPIAIJSetPreallocation(Pscalar, 1, NULL, 1, NULL));
5881e07b27eSBarry Smith
5899566063dSJacob Faibussowitsch PetscCall(DMDAGetCorners(dm, NULL, NULL, NULL, &lenI[0], &lenI[1], NULL));
5909566063dSJacob Faibussowitsch PetscCall(DMDAGetCorners(dm, &startI[0], &startI[1], NULL, &endI[0], &endI[1], NULL));
5911e07b27eSBarry Smith endI[0] += startI[0];
5921e07b27eSBarry Smith endI[1] += startI[1];
5931e07b27eSBarry Smith
5941e07b27eSBarry Smith for (j = startI[1]; j < endI[1]; j++) {
5951e07b27eSBarry Smith for (i = startI[0]; i < endI[0]; i++) {
5961e07b27eSBarry Smith PetscMPIInt rank_ijk_re, rank_reI[3];
5971e07b27eSBarry Smith PetscInt s0_re;
598c6a0d831SBarry Smith PetscInt ii, jj, local_ijk_re, mapped_ijk;
5991e07b27eSBarry Smith PetscInt lenI_re[3];
6001e07b27eSBarry Smith
6011e07b27eSBarry Smith location = (i - startI[0]) + (j - startI[1]) * lenI[0];
6029371c9d4SSatish Balay PetscCall(_DMDADetermineRankFromGlobalIJK(2, i, j, 0, ctx->Mp_re, ctx->Np_re, ctx->Pp_re, ctx->start_i_re, ctx->start_j_re, ctx->start_k_re, ctx->range_i_re, ctx->range_j_re, ctx->range_k_re, &rank_reI[0], &rank_reI[1], NULL, &rank_ijk_re));
6031e07b27eSBarry Smith
6049566063dSJacob Faibussowitsch PetscCall(_DMDADetermineGlobalS0(2, rank_ijk_re, ctx->Mp_re, ctx->Np_re, ctx->Pp_re, ctx->range_i_re, ctx->range_j_re, ctx->range_k_re, &s0_re));
6051e07b27eSBarry Smith
6061e07b27eSBarry Smith ii = i - ctx->start_i_re[rank_reI[0]];
60708401ef6SPierre Jolivet PetscCheck(ii >= 0, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmdarepart-perm2d] index error ii");
6081e07b27eSBarry Smith jj = j - ctx->start_j_re[rank_reI[1]];
60908401ef6SPierre Jolivet PetscCheck(jj >= 0, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmdarepart-perm2d] index error jj");
6101e07b27eSBarry Smith
6111e07b27eSBarry Smith lenI_re[0] = ctx->range_i_re[rank_reI[0]];
6121e07b27eSBarry Smith lenI_re[1] = ctx->range_j_re[rank_reI[1]];
6131e07b27eSBarry Smith local_ijk_re = ii + jj * lenI_re[0];
6141e07b27eSBarry Smith mapped_ijk = s0_re + local_ijk_re;
6159566063dSJacob Faibussowitsch PetscCall(MatSetValue(Pscalar, sr + location, mapped_ijk, 1.0, INSERT_VALUES));
6161e07b27eSBarry Smith }
6171e07b27eSBarry Smith }
6189566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(Pscalar, MAT_FINAL_ASSEMBLY));
6199566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(Pscalar, MAT_FINAL_ASSEMBLY));
6209566063dSJacob Faibussowitsch PetscCall(MatCreateMAIJ(Pscalar, ndof, &P));
6219566063dSJacob Faibussowitsch PetscCall(MatDestroy(&Pscalar));
6221e07b27eSBarry Smith ctx->permutation = P;
6233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
6241e07b27eSBarry Smith }
6251e07b27eSBarry Smith
PCTelescopeSetUp_dmda_scatters(PC pc,PC_Telescope sred,PC_Telescope_DMDACtx * ctx)62666976f2fSJacob Faibussowitsch static PetscErrorCode PCTelescopeSetUp_dmda_scatters(PC pc, PC_Telescope sred, PC_Telescope_DMDACtx *ctx)
627d71ae5a4SJacob Faibussowitsch {
6281e07b27eSBarry Smith Vec xred, yred, xtmp, x, xp;
6291e07b27eSBarry Smith VecScatter scatter;
6301e07b27eSBarry Smith IS isin;
6311e07b27eSBarry Smith Mat B;
6321e07b27eSBarry Smith PetscInt m, bs, st, ed;
6331e07b27eSBarry Smith MPI_Comm comm;
6341e07b27eSBarry Smith
6351e07b27eSBarry Smith PetscFunctionBegin;
6369566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)pc, &comm));
6379566063dSJacob Faibussowitsch PetscCall(PCGetOperators(pc, NULL, &B));
6389566063dSJacob Faibussowitsch PetscCall(MatCreateVecs(B, &x, NULL));
6399566063dSJacob Faibussowitsch PetscCall(MatGetBlockSize(B, &bs));
6409566063dSJacob Faibussowitsch PetscCall(VecDuplicate(x, &xp));
6413ac26c5eSBarry Smith m = 0;
6421e07b27eSBarry Smith xred = NULL;
6431e07b27eSBarry Smith yred = NULL;
64457f12427SDave May if (PCTelescope_isActiveRank(sred)) {
6459566063dSJacob Faibussowitsch PetscCall(DMCreateGlobalVector(ctx->dmrepart, &xred));
6469566063dSJacob Faibussowitsch PetscCall(VecDuplicate(xred, &yred));
6479566063dSJacob Faibussowitsch PetscCall(VecGetOwnershipRange(xred, &st, &ed));
6489566063dSJacob Faibussowitsch PetscCall(ISCreateStride(comm, ed - st, st, 1, &isin));
6499566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(xred, &m));
6501e07b27eSBarry Smith } else {
6519566063dSJacob Faibussowitsch PetscCall(VecGetOwnershipRange(x, &st, &ed));
6529566063dSJacob Faibussowitsch PetscCall(ISCreateStride(comm, 0, st, 1, &isin));
6531e07b27eSBarry Smith }
6549566063dSJacob Faibussowitsch PetscCall(ISSetBlockSize(isin, bs));
6559566063dSJacob Faibussowitsch PetscCall(VecCreate(comm, &xtmp));
6569566063dSJacob Faibussowitsch PetscCall(VecSetSizes(xtmp, m, PETSC_DECIDE));
6579566063dSJacob Faibussowitsch PetscCall(VecSetBlockSize(xtmp, bs));
6589566063dSJacob Faibussowitsch PetscCall(VecSetType(xtmp, ((PetscObject)x)->type_name));
6599566063dSJacob Faibussowitsch PetscCall(VecScatterCreate(x, isin, xtmp, NULL, &scatter));
6601e07b27eSBarry Smith sred->xred = xred;
6611e07b27eSBarry Smith sred->yred = yred;
6621e07b27eSBarry Smith sred->isin = isin;
6631e07b27eSBarry Smith sred->scatter = scatter;
6641e07b27eSBarry Smith sred->xtmp = xtmp;
6651e07b27eSBarry Smith
6661e07b27eSBarry Smith ctx->xp = xp;
6679566063dSJacob Faibussowitsch PetscCall(VecDestroy(&x));
6683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
6691e07b27eSBarry Smith }
6701e07b27eSBarry Smith
PCTelescopeSetUp_dmda(PC pc,PC_Telescope sred)671d71ae5a4SJacob Faibussowitsch PetscErrorCode PCTelescopeSetUp_dmda(PC pc, PC_Telescope sred)
672d71ae5a4SJacob Faibussowitsch {
6731e07b27eSBarry Smith PC_Telescope_DMDACtx *ctx;
6741e07b27eSBarry Smith PetscInt dim;
6751e07b27eSBarry Smith DM dm;
6761e07b27eSBarry Smith MPI_Comm comm;
6771e07b27eSBarry Smith
6781e07b27eSBarry Smith PetscFunctionBegin;
6799566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescope: setup (DMDA)\n"));
6809566063dSJacob Faibussowitsch PetscCall(PetscNew(&ctx));
6811e07b27eSBarry Smith sred->dm_ctx = (void *)ctx;
6821e07b27eSBarry Smith
6839566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)pc, &comm));
6849566063dSJacob Faibussowitsch PetscCall(PCGetDM(pc, &dm));
6859566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(dm, &dim, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL));
6861e07b27eSBarry Smith
6873ba16761SJacob Faibussowitsch PetscCall(PCTelescopeSetUp_dmda_repart(pc, sred, ctx));
6883ba16761SJacob Faibussowitsch PetscCall(PCTelescopeSetUp_dmda_repart_coors(pc, sred, ctx));
6891e07b27eSBarry Smith switch (dim) {
690d71ae5a4SJacob Faibussowitsch case 1:
691d71ae5a4SJacob Faibussowitsch SETERRQ(comm, PETSC_ERR_SUP, "Telescope: DMDA (1D) repartitioning not provided");
692d71ae5a4SJacob Faibussowitsch case 2:
693d71ae5a4SJacob Faibussowitsch PetscCall(PCTelescopeSetUp_dmda_permutation_2d(pc, sred, ctx));
694d71ae5a4SJacob Faibussowitsch break;
695d71ae5a4SJacob Faibussowitsch case 3:
696d71ae5a4SJacob Faibussowitsch PetscCall(PCTelescopeSetUp_dmda_permutation_3d(pc, sred, ctx));
697d71ae5a4SJacob Faibussowitsch break;
6981e07b27eSBarry Smith }
6999566063dSJacob Faibussowitsch PetscCall(PCTelescopeSetUp_dmda_scatters(pc, sred, ctx));
7003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
7011e07b27eSBarry Smith }
7021e07b27eSBarry Smith
PCTelescopeMatCreate_dmda_dmactivefalse(PC pc,PC_Telescope sred,MatReuse reuse,Mat * A)70366976f2fSJacob Faibussowitsch static PetscErrorCode PCTelescopeMatCreate_dmda_dmactivefalse(PC pc, PC_Telescope sred, MatReuse reuse, Mat *A)
704d71ae5a4SJacob Faibussowitsch {
7051e07b27eSBarry Smith PC_Telescope_DMDACtx *ctx;
7061e07b27eSBarry Smith MPI_Comm comm, subcomm;
7071e07b27eSBarry Smith Mat Bperm, Bred, B, P;
7081e07b27eSBarry Smith PetscInt nr, nc;
7091e07b27eSBarry Smith IS isrow, iscol;
7101e07b27eSBarry Smith Mat Blocal, *_Blocal;
7111e07b27eSBarry Smith
7121e07b27eSBarry Smith PetscFunctionBegin;
7139566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescope: updating the redundant preconditioned operator (DMDA)\n"));
7149566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)pc, &comm));
7151e07b27eSBarry Smith subcomm = PetscSubcommChild(sred->psubcomm);
7161e07b27eSBarry Smith ctx = (PC_Telescope_DMDACtx *)sred->dm_ctx;
7171e07b27eSBarry Smith
7189566063dSJacob Faibussowitsch PetscCall(PCGetOperators(pc, NULL, &B));
7199566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &nr, &nc));
7201e07b27eSBarry Smith
7211e07b27eSBarry Smith P = ctx->permutation;
7229566063dSJacob Faibussowitsch PetscCall(MatPtAP(B, P, MAT_INITIAL_MATRIX, 1.1, &Bperm));
7231e07b27eSBarry Smith
7241e07b27eSBarry Smith /* Get submatrices */
7251e07b27eSBarry Smith isrow = sred->isin;
7269566063dSJacob Faibussowitsch PetscCall(ISCreateStride(comm, nc, 0, 1, &iscol));
7271e07b27eSBarry Smith
7289566063dSJacob Faibussowitsch PetscCall(MatCreateSubMatrices(Bperm, 1, &isrow, &iscol, MAT_INITIAL_MATRIX, &_Blocal));
7291e07b27eSBarry Smith Blocal = *_Blocal;
7301e07b27eSBarry Smith Bred = NULL;
73157f12427SDave May if (PCTelescope_isActiveRank(sred)) {
7321e07b27eSBarry Smith PetscInt mm;
7331e07b27eSBarry Smith
734ad540459SPierre Jolivet if (reuse != MAT_INITIAL_MATRIX) Bred = *A;
7359566063dSJacob Faibussowitsch PetscCall(MatGetSize(Blocal, &mm, NULL));
7369566063dSJacob Faibussowitsch /* PetscCall(MatCreateMPIMatConcatenateSeqMat(subcomm,Blocal,PETSC_DECIDE,reuse,&Bred)); */
7379566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat(subcomm, Blocal, mm, reuse, &Bred));
7381e07b27eSBarry Smith }
7391e07b27eSBarry Smith *A = Bred;
7401e07b27eSBarry Smith
7419566063dSJacob Faibussowitsch PetscCall(ISDestroy(&iscol));
7429566063dSJacob Faibussowitsch PetscCall(MatDestroy(&Bperm));
7439566063dSJacob Faibussowitsch PetscCall(MatDestroyMatrices(1, &_Blocal));
7443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
7451e07b27eSBarry Smith }
7461e07b27eSBarry Smith
PCTelescopeMatCreate_dmda(PC pc,PC_Telescope sred,MatReuse reuse,Mat * A)747d71ae5a4SJacob Faibussowitsch PetscErrorCode PCTelescopeMatCreate_dmda(PC pc, PC_Telescope sred, MatReuse reuse, Mat *A)
748d71ae5a4SJacob Faibussowitsch {
749ba1c3560SDave May DM dm;
750ba1c3560SDave May PetscErrorCode (*dmksp_func)(KSP, Mat, Mat, void *);
751ba1c3560SDave May void *dmksp_ctx;
752ba1c3560SDave May
753ba1c3560SDave May PetscFunctionBegin;
7549566063dSJacob Faibussowitsch PetscCall(PCGetDM(pc, &dm));
7559566063dSJacob Faibussowitsch PetscCall(DMKSPGetComputeOperators(dm, &dmksp_func, &dmksp_ctx));
756dc9ee9fdSDave May /* We assume that dmksp_func = NULL, is equivalent to dmActive = PETSC_FALSE */
7577c5279cbSDave May if (dmksp_func && !sred->ignore_kspcomputeoperators) {
758ba1c3560SDave May DM dmrepart;
75928323a89SDave May Mat Ak;
760ba1c3560SDave May
761ba1c3560SDave May *A = NULL;
76257f12427SDave May if (PCTelescope_isActiveRank(sred)) {
7639566063dSJacob Faibussowitsch PetscCall(KSPGetDM(sred->ksp, &dmrepart));
764ba1c3560SDave May if (reuse == MAT_INITIAL_MATRIX) {
7659566063dSJacob Faibussowitsch PetscCall(DMCreateMatrix(dmrepart, &Ak));
766ba1c3560SDave May *A = Ak;
767ba1c3560SDave May } else if (reuse == MAT_REUSE_MATRIX) {
768ba1c3560SDave May Ak = *A;
769ba1c3560SDave May }
7705c5dbb1cSDave May /*
7715c5dbb1cSDave May There is no need to explicitly assemble the operator now,
7725c5dbb1cSDave May the sub-KSP will call the method provided to KSPSetComputeOperators() during KSPSetUp()
7735c5dbb1cSDave May */
774ba1c3560SDave May }
775ba1c3560SDave May } else {
7769566063dSJacob Faibussowitsch PetscCall(PCTelescopeMatCreate_dmda_dmactivefalse(pc, sred, reuse, A));
777ba1c3560SDave May }
7783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
779ba1c3560SDave May }
780ba1c3560SDave May
PCTelescopeSubNullSpaceCreate_dmda_Telescope(PC pc,PC_Telescope sred,MatNullSpace nullspace,MatNullSpace * sub_nullspace)78166976f2fSJacob Faibussowitsch static PetscErrorCode PCTelescopeSubNullSpaceCreate_dmda_Telescope(PC pc, PC_Telescope sred, MatNullSpace nullspace, MatNullSpace *sub_nullspace)
782d71ae5a4SJacob Faibussowitsch {
7831e07b27eSBarry Smith PetscBool has_const;
784a947c41eSDave May PetscInt i, k, n = 0;
7851e07b27eSBarry Smith const Vec *vecs;
786c41e779fSDave May Vec *sub_vecs = NULL;
7871e07b27eSBarry Smith MPI_Comm subcomm;
7881e07b27eSBarry Smith PC_Telescope_DMDACtx *ctx;
7891e07b27eSBarry Smith
7901e07b27eSBarry Smith PetscFunctionBegin;
7911e07b27eSBarry Smith ctx = (PC_Telescope_DMDACtx *)sred->dm_ctx;
7921e07b27eSBarry Smith subcomm = PetscSubcommChild(sred->psubcomm);
7939566063dSJacob Faibussowitsch PetscCall(MatNullSpaceGetVecs(nullspace, &has_const, &n, &vecs));
7941e07b27eSBarry Smith
79557f12427SDave May if (PCTelescope_isActiveRank(sred)) {
7961e07b27eSBarry Smith /* create new vectors */
79748a46eb9SPierre Jolivet if (n) PetscCall(VecDuplicateVecs(sred->xred, n, &sub_vecs));
7981e07b27eSBarry Smith }
7991e07b27eSBarry Smith
8001e07b27eSBarry Smith /* copy entries */
8011e07b27eSBarry Smith for (k = 0; k < n; k++) {
8021e07b27eSBarry Smith const PetscScalar *x_array;
8031e07b27eSBarry Smith PetscScalar *LA_sub_vec;
80413c30530SDave May PetscInt st, ed;
8051e07b27eSBarry Smith
8061e07b27eSBarry Smith /* permute vector into ordering associated with re-partitioned dmda */
8079566063dSJacob Faibussowitsch PetscCall(MatMultTranspose(ctx->permutation, vecs[k], ctx->xp));
8081e07b27eSBarry Smith
8091e07b27eSBarry Smith /* pull in vector x->xtmp */
8109566063dSJacob Faibussowitsch PetscCall(VecScatterBegin(sred->scatter, ctx->xp, sred->xtmp, INSERT_VALUES, SCATTER_FORWARD));
8119566063dSJacob Faibussowitsch PetscCall(VecScatterEnd(sred->scatter, ctx->xp, sred->xtmp, INSERT_VALUES, SCATTER_FORWARD));
8121e07b27eSBarry Smith
813392968a1SPatrick Sanan /* copy vector entries into xred */
8149566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(sred->xtmp, &x_array));
815ea2b237eSDave May if (sub_vecs) {
816ea2b237eSDave May if (sub_vecs[k]) {
8179566063dSJacob Faibussowitsch PetscCall(VecGetOwnershipRange(sub_vecs[k], &st, &ed));
8189566063dSJacob Faibussowitsch PetscCall(VecGetArray(sub_vecs[k], &LA_sub_vec));
819ad540459SPierre Jolivet for (i = 0; i < ed - st; i++) LA_sub_vec[i] = x_array[i];
8209566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(sub_vecs[k], &LA_sub_vec));
8211e07b27eSBarry Smith }
822ea2b237eSDave May }
8239566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(sred->xtmp, &x_array));
8241e07b27eSBarry Smith }
8251e07b27eSBarry Smith
82657f12427SDave May if (PCTelescope_isActiveRank(sred)) {
827d8b9d5b7SPatrick Sanan /* create new (near) nullspace for redundant object */
8289566063dSJacob Faibussowitsch PetscCall(MatNullSpaceCreate(subcomm, has_const, n, sub_vecs, sub_nullspace));
8299566063dSJacob Faibussowitsch PetscCall(VecDestroyVecs(n, &sub_vecs));
83028b400f6SJacob Faibussowitsch PetscCheck(!nullspace->remove, PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "Propagation of custom remove callbacks not supported when propagating (near) nullspaces with PCTelescope");
83128b400f6SJacob Faibussowitsch PetscCheck(!nullspace->rmctx, PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "Propagation of custom remove callback context not supported when propagating (near) nullspaces with PCTelescope");
832d8b9d5b7SPatrick Sanan }
8333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
834392968a1SPatrick Sanan }
835392968a1SPatrick Sanan
PCTelescopeMatNullSpaceCreate_dmda(PC pc,PC_Telescope sred,Mat sub_mat)836d71ae5a4SJacob Faibussowitsch PetscErrorCode PCTelescopeMatNullSpaceCreate_dmda(PC pc, PC_Telescope sred, Mat sub_mat)
837d71ae5a4SJacob Faibussowitsch {
838392968a1SPatrick Sanan Mat B;
839392968a1SPatrick Sanan
840392968a1SPatrick Sanan PetscFunctionBegin;
8419566063dSJacob Faibussowitsch PetscCall(PCGetOperators(pc, NULL, &B));
842392968a1SPatrick Sanan {
843392968a1SPatrick Sanan MatNullSpace nullspace, sub_nullspace;
8449566063dSJacob Faibussowitsch PetscCall(MatGetNullSpace(B, &nullspace));
845392968a1SPatrick Sanan if (nullspace) {
8469566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescope: generating nullspace (DMDA)\n"));
8479566063dSJacob Faibussowitsch PetscCall(PCTelescopeSubNullSpaceCreate_dmda_Telescope(pc, sred, nullspace, &sub_nullspace));
84857f12427SDave May if (PCTelescope_isActiveRank(sred)) {
8499566063dSJacob Faibussowitsch PetscCall(MatSetNullSpace(sub_mat, sub_nullspace));
8509566063dSJacob Faibussowitsch PetscCall(MatNullSpaceDestroy(&sub_nullspace));
8511e07b27eSBarry Smith }
852392968a1SPatrick Sanan }
853392968a1SPatrick Sanan }
854392968a1SPatrick Sanan {
855392968a1SPatrick Sanan MatNullSpace nearnullspace, sub_nearnullspace;
8569566063dSJacob Faibussowitsch PetscCall(MatGetNearNullSpace(B, &nearnullspace));
857392968a1SPatrick Sanan if (nearnullspace) {
8589566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescope: generating near nullspace (DMDA)\n"));
8599566063dSJacob Faibussowitsch PetscCall(PCTelescopeSubNullSpaceCreate_dmda_Telescope(pc, sred, nearnullspace, &sub_nearnullspace));
86057f12427SDave May if (PCTelescope_isActiveRank(sred)) {
8619566063dSJacob Faibussowitsch PetscCall(MatSetNearNullSpace(sub_mat, sub_nearnullspace));
8629566063dSJacob Faibussowitsch PetscCall(MatNullSpaceDestroy(&sub_nearnullspace));
863392968a1SPatrick Sanan }
864392968a1SPatrick Sanan }
865392968a1SPatrick Sanan }
8663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
8671e07b27eSBarry Smith }
8681e07b27eSBarry Smith
PCApply_Telescope_dmda(PC pc,Vec x,Vec y)869d71ae5a4SJacob Faibussowitsch PetscErrorCode PCApply_Telescope_dmda(PC pc, Vec x, Vec y)
870d71ae5a4SJacob Faibussowitsch {
8711e07b27eSBarry Smith PC_Telescope sred = (PC_Telescope)pc->data;
8721e07b27eSBarry Smith Mat perm;
8731e07b27eSBarry Smith Vec xtmp, xp, xred, yred;
87413c30530SDave May PetscInt i, st, ed;
8751e07b27eSBarry Smith VecScatter scatter;
8761e07b27eSBarry Smith PetscScalar *array;
8771e07b27eSBarry Smith const PetscScalar *x_array;
8781e07b27eSBarry Smith PC_Telescope_DMDACtx *ctx;
8791e07b27eSBarry Smith
8801e07b27eSBarry Smith ctx = (PC_Telescope_DMDACtx *)sred->dm_ctx;
8811e07b27eSBarry Smith xtmp = sred->xtmp;
8821e07b27eSBarry Smith scatter = sred->scatter;
8831e07b27eSBarry Smith xred = sred->xred;
8841e07b27eSBarry Smith yred = sred->yred;
8851e07b27eSBarry Smith perm = ctx->permutation;
8861e07b27eSBarry Smith xp = ctx->xp;
8871e07b27eSBarry Smith
8881e07b27eSBarry Smith PetscFunctionBegin;
8899566063dSJacob Faibussowitsch PetscCall(PetscCitationsRegister(citation, &cited));
89014c9fce5SDave May
8911e07b27eSBarry Smith /* permute vector into ordering associated with re-partitioned dmda */
8929566063dSJacob Faibussowitsch PetscCall(MatMultTranspose(perm, x, xp));
8931e07b27eSBarry Smith
8941e07b27eSBarry Smith /* pull in vector x->xtmp */
8959566063dSJacob Faibussowitsch PetscCall(VecScatterBegin(scatter, xp, xtmp, INSERT_VALUES, SCATTER_FORWARD));
8969566063dSJacob Faibussowitsch PetscCall(VecScatterEnd(scatter, xp, xtmp, INSERT_VALUES, SCATTER_FORWARD));
8971e07b27eSBarry Smith
898a5b23f4aSJose E. Roman /* copy vector entries into xred */
8999566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xtmp, &x_array));
9001e07b27eSBarry Smith if (xred) {
9011e07b27eSBarry Smith PetscScalar *LA_xred;
9029566063dSJacob Faibussowitsch PetscCall(VecGetOwnershipRange(xred, &st, &ed));
9031e07b27eSBarry Smith
9049566063dSJacob Faibussowitsch PetscCall(VecGetArray(xred, &LA_xred));
905ad540459SPierre Jolivet for (i = 0; i < ed - st; i++) LA_xred[i] = x_array[i];
9069566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xred, &LA_xred));
9071e07b27eSBarry Smith }
9089566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xtmp, &x_array));
9091e07b27eSBarry Smith
9101e07b27eSBarry Smith /* solve */
91157f12427SDave May if (PCTelescope_isActiveRank(sred)) {
9129566063dSJacob Faibussowitsch PetscCall(KSPSolve(sred->ksp, xred, yred));
9139566063dSJacob Faibussowitsch PetscCall(KSPCheckSolve(sred->ksp, pc, yred));
9141e07b27eSBarry Smith }
9151e07b27eSBarry Smith
9161e07b27eSBarry Smith /* return vector */
9179566063dSJacob Faibussowitsch PetscCall(VecGetArray(xtmp, &array));
9181e07b27eSBarry Smith if (yred) {
9191e07b27eSBarry Smith const PetscScalar *LA_yred;
9209566063dSJacob Faibussowitsch PetscCall(VecGetOwnershipRange(yred, &st, &ed));
9219566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(yred, &LA_yred));
922ad540459SPierre Jolivet for (i = 0; i < ed - st; i++) array[i] = LA_yred[i];
9239566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(yred, &LA_yred));
9241e07b27eSBarry Smith }
9259566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xtmp, &array));
9269566063dSJacob Faibussowitsch PetscCall(VecScatterBegin(scatter, xtmp, xp, INSERT_VALUES, SCATTER_REVERSE));
9279566063dSJacob Faibussowitsch PetscCall(VecScatterEnd(scatter, xtmp, xp, INSERT_VALUES, SCATTER_REVERSE));
9289566063dSJacob Faibussowitsch PetscCall(MatMult(perm, xp, y));
9293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
9301e07b27eSBarry Smith }
9311e07b27eSBarry Smith
PCApplyRichardson_Telescope_dmda(PC pc,Vec x,Vec y,Vec w,PetscReal rtol,PetscReal abstol,PetscReal dtol,PetscInt its,PetscBool zeroguess,PetscInt * outits,PCRichardsonConvergedReason * reason)932d71ae5a4SJacob Faibussowitsch PetscErrorCode PCApplyRichardson_Telescope_dmda(PC pc, Vec x, Vec y, Vec w, PetscReal rtol, PetscReal abstol, PetscReal dtol, PetscInt its, PetscBool zeroguess, PetscInt *outits, PCRichardsonConvergedReason *reason)
933d71ae5a4SJacob Faibussowitsch {
934f650675bSDave May PC_Telescope sred = (PC_Telescope)pc->data;
935f650675bSDave May Mat perm;
936a1d91a28SDave May Vec xtmp, xp, yred;
937f650675bSDave May PetscInt i, st, ed;
938f650675bSDave May VecScatter scatter;
939f650675bSDave May const PetscScalar *x_array;
940c41e779fSDave May PetscBool default_init_guess_value = PETSC_FALSE;
941f650675bSDave May PC_Telescope_DMDACtx *ctx;
942f650675bSDave May
94357f12427SDave May PetscFunctionBegin;
944f650675bSDave May ctx = (PC_Telescope_DMDACtx *)sred->dm_ctx;
945f650675bSDave May xtmp = sred->xtmp;
946f650675bSDave May scatter = sred->scatter;
947f650675bSDave May yred = sred->yred;
948f650675bSDave May perm = ctx->permutation;
949f650675bSDave May xp = ctx->xp;
950f650675bSDave May
95108401ef6SPierre Jolivet PetscCheck(its <= 1, PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "PCApplyRichardson_Telescope_dmda only supports max_it = 1");
952f650675bSDave May *reason = (PCRichardsonConvergedReason)0;
953f650675bSDave May
954f650675bSDave May if (!zeroguess) {
9559566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescopeDMDA: Scattering y for non-zero-initial guess\n"));
956f650675bSDave May /* permute vector into ordering associated with re-partitioned dmda */
9579566063dSJacob Faibussowitsch PetscCall(MatMultTranspose(perm, y, xp));
958f650675bSDave May
959f650675bSDave May /* pull in vector x->xtmp */
9609566063dSJacob Faibussowitsch PetscCall(VecScatterBegin(scatter, xp, xtmp, INSERT_VALUES, SCATTER_FORWARD));
9619566063dSJacob Faibussowitsch PetscCall(VecScatterEnd(scatter, xp, xtmp, INSERT_VALUES, SCATTER_FORWARD));
962f650675bSDave May
963a5b23f4aSJose E. Roman /* copy vector entries into xred */
9649566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xtmp, &x_array));
965f650675bSDave May if (yred) {
966f650675bSDave May PetscScalar *LA_yred;
9679566063dSJacob Faibussowitsch PetscCall(VecGetOwnershipRange(yred, &st, &ed));
9689566063dSJacob Faibussowitsch PetscCall(VecGetArray(yred, &LA_yred));
969ad540459SPierre Jolivet for (i = 0; i < ed - st; i++) LA_yred[i] = x_array[i];
9709566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yred, &LA_yred));
971f650675bSDave May }
9729566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xtmp, &x_array));
973f650675bSDave May }
974f650675bSDave May
97557f12427SDave May if (PCTelescope_isActiveRank(sred)) {
9769566063dSJacob Faibussowitsch PetscCall(KSPGetInitialGuessNonzero(sred->ksp, &default_init_guess_value));
9779566063dSJacob Faibussowitsch if (!zeroguess) PetscCall(KSPSetInitialGuessNonzero(sred->ksp, PETSC_TRUE));
978f650675bSDave May }
979f650675bSDave May
9809566063dSJacob Faibussowitsch PetscCall(PCApply_Telescope_dmda(pc, x, y));
981f650675bSDave May
98248a46eb9SPierre Jolivet if (PCTelescope_isActiveRank(sred)) PetscCall(KSPSetInitialGuessNonzero(sred->ksp, default_init_guess_value));
983f650675bSDave May
984f650675bSDave May if (!*reason) *reason = PCRICHARDSON_CONVERGED_ITS;
985f650675bSDave May *outits = 1;
9863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
987f650675bSDave May }
988f650675bSDave May
PCReset_Telescope_dmda(PC pc)989d71ae5a4SJacob Faibussowitsch PetscErrorCode PCReset_Telescope_dmda(PC pc)
990d71ae5a4SJacob Faibussowitsch {
9911e07b27eSBarry Smith PC_Telescope sred = (PC_Telescope)pc->data;
9921e07b27eSBarry Smith PC_Telescope_DMDACtx *ctx;
9931e07b27eSBarry Smith
9941e07b27eSBarry Smith PetscFunctionBegin;
9951e07b27eSBarry Smith ctx = (PC_Telescope_DMDACtx *)sred->dm_ctx;
9969566063dSJacob Faibussowitsch PetscCall(VecDestroy(&ctx->xp));
9979566063dSJacob Faibussowitsch PetscCall(MatDestroy(&ctx->permutation));
9989566063dSJacob Faibussowitsch PetscCall(DMDestroy(&ctx->dmrepart));
9999566063dSJacob Faibussowitsch PetscCall(PetscFree3(ctx->range_i_re, ctx->range_j_re, ctx->range_k_re));
10009566063dSJacob Faibussowitsch PetscCall(PetscFree3(ctx->start_i_re, ctx->start_j_re, ctx->start_k_re));
10013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
10021e07b27eSBarry Smith }
10031e07b27eSBarry Smith
DMView_DA_Short_3d(DM dm,PetscViewer v)100466976f2fSJacob Faibussowitsch static PetscErrorCode DMView_DA_Short_3d(DM dm, PetscViewer v)
1005d71ae5a4SJacob Faibussowitsch {
10061e07b27eSBarry Smith PetscInt M, N, P, m, n, p, ndof, nsw;
10071e07b27eSBarry Smith MPI_Comm comm;
10081e07b27eSBarry Smith PetscMPIInt size;
10091e07b27eSBarry Smith const char *prefix;
10101e07b27eSBarry Smith
10111e07b27eSBarry Smith PetscFunctionBegin;
10129566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)dm, &comm));
10139566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm, &size));
10149566063dSJacob Faibussowitsch PetscCall(DMGetOptionsPrefix(dm, &prefix));
10159566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(dm, NULL, &M, &N, &P, &m, &n, &p, &ndof, &nsw, NULL, NULL, NULL, NULL));
10169566063dSJacob Faibussowitsch if (prefix) PetscCall(PetscViewerASCIIPrintf(v, "DMDA Object: (%s) %d MPI processes\n", prefix, size));
10179566063dSJacob Faibussowitsch else PetscCall(PetscViewerASCIIPrintf(v, "DMDA Object: %d MPI processes\n", size));
101863a3b9bcSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(v, " M %" PetscInt_FMT " N %" PetscInt_FMT " P %" PetscInt_FMT " m %" PetscInt_FMT " n %" PetscInt_FMT " p %" PetscInt_FMT " dof %" PetscInt_FMT " overlap %" PetscInt_FMT "\n", M, N, P, m, n, p, ndof, nsw));
10193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
10201e07b27eSBarry Smith }
10211e07b27eSBarry Smith
DMView_DA_Short_2d(DM dm,PetscViewer v)102266976f2fSJacob Faibussowitsch static PetscErrorCode DMView_DA_Short_2d(DM dm, PetscViewer v)
1023d71ae5a4SJacob Faibussowitsch {
10241e07b27eSBarry Smith PetscInt M, N, m, n, ndof, nsw;
10251e07b27eSBarry Smith MPI_Comm comm;
10261e07b27eSBarry Smith PetscMPIInt size;
10271e07b27eSBarry Smith const char *prefix;
10281e07b27eSBarry Smith
10291e07b27eSBarry Smith PetscFunctionBegin;
10309566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)dm, &comm));
10319566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm, &size));
10329566063dSJacob Faibussowitsch PetscCall(DMGetOptionsPrefix(dm, &prefix));
10339566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(dm, NULL, &M, &N, NULL, &m, &n, NULL, &ndof, &nsw, NULL, NULL, NULL, NULL));
10349566063dSJacob Faibussowitsch if (prefix) PetscCall(PetscViewerASCIIPrintf(v, "DMDA Object: (%s) %d MPI processes\n", prefix, size));
10359566063dSJacob Faibussowitsch else PetscCall(PetscViewerASCIIPrintf(v, "DMDA Object: %d MPI processes\n", size));
103663a3b9bcSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(v, " M %" PetscInt_FMT " N %" PetscInt_FMT " m %" PetscInt_FMT " n %" PetscInt_FMT " dof %" PetscInt_FMT " overlap %" PetscInt_FMT "\n", M, N, m, n, ndof, nsw));
10373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
10381e07b27eSBarry Smith }
10391e07b27eSBarry Smith
DMView_DA_Short(DM dm,PetscViewer v)1040d71ae5a4SJacob Faibussowitsch PetscErrorCode DMView_DA_Short(DM dm, PetscViewer v)
1041d71ae5a4SJacob Faibussowitsch {
10421e07b27eSBarry Smith PetscInt dim;
10431e07b27eSBarry Smith
10441e07b27eSBarry Smith PetscFunctionBegin;
10459566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(dm, &dim, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL));
10461e07b27eSBarry Smith switch (dim) {
1047d71ae5a4SJacob Faibussowitsch case 2:
1048d71ae5a4SJacob Faibussowitsch PetscCall(DMView_DA_Short_2d(dm, v));
1049d71ae5a4SJacob Faibussowitsch break;
1050d71ae5a4SJacob Faibussowitsch case 3:
1051d71ae5a4SJacob Faibussowitsch PetscCall(DMView_DA_Short_3d(dm, v));
1052d71ae5a4SJacob Faibussowitsch break;
10531e07b27eSBarry Smith }
10543ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS);
10551e07b27eSBarry Smith }
1056