xref: /petsc/src/ksp/pc/impls/telescope/telescope_dmda.c (revision 66976f2f44dcc61d86a452a70219fb23b45d00f0)
11e07b27eSBarry Smith 
2120bdd93SDave May #include <petsc/private/matimpl.h>
31e07b27eSBarry Smith #include <petsc/private/pcimpl.h>
45e897e82SDave May #include <petsc/private/dmimpl.h>
51e07b27eSBarry Smith #include <petscksp.h> /*I "petscksp.h" I*/
61e07b27eSBarry Smith #include <petscdm.h>
71e07b27eSBarry Smith #include <petscdmda.h>
81e07b27eSBarry Smith 
9575a0592SBarry Smith #include "../src/ksp/pc/impls/telescope/telescope.h"
101e07b27eSBarry Smith 
11bf00f589SPatrick Sanan static PetscBool  cited      = PETSC_FALSE;
129371c9d4SSatish Balay static const char citation[] = "@inproceedings{MaySananRuppKnepleySmith2016,\n"
13bf00f589SPatrick Sanan                                "  title     = {Extreme-Scale Multigrid Components within PETSc},\n"
14bf00f589SPatrick Sanan                                "  author    = {Dave A. May and Patrick Sanan and Karl Rupp and Matthew G. Knepley and Barry F. Smith},\n"
15bf00f589SPatrick Sanan                                "  booktitle = {Proceedings of the Platform for Advanced Scientific Computing Conference},\n"
16bf00f589SPatrick Sanan                                "  series    = {PASC '16},\n"
17bf00f589SPatrick Sanan                                "  isbn      = {978-1-4503-4126-4},\n"
18bf00f589SPatrick Sanan                                "  location  = {Lausanne, Switzerland},\n"
19bf00f589SPatrick Sanan                                "  pages     = {5:1--5:12},\n"
20bf00f589SPatrick Sanan                                "  articleno = {5},\n"
21bf00f589SPatrick Sanan                                "  numpages  = {12},\n"
22a8d69d7bSBarry Smith                                "  url       = {https://doi.acm.org/10.1145/2929908.2929913},\n"
23bf00f589SPatrick Sanan                                "  doi       = {10.1145/2929908.2929913},\n"
24bf00f589SPatrick Sanan                                "  acmid     = {2929913},\n"
25bf00f589SPatrick Sanan                                "  publisher = {ACM},\n"
26bf00f589SPatrick Sanan                                "  address   = {New York, NY, USA},\n"
27bf00f589SPatrick Sanan                                "  keywords  = {GPU, HPC, agglomeration, coarse-level solver, multigrid, parallel computing, preconditioning},\n"
28bf00f589SPatrick Sanan                                "  year      = {2016}\n"
29bf00f589SPatrick Sanan                                "}\n";
30bf00f589SPatrick Sanan 
31d71ae5a4SJacob Faibussowitsch static PetscErrorCode _DMDADetermineRankFromGlobalIJK(PetscInt dim, PetscInt i, PetscInt j, PetscInt k, PetscInt Mp, PetscInt Np, PetscInt Pp, PetscInt start_i[], PetscInt start_j[], PetscInt start_k[], PetscInt span_i[], PetscInt span_j[], PetscInt span_k[], PetscMPIInt *_pi, PetscMPIInt *_pj, PetscMPIInt *_pk, PetscMPIInt *rank_re)
32d71ae5a4SJacob Faibussowitsch {
331e07b27eSBarry Smith   PetscInt pi, pj, pk, n;
341e07b27eSBarry Smith 
351e07b27eSBarry Smith   PetscFunctionBegin;
36137d0469SJed Brown   *rank_re = -1;
37137d0469SJed Brown   if (_pi) *_pi = -1;
38137d0469SJed Brown   if (_pj) *_pj = -1;
39137d0469SJed Brown   if (_pk) *_pk = -1;
401e07b27eSBarry Smith   pi = pj = pk = -1;
411e07b27eSBarry Smith   if (_pi) {
421e07b27eSBarry Smith     for (n = 0; n < Mp; n++) {
431e07b27eSBarry Smith       if ((i >= start_i[n]) && (i < start_i[n] + span_i[n])) {
441e07b27eSBarry Smith         pi = n;
451e07b27eSBarry Smith         break;
461e07b27eSBarry Smith       }
471e07b27eSBarry Smith     }
4863a3b9bcSJacob Faibussowitsch     PetscCheck(pi != -1, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmda-ijk] pi cannot be determined : range %" PetscInt_FMT ", val %" PetscInt_FMT, Mp, i);
491e07b27eSBarry Smith     *_pi = pi;
501e07b27eSBarry Smith   }
511e07b27eSBarry Smith 
521e07b27eSBarry Smith   if (_pj) {
531e07b27eSBarry Smith     for (n = 0; n < Np; n++) {
541e07b27eSBarry Smith       if ((j >= start_j[n]) && (j < start_j[n] + span_j[n])) {
551e07b27eSBarry Smith         pj = n;
561e07b27eSBarry Smith         break;
571e07b27eSBarry Smith       }
581e07b27eSBarry Smith     }
5963a3b9bcSJacob Faibussowitsch     PetscCheck(pj != -1, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmda-ijk] pj cannot be determined : range %" PetscInt_FMT ", val %" PetscInt_FMT, Np, j);
601e07b27eSBarry Smith     *_pj = pj;
611e07b27eSBarry Smith   }
621e07b27eSBarry Smith 
631e07b27eSBarry Smith   if (_pk) {
641e07b27eSBarry Smith     for (n = 0; n < Pp; n++) {
651e07b27eSBarry Smith       if ((k >= start_k[n]) && (k < start_k[n] + span_k[n])) {
661e07b27eSBarry Smith         pk = n;
671e07b27eSBarry Smith         break;
681e07b27eSBarry Smith       }
691e07b27eSBarry Smith     }
7063a3b9bcSJacob Faibussowitsch     PetscCheck(pk != -1, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmda-ijk] pk cannot be determined : range %" PetscInt_FMT ", val %" PetscInt_FMT, Pp, k);
711e07b27eSBarry Smith     *_pk = pk;
721e07b27eSBarry Smith   }
731e07b27eSBarry Smith 
741e07b27eSBarry Smith   switch (dim) {
75d71ae5a4SJacob Faibussowitsch   case 1:
76d71ae5a4SJacob Faibussowitsch     *rank_re = pi;
77d71ae5a4SJacob Faibussowitsch     break;
78d71ae5a4SJacob Faibussowitsch   case 2:
79d71ae5a4SJacob Faibussowitsch     *rank_re = pi + pj * Mp;
80d71ae5a4SJacob Faibussowitsch     break;
81d71ae5a4SJacob Faibussowitsch   case 3:
82d71ae5a4SJacob Faibussowitsch     *rank_re = pi + pj * Mp + pk * (Mp * Np);
83d71ae5a4SJacob Faibussowitsch     break;
841e07b27eSBarry Smith   }
853ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
861e07b27eSBarry Smith }
871e07b27eSBarry Smith 
88d71ae5a4SJacob Faibussowitsch static PetscErrorCode _DMDADetermineGlobalS0(PetscInt dim, PetscMPIInt rank_re, PetscInt Mp_re, PetscInt Np_re, PetscInt Pp_re, PetscInt range_i_re[], PetscInt range_j_re[], PetscInt range_k_re[], PetscInt *s0)
89d71ae5a4SJacob Faibussowitsch {
90c6a0d831SBarry Smith   PetscInt i, j, k, start_IJK = 0;
911e07b27eSBarry Smith   PetscInt rank_ijk;
921e07b27eSBarry Smith 
931e07b27eSBarry Smith   PetscFunctionBegin;
941e07b27eSBarry Smith   switch (dim) {
951e07b27eSBarry Smith   case 1:
961e07b27eSBarry Smith     for (i = 0; i < Mp_re; i++) {
971e07b27eSBarry Smith       rank_ijk = i;
98ad540459SPierre Jolivet       if (rank_ijk < rank_re) start_IJK += range_i_re[i];
991e07b27eSBarry Smith     }
1001e07b27eSBarry Smith     break;
1011e07b27eSBarry Smith   case 2:
1021e07b27eSBarry Smith     for (j = 0; j < Np_re; j++) {
1031e07b27eSBarry Smith       for (i = 0; i < Mp_re; i++) {
1041e07b27eSBarry Smith         rank_ijk = i + j * Mp_re;
105ad540459SPierre Jolivet         if (rank_ijk < rank_re) start_IJK += range_i_re[i] * range_j_re[j];
1061e07b27eSBarry Smith       }
1071e07b27eSBarry Smith     }
1081e07b27eSBarry Smith     break;
1091e07b27eSBarry Smith   case 3:
1101e07b27eSBarry Smith     for (k = 0; k < Pp_re; k++) {
1111e07b27eSBarry Smith       for (j = 0; j < Np_re; j++) {
1121e07b27eSBarry Smith         for (i = 0; i < Mp_re; i++) {
1131e07b27eSBarry Smith           rank_ijk = i + j * Mp_re + k * Mp_re * Np_re;
114ad540459SPierre Jolivet           if (rank_ijk < rank_re) start_IJK += range_i_re[i] * range_j_re[j] * range_k_re[k];
1151e07b27eSBarry Smith         }
1161e07b27eSBarry Smith       }
1171e07b27eSBarry Smith     }
1181e07b27eSBarry Smith     break;
1191e07b27eSBarry Smith   }
1201e07b27eSBarry Smith   *s0 = start_IJK;
1213ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1221e07b27eSBarry Smith }
1231e07b27eSBarry Smith 
124d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCTelescopeSetUp_dmda_repart_coors2d(PC_Telescope sred, DM dm, DM subdm)
125d71ae5a4SJacob Faibussowitsch {
1261e07b27eSBarry Smith   DM         cdm;
1271e07b27eSBarry Smith   Vec        coor, coor_natural, perm_coors;
1281e07b27eSBarry Smith   PetscInt   i, j, si, sj, ni, nj, M, N, Ml, Nl, c, nidx;
1291e07b27eSBarry Smith   PetscInt  *fine_indices;
1301e07b27eSBarry Smith   IS         is_fine, is_local;
1311e07b27eSBarry Smith   VecScatter sctx;
1321e07b27eSBarry Smith 
1331e07b27eSBarry Smith   PetscFunctionBegin;
1349566063dSJacob Faibussowitsch   PetscCall(DMGetCoordinates(dm, &coor));
1353ba16761SJacob Faibussowitsch   if (!coor) PetscFunctionReturn(PETSC_SUCCESS);
13648a46eb9SPierre Jolivet   if (PCTelescope_isActiveRank(sred)) PetscCall(DMDASetUniformCoordinates(subdm, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0));
1371e07b27eSBarry Smith   /* Get the coordinate vector from the distributed array */
1389566063dSJacob Faibussowitsch   PetscCall(DMGetCoordinateDM(dm, &cdm));
1399566063dSJacob Faibussowitsch   PetscCall(DMDACreateNaturalVector(cdm, &coor_natural));
1401e07b27eSBarry Smith 
1419566063dSJacob Faibussowitsch   PetscCall(DMDAGlobalToNaturalBegin(cdm, coor, INSERT_VALUES, coor_natural));
1429566063dSJacob Faibussowitsch   PetscCall(DMDAGlobalToNaturalEnd(cdm, coor, INSERT_VALUES, coor_natural));
1431e07b27eSBarry Smith 
1441e07b27eSBarry Smith   /* get indices of the guys I want to grab */
1459566063dSJacob Faibussowitsch   PetscCall(DMDAGetInfo(dm, NULL, &M, &N, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL));
14657f12427SDave May   if (PCTelescope_isActiveRank(sred)) {
1479566063dSJacob Faibussowitsch     PetscCall(DMDAGetCorners(subdm, &si, &sj, NULL, &ni, &nj, NULL));
14815dd08bcSBarry Smith     Ml = ni;
14915dd08bcSBarry Smith     Nl = nj;
1501e07b27eSBarry Smith   } else {
151c41e779fSDave May     si = sj = 0;
152c41e779fSDave May     ni = nj = 0;
1533ac26c5eSBarry Smith     Ml = Nl = 0;
1541e07b27eSBarry Smith   }
1551e07b27eSBarry Smith 
1569566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(Ml * Nl * 2, &fine_indices));
1571e07b27eSBarry Smith   c = 0;
15857f12427SDave May   if (PCTelescope_isActiveRank(sred)) {
1591e07b27eSBarry Smith     for (j = sj; j < sj + nj; j++) {
1601e07b27eSBarry Smith       for (i = si; i < si + ni; i++) {
1611e07b27eSBarry Smith         nidx                = (i) + (j)*M;
1621e07b27eSBarry Smith         fine_indices[c]     = 2 * nidx;
1631e07b27eSBarry Smith         fine_indices[c + 1] = 2 * nidx + 1;
1641e07b27eSBarry Smith         c                   = c + 2;
1651e07b27eSBarry Smith       }
1661e07b27eSBarry Smith     }
16763a3b9bcSJacob Faibussowitsch     PetscCheck(c == Ml * Nl * 2, PETSC_COMM_SELF, PETSC_ERR_PLIB, "c %" PetscInt_FMT " should equal 2 * Ml %" PetscInt_FMT " * Nl %" PetscInt_FMT, c, Ml, Nl);
1681e07b27eSBarry Smith   }
1691e07b27eSBarry Smith 
1701e07b27eSBarry Smith   /* generate scatter */
1719566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)dm), Ml * Nl * 2, fine_indices, PETSC_USE_POINTER, &is_fine));
1729566063dSJacob Faibussowitsch   PetscCall(ISCreateStride(PETSC_COMM_SELF, Ml * Nl * 2, 0, 1, &is_local));
1731e07b27eSBarry Smith 
1741e07b27eSBarry Smith   /* scatter */
1759566063dSJacob Faibussowitsch   PetscCall(VecCreate(PETSC_COMM_SELF, &perm_coors));
1769566063dSJacob Faibussowitsch   PetscCall(VecSetSizes(perm_coors, PETSC_DECIDE, Ml * Nl * 2));
1779566063dSJacob Faibussowitsch   PetscCall(VecSetType(perm_coors, VECSEQ));
1781e07b27eSBarry Smith 
1799566063dSJacob Faibussowitsch   PetscCall(VecScatterCreate(coor_natural, is_fine, perm_coors, is_local, &sctx));
1809566063dSJacob Faibussowitsch   PetscCall(VecScatterBegin(sctx, coor_natural, perm_coors, INSERT_VALUES, SCATTER_FORWARD));
1819566063dSJacob Faibussowitsch   PetscCall(VecScatterEnd(sctx, coor_natural, perm_coors, INSERT_VALUES, SCATTER_FORWARD));
1821e07b27eSBarry Smith   /* access */
18357f12427SDave May   if (PCTelescope_isActiveRank(sred)) {
1841e07b27eSBarry Smith     Vec                _coors;
1851e07b27eSBarry Smith     const PetscScalar *LA_perm;
1861e07b27eSBarry Smith     PetscScalar       *LA_coors;
1871e07b27eSBarry Smith 
1889566063dSJacob Faibussowitsch     PetscCall(DMGetCoordinates(subdm, &_coors));
1899566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(perm_coors, &LA_perm));
1909566063dSJacob Faibussowitsch     PetscCall(VecGetArray(_coors, &LA_coors));
191ad540459SPierre Jolivet     for (i = 0; i < Ml * Nl * 2; i++) LA_coors[i] = LA_perm[i];
1929566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(_coors, &LA_coors));
1939566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(perm_coors, &LA_perm));
1941e07b27eSBarry Smith   }
1951e07b27eSBarry Smith 
1961e07b27eSBarry Smith   /* update local coords */
19757f12427SDave May   if (PCTelescope_isActiveRank(sred)) {
1981e07b27eSBarry Smith     DM  _dmc;
1991e07b27eSBarry Smith     Vec _coors, _coors_local;
2009566063dSJacob Faibussowitsch     PetscCall(DMGetCoordinateDM(subdm, &_dmc));
2019566063dSJacob Faibussowitsch     PetscCall(DMGetCoordinates(subdm, &_coors));
2029566063dSJacob Faibussowitsch     PetscCall(DMGetCoordinatesLocal(subdm, &_coors_local));
2039566063dSJacob Faibussowitsch     PetscCall(DMGlobalToLocalBegin(_dmc, _coors, INSERT_VALUES, _coors_local));
2049566063dSJacob Faibussowitsch     PetscCall(DMGlobalToLocalEnd(_dmc, _coors, INSERT_VALUES, _coors_local));
2051e07b27eSBarry Smith   }
2069566063dSJacob Faibussowitsch   PetscCall(VecScatterDestroy(&sctx));
2079566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&is_fine));
2089566063dSJacob Faibussowitsch   PetscCall(PetscFree(fine_indices));
2099566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&is_local));
2109566063dSJacob Faibussowitsch   PetscCall(VecDestroy(&perm_coors));
2119566063dSJacob Faibussowitsch   PetscCall(VecDestroy(&coor_natural));
2123ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2131e07b27eSBarry Smith }
2141e07b27eSBarry Smith 
215d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCTelescopeSetUp_dmda_repart_coors3d(PC_Telescope sred, DM dm, DM subdm)
216d71ae5a4SJacob Faibussowitsch {
2171e07b27eSBarry Smith   DM         cdm;
2181e07b27eSBarry Smith   Vec        coor, coor_natural, perm_coors;
2191e07b27eSBarry Smith   PetscInt   i, j, k, si, sj, sk, ni, nj, nk, M, N, P, Ml, Nl, Pl, c, nidx;
2201e07b27eSBarry Smith   PetscInt  *fine_indices;
2211e07b27eSBarry Smith   IS         is_fine, is_local;
2221e07b27eSBarry Smith   VecScatter sctx;
2231e07b27eSBarry Smith 
2241e07b27eSBarry Smith   PetscFunctionBegin;
2259566063dSJacob Faibussowitsch   PetscCall(DMGetCoordinates(dm, &coor));
2263ba16761SJacob Faibussowitsch   if (!coor) PetscFunctionReturn(PETSC_SUCCESS);
2271e07b27eSBarry Smith 
22848a46eb9SPierre Jolivet   if (PCTelescope_isActiveRank(sred)) PetscCall(DMDASetUniformCoordinates(subdm, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0));
2291e07b27eSBarry Smith 
2301e07b27eSBarry Smith   /* Get the coordinate vector from the distributed array */
2319566063dSJacob Faibussowitsch   PetscCall(DMGetCoordinateDM(dm, &cdm));
2329566063dSJacob Faibussowitsch   PetscCall(DMDACreateNaturalVector(cdm, &coor_natural));
2339566063dSJacob Faibussowitsch   PetscCall(DMDAGlobalToNaturalBegin(cdm, coor, INSERT_VALUES, coor_natural));
2349566063dSJacob Faibussowitsch   PetscCall(DMDAGlobalToNaturalEnd(cdm, coor, INSERT_VALUES, coor_natural));
2351e07b27eSBarry Smith 
2361e07b27eSBarry Smith   /* get indices of the guys I want to grab */
2379566063dSJacob Faibussowitsch   PetscCall(DMDAGetInfo(dm, NULL, &M, &N, &P, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL));
2381e07b27eSBarry Smith 
23957f12427SDave May   if (PCTelescope_isActiveRank(sred)) {
2409566063dSJacob Faibussowitsch     PetscCall(DMDAGetCorners(subdm, &si, &sj, &sk, &ni, &nj, &nk));
241553d0ae9SBarry Smith     Ml = ni;
242553d0ae9SBarry Smith     Nl = nj;
243553d0ae9SBarry Smith     Pl = nk;
2441e07b27eSBarry Smith   } else {
245c41e779fSDave May     si = sj = sk = 0;
246c41e779fSDave May     ni = nj = nk = 0;
2473ac26c5eSBarry Smith     Ml = Nl = Pl = 0;
2481e07b27eSBarry Smith   }
2491e07b27eSBarry Smith 
2509566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(Ml * Nl * Pl * 3, &fine_indices));
2511e07b27eSBarry Smith 
2521e07b27eSBarry Smith   c = 0;
25357f12427SDave May   if (PCTelescope_isActiveRank(sred)) {
2541e07b27eSBarry Smith     for (k = sk; k < sk + nk; k++) {
2551e07b27eSBarry Smith       for (j = sj; j < sj + nj; j++) {
2561e07b27eSBarry Smith         for (i = si; i < si + ni; i++) {
2571e07b27eSBarry Smith           nidx                = (i) + (j)*M + (k)*M * N;
2581e07b27eSBarry Smith           fine_indices[c]     = 3 * nidx;
2591e07b27eSBarry Smith           fine_indices[c + 1] = 3 * nidx + 1;
2601e07b27eSBarry Smith           fine_indices[c + 2] = 3 * nidx + 2;
2611e07b27eSBarry Smith           c                   = c + 3;
2621e07b27eSBarry Smith         }
2631e07b27eSBarry Smith       }
2641e07b27eSBarry Smith     }
2651e07b27eSBarry Smith   }
2661e07b27eSBarry Smith 
2671e07b27eSBarry Smith   /* generate scatter */
2689566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)dm), Ml * Nl * Pl * 3, fine_indices, PETSC_USE_POINTER, &is_fine));
2699566063dSJacob Faibussowitsch   PetscCall(ISCreateStride(PETSC_COMM_SELF, Ml * Nl * Pl * 3, 0, 1, &is_local));
2701e07b27eSBarry Smith 
2711e07b27eSBarry Smith   /* scatter */
2729566063dSJacob Faibussowitsch   PetscCall(VecCreate(PETSC_COMM_SELF, &perm_coors));
2739566063dSJacob Faibussowitsch   PetscCall(VecSetSizes(perm_coors, PETSC_DECIDE, Ml * Nl * Pl * 3));
2749566063dSJacob Faibussowitsch   PetscCall(VecSetType(perm_coors, VECSEQ));
2759566063dSJacob Faibussowitsch   PetscCall(VecScatterCreate(coor_natural, is_fine, perm_coors, is_local, &sctx));
2769566063dSJacob Faibussowitsch   PetscCall(VecScatterBegin(sctx, coor_natural, perm_coors, INSERT_VALUES, SCATTER_FORWARD));
2779566063dSJacob Faibussowitsch   PetscCall(VecScatterEnd(sctx, coor_natural, perm_coors, INSERT_VALUES, SCATTER_FORWARD));
2781e07b27eSBarry Smith 
2791e07b27eSBarry Smith   /* access */
28057f12427SDave May   if (PCTelescope_isActiveRank(sred)) {
2811e07b27eSBarry Smith     Vec                _coors;
2821e07b27eSBarry Smith     const PetscScalar *LA_perm;
2831e07b27eSBarry Smith     PetscScalar       *LA_coors;
2841e07b27eSBarry Smith 
2859566063dSJacob Faibussowitsch     PetscCall(DMGetCoordinates(subdm, &_coors));
2869566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(perm_coors, &LA_perm));
2879566063dSJacob Faibussowitsch     PetscCall(VecGetArray(_coors, &LA_coors));
288ad540459SPierre Jolivet     for (i = 0; i < Ml * Nl * Pl * 3; i++) LA_coors[i] = LA_perm[i];
2899566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(_coors, &LA_coors));
2909566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(perm_coors, &LA_perm));
2911e07b27eSBarry Smith   }
2921e07b27eSBarry Smith 
2931e07b27eSBarry Smith   /* update local coords */
29457f12427SDave May   if (PCTelescope_isActiveRank(sred)) {
2951e07b27eSBarry Smith     DM  _dmc;
2961e07b27eSBarry Smith     Vec _coors, _coors_local;
2971e07b27eSBarry Smith 
2989566063dSJacob Faibussowitsch     PetscCall(DMGetCoordinateDM(subdm, &_dmc));
2999566063dSJacob Faibussowitsch     PetscCall(DMGetCoordinates(subdm, &_coors));
3009566063dSJacob Faibussowitsch     PetscCall(DMGetCoordinatesLocal(subdm, &_coors_local));
3019566063dSJacob Faibussowitsch     PetscCall(DMGlobalToLocalBegin(_dmc, _coors, INSERT_VALUES, _coors_local));
3029566063dSJacob Faibussowitsch     PetscCall(DMGlobalToLocalEnd(_dmc, _coors, INSERT_VALUES, _coors_local));
3031e07b27eSBarry Smith   }
3041e07b27eSBarry Smith 
3059566063dSJacob Faibussowitsch   PetscCall(VecScatterDestroy(&sctx));
3069566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&is_fine));
3079566063dSJacob Faibussowitsch   PetscCall(PetscFree(fine_indices));
3089566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&is_local));
3099566063dSJacob Faibussowitsch   PetscCall(VecDestroy(&perm_coors));
3109566063dSJacob Faibussowitsch   PetscCall(VecDestroy(&coor_natural));
3113ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3121e07b27eSBarry Smith }
3131e07b27eSBarry Smith 
314d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCTelescopeSetUp_dmda_repart_coors(PC pc, PC_Telescope sred, PC_Telescope_DMDACtx *ctx)
315d71ae5a4SJacob Faibussowitsch {
3161e07b27eSBarry Smith   PetscInt     dim;
3171e07b27eSBarry Smith   DM           dm, subdm;
3181e07b27eSBarry Smith   PetscSubcomm psubcomm;
3191e07b27eSBarry Smith   MPI_Comm     comm;
3201e07b27eSBarry Smith   Vec          coor;
3211e07b27eSBarry Smith 
3221e07b27eSBarry Smith   PetscFunctionBegin;
3239566063dSJacob Faibussowitsch   PetscCall(PCGetDM(pc, &dm));
3249566063dSJacob Faibussowitsch   PetscCall(DMGetCoordinates(dm, &coor));
3253ba16761SJacob Faibussowitsch   if (!coor) PetscFunctionReturn(PETSC_SUCCESS);
3261e07b27eSBarry Smith   psubcomm = sred->psubcomm;
3271e07b27eSBarry Smith   comm     = PetscSubcommParent(psubcomm);
3281e07b27eSBarry Smith   subdm    = ctx->dmrepart;
3291e07b27eSBarry Smith 
3309566063dSJacob Faibussowitsch   PetscCall(PetscInfo(pc, "PCTelescope: setting up the coordinates (DMDA)\n"));
3319566063dSJacob Faibussowitsch   PetscCall(DMDAGetInfo(dm, &dim, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL));
3321e07b27eSBarry Smith   switch (dim) {
333d71ae5a4SJacob Faibussowitsch   case 1:
334d71ae5a4SJacob Faibussowitsch     SETERRQ(comm, PETSC_ERR_SUP, "Telescope: DMDA (1D) repartitioning not provided");
335d71ae5a4SJacob Faibussowitsch   case 2:
336d71ae5a4SJacob Faibussowitsch     PetscCall(PCTelescopeSetUp_dmda_repart_coors2d(sred, dm, subdm));
337d71ae5a4SJacob Faibussowitsch     break;
338d71ae5a4SJacob Faibussowitsch   case 3:
339d71ae5a4SJacob Faibussowitsch     PetscCall(PCTelescopeSetUp_dmda_repart_coors3d(sred, dm, subdm));
340d71ae5a4SJacob Faibussowitsch     break;
3411e07b27eSBarry Smith   }
3423ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3431e07b27eSBarry Smith }
3441e07b27eSBarry Smith 
3451e07b27eSBarry Smith /* setup repartitioned dm */
346*66976f2fSJacob Faibussowitsch static PetscErrorCode PCTelescopeSetUp_dmda_repart(PC pc, PC_Telescope sred, PC_Telescope_DMDACtx *ctx)
347d71ae5a4SJacob Faibussowitsch {
3481e07b27eSBarry Smith   DM                    dm;
3491e07b27eSBarry Smith   PetscInt              dim, nx, ny, nz, ndof, nsw, sum, k;
3501e07b27eSBarry Smith   DMBoundaryType        bx, by, bz;
3511e07b27eSBarry Smith   DMDAStencilType       stencil;
3521e07b27eSBarry Smith   const PetscInt       *_range_i_re;
3531e07b27eSBarry Smith   const PetscInt       *_range_j_re;
3541e07b27eSBarry Smith   const PetscInt       *_range_k_re;
3551e07b27eSBarry Smith   DMDAInterpolationType itype;
3561e07b27eSBarry Smith   PetscInt              refine_x, refine_y, refine_z;
3571e07b27eSBarry Smith   MPI_Comm              comm, subcomm;
3581e07b27eSBarry Smith   const char           *prefix;
3591e07b27eSBarry Smith 
3601e07b27eSBarry Smith   PetscFunctionBegin;
3611e07b27eSBarry Smith   comm    = PetscSubcommParent(sred->psubcomm);
3621e07b27eSBarry Smith   subcomm = PetscSubcommChild(sred->psubcomm);
3639566063dSJacob Faibussowitsch   PetscCall(PCGetDM(pc, &dm));
3641e07b27eSBarry Smith 
3659566063dSJacob Faibussowitsch   PetscCall(DMDAGetInfo(dm, &dim, &nx, &ny, &nz, NULL, NULL, NULL, &ndof, &nsw, &bx, &by, &bz, &stencil));
3669566063dSJacob Faibussowitsch   PetscCall(DMDAGetInterpolationType(dm, &itype));
3679566063dSJacob Faibussowitsch   PetscCall(DMDAGetRefinementFactor(dm, &refine_x, &refine_y, &refine_z));
3681e07b27eSBarry Smith 
3691e07b27eSBarry Smith   ctx->dmrepart = NULL;
3701e07b27eSBarry Smith   _range_i_re = _range_j_re = _range_k_re = NULL;
3711e07b27eSBarry Smith   /* Create DMDA on the child communicator */
37257f12427SDave May   if (PCTelescope_isActiveRank(sred)) {
3731e07b27eSBarry Smith     switch (dim) {
3741e07b27eSBarry Smith     case 1:
3759566063dSJacob Faibussowitsch       PetscCall(PetscInfo(pc, "PCTelescope: setting up the DMDA on comm subset (1D)\n"));
3769566063dSJacob Faibussowitsch       /* PetscCall(DMDACreate1d(subcomm,bx,nx,ndof,nsw,NULL,&ctx->dmrepart)); */
3771e07b27eSBarry Smith       ny = nz = 1;
3781e07b27eSBarry Smith       by = bz = DM_BOUNDARY_NONE;
3791e07b27eSBarry Smith       break;
3801e07b27eSBarry Smith     case 2:
3819566063dSJacob Faibussowitsch       PetscCall(PetscInfo(pc, "PCTelescope: setting up the DMDA on comm subset (2D)\n"));
3829566063dSJacob Faibussowitsch       /* PetscCall(DMDACreate2d(subcomm,bx,by,stencil,nx,ny, PETSC_DECIDE,PETSC_DECIDE,
3839566063dSJacob Faibussowitsch          ndof,nsw, NULL,NULL,&ctx->dmrepart)); */
3841e07b27eSBarry Smith       nz = 1;
3851e07b27eSBarry Smith       bz = DM_BOUNDARY_NONE;
3861e07b27eSBarry Smith       break;
3871e07b27eSBarry Smith     case 3:
3889566063dSJacob Faibussowitsch       PetscCall(PetscInfo(pc, "PCTelescope: setting up the DMDA on comm subset (3D)\n"));
3899566063dSJacob Faibussowitsch       /* PetscCall(DMDACreate3d(subcomm,bx,by,bz,stencil,nx,ny,nz,
3909566063dSJacob Faibussowitsch          PETSC_DECIDE,PETSC_DECIDE,PETSC_DECIDE, ndof,nsw, NULL,NULL,NULL,&ctx->dmrepart)); */
3911e07b27eSBarry Smith       break;
3921e07b27eSBarry Smith     }
3931e07b27eSBarry Smith     /*
3941e07b27eSBarry Smith      The API DMDACreate1d(), DMDACreate2d(), DMDACreate3d() does not allow us to set/append
3951e07b27eSBarry Smith      a unique option prefix for the DM, thus I prefer to expose the contents of these API's here.
3961e07b27eSBarry Smith      This allows users to control the partitioning of the subDM.
3971e07b27eSBarry Smith     */
3989566063dSJacob Faibussowitsch     PetscCall(DMDACreate(subcomm, &ctx->dmrepart));
3991e07b27eSBarry Smith     /* Set unique option prefix name */
4009566063dSJacob Faibussowitsch     PetscCall(KSPGetOptionsPrefix(sred->ksp, &prefix));
4019566063dSJacob Faibussowitsch     PetscCall(DMSetOptionsPrefix(ctx->dmrepart, prefix));
4029566063dSJacob Faibussowitsch     PetscCall(DMAppendOptionsPrefix(ctx->dmrepart, "repart_"));
4031e07b27eSBarry Smith     /* standard setup from DMDACreate{1,2,3}d() */
4049566063dSJacob Faibussowitsch     PetscCall(DMSetDimension(ctx->dmrepart, dim));
4059566063dSJacob Faibussowitsch     PetscCall(DMDASetSizes(ctx->dmrepart, nx, ny, nz));
4069566063dSJacob Faibussowitsch     PetscCall(DMDASetNumProcs(ctx->dmrepart, PETSC_DECIDE, PETSC_DECIDE, PETSC_DECIDE));
4079566063dSJacob Faibussowitsch     PetscCall(DMDASetBoundaryType(ctx->dmrepart, bx, by, bz));
4089566063dSJacob Faibussowitsch     PetscCall(DMDASetDof(ctx->dmrepart, ndof));
4099566063dSJacob Faibussowitsch     PetscCall(DMDASetStencilType(ctx->dmrepart, stencil));
4109566063dSJacob Faibussowitsch     PetscCall(DMDASetStencilWidth(ctx->dmrepart, nsw));
4119566063dSJacob Faibussowitsch     PetscCall(DMDASetOwnershipRanges(ctx->dmrepart, NULL, NULL, NULL));
4129566063dSJacob Faibussowitsch     PetscCall(DMSetFromOptions(ctx->dmrepart));
4139566063dSJacob Faibussowitsch     PetscCall(DMSetUp(ctx->dmrepart));
4141e07b27eSBarry Smith     /* Set refinement factors and interpolation type from the partent */
4159566063dSJacob Faibussowitsch     PetscCall(DMDASetRefinementFactor(ctx->dmrepart, refine_x, refine_y, refine_z));
4169566063dSJacob Faibussowitsch     PetscCall(DMDASetInterpolationType(ctx->dmrepart, itype));
4171e07b27eSBarry Smith 
4189566063dSJacob Faibussowitsch     PetscCall(DMDAGetInfo(ctx->dmrepart, NULL, NULL, NULL, NULL, &ctx->Mp_re, &ctx->Np_re, &ctx->Pp_re, NULL, NULL, NULL, NULL, NULL, NULL));
4199566063dSJacob Faibussowitsch     PetscCall(DMDAGetOwnershipRanges(ctx->dmrepart, &_range_i_re, &_range_j_re, &_range_k_re));
4205e897e82SDave May 
4215e897e82SDave May     ctx->dmrepart->ops->creatematrix              = dm->ops->creatematrix;
4225e897e82SDave May     ctx->dmrepart->ops->createdomaindecomposition = dm->ops->createdomaindecomposition;
4231e07b27eSBarry Smith   }
4241e07b27eSBarry Smith 
4251e07b27eSBarry Smith   /* generate ranges for repartitioned dm */
4261e07b27eSBarry Smith   /* note - assume rank 0 always participates */
427071fcb05SBarry Smith   /* TODO: use a single MPI call */
4289566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Bcast(&ctx->Mp_re, 1, MPIU_INT, 0, comm));
4299566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Bcast(&ctx->Np_re, 1, MPIU_INT, 0, comm));
4309566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Bcast(&ctx->Pp_re, 1, MPIU_INT, 0, comm));
4311e07b27eSBarry Smith 
4329566063dSJacob Faibussowitsch   PetscCall(PetscCalloc3(ctx->Mp_re, &ctx->range_i_re, ctx->Np_re, &ctx->range_j_re, ctx->Pp_re, &ctx->range_k_re));
4331e07b27eSBarry Smith 
4349566063dSJacob Faibussowitsch   if (_range_i_re) PetscCall(PetscArraycpy(ctx->range_i_re, _range_i_re, ctx->Mp_re));
4359566063dSJacob Faibussowitsch   if (_range_j_re) PetscCall(PetscArraycpy(ctx->range_j_re, _range_j_re, ctx->Np_re));
4369566063dSJacob Faibussowitsch   if (_range_k_re) PetscCall(PetscArraycpy(ctx->range_k_re, _range_k_re, ctx->Pp_re));
4371e07b27eSBarry Smith 
438071fcb05SBarry Smith   /* TODO: use a single MPI call */
4399566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Bcast(ctx->range_i_re, ctx->Mp_re, MPIU_INT, 0, comm));
4409566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Bcast(ctx->range_j_re, ctx->Np_re, MPIU_INT, 0, comm));
4419566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Bcast(ctx->range_k_re, ctx->Pp_re, MPIU_INT, 0, comm));
4421e07b27eSBarry Smith 
4439566063dSJacob Faibussowitsch   PetscCall(PetscMalloc3(ctx->Mp_re, &ctx->start_i_re, ctx->Np_re, &ctx->start_j_re, ctx->Pp_re, &ctx->start_k_re));
4441e07b27eSBarry Smith 
4451e07b27eSBarry Smith   sum = 0;
4461e07b27eSBarry Smith   for (k = 0; k < ctx->Mp_re; k++) {
4471e07b27eSBarry Smith     ctx->start_i_re[k] = sum;
4481e07b27eSBarry Smith     sum += ctx->range_i_re[k];
4491e07b27eSBarry Smith   }
4501e07b27eSBarry Smith 
4511e07b27eSBarry Smith   sum = 0;
4521e07b27eSBarry Smith   for (k = 0; k < ctx->Np_re; k++) {
4531e07b27eSBarry Smith     ctx->start_j_re[k] = sum;
4541e07b27eSBarry Smith     sum += ctx->range_j_re[k];
4551e07b27eSBarry Smith   }
4561e07b27eSBarry Smith 
4571e07b27eSBarry Smith   sum = 0;
4581e07b27eSBarry Smith   for (k = 0; k < ctx->Pp_re; k++) {
4591e07b27eSBarry Smith     ctx->start_k_re[k] = sum;
4601e07b27eSBarry Smith     sum += ctx->range_k_re[k];
4611e07b27eSBarry Smith   }
4621e07b27eSBarry Smith 
463ba1c3560SDave May   /* attach repartitioned dm to child ksp */
464ba1c3560SDave May   {
465ba1c3560SDave May     PetscErrorCode (*dmksp_func)(KSP, Mat, Mat, void *);
466ba1c3560SDave May     void *dmksp_ctx;
467ba1c3560SDave May 
4689566063dSJacob Faibussowitsch     PetscCall(DMKSPGetComputeOperators(dm, &dmksp_func, &dmksp_ctx));
469ba1c3560SDave May 
4701e07b27eSBarry Smith     /* attach dm to ksp on sub communicator */
47157f12427SDave May     if (PCTelescope_isActiveRank(sred)) {
4729566063dSJacob Faibussowitsch       PetscCall(KSPSetDM(sred->ksp, ctx->dmrepart));
473ba1c3560SDave May 
474c5db1f53SDave May       if (!dmksp_func || sred->ignore_kspcomputeoperators) {
4759566063dSJacob Faibussowitsch         PetscCall(KSPSetDMActive(sred->ksp, PETSC_FALSE));
476ba1c3560SDave May       } else {
477ba1c3560SDave May         /* sub ksp inherits dmksp_func and context provided by user */
4789566063dSJacob Faibussowitsch         PetscCall(KSPSetComputeOperators(sred->ksp, dmksp_func, dmksp_ctx));
4799566063dSJacob Faibussowitsch         PetscCall(KSPSetDMActive(sred->ksp, PETSC_TRUE));
480ba1c3560SDave May       }
481ba1c3560SDave May     }
4821e07b27eSBarry Smith   }
4833ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4841e07b27eSBarry Smith }
4851e07b27eSBarry Smith 
486*66976f2fSJacob Faibussowitsch static PetscErrorCode PCTelescopeSetUp_dmda_permutation_3d(PC pc, PC_Telescope sred, PC_Telescope_DMDACtx *ctx)
487d71ae5a4SJacob Faibussowitsch {
4881e07b27eSBarry Smith   DM       dm;
4891e07b27eSBarry Smith   MPI_Comm comm;
4901e07b27eSBarry Smith   Mat      Pscalar, P;
4911e07b27eSBarry Smith   PetscInt ndof;
4921e07b27eSBarry Smith   PetscInt i, j, k, location, startI[3], endI[3], lenI[3], nx, ny, nz;
4931e07b27eSBarry Smith   PetscInt sr, er, Mr;
4941e07b27eSBarry Smith   Vec      V;
4951e07b27eSBarry Smith 
4961e07b27eSBarry Smith   PetscFunctionBegin;
4979566063dSJacob Faibussowitsch   PetscCall(PetscInfo(pc, "PCTelescope: setting up the permutation matrix (DMDA-3D)\n"));
4989566063dSJacob Faibussowitsch   PetscCall(PetscObjectGetComm((PetscObject)pc, &comm));
4991e07b27eSBarry Smith 
5009566063dSJacob Faibussowitsch   PetscCall(PCGetDM(pc, &dm));
5019566063dSJacob Faibussowitsch   PetscCall(DMDAGetInfo(dm, NULL, &nx, &ny, &nz, NULL, NULL, NULL, &ndof, NULL, NULL, NULL, NULL, NULL));
5021e07b27eSBarry Smith 
5039566063dSJacob Faibussowitsch   PetscCall(DMGetGlobalVector(dm, &V));
5049566063dSJacob Faibussowitsch   PetscCall(VecGetSize(V, &Mr));
5059566063dSJacob Faibussowitsch   PetscCall(VecGetOwnershipRange(V, &sr, &er));
5069566063dSJacob Faibussowitsch   PetscCall(DMRestoreGlobalVector(dm, &V));
5071e07b27eSBarry Smith   sr = sr / ndof;
5081e07b27eSBarry Smith   er = er / ndof;
5091e07b27eSBarry Smith   Mr = Mr / ndof;
5101e07b27eSBarry Smith 
5119566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, &Pscalar));
5129566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(Pscalar, (er - sr), (er - sr), Mr, Mr));
5139566063dSJacob Faibussowitsch   PetscCall(MatSetType(Pscalar, MATAIJ));
5149566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation(Pscalar, 1, NULL));
5159566063dSJacob Faibussowitsch   PetscCall(MatMPIAIJSetPreallocation(Pscalar, 1, NULL, 1, NULL));
5161e07b27eSBarry Smith 
5179566063dSJacob Faibussowitsch   PetscCall(DMDAGetCorners(dm, NULL, NULL, NULL, &lenI[0], &lenI[1], &lenI[2]));
5189566063dSJacob Faibussowitsch   PetscCall(DMDAGetCorners(dm, &startI[0], &startI[1], &startI[2], &endI[0], &endI[1], &endI[2]));
5191e07b27eSBarry Smith   endI[0] += startI[0];
5201e07b27eSBarry Smith   endI[1] += startI[1];
5211e07b27eSBarry Smith   endI[2] += startI[2];
5221e07b27eSBarry Smith 
5231e07b27eSBarry Smith   for (k = startI[2]; k < endI[2]; k++) {
5241e07b27eSBarry Smith     for (j = startI[1]; j < endI[1]; j++) {
5251e07b27eSBarry Smith       for (i = startI[0]; i < endI[0]; i++) {
5261e07b27eSBarry Smith         PetscMPIInt rank_ijk_re, rank_reI[3];
5271e07b27eSBarry Smith         PetscInt    s0_re;
528c6a0d831SBarry Smith         PetscInt    ii, jj, kk, local_ijk_re, mapped_ijk;
5291e07b27eSBarry Smith         PetscInt    lenI_re[3];
5301e07b27eSBarry Smith 
5311e07b27eSBarry Smith         location = (i - startI[0]) + (j - startI[1]) * lenI[0] + (k - startI[2]) * lenI[0] * lenI[1];
5329371c9d4SSatish Balay         PetscCall(_DMDADetermineRankFromGlobalIJK(3, i, j, k, ctx->Mp_re, ctx->Np_re, ctx->Pp_re, ctx->start_i_re, ctx->start_j_re, ctx->start_k_re, ctx->range_i_re, ctx->range_j_re, ctx->range_k_re, &rank_reI[0], &rank_reI[1], &rank_reI[2], &rank_ijk_re));
5339566063dSJacob Faibussowitsch         PetscCall(_DMDADetermineGlobalS0(3, rank_ijk_re, ctx->Mp_re, ctx->Np_re, ctx->Pp_re, ctx->range_i_re, ctx->range_j_re, ctx->range_k_re, &s0_re));
5341e07b27eSBarry Smith         ii = i - ctx->start_i_re[rank_reI[0]];
53508401ef6SPierre Jolivet         PetscCheck(ii >= 0, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmdarepart-perm3d] index error ii");
5361e07b27eSBarry Smith         jj = j - ctx->start_j_re[rank_reI[1]];
53708401ef6SPierre Jolivet         PetscCheck(jj >= 0, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmdarepart-perm3d] index error jj");
5381e07b27eSBarry Smith         kk = k - ctx->start_k_re[rank_reI[2]];
53908401ef6SPierre Jolivet         PetscCheck(kk >= 0, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmdarepart-perm3d] index error kk");
5401e07b27eSBarry Smith         lenI_re[0]   = ctx->range_i_re[rank_reI[0]];
5411e07b27eSBarry Smith         lenI_re[1]   = ctx->range_j_re[rank_reI[1]];
5421e07b27eSBarry Smith         lenI_re[2]   = ctx->range_k_re[rank_reI[2]];
5431e07b27eSBarry Smith         local_ijk_re = ii + jj * lenI_re[0] + kk * lenI_re[0] * lenI_re[1];
5441e07b27eSBarry Smith         mapped_ijk   = s0_re + local_ijk_re;
5459566063dSJacob Faibussowitsch         PetscCall(MatSetValue(Pscalar, sr + location, mapped_ijk, 1.0, INSERT_VALUES));
5461e07b27eSBarry Smith       }
5471e07b27eSBarry Smith     }
5481e07b27eSBarry Smith   }
5499566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(Pscalar, MAT_FINAL_ASSEMBLY));
5509566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(Pscalar, MAT_FINAL_ASSEMBLY));
5519566063dSJacob Faibussowitsch   PetscCall(MatCreateMAIJ(Pscalar, ndof, &P));
5529566063dSJacob Faibussowitsch   PetscCall(MatDestroy(&Pscalar));
5531e07b27eSBarry Smith   ctx->permutation = P;
5543ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5551e07b27eSBarry Smith }
5561e07b27eSBarry Smith 
557*66976f2fSJacob Faibussowitsch static PetscErrorCode PCTelescopeSetUp_dmda_permutation_2d(PC pc, PC_Telescope sred, PC_Telescope_DMDACtx *ctx)
558d71ae5a4SJacob Faibussowitsch {
5591e07b27eSBarry Smith   DM       dm;
5601e07b27eSBarry Smith   MPI_Comm comm;
5611e07b27eSBarry Smith   Mat      Pscalar, P;
5621e07b27eSBarry Smith   PetscInt ndof;
5631e07b27eSBarry Smith   PetscInt i, j, location, startI[2], endI[2], lenI[2], nx, ny, nz;
5641e07b27eSBarry Smith   PetscInt sr, er, Mr;
5651e07b27eSBarry Smith   Vec      V;
5661e07b27eSBarry Smith 
5671e07b27eSBarry Smith   PetscFunctionBegin;
5689566063dSJacob Faibussowitsch   PetscCall(PetscInfo(pc, "PCTelescope: setting up the permutation matrix (DMDA-2D)\n"));
5699566063dSJacob Faibussowitsch   PetscCall(PetscObjectGetComm((PetscObject)pc, &comm));
5709566063dSJacob Faibussowitsch   PetscCall(PCGetDM(pc, &dm));
5719566063dSJacob Faibussowitsch   PetscCall(DMDAGetInfo(dm, NULL, &nx, &ny, &nz, NULL, NULL, NULL, &ndof, NULL, NULL, NULL, NULL, NULL));
5729566063dSJacob Faibussowitsch   PetscCall(DMGetGlobalVector(dm, &V));
5739566063dSJacob Faibussowitsch   PetscCall(VecGetSize(V, &Mr));
5749566063dSJacob Faibussowitsch   PetscCall(VecGetOwnershipRange(V, &sr, &er));
5759566063dSJacob Faibussowitsch   PetscCall(DMRestoreGlobalVector(dm, &V));
5761e07b27eSBarry Smith   sr = sr / ndof;
5771e07b27eSBarry Smith   er = er / ndof;
5781e07b27eSBarry Smith   Mr = Mr / ndof;
5791e07b27eSBarry Smith 
5809566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, &Pscalar));
5819566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(Pscalar, (er - sr), (er - sr), Mr, Mr));
5829566063dSJacob Faibussowitsch   PetscCall(MatSetType(Pscalar, MATAIJ));
5839566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation(Pscalar, 1, NULL));
5849566063dSJacob Faibussowitsch   PetscCall(MatMPIAIJSetPreallocation(Pscalar, 1, NULL, 1, NULL));
5851e07b27eSBarry Smith 
5869566063dSJacob Faibussowitsch   PetscCall(DMDAGetCorners(dm, NULL, NULL, NULL, &lenI[0], &lenI[1], NULL));
5879566063dSJacob Faibussowitsch   PetscCall(DMDAGetCorners(dm, &startI[0], &startI[1], NULL, &endI[0], &endI[1], NULL));
5881e07b27eSBarry Smith   endI[0] += startI[0];
5891e07b27eSBarry Smith   endI[1] += startI[1];
5901e07b27eSBarry Smith 
5911e07b27eSBarry Smith   for (j = startI[1]; j < endI[1]; j++) {
5921e07b27eSBarry Smith     for (i = startI[0]; i < endI[0]; i++) {
5931e07b27eSBarry Smith       PetscMPIInt rank_ijk_re, rank_reI[3];
5941e07b27eSBarry Smith       PetscInt    s0_re;
595c6a0d831SBarry Smith       PetscInt    ii, jj, local_ijk_re, mapped_ijk;
5961e07b27eSBarry Smith       PetscInt    lenI_re[3];
5971e07b27eSBarry Smith 
5981e07b27eSBarry Smith       location = (i - startI[0]) + (j - startI[1]) * lenI[0];
5999371c9d4SSatish Balay       PetscCall(_DMDADetermineRankFromGlobalIJK(2, i, j, 0, ctx->Mp_re, ctx->Np_re, ctx->Pp_re, ctx->start_i_re, ctx->start_j_re, ctx->start_k_re, ctx->range_i_re, ctx->range_j_re, ctx->range_k_re, &rank_reI[0], &rank_reI[1], NULL, &rank_ijk_re));
6001e07b27eSBarry Smith 
6019566063dSJacob Faibussowitsch       PetscCall(_DMDADetermineGlobalS0(2, rank_ijk_re, ctx->Mp_re, ctx->Np_re, ctx->Pp_re, ctx->range_i_re, ctx->range_j_re, ctx->range_k_re, &s0_re));
6021e07b27eSBarry Smith 
6031e07b27eSBarry Smith       ii = i - ctx->start_i_re[rank_reI[0]];
60408401ef6SPierre Jolivet       PetscCheck(ii >= 0, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmdarepart-perm2d] index error ii");
6051e07b27eSBarry Smith       jj = j - ctx->start_j_re[rank_reI[1]];
60608401ef6SPierre Jolivet       PetscCheck(jj >= 0, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmdarepart-perm2d] index error jj");
6071e07b27eSBarry Smith 
6081e07b27eSBarry Smith       lenI_re[0]   = ctx->range_i_re[rank_reI[0]];
6091e07b27eSBarry Smith       lenI_re[1]   = ctx->range_j_re[rank_reI[1]];
6101e07b27eSBarry Smith       local_ijk_re = ii + jj * lenI_re[0];
6111e07b27eSBarry Smith       mapped_ijk   = s0_re + local_ijk_re;
6129566063dSJacob Faibussowitsch       PetscCall(MatSetValue(Pscalar, sr + location, mapped_ijk, 1.0, INSERT_VALUES));
6131e07b27eSBarry Smith     }
6141e07b27eSBarry Smith   }
6159566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(Pscalar, MAT_FINAL_ASSEMBLY));
6169566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(Pscalar, MAT_FINAL_ASSEMBLY));
6179566063dSJacob Faibussowitsch   PetscCall(MatCreateMAIJ(Pscalar, ndof, &P));
6189566063dSJacob Faibussowitsch   PetscCall(MatDestroy(&Pscalar));
6191e07b27eSBarry Smith   ctx->permutation = P;
6203ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
6211e07b27eSBarry Smith }
6221e07b27eSBarry Smith 
623*66976f2fSJacob Faibussowitsch static PetscErrorCode PCTelescopeSetUp_dmda_scatters(PC pc, PC_Telescope sred, PC_Telescope_DMDACtx *ctx)
624d71ae5a4SJacob Faibussowitsch {
6251e07b27eSBarry Smith   Vec        xred, yred, xtmp, x, xp;
6261e07b27eSBarry Smith   VecScatter scatter;
6271e07b27eSBarry Smith   IS         isin;
6281e07b27eSBarry Smith   Mat        B;
6291e07b27eSBarry Smith   PetscInt   m, bs, st, ed;
6301e07b27eSBarry Smith   MPI_Comm   comm;
6311e07b27eSBarry Smith 
6321e07b27eSBarry Smith   PetscFunctionBegin;
6339566063dSJacob Faibussowitsch   PetscCall(PetscObjectGetComm((PetscObject)pc, &comm));
6349566063dSJacob Faibussowitsch   PetscCall(PCGetOperators(pc, NULL, &B));
6359566063dSJacob Faibussowitsch   PetscCall(MatCreateVecs(B, &x, NULL));
6369566063dSJacob Faibussowitsch   PetscCall(MatGetBlockSize(B, &bs));
6379566063dSJacob Faibussowitsch   PetscCall(VecDuplicate(x, &xp));
6383ac26c5eSBarry Smith   m    = 0;
6391e07b27eSBarry Smith   xred = NULL;
6401e07b27eSBarry Smith   yred = NULL;
64157f12427SDave May   if (PCTelescope_isActiveRank(sred)) {
6429566063dSJacob Faibussowitsch     PetscCall(DMCreateGlobalVector(ctx->dmrepart, &xred));
6439566063dSJacob Faibussowitsch     PetscCall(VecDuplicate(xred, &yred));
6449566063dSJacob Faibussowitsch     PetscCall(VecGetOwnershipRange(xred, &st, &ed));
6459566063dSJacob Faibussowitsch     PetscCall(ISCreateStride(comm, ed - st, st, 1, &isin));
6469566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(xred, &m));
6471e07b27eSBarry Smith   } else {
6489566063dSJacob Faibussowitsch     PetscCall(VecGetOwnershipRange(x, &st, &ed));
6499566063dSJacob Faibussowitsch     PetscCall(ISCreateStride(comm, 0, st, 1, &isin));
6501e07b27eSBarry Smith   }
6519566063dSJacob Faibussowitsch   PetscCall(ISSetBlockSize(isin, bs));
6529566063dSJacob Faibussowitsch   PetscCall(VecCreate(comm, &xtmp));
6539566063dSJacob Faibussowitsch   PetscCall(VecSetSizes(xtmp, m, PETSC_DECIDE));
6549566063dSJacob Faibussowitsch   PetscCall(VecSetBlockSize(xtmp, bs));
6559566063dSJacob Faibussowitsch   PetscCall(VecSetType(xtmp, ((PetscObject)x)->type_name));
6569566063dSJacob Faibussowitsch   PetscCall(VecScatterCreate(x, isin, xtmp, NULL, &scatter));
6571e07b27eSBarry Smith   sred->xred    = xred;
6581e07b27eSBarry Smith   sred->yred    = yred;
6591e07b27eSBarry Smith   sred->isin    = isin;
6601e07b27eSBarry Smith   sred->scatter = scatter;
6611e07b27eSBarry Smith   sred->xtmp    = xtmp;
6621e07b27eSBarry Smith 
6631e07b27eSBarry Smith   ctx->xp = xp;
6649566063dSJacob Faibussowitsch   PetscCall(VecDestroy(&x));
6653ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
6661e07b27eSBarry Smith }
6671e07b27eSBarry Smith 
668d71ae5a4SJacob Faibussowitsch PetscErrorCode PCTelescopeSetUp_dmda(PC pc, PC_Telescope sred)
669d71ae5a4SJacob Faibussowitsch {
6701e07b27eSBarry Smith   PC_Telescope_DMDACtx *ctx;
6711e07b27eSBarry Smith   PetscInt              dim;
6721e07b27eSBarry Smith   DM                    dm;
6731e07b27eSBarry Smith   MPI_Comm              comm;
6741e07b27eSBarry Smith 
6751e07b27eSBarry Smith   PetscFunctionBegin;
6769566063dSJacob Faibussowitsch   PetscCall(PetscInfo(pc, "PCTelescope: setup (DMDA)\n"));
6779566063dSJacob Faibussowitsch   PetscCall(PetscNew(&ctx));
6781e07b27eSBarry Smith   sred->dm_ctx = (void *)ctx;
6791e07b27eSBarry Smith 
6809566063dSJacob Faibussowitsch   PetscCall(PetscObjectGetComm((PetscObject)pc, &comm));
6819566063dSJacob Faibussowitsch   PetscCall(PCGetDM(pc, &dm));
6829566063dSJacob Faibussowitsch   PetscCall(DMDAGetInfo(dm, &dim, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL));
6831e07b27eSBarry Smith 
6843ba16761SJacob Faibussowitsch   PetscCall(PCTelescopeSetUp_dmda_repart(pc, sred, ctx));
6853ba16761SJacob Faibussowitsch   PetscCall(PCTelescopeSetUp_dmda_repart_coors(pc, sred, ctx));
6861e07b27eSBarry Smith   switch (dim) {
687d71ae5a4SJacob Faibussowitsch   case 1:
688d71ae5a4SJacob Faibussowitsch     SETERRQ(comm, PETSC_ERR_SUP, "Telescope: DMDA (1D) repartitioning not provided");
689d71ae5a4SJacob Faibussowitsch   case 2:
690d71ae5a4SJacob Faibussowitsch     PetscCall(PCTelescopeSetUp_dmda_permutation_2d(pc, sred, ctx));
691d71ae5a4SJacob Faibussowitsch     break;
692d71ae5a4SJacob Faibussowitsch   case 3:
693d71ae5a4SJacob Faibussowitsch     PetscCall(PCTelescopeSetUp_dmda_permutation_3d(pc, sred, ctx));
694d71ae5a4SJacob Faibussowitsch     break;
6951e07b27eSBarry Smith   }
6969566063dSJacob Faibussowitsch   PetscCall(PCTelescopeSetUp_dmda_scatters(pc, sred, ctx));
6973ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
6981e07b27eSBarry Smith }
6991e07b27eSBarry Smith 
700*66976f2fSJacob Faibussowitsch static PetscErrorCode PCTelescopeMatCreate_dmda_dmactivefalse(PC pc, PC_Telescope sred, MatReuse reuse, Mat *A)
701d71ae5a4SJacob Faibussowitsch {
7021e07b27eSBarry Smith   PC_Telescope_DMDACtx *ctx;
7031e07b27eSBarry Smith   MPI_Comm              comm, subcomm;
7041e07b27eSBarry Smith   Mat                   Bperm, Bred, B, P;
7051e07b27eSBarry Smith   PetscInt              nr, nc;
7061e07b27eSBarry Smith   IS                    isrow, iscol;
7071e07b27eSBarry Smith   Mat                   Blocal, *_Blocal;
7081e07b27eSBarry Smith 
7091e07b27eSBarry Smith   PetscFunctionBegin;
7109566063dSJacob Faibussowitsch   PetscCall(PetscInfo(pc, "PCTelescope: updating the redundant preconditioned operator (DMDA)\n"));
7119566063dSJacob Faibussowitsch   PetscCall(PetscObjectGetComm((PetscObject)pc, &comm));
7121e07b27eSBarry Smith   subcomm = PetscSubcommChild(sred->psubcomm);
7131e07b27eSBarry Smith   ctx     = (PC_Telescope_DMDACtx *)sred->dm_ctx;
7141e07b27eSBarry Smith 
7159566063dSJacob Faibussowitsch   PetscCall(PCGetOperators(pc, NULL, &B));
7169566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &nr, &nc));
7171e07b27eSBarry Smith 
7181e07b27eSBarry Smith   P = ctx->permutation;
7199566063dSJacob Faibussowitsch   PetscCall(MatPtAP(B, P, MAT_INITIAL_MATRIX, 1.1, &Bperm));
7201e07b27eSBarry Smith 
7211e07b27eSBarry Smith   /* Get submatrices */
7221e07b27eSBarry Smith   isrow = sred->isin;
7239566063dSJacob Faibussowitsch   PetscCall(ISCreateStride(comm, nc, 0, 1, &iscol));
7241e07b27eSBarry Smith 
7259566063dSJacob Faibussowitsch   PetscCall(MatCreateSubMatrices(Bperm, 1, &isrow, &iscol, MAT_INITIAL_MATRIX, &_Blocal));
7261e07b27eSBarry Smith   Blocal = *_Blocal;
7271e07b27eSBarry Smith   Bred   = NULL;
72857f12427SDave May   if (PCTelescope_isActiveRank(sred)) {
7291e07b27eSBarry Smith     PetscInt mm;
7301e07b27eSBarry Smith 
731ad540459SPierre Jolivet     if (reuse != MAT_INITIAL_MATRIX) Bred = *A;
7329566063dSJacob Faibussowitsch     PetscCall(MatGetSize(Blocal, &mm, NULL));
7339566063dSJacob Faibussowitsch     /* PetscCall(MatCreateMPIMatConcatenateSeqMat(subcomm,Blocal,PETSC_DECIDE,reuse,&Bred)); */
7349566063dSJacob Faibussowitsch     PetscCall(MatCreateMPIMatConcatenateSeqMat(subcomm, Blocal, mm, reuse, &Bred));
7351e07b27eSBarry Smith   }
7361e07b27eSBarry Smith   *A = Bred;
7371e07b27eSBarry Smith 
7389566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&iscol));
7399566063dSJacob Faibussowitsch   PetscCall(MatDestroy(&Bperm));
7409566063dSJacob Faibussowitsch   PetscCall(MatDestroyMatrices(1, &_Blocal));
7413ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
7421e07b27eSBarry Smith }
7431e07b27eSBarry Smith 
744d71ae5a4SJacob Faibussowitsch PetscErrorCode PCTelescopeMatCreate_dmda(PC pc, PC_Telescope sred, MatReuse reuse, Mat *A)
745d71ae5a4SJacob Faibussowitsch {
746ba1c3560SDave May   DM dm;
747ba1c3560SDave May   PetscErrorCode (*dmksp_func)(KSP, Mat, Mat, void *);
748ba1c3560SDave May   void *dmksp_ctx;
749ba1c3560SDave May 
750ba1c3560SDave May   PetscFunctionBegin;
7519566063dSJacob Faibussowitsch   PetscCall(PCGetDM(pc, &dm));
7529566063dSJacob Faibussowitsch   PetscCall(DMKSPGetComputeOperators(dm, &dmksp_func, &dmksp_ctx));
753dc9ee9fdSDave May   /* We assume that dmksp_func = NULL, is equivalent to dmActive = PETSC_FALSE */
7547c5279cbSDave May   if (dmksp_func && !sred->ignore_kspcomputeoperators) {
755ba1c3560SDave May     DM  dmrepart;
75628323a89SDave May     Mat Ak;
757ba1c3560SDave May 
758ba1c3560SDave May     *A = NULL;
75957f12427SDave May     if (PCTelescope_isActiveRank(sred)) {
7609566063dSJacob Faibussowitsch       PetscCall(KSPGetDM(sred->ksp, &dmrepart));
761ba1c3560SDave May       if (reuse == MAT_INITIAL_MATRIX) {
7629566063dSJacob Faibussowitsch         PetscCall(DMCreateMatrix(dmrepart, &Ak));
763ba1c3560SDave May         *A = Ak;
764ba1c3560SDave May       } else if (reuse == MAT_REUSE_MATRIX) {
765ba1c3560SDave May         Ak = *A;
766ba1c3560SDave May       }
7675c5dbb1cSDave May       /*
7685c5dbb1cSDave May        There is no need to explicitly assemble the operator now,
7695c5dbb1cSDave May        the sub-KSP will call the method provided to KSPSetComputeOperators() during KSPSetUp()
7705c5dbb1cSDave May       */
771ba1c3560SDave May     }
772ba1c3560SDave May   } else {
7739566063dSJacob Faibussowitsch     PetscCall(PCTelescopeMatCreate_dmda_dmactivefalse(pc, sred, reuse, A));
774ba1c3560SDave May   }
7753ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
776ba1c3560SDave May }
777ba1c3560SDave May 
778*66976f2fSJacob Faibussowitsch static PetscErrorCode PCTelescopeSubNullSpaceCreate_dmda_Telescope(PC pc, PC_Telescope sred, MatNullSpace nullspace, MatNullSpace *sub_nullspace)
779d71ae5a4SJacob Faibussowitsch {
7801e07b27eSBarry Smith   PetscBool             has_const;
781a947c41eSDave May   PetscInt              i, k, n = 0;
7821e07b27eSBarry Smith   const Vec            *vecs;
783c41e779fSDave May   Vec                  *sub_vecs = NULL;
7841e07b27eSBarry Smith   MPI_Comm              subcomm;
7851e07b27eSBarry Smith   PC_Telescope_DMDACtx *ctx;
7861e07b27eSBarry Smith 
7871e07b27eSBarry Smith   PetscFunctionBegin;
7881e07b27eSBarry Smith   ctx     = (PC_Telescope_DMDACtx *)sred->dm_ctx;
7891e07b27eSBarry Smith   subcomm = PetscSubcommChild(sred->psubcomm);
7909566063dSJacob Faibussowitsch   PetscCall(MatNullSpaceGetVecs(nullspace, &has_const, &n, &vecs));
7911e07b27eSBarry Smith 
79257f12427SDave May   if (PCTelescope_isActiveRank(sred)) {
7931e07b27eSBarry Smith     /* create new vectors */
79448a46eb9SPierre Jolivet     if (n) PetscCall(VecDuplicateVecs(sred->xred, n, &sub_vecs));
7951e07b27eSBarry Smith   }
7961e07b27eSBarry Smith 
7971e07b27eSBarry Smith   /* copy entries */
7981e07b27eSBarry Smith   for (k = 0; k < n; k++) {
7991e07b27eSBarry Smith     const PetscScalar *x_array;
8001e07b27eSBarry Smith     PetscScalar       *LA_sub_vec;
80113c30530SDave May     PetscInt           st, ed;
8021e07b27eSBarry Smith 
8031e07b27eSBarry Smith     /* permute vector into ordering associated with re-partitioned dmda */
8049566063dSJacob Faibussowitsch     PetscCall(MatMultTranspose(ctx->permutation, vecs[k], ctx->xp));
8051e07b27eSBarry Smith 
8061e07b27eSBarry Smith     /* pull in vector x->xtmp */
8079566063dSJacob Faibussowitsch     PetscCall(VecScatterBegin(sred->scatter, ctx->xp, sred->xtmp, INSERT_VALUES, SCATTER_FORWARD));
8089566063dSJacob Faibussowitsch     PetscCall(VecScatterEnd(sred->scatter, ctx->xp, sred->xtmp, INSERT_VALUES, SCATTER_FORWARD));
8091e07b27eSBarry Smith 
810392968a1SPatrick Sanan     /* copy vector entries into xred */
8119566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(sred->xtmp, &x_array));
812ea2b237eSDave May     if (sub_vecs) {
813ea2b237eSDave May       if (sub_vecs[k]) {
8149566063dSJacob Faibussowitsch         PetscCall(VecGetOwnershipRange(sub_vecs[k], &st, &ed));
8159566063dSJacob Faibussowitsch         PetscCall(VecGetArray(sub_vecs[k], &LA_sub_vec));
816ad540459SPierre Jolivet         for (i = 0; i < ed - st; i++) LA_sub_vec[i] = x_array[i];
8179566063dSJacob Faibussowitsch         PetscCall(VecRestoreArray(sub_vecs[k], &LA_sub_vec));
8181e07b27eSBarry Smith       }
819ea2b237eSDave May     }
8209566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(sred->xtmp, &x_array));
8211e07b27eSBarry Smith   }
8221e07b27eSBarry Smith 
82357f12427SDave May   if (PCTelescope_isActiveRank(sred)) {
824d8b9d5b7SPatrick Sanan     /* create new (near) nullspace for redundant object */
8259566063dSJacob Faibussowitsch     PetscCall(MatNullSpaceCreate(subcomm, has_const, n, sub_vecs, sub_nullspace));
8269566063dSJacob Faibussowitsch     PetscCall(VecDestroyVecs(n, &sub_vecs));
82728b400f6SJacob Faibussowitsch     PetscCheck(!nullspace->remove, PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "Propagation of custom remove callbacks not supported when propagating (near) nullspaces with PCTelescope");
82828b400f6SJacob Faibussowitsch     PetscCheck(!nullspace->rmctx, PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "Propagation of custom remove callback context not supported when propagating (near) nullspaces with PCTelescope");
829d8b9d5b7SPatrick Sanan   }
8303ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
831392968a1SPatrick Sanan }
832392968a1SPatrick Sanan 
833d71ae5a4SJacob Faibussowitsch PetscErrorCode PCTelescopeMatNullSpaceCreate_dmda(PC pc, PC_Telescope sred, Mat sub_mat)
834d71ae5a4SJacob Faibussowitsch {
835392968a1SPatrick Sanan   Mat B;
836392968a1SPatrick Sanan 
837392968a1SPatrick Sanan   PetscFunctionBegin;
8389566063dSJacob Faibussowitsch   PetscCall(PCGetOperators(pc, NULL, &B));
839392968a1SPatrick Sanan   {
840392968a1SPatrick Sanan     MatNullSpace nullspace, sub_nullspace;
8419566063dSJacob Faibussowitsch     PetscCall(MatGetNullSpace(B, &nullspace));
842392968a1SPatrick Sanan     if (nullspace) {
8439566063dSJacob Faibussowitsch       PetscCall(PetscInfo(pc, "PCTelescope: generating nullspace (DMDA)\n"));
8449566063dSJacob Faibussowitsch       PetscCall(PCTelescopeSubNullSpaceCreate_dmda_Telescope(pc, sred, nullspace, &sub_nullspace));
84557f12427SDave May       if (PCTelescope_isActiveRank(sred)) {
8469566063dSJacob Faibussowitsch         PetscCall(MatSetNullSpace(sub_mat, sub_nullspace));
8479566063dSJacob Faibussowitsch         PetscCall(MatNullSpaceDestroy(&sub_nullspace));
8481e07b27eSBarry Smith       }
849392968a1SPatrick Sanan     }
850392968a1SPatrick Sanan   }
851392968a1SPatrick Sanan   {
852392968a1SPatrick Sanan     MatNullSpace nearnullspace, sub_nearnullspace;
8539566063dSJacob Faibussowitsch     PetscCall(MatGetNearNullSpace(B, &nearnullspace));
854392968a1SPatrick Sanan     if (nearnullspace) {
8559566063dSJacob Faibussowitsch       PetscCall(PetscInfo(pc, "PCTelescope: generating near nullspace (DMDA)\n"));
8569566063dSJacob Faibussowitsch       PetscCall(PCTelescopeSubNullSpaceCreate_dmda_Telescope(pc, sred, nearnullspace, &sub_nearnullspace));
85757f12427SDave May       if (PCTelescope_isActiveRank(sred)) {
8589566063dSJacob Faibussowitsch         PetscCall(MatSetNearNullSpace(sub_mat, sub_nearnullspace));
8599566063dSJacob Faibussowitsch         PetscCall(MatNullSpaceDestroy(&sub_nearnullspace));
860392968a1SPatrick Sanan       }
861392968a1SPatrick Sanan     }
862392968a1SPatrick Sanan   }
8633ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
8641e07b27eSBarry Smith }
8651e07b27eSBarry Smith 
866d71ae5a4SJacob Faibussowitsch PetscErrorCode PCApply_Telescope_dmda(PC pc, Vec x, Vec y)
867d71ae5a4SJacob Faibussowitsch {
8681e07b27eSBarry Smith   PC_Telescope          sred = (PC_Telescope)pc->data;
8691e07b27eSBarry Smith   Mat                   perm;
8701e07b27eSBarry Smith   Vec                   xtmp, xp, xred, yred;
87113c30530SDave May   PetscInt              i, st, ed;
8721e07b27eSBarry Smith   VecScatter            scatter;
8731e07b27eSBarry Smith   PetscScalar          *array;
8741e07b27eSBarry Smith   const PetscScalar    *x_array;
8751e07b27eSBarry Smith   PC_Telescope_DMDACtx *ctx;
8761e07b27eSBarry Smith 
8771e07b27eSBarry Smith   ctx     = (PC_Telescope_DMDACtx *)sred->dm_ctx;
8781e07b27eSBarry Smith   xtmp    = sred->xtmp;
8791e07b27eSBarry Smith   scatter = sred->scatter;
8801e07b27eSBarry Smith   xred    = sred->xred;
8811e07b27eSBarry Smith   yred    = sred->yred;
8821e07b27eSBarry Smith   perm    = ctx->permutation;
8831e07b27eSBarry Smith   xp      = ctx->xp;
8841e07b27eSBarry Smith 
8851e07b27eSBarry Smith   PetscFunctionBegin;
8869566063dSJacob Faibussowitsch   PetscCall(PetscCitationsRegister(citation, &cited));
88714c9fce5SDave May 
8881e07b27eSBarry Smith   /* permute vector into ordering associated with re-partitioned dmda */
8899566063dSJacob Faibussowitsch   PetscCall(MatMultTranspose(perm, x, xp));
8901e07b27eSBarry Smith 
8911e07b27eSBarry Smith   /* pull in vector x->xtmp */
8929566063dSJacob Faibussowitsch   PetscCall(VecScatterBegin(scatter, xp, xtmp, INSERT_VALUES, SCATTER_FORWARD));
8939566063dSJacob Faibussowitsch   PetscCall(VecScatterEnd(scatter, xp, xtmp, INSERT_VALUES, SCATTER_FORWARD));
8941e07b27eSBarry Smith 
895a5b23f4aSJose E. Roman   /* copy vector entries into xred */
8969566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xtmp, &x_array));
8971e07b27eSBarry Smith   if (xred) {
8981e07b27eSBarry Smith     PetscScalar *LA_xred;
8999566063dSJacob Faibussowitsch     PetscCall(VecGetOwnershipRange(xred, &st, &ed));
9001e07b27eSBarry Smith 
9019566063dSJacob Faibussowitsch     PetscCall(VecGetArray(xred, &LA_xred));
902ad540459SPierre Jolivet     for (i = 0; i < ed - st; i++) LA_xred[i] = x_array[i];
9039566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(xred, &LA_xred));
9041e07b27eSBarry Smith   }
9059566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xtmp, &x_array));
9061e07b27eSBarry Smith 
9071e07b27eSBarry Smith   /* solve */
90857f12427SDave May   if (PCTelescope_isActiveRank(sred)) {
9099566063dSJacob Faibussowitsch     PetscCall(KSPSolve(sred->ksp, xred, yred));
9109566063dSJacob Faibussowitsch     PetscCall(KSPCheckSolve(sred->ksp, pc, yred));
9111e07b27eSBarry Smith   }
9121e07b27eSBarry Smith 
9131e07b27eSBarry Smith   /* return vector */
9149566063dSJacob Faibussowitsch   PetscCall(VecGetArray(xtmp, &array));
9151e07b27eSBarry Smith   if (yred) {
9161e07b27eSBarry Smith     const PetscScalar *LA_yred;
9179566063dSJacob Faibussowitsch     PetscCall(VecGetOwnershipRange(yred, &st, &ed));
9189566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(yred, &LA_yred));
919ad540459SPierre Jolivet     for (i = 0; i < ed - st; i++) array[i] = LA_yred[i];
9209566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(yred, &LA_yred));
9211e07b27eSBarry Smith   }
9229566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(xtmp, &array));
9239566063dSJacob Faibussowitsch   PetscCall(VecScatterBegin(scatter, xtmp, xp, INSERT_VALUES, SCATTER_REVERSE));
9249566063dSJacob Faibussowitsch   PetscCall(VecScatterEnd(scatter, xtmp, xp, INSERT_VALUES, SCATTER_REVERSE));
9259566063dSJacob Faibussowitsch   PetscCall(MatMult(perm, xp, y));
9263ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
9271e07b27eSBarry Smith }
9281e07b27eSBarry Smith 
929d71ae5a4SJacob Faibussowitsch PetscErrorCode PCApplyRichardson_Telescope_dmda(PC pc, Vec x, Vec y, Vec w, PetscReal rtol, PetscReal abstol, PetscReal dtol, PetscInt its, PetscBool zeroguess, PetscInt *outits, PCRichardsonConvergedReason *reason)
930d71ae5a4SJacob Faibussowitsch {
931f650675bSDave May   PC_Telescope          sred = (PC_Telescope)pc->data;
932f650675bSDave May   Mat                   perm;
933a1d91a28SDave May   Vec                   xtmp, xp, yred;
934f650675bSDave May   PetscInt              i, st, ed;
935f650675bSDave May   VecScatter            scatter;
936f650675bSDave May   const PetscScalar    *x_array;
937c41e779fSDave May   PetscBool             default_init_guess_value = PETSC_FALSE;
938f650675bSDave May   PC_Telescope_DMDACtx *ctx;
939f650675bSDave May 
94057f12427SDave May   PetscFunctionBegin;
941f650675bSDave May   ctx     = (PC_Telescope_DMDACtx *)sred->dm_ctx;
942f650675bSDave May   xtmp    = sred->xtmp;
943f650675bSDave May   scatter = sred->scatter;
944f650675bSDave May   yred    = sred->yred;
945f650675bSDave May   perm    = ctx->permutation;
946f650675bSDave May   xp      = ctx->xp;
947f650675bSDave May 
94808401ef6SPierre Jolivet   PetscCheck(its <= 1, PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "PCApplyRichardson_Telescope_dmda only supports max_it = 1");
949f650675bSDave May   *reason = (PCRichardsonConvergedReason)0;
950f650675bSDave May 
951f650675bSDave May   if (!zeroguess) {
9529566063dSJacob Faibussowitsch     PetscCall(PetscInfo(pc, "PCTelescopeDMDA: Scattering y for non-zero-initial guess\n"));
953f650675bSDave May     /* permute vector into ordering associated with re-partitioned dmda */
9549566063dSJacob Faibussowitsch     PetscCall(MatMultTranspose(perm, y, xp));
955f650675bSDave May 
956f650675bSDave May     /* pull in vector x->xtmp */
9579566063dSJacob Faibussowitsch     PetscCall(VecScatterBegin(scatter, xp, xtmp, INSERT_VALUES, SCATTER_FORWARD));
9589566063dSJacob Faibussowitsch     PetscCall(VecScatterEnd(scatter, xp, xtmp, INSERT_VALUES, SCATTER_FORWARD));
959f650675bSDave May 
960a5b23f4aSJose E. Roman     /* copy vector entries into xred */
9619566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(xtmp, &x_array));
962f650675bSDave May     if (yred) {
963f650675bSDave May       PetscScalar *LA_yred;
9649566063dSJacob Faibussowitsch       PetscCall(VecGetOwnershipRange(yred, &st, &ed));
9659566063dSJacob Faibussowitsch       PetscCall(VecGetArray(yred, &LA_yred));
966ad540459SPierre Jolivet       for (i = 0; i < ed - st; i++) LA_yred[i] = x_array[i];
9679566063dSJacob Faibussowitsch       PetscCall(VecRestoreArray(yred, &LA_yred));
968f650675bSDave May     }
9699566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(xtmp, &x_array));
970f650675bSDave May   }
971f650675bSDave May 
97257f12427SDave May   if (PCTelescope_isActiveRank(sred)) {
9739566063dSJacob Faibussowitsch     PetscCall(KSPGetInitialGuessNonzero(sred->ksp, &default_init_guess_value));
9749566063dSJacob Faibussowitsch     if (!zeroguess) PetscCall(KSPSetInitialGuessNonzero(sred->ksp, PETSC_TRUE));
975f650675bSDave May   }
976f650675bSDave May 
9779566063dSJacob Faibussowitsch   PetscCall(PCApply_Telescope_dmda(pc, x, y));
978f650675bSDave May 
97948a46eb9SPierre Jolivet   if (PCTelescope_isActiveRank(sred)) PetscCall(KSPSetInitialGuessNonzero(sred->ksp, default_init_guess_value));
980f650675bSDave May 
981f650675bSDave May   if (!*reason) *reason = PCRICHARDSON_CONVERGED_ITS;
982f650675bSDave May   *outits = 1;
9833ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
984f650675bSDave May }
985f650675bSDave May 
986d71ae5a4SJacob Faibussowitsch PetscErrorCode PCReset_Telescope_dmda(PC pc)
987d71ae5a4SJacob Faibussowitsch {
9881e07b27eSBarry Smith   PC_Telescope          sred = (PC_Telescope)pc->data;
9891e07b27eSBarry Smith   PC_Telescope_DMDACtx *ctx;
9901e07b27eSBarry Smith 
9911e07b27eSBarry Smith   PetscFunctionBegin;
9921e07b27eSBarry Smith   ctx = (PC_Telescope_DMDACtx *)sred->dm_ctx;
9939566063dSJacob Faibussowitsch   PetscCall(VecDestroy(&ctx->xp));
9949566063dSJacob Faibussowitsch   PetscCall(MatDestroy(&ctx->permutation));
9959566063dSJacob Faibussowitsch   PetscCall(DMDestroy(&ctx->dmrepart));
9969566063dSJacob Faibussowitsch   PetscCall(PetscFree3(ctx->range_i_re, ctx->range_j_re, ctx->range_k_re));
9979566063dSJacob Faibussowitsch   PetscCall(PetscFree3(ctx->start_i_re, ctx->start_j_re, ctx->start_k_re));
9983ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
9991e07b27eSBarry Smith }
10001e07b27eSBarry Smith 
1001*66976f2fSJacob Faibussowitsch static PetscErrorCode DMView_DA_Short_3d(DM dm, PetscViewer v)
1002d71ae5a4SJacob Faibussowitsch {
10031e07b27eSBarry Smith   PetscInt    M, N, P, m, n, p, ndof, nsw;
10041e07b27eSBarry Smith   MPI_Comm    comm;
10051e07b27eSBarry Smith   PetscMPIInt size;
10061e07b27eSBarry Smith   const char *prefix;
10071e07b27eSBarry Smith 
10081e07b27eSBarry Smith   PetscFunctionBegin;
10099566063dSJacob Faibussowitsch   PetscCall(PetscObjectGetComm((PetscObject)dm, &comm));
10109566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(comm, &size));
10119566063dSJacob Faibussowitsch   PetscCall(DMGetOptionsPrefix(dm, &prefix));
10129566063dSJacob Faibussowitsch   PetscCall(DMDAGetInfo(dm, NULL, &M, &N, &P, &m, &n, &p, &ndof, &nsw, NULL, NULL, NULL, NULL));
10139566063dSJacob Faibussowitsch   if (prefix) PetscCall(PetscViewerASCIIPrintf(v, "DMDA Object:    (%s)    %d MPI processes\n", prefix, size));
10149566063dSJacob Faibussowitsch   else PetscCall(PetscViewerASCIIPrintf(v, "DMDA Object:    %d MPI processes\n", size));
101563a3b9bcSJacob Faibussowitsch   PetscCall(PetscViewerASCIIPrintf(v, "  M %" PetscInt_FMT " N %" PetscInt_FMT " P %" PetscInt_FMT " m %" PetscInt_FMT " n %" PetscInt_FMT " p %" PetscInt_FMT " dof %" PetscInt_FMT " overlap %" PetscInt_FMT "\n", M, N, P, m, n, p, ndof, nsw));
10163ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
10171e07b27eSBarry Smith }
10181e07b27eSBarry Smith 
1019*66976f2fSJacob Faibussowitsch static PetscErrorCode DMView_DA_Short_2d(DM dm, PetscViewer v)
1020d71ae5a4SJacob Faibussowitsch {
10211e07b27eSBarry Smith   PetscInt    M, N, m, n, ndof, nsw;
10221e07b27eSBarry Smith   MPI_Comm    comm;
10231e07b27eSBarry Smith   PetscMPIInt size;
10241e07b27eSBarry Smith   const char *prefix;
10251e07b27eSBarry Smith 
10261e07b27eSBarry Smith   PetscFunctionBegin;
10279566063dSJacob Faibussowitsch   PetscCall(PetscObjectGetComm((PetscObject)dm, &comm));
10289566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(comm, &size));
10299566063dSJacob Faibussowitsch   PetscCall(DMGetOptionsPrefix(dm, &prefix));
10309566063dSJacob Faibussowitsch   PetscCall(DMDAGetInfo(dm, NULL, &M, &N, NULL, &m, &n, NULL, &ndof, &nsw, NULL, NULL, NULL, NULL));
10319566063dSJacob Faibussowitsch   if (prefix) PetscCall(PetscViewerASCIIPrintf(v, "DMDA Object:    (%s)    %d MPI processes\n", prefix, size));
10329566063dSJacob Faibussowitsch   else PetscCall(PetscViewerASCIIPrintf(v, "DMDA Object:    %d MPI processes\n", size));
103363a3b9bcSJacob Faibussowitsch   PetscCall(PetscViewerASCIIPrintf(v, "  M %" PetscInt_FMT " N %" PetscInt_FMT " m %" PetscInt_FMT " n %" PetscInt_FMT " dof %" PetscInt_FMT " overlap %" PetscInt_FMT "\n", M, N, m, n, ndof, nsw));
10343ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
10351e07b27eSBarry Smith }
10361e07b27eSBarry Smith 
1037d71ae5a4SJacob Faibussowitsch PetscErrorCode DMView_DA_Short(DM dm, PetscViewer v)
1038d71ae5a4SJacob Faibussowitsch {
10391e07b27eSBarry Smith   PetscInt dim;
10401e07b27eSBarry Smith 
10411e07b27eSBarry Smith   PetscFunctionBegin;
10429566063dSJacob Faibussowitsch   PetscCall(DMDAGetInfo(dm, &dim, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL));
10431e07b27eSBarry Smith   switch (dim) {
1044d71ae5a4SJacob Faibussowitsch   case 2:
1045d71ae5a4SJacob Faibussowitsch     PetscCall(DMView_DA_Short_2d(dm, v));
1046d71ae5a4SJacob Faibussowitsch     break;
1047d71ae5a4SJacob Faibussowitsch   case 3:
1048d71ae5a4SJacob Faibussowitsch     PetscCall(DMView_DA_Short_3d(dm, v));
1049d71ae5a4SJacob Faibussowitsch     break;
10501e07b27eSBarry Smith   }
10513ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
10521e07b27eSBarry Smith }
1053