1120bdd93SDave May #include <petsc/private/matimpl.h> 21e07b27eSBarry Smith #include <petsc/private/pcimpl.h> 35e897e82SDave May #include <petsc/private/dmimpl.h> 41e07b27eSBarry Smith #include <petscksp.h> /*I "petscksp.h" I*/ 51e07b27eSBarry Smith #include <petscdm.h> 61e07b27eSBarry Smith #include <petscdmda.h> 71e07b27eSBarry Smith 8575a0592SBarry Smith #include "../src/ksp/pc/impls/telescope/telescope.h" 91e07b27eSBarry Smith 10bf00f589SPatrick Sanan static PetscBool cited = PETSC_FALSE; 119371c9d4SSatish Balay static const char citation[] = "@inproceedings{MaySananRuppKnepleySmith2016,\n" 12bf00f589SPatrick Sanan " title = {Extreme-Scale Multigrid Components within PETSc},\n" 13bf00f589SPatrick Sanan " author = {Dave A. May and Patrick Sanan and Karl Rupp and Matthew G. Knepley and Barry F. Smith},\n" 14bf00f589SPatrick Sanan " booktitle = {Proceedings of the Platform for Advanced Scientific Computing Conference},\n" 15bf00f589SPatrick Sanan " series = {PASC '16},\n" 16bf00f589SPatrick Sanan " isbn = {978-1-4503-4126-4},\n" 17bf00f589SPatrick Sanan " location = {Lausanne, Switzerland},\n" 18bf00f589SPatrick Sanan " pages = {5:1--5:12},\n" 19bf00f589SPatrick Sanan " articleno = {5},\n" 20bf00f589SPatrick Sanan " numpages = {12},\n" 21a8d69d7bSBarry Smith " url = {https://doi.acm.org/10.1145/2929908.2929913},\n" 22bf00f589SPatrick Sanan " doi = {10.1145/2929908.2929913},\n" 23bf00f589SPatrick Sanan " acmid = {2929913},\n" 24bf00f589SPatrick Sanan " publisher = {ACM},\n" 25bf00f589SPatrick Sanan " address = {New York, NY, USA},\n" 26bf00f589SPatrick Sanan " keywords = {GPU, HPC, agglomeration, coarse-level solver, multigrid, parallel computing, preconditioning},\n" 27bf00f589SPatrick Sanan " year = {2016}\n" 28bf00f589SPatrick Sanan "}\n"; 29bf00f589SPatrick Sanan 30d71ae5a4SJacob Faibussowitsch static PetscErrorCode _DMDADetermineRankFromGlobalIJK(PetscInt dim, PetscInt i, PetscInt j, PetscInt k, PetscInt Mp, PetscInt Np, PetscInt Pp, PetscInt start_i[], PetscInt start_j[], PetscInt start_k[], PetscInt span_i[], PetscInt span_j[], PetscInt span_k[], PetscMPIInt *_pi, PetscMPIInt *_pj, PetscMPIInt *_pk, PetscMPIInt *rank_re) 31d71ae5a4SJacob Faibussowitsch { 321e07b27eSBarry Smith PetscInt pi, pj, pk, n; 331e07b27eSBarry Smith 341e07b27eSBarry Smith PetscFunctionBegin; 35137d0469SJed Brown *rank_re = -1; 36137d0469SJed Brown if (_pi) *_pi = -1; 37137d0469SJed Brown if (_pj) *_pj = -1; 38137d0469SJed Brown if (_pk) *_pk = -1; 391e07b27eSBarry Smith pi = pj = pk = -1; 401e07b27eSBarry Smith if (_pi) { 411e07b27eSBarry Smith for (n = 0; n < Mp; n++) { 421e07b27eSBarry Smith if ((i >= start_i[n]) && (i < start_i[n] + span_i[n])) { 431e07b27eSBarry Smith pi = n; 441e07b27eSBarry Smith break; 451e07b27eSBarry Smith } 461e07b27eSBarry Smith } 4763a3b9bcSJacob Faibussowitsch PetscCheck(pi != -1, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmda-ijk] pi cannot be determined : range %" PetscInt_FMT ", val %" PetscInt_FMT, Mp, i); 48835f2295SStefano Zampini PetscCall(PetscMPIIntCast(pi, _pi)); 491e07b27eSBarry Smith } 501e07b27eSBarry Smith 511e07b27eSBarry Smith if (_pj) { 521e07b27eSBarry Smith for (n = 0; n < Np; n++) { 531e07b27eSBarry Smith if ((j >= start_j[n]) && (j < start_j[n] + span_j[n])) { 541e07b27eSBarry Smith pj = n; 551e07b27eSBarry Smith break; 561e07b27eSBarry Smith } 571e07b27eSBarry Smith } 5863a3b9bcSJacob Faibussowitsch PetscCheck(pj != -1, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmda-ijk] pj cannot be determined : range %" PetscInt_FMT ", val %" PetscInt_FMT, Np, j); 59835f2295SStefano Zampini PetscCall(PetscMPIIntCast(pj, _pj)); 601e07b27eSBarry Smith } 611e07b27eSBarry Smith 621e07b27eSBarry Smith if (_pk) { 631e07b27eSBarry Smith for (n = 0; n < Pp; n++) { 641e07b27eSBarry Smith if ((k >= start_k[n]) && (k < start_k[n] + span_k[n])) { 651e07b27eSBarry Smith pk = n; 661e07b27eSBarry Smith break; 671e07b27eSBarry Smith } 681e07b27eSBarry Smith } 6963a3b9bcSJacob Faibussowitsch PetscCheck(pk != -1, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmda-ijk] pk cannot be determined : range %" PetscInt_FMT ", val %" PetscInt_FMT, Pp, k); 70835f2295SStefano Zampini PetscCall(PetscMPIIntCast(pk, _pk)); 711e07b27eSBarry Smith } 721e07b27eSBarry Smith 731e07b27eSBarry Smith switch (dim) { 74d71ae5a4SJacob Faibussowitsch case 1: 75835f2295SStefano Zampini PetscCall(PetscMPIIntCast(pi, rank_re)); 76d71ae5a4SJacob Faibussowitsch break; 77d71ae5a4SJacob Faibussowitsch case 2: 78835f2295SStefano Zampini PetscCall(PetscMPIIntCast(pi + pj * Mp, rank_re)); 79d71ae5a4SJacob Faibussowitsch break; 80d71ae5a4SJacob Faibussowitsch case 3: 81835f2295SStefano Zampini PetscCall(PetscMPIIntCast(pi + pj * Mp + pk * (Mp * Np), rank_re)); 82d71ae5a4SJacob Faibussowitsch break; 831e07b27eSBarry Smith } 843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 851e07b27eSBarry Smith } 861e07b27eSBarry Smith 87d71ae5a4SJacob Faibussowitsch static PetscErrorCode _DMDADetermineGlobalS0(PetscInt dim, PetscMPIInt rank_re, PetscInt Mp_re, PetscInt Np_re, PetscInt Pp_re, PetscInt range_i_re[], PetscInt range_j_re[], PetscInt range_k_re[], PetscInt *s0) 88d71ae5a4SJacob Faibussowitsch { 89c6a0d831SBarry Smith PetscInt i, j, k, start_IJK = 0; 901e07b27eSBarry Smith PetscInt rank_ijk; 911e07b27eSBarry Smith 921e07b27eSBarry Smith PetscFunctionBegin; 931e07b27eSBarry Smith switch (dim) { 941e07b27eSBarry Smith case 1: 951e07b27eSBarry Smith for (i = 0; i < Mp_re; i++) { 961e07b27eSBarry Smith rank_ijk = i; 97ad540459SPierre Jolivet if (rank_ijk < rank_re) start_IJK += range_i_re[i]; 981e07b27eSBarry Smith } 991e07b27eSBarry Smith break; 1001e07b27eSBarry Smith case 2: 1011e07b27eSBarry Smith for (j = 0; j < Np_re; j++) { 1021e07b27eSBarry Smith for (i = 0; i < Mp_re; i++) { 1031e07b27eSBarry Smith rank_ijk = i + j * Mp_re; 104ad540459SPierre Jolivet if (rank_ijk < rank_re) start_IJK += range_i_re[i] * range_j_re[j]; 1051e07b27eSBarry Smith } 1061e07b27eSBarry Smith } 1071e07b27eSBarry Smith break; 1081e07b27eSBarry Smith case 3: 1091e07b27eSBarry Smith for (k = 0; k < Pp_re; k++) { 1101e07b27eSBarry Smith for (j = 0; j < Np_re; j++) { 1111e07b27eSBarry Smith for (i = 0; i < Mp_re; i++) { 1121e07b27eSBarry Smith rank_ijk = i + j * Mp_re + k * Mp_re * Np_re; 113ad540459SPierre Jolivet if (rank_ijk < rank_re) start_IJK += range_i_re[i] * range_j_re[j] * range_k_re[k]; 1141e07b27eSBarry Smith } 1151e07b27eSBarry Smith } 1161e07b27eSBarry Smith } 1171e07b27eSBarry Smith break; 1181e07b27eSBarry Smith } 1191e07b27eSBarry Smith *s0 = start_IJK; 1203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1211e07b27eSBarry Smith } 1221e07b27eSBarry Smith 123d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCTelescopeSetUp_dmda_repart_coors2d(PC_Telescope sred, DM dm, DM subdm) 124d71ae5a4SJacob Faibussowitsch { 1251e07b27eSBarry Smith DM cdm; 1261e07b27eSBarry Smith Vec coor, coor_natural, perm_coors; 1271e07b27eSBarry Smith PetscInt i, j, si, sj, ni, nj, M, N, Ml, Nl, c, nidx; 1281e07b27eSBarry Smith PetscInt *fine_indices; 1291e07b27eSBarry Smith IS is_fine, is_local; 1301e07b27eSBarry Smith VecScatter sctx; 1311e07b27eSBarry Smith 1321e07b27eSBarry Smith PetscFunctionBegin; 1339566063dSJacob Faibussowitsch PetscCall(DMGetCoordinates(dm, &coor)); 1343ba16761SJacob Faibussowitsch if (!coor) PetscFunctionReturn(PETSC_SUCCESS); 13548a46eb9SPierre Jolivet if (PCTelescope_isActiveRank(sred)) PetscCall(DMDASetUniformCoordinates(subdm, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0)); 1361e07b27eSBarry Smith /* Get the coordinate vector from the distributed array */ 1379566063dSJacob Faibussowitsch PetscCall(DMGetCoordinateDM(dm, &cdm)); 1389566063dSJacob Faibussowitsch PetscCall(DMDACreateNaturalVector(cdm, &coor_natural)); 1391e07b27eSBarry Smith 1409566063dSJacob Faibussowitsch PetscCall(DMDAGlobalToNaturalBegin(cdm, coor, INSERT_VALUES, coor_natural)); 1419566063dSJacob Faibussowitsch PetscCall(DMDAGlobalToNaturalEnd(cdm, coor, INSERT_VALUES, coor_natural)); 1421e07b27eSBarry Smith 1431e07b27eSBarry Smith /* get indices of the guys I want to grab */ 1449566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(dm, NULL, &M, &N, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL)); 14557f12427SDave May if (PCTelescope_isActiveRank(sred)) { 1469566063dSJacob Faibussowitsch PetscCall(DMDAGetCorners(subdm, &si, &sj, NULL, &ni, &nj, NULL)); 14715dd08bcSBarry Smith Ml = ni; 14815dd08bcSBarry Smith Nl = nj; 1491e07b27eSBarry Smith } else { 150c41e779fSDave May si = sj = 0; 151c41e779fSDave May ni = nj = 0; 1523ac26c5eSBarry Smith Ml = Nl = 0; 1531e07b27eSBarry Smith } 1541e07b27eSBarry Smith 1559566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Ml * Nl * 2, &fine_indices)); 1561e07b27eSBarry Smith c = 0; 15757f12427SDave May if (PCTelescope_isActiveRank(sred)) { 1581e07b27eSBarry Smith for (j = sj; j < sj + nj; j++) { 1591e07b27eSBarry Smith for (i = si; i < si + ni; i++) { 1601e07b27eSBarry Smith nidx = (i) + (j)*M; 1611e07b27eSBarry Smith fine_indices[c] = 2 * nidx; 1621e07b27eSBarry Smith fine_indices[c + 1] = 2 * nidx + 1; 1631e07b27eSBarry Smith c = c + 2; 1641e07b27eSBarry Smith } 1651e07b27eSBarry Smith } 16663a3b9bcSJacob Faibussowitsch PetscCheck(c == Ml * Nl * 2, PETSC_COMM_SELF, PETSC_ERR_PLIB, "c %" PetscInt_FMT " should equal 2 * Ml %" PetscInt_FMT " * Nl %" PetscInt_FMT, c, Ml, Nl); 1671e07b27eSBarry Smith } 1681e07b27eSBarry Smith 1691e07b27eSBarry Smith /* generate scatter */ 1709566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)dm), Ml * Nl * 2, fine_indices, PETSC_USE_POINTER, &is_fine)); 1719566063dSJacob Faibussowitsch PetscCall(ISCreateStride(PETSC_COMM_SELF, Ml * Nl * 2, 0, 1, &is_local)); 1721e07b27eSBarry Smith 1731e07b27eSBarry Smith /* scatter */ 1749566063dSJacob Faibussowitsch PetscCall(VecCreate(PETSC_COMM_SELF, &perm_coors)); 1759566063dSJacob Faibussowitsch PetscCall(VecSetSizes(perm_coors, PETSC_DECIDE, Ml * Nl * 2)); 1769566063dSJacob Faibussowitsch PetscCall(VecSetType(perm_coors, VECSEQ)); 1771e07b27eSBarry Smith 1789566063dSJacob Faibussowitsch PetscCall(VecScatterCreate(coor_natural, is_fine, perm_coors, is_local, &sctx)); 1799566063dSJacob Faibussowitsch PetscCall(VecScatterBegin(sctx, coor_natural, perm_coors, INSERT_VALUES, SCATTER_FORWARD)); 1809566063dSJacob Faibussowitsch PetscCall(VecScatterEnd(sctx, coor_natural, perm_coors, INSERT_VALUES, SCATTER_FORWARD)); 1811e07b27eSBarry Smith /* access */ 18257f12427SDave May if (PCTelescope_isActiveRank(sred)) { 1831e07b27eSBarry Smith Vec _coors; 1841e07b27eSBarry Smith const PetscScalar *LA_perm; 1851e07b27eSBarry Smith PetscScalar *LA_coors; 1861e07b27eSBarry Smith 1879566063dSJacob Faibussowitsch PetscCall(DMGetCoordinates(subdm, &_coors)); 1889566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(perm_coors, &LA_perm)); 1899566063dSJacob Faibussowitsch PetscCall(VecGetArray(_coors, &LA_coors)); 190ad540459SPierre Jolivet for (i = 0; i < Ml * Nl * 2; i++) LA_coors[i] = LA_perm[i]; 1919566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(_coors, &LA_coors)); 1929566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(perm_coors, &LA_perm)); 1931e07b27eSBarry Smith } 1941e07b27eSBarry Smith 1951e07b27eSBarry Smith /* update local coords */ 19657f12427SDave May if (PCTelescope_isActiveRank(sred)) { 1971e07b27eSBarry Smith DM _dmc; 1981e07b27eSBarry Smith Vec _coors, _coors_local; 1999566063dSJacob Faibussowitsch PetscCall(DMGetCoordinateDM(subdm, &_dmc)); 2009566063dSJacob Faibussowitsch PetscCall(DMGetCoordinates(subdm, &_coors)); 2019566063dSJacob Faibussowitsch PetscCall(DMGetCoordinatesLocal(subdm, &_coors_local)); 2029566063dSJacob Faibussowitsch PetscCall(DMGlobalToLocalBegin(_dmc, _coors, INSERT_VALUES, _coors_local)); 2039566063dSJacob Faibussowitsch PetscCall(DMGlobalToLocalEnd(_dmc, _coors, INSERT_VALUES, _coors_local)); 2041e07b27eSBarry Smith } 2059566063dSJacob Faibussowitsch PetscCall(VecScatterDestroy(&sctx)); 2069566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is_fine)); 2079566063dSJacob Faibussowitsch PetscCall(PetscFree(fine_indices)); 2089566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is_local)); 2099566063dSJacob Faibussowitsch PetscCall(VecDestroy(&perm_coors)); 2109566063dSJacob Faibussowitsch PetscCall(VecDestroy(&coor_natural)); 2113ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2121e07b27eSBarry Smith } 2131e07b27eSBarry Smith 214d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCTelescopeSetUp_dmda_repart_coors3d(PC_Telescope sred, DM dm, DM subdm) 215d71ae5a4SJacob Faibussowitsch { 2161e07b27eSBarry Smith DM cdm; 2171e07b27eSBarry Smith Vec coor, coor_natural, perm_coors; 2181e07b27eSBarry Smith PetscInt i, j, k, si, sj, sk, ni, nj, nk, M, N, P, Ml, Nl, Pl, c, nidx; 2191e07b27eSBarry Smith PetscInt *fine_indices; 2201e07b27eSBarry Smith IS is_fine, is_local; 2211e07b27eSBarry Smith VecScatter sctx; 2221e07b27eSBarry Smith 2231e07b27eSBarry Smith PetscFunctionBegin; 2249566063dSJacob Faibussowitsch PetscCall(DMGetCoordinates(dm, &coor)); 2253ba16761SJacob Faibussowitsch if (!coor) PetscFunctionReturn(PETSC_SUCCESS); 2261e07b27eSBarry Smith 22748a46eb9SPierre Jolivet if (PCTelescope_isActiveRank(sred)) PetscCall(DMDASetUniformCoordinates(subdm, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0)); 2281e07b27eSBarry Smith 2291e07b27eSBarry Smith /* Get the coordinate vector from the distributed array */ 2309566063dSJacob Faibussowitsch PetscCall(DMGetCoordinateDM(dm, &cdm)); 2319566063dSJacob Faibussowitsch PetscCall(DMDACreateNaturalVector(cdm, &coor_natural)); 2329566063dSJacob Faibussowitsch PetscCall(DMDAGlobalToNaturalBegin(cdm, coor, INSERT_VALUES, coor_natural)); 2339566063dSJacob Faibussowitsch PetscCall(DMDAGlobalToNaturalEnd(cdm, coor, INSERT_VALUES, coor_natural)); 2341e07b27eSBarry Smith 2351e07b27eSBarry Smith /* get indices of the guys I want to grab */ 2369566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(dm, NULL, &M, &N, &P, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL)); 2371e07b27eSBarry Smith 23857f12427SDave May if (PCTelescope_isActiveRank(sred)) { 2399566063dSJacob Faibussowitsch PetscCall(DMDAGetCorners(subdm, &si, &sj, &sk, &ni, &nj, &nk)); 240553d0ae9SBarry Smith Ml = ni; 241553d0ae9SBarry Smith Nl = nj; 242553d0ae9SBarry Smith Pl = nk; 2431e07b27eSBarry Smith } else { 244c41e779fSDave May si = sj = sk = 0; 245c41e779fSDave May ni = nj = nk = 0; 2463ac26c5eSBarry Smith Ml = Nl = Pl = 0; 2471e07b27eSBarry Smith } 2481e07b27eSBarry Smith 2499566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Ml * Nl * Pl * 3, &fine_indices)); 2501e07b27eSBarry Smith 2511e07b27eSBarry Smith c = 0; 25257f12427SDave May if (PCTelescope_isActiveRank(sred)) { 2531e07b27eSBarry Smith for (k = sk; k < sk + nk; k++) { 2541e07b27eSBarry Smith for (j = sj; j < sj + nj; j++) { 2551e07b27eSBarry Smith for (i = si; i < si + ni; i++) { 2561e07b27eSBarry Smith nidx = (i) + (j)*M + (k)*M * N; 2571e07b27eSBarry Smith fine_indices[c] = 3 * nidx; 2581e07b27eSBarry Smith fine_indices[c + 1] = 3 * nidx + 1; 2591e07b27eSBarry Smith fine_indices[c + 2] = 3 * nidx + 2; 2601e07b27eSBarry Smith c = c + 3; 2611e07b27eSBarry Smith } 2621e07b27eSBarry Smith } 2631e07b27eSBarry Smith } 2641e07b27eSBarry Smith } 2651e07b27eSBarry Smith 2661e07b27eSBarry Smith /* generate scatter */ 2679566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)dm), Ml * Nl * Pl * 3, fine_indices, PETSC_USE_POINTER, &is_fine)); 2689566063dSJacob Faibussowitsch PetscCall(ISCreateStride(PETSC_COMM_SELF, Ml * Nl * Pl * 3, 0, 1, &is_local)); 2691e07b27eSBarry Smith 2701e07b27eSBarry Smith /* scatter */ 2719566063dSJacob Faibussowitsch PetscCall(VecCreate(PETSC_COMM_SELF, &perm_coors)); 2729566063dSJacob Faibussowitsch PetscCall(VecSetSizes(perm_coors, PETSC_DECIDE, Ml * Nl * Pl * 3)); 2739566063dSJacob Faibussowitsch PetscCall(VecSetType(perm_coors, VECSEQ)); 2749566063dSJacob Faibussowitsch PetscCall(VecScatterCreate(coor_natural, is_fine, perm_coors, is_local, &sctx)); 2759566063dSJacob Faibussowitsch PetscCall(VecScatterBegin(sctx, coor_natural, perm_coors, INSERT_VALUES, SCATTER_FORWARD)); 2769566063dSJacob Faibussowitsch PetscCall(VecScatterEnd(sctx, coor_natural, perm_coors, INSERT_VALUES, SCATTER_FORWARD)); 2771e07b27eSBarry Smith 2781e07b27eSBarry Smith /* access */ 27957f12427SDave May if (PCTelescope_isActiveRank(sred)) { 2801e07b27eSBarry Smith Vec _coors; 2811e07b27eSBarry Smith const PetscScalar *LA_perm; 2821e07b27eSBarry Smith PetscScalar *LA_coors; 2831e07b27eSBarry Smith 2849566063dSJacob Faibussowitsch PetscCall(DMGetCoordinates(subdm, &_coors)); 2859566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(perm_coors, &LA_perm)); 2869566063dSJacob Faibussowitsch PetscCall(VecGetArray(_coors, &LA_coors)); 287ad540459SPierre Jolivet for (i = 0; i < Ml * Nl * Pl * 3; i++) LA_coors[i] = LA_perm[i]; 2889566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(_coors, &LA_coors)); 2899566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(perm_coors, &LA_perm)); 2901e07b27eSBarry Smith } 2911e07b27eSBarry Smith 2921e07b27eSBarry Smith /* update local coords */ 29357f12427SDave May if (PCTelescope_isActiveRank(sred)) { 2941e07b27eSBarry Smith DM _dmc; 2951e07b27eSBarry Smith Vec _coors, _coors_local; 2961e07b27eSBarry Smith 2979566063dSJacob Faibussowitsch PetscCall(DMGetCoordinateDM(subdm, &_dmc)); 2989566063dSJacob Faibussowitsch PetscCall(DMGetCoordinates(subdm, &_coors)); 2999566063dSJacob Faibussowitsch PetscCall(DMGetCoordinatesLocal(subdm, &_coors_local)); 3009566063dSJacob Faibussowitsch PetscCall(DMGlobalToLocalBegin(_dmc, _coors, INSERT_VALUES, _coors_local)); 3019566063dSJacob Faibussowitsch PetscCall(DMGlobalToLocalEnd(_dmc, _coors, INSERT_VALUES, _coors_local)); 3021e07b27eSBarry Smith } 3031e07b27eSBarry Smith 3049566063dSJacob Faibussowitsch PetscCall(VecScatterDestroy(&sctx)); 3059566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is_fine)); 3069566063dSJacob Faibussowitsch PetscCall(PetscFree(fine_indices)); 3079566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is_local)); 3089566063dSJacob Faibussowitsch PetscCall(VecDestroy(&perm_coors)); 3099566063dSJacob Faibussowitsch PetscCall(VecDestroy(&coor_natural)); 3103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3111e07b27eSBarry Smith } 3121e07b27eSBarry Smith 313d71ae5a4SJacob Faibussowitsch static PetscErrorCode PCTelescopeSetUp_dmda_repart_coors(PC pc, PC_Telescope sred, PC_Telescope_DMDACtx *ctx) 314d71ae5a4SJacob Faibussowitsch { 3151e07b27eSBarry Smith PetscInt dim; 3161e07b27eSBarry Smith DM dm, subdm; 3171e07b27eSBarry Smith PetscSubcomm psubcomm; 3181e07b27eSBarry Smith MPI_Comm comm; 3191e07b27eSBarry Smith Vec coor; 3201e07b27eSBarry Smith 3211e07b27eSBarry Smith PetscFunctionBegin; 3229566063dSJacob Faibussowitsch PetscCall(PCGetDM(pc, &dm)); 3239566063dSJacob Faibussowitsch PetscCall(DMGetCoordinates(dm, &coor)); 3243ba16761SJacob Faibussowitsch if (!coor) PetscFunctionReturn(PETSC_SUCCESS); 3251e07b27eSBarry Smith psubcomm = sred->psubcomm; 3261e07b27eSBarry Smith comm = PetscSubcommParent(psubcomm); 3271e07b27eSBarry Smith subdm = ctx->dmrepart; 3281e07b27eSBarry Smith 3299566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescope: setting up the coordinates (DMDA)\n")); 3309566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(dm, &dim, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL)); 3311e07b27eSBarry Smith switch (dim) { 332d71ae5a4SJacob Faibussowitsch case 1: 333d71ae5a4SJacob Faibussowitsch SETERRQ(comm, PETSC_ERR_SUP, "Telescope: DMDA (1D) repartitioning not provided"); 334d71ae5a4SJacob Faibussowitsch case 2: 335d71ae5a4SJacob Faibussowitsch PetscCall(PCTelescopeSetUp_dmda_repart_coors2d(sred, dm, subdm)); 336d71ae5a4SJacob Faibussowitsch break; 337d71ae5a4SJacob Faibussowitsch case 3: 338d71ae5a4SJacob Faibussowitsch PetscCall(PCTelescopeSetUp_dmda_repart_coors3d(sred, dm, subdm)); 339d71ae5a4SJacob Faibussowitsch break; 3401e07b27eSBarry Smith } 3413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3421e07b27eSBarry Smith } 3431e07b27eSBarry Smith 3441e07b27eSBarry Smith /* setup repartitioned dm */ 34566976f2fSJacob Faibussowitsch static PetscErrorCode PCTelescopeSetUp_dmda_repart(PC pc, PC_Telescope sred, PC_Telescope_DMDACtx *ctx) 346d71ae5a4SJacob Faibussowitsch { 3471e07b27eSBarry Smith DM dm; 3481e07b27eSBarry Smith PetscInt dim, nx, ny, nz, ndof, nsw, sum, k; 3491e07b27eSBarry Smith DMBoundaryType bx, by, bz; 3501e07b27eSBarry Smith DMDAStencilType stencil; 3511e07b27eSBarry Smith const PetscInt *_range_i_re; 3521e07b27eSBarry Smith const PetscInt *_range_j_re; 3531e07b27eSBarry Smith const PetscInt *_range_k_re; 3541e07b27eSBarry Smith DMDAInterpolationType itype; 3551e07b27eSBarry Smith PetscInt refine_x, refine_y, refine_z; 3561e07b27eSBarry Smith MPI_Comm comm, subcomm; 3571e07b27eSBarry Smith const char *prefix; 358835f2295SStefano Zampini PetscMPIInt ni; 3591e07b27eSBarry Smith 3601e07b27eSBarry Smith PetscFunctionBegin; 3611e07b27eSBarry Smith comm = PetscSubcommParent(sred->psubcomm); 3621e07b27eSBarry Smith subcomm = PetscSubcommChild(sred->psubcomm); 3639566063dSJacob Faibussowitsch PetscCall(PCGetDM(pc, &dm)); 3641e07b27eSBarry Smith 3659566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(dm, &dim, &nx, &ny, &nz, NULL, NULL, NULL, &ndof, &nsw, &bx, &by, &bz, &stencil)); 3669566063dSJacob Faibussowitsch PetscCall(DMDAGetInterpolationType(dm, &itype)); 3679566063dSJacob Faibussowitsch PetscCall(DMDAGetRefinementFactor(dm, &refine_x, &refine_y, &refine_z)); 3681e07b27eSBarry Smith 3691e07b27eSBarry Smith ctx->dmrepart = NULL; 3701e07b27eSBarry Smith _range_i_re = _range_j_re = _range_k_re = NULL; 3711e07b27eSBarry Smith /* Create DMDA on the child communicator */ 37257f12427SDave May if (PCTelescope_isActiveRank(sred)) { 3731e07b27eSBarry Smith switch (dim) { 3741e07b27eSBarry Smith case 1: 3759566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescope: setting up the DMDA on comm subset (1D)\n")); 3769566063dSJacob Faibussowitsch /* PetscCall(DMDACreate1d(subcomm,bx,nx,ndof,nsw,NULL,&ctx->dmrepart)); */ 3771e07b27eSBarry Smith ny = nz = 1; 3781e07b27eSBarry Smith by = bz = DM_BOUNDARY_NONE; 3791e07b27eSBarry Smith break; 3801e07b27eSBarry Smith case 2: 3819566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescope: setting up the DMDA on comm subset (2D)\n")); 3829566063dSJacob Faibussowitsch /* PetscCall(DMDACreate2d(subcomm,bx,by,stencil,nx,ny, PETSC_DECIDE,PETSC_DECIDE, 3839566063dSJacob Faibussowitsch ndof,nsw, NULL,NULL,&ctx->dmrepart)); */ 3841e07b27eSBarry Smith nz = 1; 3851e07b27eSBarry Smith bz = DM_BOUNDARY_NONE; 3861e07b27eSBarry Smith break; 3871e07b27eSBarry Smith case 3: 3889566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescope: setting up the DMDA on comm subset (3D)\n")); 3899566063dSJacob Faibussowitsch /* PetscCall(DMDACreate3d(subcomm,bx,by,bz,stencil,nx,ny,nz, 3909566063dSJacob Faibussowitsch PETSC_DECIDE,PETSC_DECIDE,PETSC_DECIDE, ndof,nsw, NULL,NULL,NULL,&ctx->dmrepart)); */ 3911e07b27eSBarry Smith break; 3921e07b27eSBarry Smith } 3931e07b27eSBarry Smith /* 3941e07b27eSBarry Smith The API DMDACreate1d(), DMDACreate2d(), DMDACreate3d() does not allow us to set/append 3951e07b27eSBarry Smith a unique option prefix for the DM, thus I prefer to expose the contents of these API's here. 3961e07b27eSBarry Smith This allows users to control the partitioning of the subDM. 3971e07b27eSBarry Smith */ 3989566063dSJacob Faibussowitsch PetscCall(DMDACreate(subcomm, &ctx->dmrepart)); 3991e07b27eSBarry Smith /* Set unique option prefix name */ 4009566063dSJacob Faibussowitsch PetscCall(KSPGetOptionsPrefix(sred->ksp, &prefix)); 4019566063dSJacob Faibussowitsch PetscCall(DMSetOptionsPrefix(ctx->dmrepart, prefix)); 4029566063dSJacob Faibussowitsch PetscCall(DMAppendOptionsPrefix(ctx->dmrepart, "repart_")); 4031e07b27eSBarry Smith /* standard setup from DMDACreate{1,2,3}d() */ 4049566063dSJacob Faibussowitsch PetscCall(DMSetDimension(ctx->dmrepart, dim)); 4059566063dSJacob Faibussowitsch PetscCall(DMDASetSizes(ctx->dmrepart, nx, ny, nz)); 4069566063dSJacob Faibussowitsch PetscCall(DMDASetNumProcs(ctx->dmrepart, PETSC_DECIDE, PETSC_DECIDE, PETSC_DECIDE)); 4079566063dSJacob Faibussowitsch PetscCall(DMDASetBoundaryType(ctx->dmrepart, bx, by, bz)); 4089566063dSJacob Faibussowitsch PetscCall(DMDASetDof(ctx->dmrepart, ndof)); 4099566063dSJacob Faibussowitsch PetscCall(DMDASetStencilType(ctx->dmrepart, stencil)); 4109566063dSJacob Faibussowitsch PetscCall(DMDASetStencilWidth(ctx->dmrepart, nsw)); 4119566063dSJacob Faibussowitsch PetscCall(DMDASetOwnershipRanges(ctx->dmrepart, NULL, NULL, NULL)); 4129566063dSJacob Faibussowitsch PetscCall(DMSetFromOptions(ctx->dmrepart)); 4139566063dSJacob Faibussowitsch PetscCall(DMSetUp(ctx->dmrepart)); 4141e07b27eSBarry Smith /* Set refinement factors and interpolation type from the partent */ 4159566063dSJacob Faibussowitsch PetscCall(DMDASetRefinementFactor(ctx->dmrepart, refine_x, refine_y, refine_z)); 4169566063dSJacob Faibussowitsch PetscCall(DMDASetInterpolationType(ctx->dmrepart, itype)); 4171e07b27eSBarry Smith 4189566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(ctx->dmrepart, NULL, NULL, NULL, NULL, &ctx->Mp_re, &ctx->Np_re, &ctx->Pp_re, NULL, NULL, NULL, NULL, NULL, NULL)); 4199566063dSJacob Faibussowitsch PetscCall(DMDAGetOwnershipRanges(ctx->dmrepart, &_range_i_re, &_range_j_re, &_range_k_re)); 4205e897e82SDave May 4215e897e82SDave May ctx->dmrepart->ops->creatematrix = dm->ops->creatematrix; 4225e897e82SDave May ctx->dmrepart->ops->createdomaindecomposition = dm->ops->createdomaindecomposition; 4231e07b27eSBarry Smith } 4241e07b27eSBarry Smith 4251e07b27eSBarry Smith /* generate ranges for repartitioned dm */ 4261e07b27eSBarry Smith /* note - assume rank 0 always participates */ 427071fcb05SBarry Smith /* TODO: use a single MPI call */ 4289566063dSJacob Faibussowitsch PetscCallMPI(MPI_Bcast(&ctx->Mp_re, 1, MPIU_INT, 0, comm)); 4299566063dSJacob Faibussowitsch PetscCallMPI(MPI_Bcast(&ctx->Np_re, 1, MPIU_INT, 0, comm)); 4309566063dSJacob Faibussowitsch PetscCallMPI(MPI_Bcast(&ctx->Pp_re, 1, MPIU_INT, 0, comm)); 4311e07b27eSBarry Smith 4329566063dSJacob Faibussowitsch PetscCall(PetscCalloc3(ctx->Mp_re, &ctx->range_i_re, ctx->Np_re, &ctx->range_j_re, ctx->Pp_re, &ctx->range_k_re)); 4331e07b27eSBarry Smith 4349566063dSJacob Faibussowitsch if (_range_i_re) PetscCall(PetscArraycpy(ctx->range_i_re, _range_i_re, ctx->Mp_re)); 4359566063dSJacob Faibussowitsch if (_range_j_re) PetscCall(PetscArraycpy(ctx->range_j_re, _range_j_re, ctx->Np_re)); 4369566063dSJacob Faibussowitsch if (_range_k_re) PetscCall(PetscArraycpy(ctx->range_k_re, _range_k_re, ctx->Pp_re)); 4371e07b27eSBarry Smith 438071fcb05SBarry Smith /* TODO: use a single MPI call */ 439835f2295SStefano Zampini PetscCall(PetscMPIIntCast(ctx->Mp_re, &ni)); 440835f2295SStefano Zampini PetscCallMPI(MPI_Bcast(ctx->range_i_re, ni, MPIU_INT, 0, comm)); 441835f2295SStefano Zampini PetscCall(PetscMPIIntCast(ctx->Np_re, &ni)); 442835f2295SStefano Zampini PetscCallMPI(MPI_Bcast(ctx->range_j_re, ni, MPIU_INT, 0, comm)); 443835f2295SStefano Zampini PetscCall(PetscMPIIntCast(ctx->Pp_re, &ni)); 444835f2295SStefano Zampini PetscCallMPI(MPI_Bcast(ctx->range_k_re, ni, MPIU_INT, 0, comm)); 4451e07b27eSBarry Smith 4469566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(ctx->Mp_re, &ctx->start_i_re, ctx->Np_re, &ctx->start_j_re, ctx->Pp_re, &ctx->start_k_re)); 4471e07b27eSBarry Smith 4481e07b27eSBarry Smith sum = 0; 4491e07b27eSBarry Smith for (k = 0; k < ctx->Mp_re; k++) { 4501e07b27eSBarry Smith ctx->start_i_re[k] = sum; 4511e07b27eSBarry Smith sum += ctx->range_i_re[k]; 4521e07b27eSBarry Smith } 4531e07b27eSBarry Smith 4541e07b27eSBarry Smith sum = 0; 4551e07b27eSBarry Smith for (k = 0; k < ctx->Np_re; k++) { 4561e07b27eSBarry Smith ctx->start_j_re[k] = sum; 4571e07b27eSBarry Smith sum += ctx->range_j_re[k]; 4581e07b27eSBarry Smith } 4591e07b27eSBarry Smith 4601e07b27eSBarry Smith sum = 0; 4611e07b27eSBarry Smith for (k = 0; k < ctx->Pp_re; k++) { 4621e07b27eSBarry Smith ctx->start_k_re[k] = sum; 4631e07b27eSBarry Smith sum += ctx->range_k_re[k]; 4641e07b27eSBarry Smith } 4651e07b27eSBarry Smith 466ba1c3560SDave May /* attach repartitioned dm to child ksp */ 467ba1c3560SDave May { 468ba1c3560SDave May PetscErrorCode (*dmksp_func)(KSP, Mat, Mat, void *); 469ba1c3560SDave May void *dmksp_ctx; 470ba1c3560SDave May 4719566063dSJacob Faibussowitsch PetscCall(DMKSPGetComputeOperators(dm, &dmksp_func, &dmksp_ctx)); 472ba1c3560SDave May 4731e07b27eSBarry Smith /* attach dm to ksp on sub communicator */ 47457f12427SDave May if (PCTelescope_isActiveRank(sred)) { 4759566063dSJacob Faibussowitsch PetscCall(KSPSetDM(sred->ksp, ctx->dmrepart)); 476ba1c3560SDave May 477c5db1f53SDave May if (!dmksp_func || sred->ignore_kspcomputeoperators) { 478*bf0c7fc2SBarry Smith PetscCall(KSPSetDMActive(sred->ksp, KSP_DMACTIVE_ALL, PETSC_FALSE)); 479ba1c3560SDave May } else { 480ba1c3560SDave May /* sub ksp inherits dmksp_func and context provided by user */ 4819566063dSJacob Faibussowitsch PetscCall(KSPSetComputeOperators(sred->ksp, dmksp_func, dmksp_ctx)); 482*bf0c7fc2SBarry Smith PetscCall(KSPSetDMActive(sred->ksp, KSP_DMACTIVE_ALL, PETSC_TRUE)); 483ba1c3560SDave May } 484ba1c3560SDave May } 4851e07b27eSBarry Smith } 4863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4871e07b27eSBarry Smith } 4881e07b27eSBarry Smith 48966976f2fSJacob Faibussowitsch static PetscErrorCode PCTelescopeSetUp_dmda_permutation_3d(PC pc, PC_Telescope sred, PC_Telescope_DMDACtx *ctx) 490d71ae5a4SJacob Faibussowitsch { 4911e07b27eSBarry Smith DM dm; 4921e07b27eSBarry Smith MPI_Comm comm; 4931e07b27eSBarry Smith Mat Pscalar, P; 4941e07b27eSBarry Smith PetscInt ndof; 4951e07b27eSBarry Smith PetscInt i, j, k, location, startI[3], endI[3], lenI[3], nx, ny, nz; 4961e07b27eSBarry Smith PetscInt sr, er, Mr; 4971e07b27eSBarry Smith Vec V; 4981e07b27eSBarry Smith 4991e07b27eSBarry Smith PetscFunctionBegin; 5009566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescope: setting up the permutation matrix (DMDA-3D)\n")); 5019566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)pc, &comm)); 5021e07b27eSBarry Smith 5039566063dSJacob Faibussowitsch PetscCall(PCGetDM(pc, &dm)); 5049566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(dm, NULL, &nx, &ny, &nz, NULL, NULL, NULL, &ndof, NULL, NULL, NULL, NULL, NULL)); 5051e07b27eSBarry Smith 5069566063dSJacob Faibussowitsch PetscCall(DMGetGlobalVector(dm, &V)); 5079566063dSJacob Faibussowitsch PetscCall(VecGetSize(V, &Mr)); 5089566063dSJacob Faibussowitsch PetscCall(VecGetOwnershipRange(V, &sr, &er)); 5099566063dSJacob Faibussowitsch PetscCall(DMRestoreGlobalVector(dm, &V)); 5101e07b27eSBarry Smith sr = sr / ndof; 5111e07b27eSBarry Smith er = er / ndof; 5121e07b27eSBarry Smith Mr = Mr / ndof; 5131e07b27eSBarry Smith 5149566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, &Pscalar)); 51557508eceSPierre Jolivet PetscCall(MatSetSizes(Pscalar, er - sr, er - sr, Mr, Mr)); 5169566063dSJacob Faibussowitsch PetscCall(MatSetType(Pscalar, MATAIJ)); 5179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(Pscalar, 1, NULL)); 5189566063dSJacob Faibussowitsch PetscCall(MatMPIAIJSetPreallocation(Pscalar, 1, NULL, 1, NULL)); 5191e07b27eSBarry Smith 5209566063dSJacob Faibussowitsch PetscCall(DMDAGetCorners(dm, NULL, NULL, NULL, &lenI[0], &lenI[1], &lenI[2])); 5219566063dSJacob Faibussowitsch PetscCall(DMDAGetCorners(dm, &startI[0], &startI[1], &startI[2], &endI[0], &endI[1], &endI[2])); 5221e07b27eSBarry Smith endI[0] += startI[0]; 5231e07b27eSBarry Smith endI[1] += startI[1]; 5241e07b27eSBarry Smith endI[2] += startI[2]; 5251e07b27eSBarry Smith 5261e07b27eSBarry Smith for (k = startI[2]; k < endI[2]; k++) { 5271e07b27eSBarry Smith for (j = startI[1]; j < endI[1]; j++) { 5281e07b27eSBarry Smith for (i = startI[0]; i < endI[0]; i++) { 5291e07b27eSBarry Smith PetscMPIInt rank_ijk_re, rank_reI[3]; 5301e07b27eSBarry Smith PetscInt s0_re; 531c6a0d831SBarry Smith PetscInt ii, jj, kk, local_ijk_re, mapped_ijk; 5321e07b27eSBarry Smith PetscInt lenI_re[3]; 5331e07b27eSBarry Smith 5341e07b27eSBarry Smith location = (i - startI[0]) + (j - startI[1]) * lenI[0] + (k - startI[2]) * lenI[0] * lenI[1]; 5359371c9d4SSatish Balay PetscCall(_DMDADetermineRankFromGlobalIJK(3, i, j, k, ctx->Mp_re, ctx->Np_re, ctx->Pp_re, ctx->start_i_re, ctx->start_j_re, ctx->start_k_re, ctx->range_i_re, ctx->range_j_re, ctx->range_k_re, &rank_reI[0], &rank_reI[1], &rank_reI[2], &rank_ijk_re)); 5369566063dSJacob Faibussowitsch PetscCall(_DMDADetermineGlobalS0(3, rank_ijk_re, ctx->Mp_re, ctx->Np_re, ctx->Pp_re, ctx->range_i_re, ctx->range_j_re, ctx->range_k_re, &s0_re)); 5371e07b27eSBarry Smith ii = i - ctx->start_i_re[rank_reI[0]]; 53808401ef6SPierre Jolivet PetscCheck(ii >= 0, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmdarepart-perm3d] index error ii"); 5391e07b27eSBarry Smith jj = j - ctx->start_j_re[rank_reI[1]]; 54008401ef6SPierre Jolivet PetscCheck(jj >= 0, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmdarepart-perm3d] index error jj"); 5411e07b27eSBarry Smith kk = k - ctx->start_k_re[rank_reI[2]]; 54208401ef6SPierre Jolivet PetscCheck(kk >= 0, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmdarepart-perm3d] index error kk"); 5431e07b27eSBarry Smith lenI_re[0] = ctx->range_i_re[rank_reI[0]]; 5441e07b27eSBarry Smith lenI_re[1] = ctx->range_j_re[rank_reI[1]]; 5451e07b27eSBarry Smith lenI_re[2] = ctx->range_k_re[rank_reI[2]]; 5461e07b27eSBarry Smith local_ijk_re = ii + jj * lenI_re[0] + kk * lenI_re[0] * lenI_re[1]; 5471e07b27eSBarry Smith mapped_ijk = s0_re + local_ijk_re; 5489566063dSJacob Faibussowitsch PetscCall(MatSetValue(Pscalar, sr + location, mapped_ijk, 1.0, INSERT_VALUES)); 5491e07b27eSBarry Smith } 5501e07b27eSBarry Smith } 5511e07b27eSBarry Smith } 5529566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(Pscalar, MAT_FINAL_ASSEMBLY)); 5539566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(Pscalar, MAT_FINAL_ASSEMBLY)); 5549566063dSJacob Faibussowitsch PetscCall(MatCreateMAIJ(Pscalar, ndof, &P)); 5559566063dSJacob Faibussowitsch PetscCall(MatDestroy(&Pscalar)); 5561e07b27eSBarry Smith ctx->permutation = P; 5573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5581e07b27eSBarry Smith } 5591e07b27eSBarry Smith 56066976f2fSJacob Faibussowitsch static PetscErrorCode PCTelescopeSetUp_dmda_permutation_2d(PC pc, PC_Telescope sred, PC_Telescope_DMDACtx *ctx) 561d71ae5a4SJacob Faibussowitsch { 5621e07b27eSBarry Smith DM dm; 5631e07b27eSBarry Smith MPI_Comm comm; 5641e07b27eSBarry Smith Mat Pscalar, P; 5651e07b27eSBarry Smith PetscInt ndof; 5661e07b27eSBarry Smith PetscInt i, j, location, startI[2], endI[2], lenI[2], nx, ny, nz; 5671e07b27eSBarry Smith PetscInt sr, er, Mr; 5681e07b27eSBarry Smith Vec V; 5691e07b27eSBarry Smith 5701e07b27eSBarry Smith PetscFunctionBegin; 5719566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescope: setting up the permutation matrix (DMDA-2D)\n")); 5729566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)pc, &comm)); 5739566063dSJacob Faibussowitsch PetscCall(PCGetDM(pc, &dm)); 5749566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(dm, NULL, &nx, &ny, &nz, NULL, NULL, NULL, &ndof, NULL, NULL, NULL, NULL, NULL)); 5759566063dSJacob Faibussowitsch PetscCall(DMGetGlobalVector(dm, &V)); 5769566063dSJacob Faibussowitsch PetscCall(VecGetSize(V, &Mr)); 5779566063dSJacob Faibussowitsch PetscCall(VecGetOwnershipRange(V, &sr, &er)); 5789566063dSJacob Faibussowitsch PetscCall(DMRestoreGlobalVector(dm, &V)); 5791e07b27eSBarry Smith sr = sr / ndof; 5801e07b27eSBarry Smith er = er / ndof; 5811e07b27eSBarry Smith Mr = Mr / ndof; 5821e07b27eSBarry Smith 5839566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, &Pscalar)); 58457508eceSPierre Jolivet PetscCall(MatSetSizes(Pscalar, er - sr, er - sr, Mr, Mr)); 5859566063dSJacob Faibussowitsch PetscCall(MatSetType(Pscalar, MATAIJ)); 5869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(Pscalar, 1, NULL)); 5879566063dSJacob Faibussowitsch PetscCall(MatMPIAIJSetPreallocation(Pscalar, 1, NULL, 1, NULL)); 5881e07b27eSBarry Smith 5899566063dSJacob Faibussowitsch PetscCall(DMDAGetCorners(dm, NULL, NULL, NULL, &lenI[0], &lenI[1], NULL)); 5909566063dSJacob Faibussowitsch PetscCall(DMDAGetCorners(dm, &startI[0], &startI[1], NULL, &endI[0], &endI[1], NULL)); 5911e07b27eSBarry Smith endI[0] += startI[0]; 5921e07b27eSBarry Smith endI[1] += startI[1]; 5931e07b27eSBarry Smith 5941e07b27eSBarry Smith for (j = startI[1]; j < endI[1]; j++) { 5951e07b27eSBarry Smith for (i = startI[0]; i < endI[0]; i++) { 5961e07b27eSBarry Smith PetscMPIInt rank_ijk_re, rank_reI[3]; 5971e07b27eSBarry Smith PetscInt s0_re; 598c6a0d831SBarry Smith PetscInt ii, jj, local_ijk_re, mapped_ijk; 5991e07b27eSBarry Smith PetscInt lenI_re[3]; 6001e07b27eSBarry Smith 6011e07b27eSBarry Smith location = (i - startI[0]) + (j - startI[1]) * lenI[0]; 6029371c9d4SSatish Balay PetscCall(_DMDADetermineRankFromGlobalIJK(2, i, j, 0, ctx->Mp_re, ctx->Np_re, ctx->Pp_re, ctx->start_i_re, ctx->start_j_re, ctx->start_k_re, ctx->range_i_re, ctx->range_j_re, ctx->range_k_re, &rank_reI[0], &rank_reI[1], NULL, &rank_ijk_re)); 6031e07b27eSBarry Smith 6049566063dSJacob Faibussowitsch PetscCall(_DMDADetermineGlobalS0(2, rank_ijk_re, ctx->Mp_re, ctx->Np_re, ctx->Pp_re, ctx->range_i_re, ctx->range_j_re, ctx->range_k_re, &s0_re)); 6051e07b27eSBarry Smith 6061e07b27eSBarry Smith ii = i - ctx->start_i_re[rank_reI[0]]; 60708401ef6SPierre Jolivet PetscCheck(ii >= 0, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmdarepart-perm2d] index error ii"); 6081e07b27eSBarry Smith jj = j - ctx->start_j_re[rank_reI[1]]; 60908401ef6SPierre Jolivet PetscCheck(jj >= 0, PETSC_COMM_SELF, PETSC_ERR_USER, "[dmdarepart-perm2d] index error jj"); 6101e07b27eSBarry Smith 6111e07b27eSBarry Smith lenI_re[0] = ctx->range_i_re[rank_reI[0]]; 6121e07b27eSBarry Smith lenI_re[1] = ctx->range_j_re[rank_reI[1]]; 6131e07b27eSBarry Smith local_ijk_re = ii + jj * lenI_re[0]; 6141e07b27eSBarry Smith mapped_ijk = s0_re + local_ijk_re; 6159566063dSJacob Faibussowitsch PetscCall(MatSetValue(Pscalar, sr + location, mapped_ijk, 1.0, INSERT_VALUES)); 6161e07b27eSBarry Smith } 6171e07b27eSBarry Smith } 6189566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(Pscalar, MAT_FINAL_ASSEMBLY)); 6199566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(Pscalar, MAT_FINAL_ASSEMBLY)); 6209566063dSJacob Faibussowitsch PetscCall(MatCreateMAIJ(Pscalar, ndof, &P)); 6219566063dSJacob Faibussowitsch PetscCall(MatDestroy(&Pscalar)); 6221e07b27eSBarry Smith ctx->permutation = P; 6233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6241e07b27eSBarry Smith } 6251e07b27eSBarry Smith 62666976f2fSJacob Faibussowitsch static PetscErrorCode PCTelescopeSetUp_dmda_scatters(PC pc, PC_Telescope sred, PC_Telescope_DMDACtx *ctx) 627d71ae5a4SJacob Faibussowitsch { 6281e07b27eSBarry Smith Vec xred, yred, xtmp, x, xp; 6291e07b27eSBarry Smith VecScatter scatter; 6301e07b27eSBarry Smith IS isin; 6311e07b27eSBarry Smith Mat B; 6321e07b27eSBarry Smith PetscInt m, bs, st, ed; 6331e07b27eSBarry Smith MPI_Comm comm; 6341e07b27eSBarry Smith 6351e07b27eSBarry Smith PetscFunctionBegin; 6369566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)pc, &comm)); 6379566063dSJacob Faibussowitsch PetscCall(PCGetOperators(pc, NULL, &B)); 6389566063dSJacob Faibussowitsch PetscCall(MatCreateVecs(B, &x, NULL)); 6399566063dSJacob Faibussowitsch PetscCall(MatGetBlockSize(B, &bs)); 6409566063dSJacob Faibussowitsch PetscCall(VecDuplicate(x, &xp)); 6413ac26c5eSBarry Smith m = 0; 6421e07b27eSBarry Smith xred = NULL; 6431e07b27eSBarry Smith yred = NULL; 64457f12427SDave May if (PCTelescope_isActiveRank(sred)) { 6459566063dSJacob Faibussowitsch PetscCall(DMCreateGlobalVector(ctx->dmrepart, &xred)); 6469566063dSJacob Faibussowitsch PetscCall(VecDuplicate(xred, &yred)); 6479566063dSJacob Faibussowitsch PetscCall(VecGetOwnershipRange(xred, &st, &ed)); 6489566063dSJacob Faibussowitsch PetscCall(ISCreateStride(comm, ed - st, st, 1, &isin)); 6499566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(xred, &m)); 6501e07b27eSBarry Smith } else { 6519566063dSJacob Faibussowitsch PetscCall(VecGetOwnershipRange(x, &st, &ed)); 6529566063dSJacob Faibussowitsch PetscCall(ISCreateStride(comm, 0, st, 1, &isin)); 6531e07b27eSBarry Smith } 6549566063dSJacob Faibussowitsch PetscCall(ISSetBlockSize(isin, bs)); 6559566063dSJacob Faibussowitsch PetscCall(VecCreate(comm, &xtmp)); 6569566063dSJacob Faibussowitsch PetscCall(VecSetSizes(xtmp, m, PETSC_DECIDE)); 6579566063dSJacob Faibussowitsch PetscCall(VecSetBlockSize(xtmp, bs)); 6589566063dSJacob Faibussowitsch PetscCall(VecSetType(xtmp, ((PetscObject)x)->type_name)); 6599566063dSJacob Faibussowitsch PetscCall(VecScatterCreate(x, isin, xtmp, NULL, &scatter)); 6601e07b27eSBarry Smith sred->xred = xred; 6611e07b27eSBarry Smith sred->yred = yred; 6621e07b27eSBarry Smith sred->isin = isin; 6631e07b27eSBarry Smith sred->scatter = scatter; 6641e07b27eSBarry Smith sred->xtmp = xtmp; 6651e07b27eSBarry Smith 6661e07b27eSBarry Smith ctx->xp = xp; 6679566063dSJacob Faibussowitsch PetscCall(VecDestroy(&x)); 6683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6691e07b27eSBarry Smith } 6701e07b27eSBarry Smith 671d71ae5a4SJacob Faibussowitsch PetscErrorCode PCTelescopeSetUp_dmda(PC pc, PC_Telescope sred) 672d71ae5a4SJacob Faibussowitsch { 6731e07b27eSBarry Smith PC_Telescope_DMDACtx *ctx; 6741e07b27eSBarry Smith PetscInt dim; 6751e07b27eSBarry Smith DM dm; 6761e07b27eSBarry Smith MPI_Comm comm; 6771e07b27eSBarry Smith 6781e07b27eSBarry Smith PetscFunctionBegin; 6799566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescope: setup (DMDA)\n")); 6809566063dSJacob Faibussowitsch PetscCall(PetscNew(&ctx)); 6811e07b27eSBarry Smith sred->dm_ctx = (void *)ctx; 6821e07b27eSBarry Smith 6839566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)pc, &comm)); 6849566063dSJacob Faibussowitsch PetscCall(PCGetDM(pc, &dm)); 6859566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(dm, &dim, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL)); 6861e07b27eSBarry Smith 6873ba16761SJacob Faibussowitsch PetscCall(PCTelescopeSetUp_dmda_repart(pc, sred, ctx)); 6883ba16761SJacob Faibussowitsch PetscCall(PCTelescopeSetUp_dmda_repart_coors(pc, sred, ctx)); 6891e07b27eSBarry Smith switch (dim) { 690d71ae5a4SJacob Faibussowitsch case 1: 691d71ae5a4SJacob Faibussowitsch SETERRQ(comm, PETSC_ERR_SUP, "Telescope: DMDA (1D) repartitioning not provided"); 692d71ae5a4SJacob Faibussowitsch case 2: 693d71ae5a4SJacob Faibussowitsch PetscCall(PCTelescopeSetUp_dmda_permutation_2d(pc, sred, ctx)); 694d71ae5a4SJacob Faibussowitsch break; 695d71ae5a4SJacob Faibussowitsch case 3: 696d71ae5a4SJacob Faibussowitsch PetscCall(PCTelescopeSetUp_dmda_permutation_3d(pc, sred, ctx)); 697d71ae5a4SJacob Faibussowitsch break; 6981e07b27eSBarry Smith } 6999566063dSJacob Faibussowitsch PetscCall(PCTelescopeSetUp_dmda_scatters(pc, sred, ctx)); 7003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7011e07b27eSBarry Smith } 7021e07b27eSBarry Smith 70366976f2fSJacob Faibussowitsch static PetscErrorCode PCTelescopeMatCreate_dmda_dmactivefalse(PC pc, PC_Telescope sred, MatReuse reuse, Mat *A) 704d71ae5a4SJacob Faibussowitsch { 7051e07b27eSBarry Smith PC_Telescope_DMDACtx *ctx; 7061e07b27eSBarry Smith MPI_Comm comm, subcomm; 7071e07b27eSBarry Smith Mat Bperm, Bred, B, P; 7081e07b27eSBarry Smith PetscInt nr, nc; 7091e07b27eSBarry Smith IS isrow, iscol; 7101e07b27eSBarry Smith Mat Blocal, *_Blocal; 7111e07b27eSBarry Smith 7121e07b27eSBarry Smith PetscFunctionBegin; 7139566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescope: updating the redundant preconditioned operator (DMDA)\n")); 7149566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)pc, &comm)); 7151e07b27eSBarry Smith subcomm = PetscSubcommChild(sred->psubcomm); 7161e07b27eSBarry Smith ctx = (PC_Telescope_DMDACtx *)sred->dm_ctx; 7171e07b27eSBarry Smith 7189566063dSJacob Faibussowitsch PetscCall(PCGetOperators(pc, NULL, &B)); 7199566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &nr, &nc)); 7201e07b27eSBarry Smith 7211e07b27eSBarry Smith P = ctx->permutation; 7229566063dSJacob Faibussowitsch PetscCall(MatPtAP(B, P, MAT_INITIAL_MATRIX, 1.1, &Bperm)); 7231e07b27eSBarry Smith 7241e07b27eSBarry Smith /* Get submatrices */ 7251e07b27eSBarry Smith isrow = sred->isin; 7269566063dSJacob Faibussowitsch PetscCall(ISCreateStride(comm, nc, 0, 1, &iscol)); 7271e07b27eSBarry Smith 7289566063dSJacob Faibussowitsch PetscCall(MatCreateSubMatrices(Bperm, 1, &isrow, &iscol, MAT_INITIAL_MATRIX, &_Blocal)); 7291e07b27eSBarry Smith Blocal = *_Blocal; 7301e07b27eSBarry Smith Bred = NULL; 73157f12427SDave May if (PCTelescope_isActiveRank(sred)) { 7321e07b27eSBarry Smith PetscInt mm; 7331e07b27eSBarry Smith 734ad540459SPierre Jolivet if (reuse != MAT_INITIAL_MATRIX) Bred = *A; 7359566063dSJacob Faibussowitsch PetscCall(MatGetSize(Blocal, &mm, NULL)); 7369566063dSJacob Faibussowitsch /* PetscCall(MatCreateMPIMatConcatenateSeqMat(subcomm,Blocal,PETSC_DECIDE,reuse,&Bred)); */ 7379566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat(subcomm, Blocal, mm, reuse, &Bred)); 7381e07b27eSBarry Smith } 7391e07b27eSBarry Smith *A = Bred; 7401e07b27eSBarry Smith 7419566063dSJacob Faibussowitsch PetscCall(ISDestroy(&iscol)); 7429566063dSJacob Faibussowitsch PetscCall(MatDestroy(&Bperm)); 7439566063dSJacob Faibussowitsch PetscCall(MatDestroyMatrices(1, &_Blocal)); 7443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7451e07b27eSBarry Smith } 7461e07b27eSBarry Smith 747d71ae5a4SJacob Faibussowitsch PetscErrorCode PCTelescopeMatCreate_dmda(PC pc, PC_Telescope sred, MatReuse reuse, Mat *A) 748d71ae5a4SJacob Faibussowitsch { 749ba1c3560SDave May DM dm; 750ba1c3560SDave May PetscErrorCode (*dmksp_func)(KSP, Mat, Mat, void *); 751ba1c3560SDave May void *dmksp_ctx; 752ba1c3560SDave May 753ba1c3560SDave May PetscFunctionBegin; 7549566063dSJacob Faibussowitsch PetscCall(PCGetDM(pc, &dm)); 7559566063dSJacob Faibussowitsch PetscCall(DMKSPGetComputeOperators(dm, &dmksp_func, &dmksp_ctx)); 756dc9ee9fdSDave May /* We assume that dmksp_func = NULL, is equivalent to dmActive = PETSC_FALSE */ 7577c5279cbSDave May if (dmksp_func && !sred->ignore_kspcomputeoperators) { 758ba1c3560SDave May DM dmrepart; 75928323a89SDave May Mat Ak; 760ba1c3560SDave May 761ba1c3560SDave May *A = NULL; 76257f12427SDave May if (PCTelescope_isActiveRank(sred)) { 7639566063dSJacob Faibussowitsch PetscCall(KSPGetDM(sred->ksp, &dmrepart)); 764ba1c3560SDave May if (reuse == MAT_INITIAL_MATRIX) { 7659566063dSJacob Faibussowitsch PetscCall(DMCreateMatrix(dmrepart, &Ak)); 766ba1c3560SDave May *A = Ak; 767ba1c3560SDave May } else if (reuse == MAT_REUSE_MATRIX) { 768ba1c3560SDave May Ak = *A; 769ba1c3560SDave May } 7705c5dbb1cSDave May /* 7715c5dbb1cSDave May There is no need to explicitly assemble the operator now, 7725c5dbb1cSDave May the sub-KSP will call the method provided to KSPSetComputeOperators() during KSPSetUp() 7735c5dbb1cSDave May */ 774ba1c3560SDave May } 775ba1c3560SDave May } else { 7769566063dSJacob Faibussowitsch PetscCall(PCTelescopeMatCreate_dmda_dmactivefalse(pc, sred, reuse, A)); 777ba1c3560SDave May } 7783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 779ba1c3560SDave May } 780ba1c3560SDave May 78166976f2fSJacob Faibussowitsch static PetscErrorCode PCTelescopeSubNullSpaceCreate_dmda_Telescope(PC pc, PC_Telescope sred, MatNullSpace nullspace, MatNullSpace *sub_nullspace) 782d71ae5a4SJacob Faibussowitsch { 7831e07b27eSBarry Smith PetscBool has_const; 784a947c41eSDave May PetscInt i, k, n = 0; 7851e07b27eSBarry Smith const Vec *vecs; 786c41e779fSDave May Vec *sub_vecs = NULL; 7871e07b27eSBarry Smith MPI_Comm subcomm; 7881e07b27eSBarry Smith PC_Telescope_DMDACtx *ctx; 7891e07b27eSBarry Smith 7901e07b27eSBarry Smith PetscFunctionBegin; 7911e07b27eSBarry Smith ctx = (PC_Telescope_DMDACtx *)sred->dm_ctx; 7921e07b27eSBarry Smith subcomm = PetscSubcommChild(sred->psubcomm); 7939566063dSJacob Faibussowitsch PetscCall(MatNullSpaceGetVecs(nullspace, &has_const, &n, &vecs)); 7941e07b27eSBarry Smith 79557f12427SDave May if (PCTelescope_isActiveRank(sred)) { 7961e07b27eSBarry Smith /* create new vectors */ 79748a46eb9SPierre Jolivet if (n) PetscCall(VecDuplicateVecs(sred->xred, n, &sub_vecs)); 7981e07b27eSBarry Smith } 7991e07b27eSBarry Smith 8001e07b27eSBarry Smith /* copy entries */ 8011e07b27eSBarry Smith for (k = 0; k < n; k++) { 8021e07b27eSBarry Smith const PetscScalar *x_array; 8031e07b27eSBarry Smith PetscScalar *LA_sub_vec; 80413c30530SDave May PetscInt st, ed; 8051e07b27eSBarry Smith 8061e07b27eSBarry Smith /* permute vector into ordering associated with re-partitioned dmda */ 8079566063dSJacob Faibussowitsch PetscCall(MatMultTranspose(ctx->permutation, vecs[k], ctx->xp)); 8081e07b27eSBarry Smith 8091e07b27eSBarry Smith /* pull in vector x->xtmp */ 8109566063dSJacob Faibussowitsch PetscCall(VecScatterBegin(sred->scatter, ctx->xp, sred->xtmp, INSERT_VALUES, SCATTER_FORWARD)); 8119566063dSJacob Faibussowitsch PetscCall(VecScatterEnd(sred->scatter, ctx->xp, sred->xtmp, INSERT_VALUES, SCATTER_FORWARD)); 8121e07b27eSBarry Smith 813392968a1SPatrick Sanan /* copy vector entries into xred */ 8149566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(sred->xtmp, &x_array)); 815ea2b237eSDave May if (sub_vecs) { 816ea2b237eSDave May if (sub_vecs[k]) { 8179566063dSJacob Faibussowitsch PetscCall(VecGetOwnershipRange(sub_vecs[k], &st, &ed)); 8189566063dSJacob Faibussowitsch PetscCall(VecGetArray(sub_vecs[k], &LA_sub_vec)); 819ad540459SPierre Jolivet for (i = 0; i < ed - st; i++) LA_sub_vec[i] = x_array[i]; 8209566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(sub_vecs[k], &LA_sub_vec)); 8211e07b27eSBarry Smith } 822ea2b237eSDave May } 8239566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(sred->xtmp, &x_array)); 8241e07b27eSBarry Smith } 8251e07b27eSBarry Smith 82657f12427SDave May if (PCTelescope_isActiveRank(sred)) { 827d8b9d5b7SPatrick Sanan /* create new (near) nullspace for redundant object */ 8289566063dSJacob Faibussowitsch PetscCall(MatNullSpaceCreate(subcomm, has_const, n, sub_vecs, sub_nullspace)); 8299566063dSJacob Faibussowitsch PetscCall(VecDestroyVecs(n, &sub_vecs)); 83028b400f6SJacob Faibussowitsch PetscCheck(!nullspace->remove, PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "Propagation of custom remove callbacks not supported when propagating (near) nullspaces with PCTelescope"); 83128b400f6SJacob Faibussowitsch PetscCheck(!nullspace->rmctx, PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "Propagation of custom remove callback context not supported when propagating (near) nullspaces with PCTelescope"); 832d8b9d5b7SPatrick Sanan } 8333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 834392968a1SPatrick Sanan } 835392968a1SPatrick Sanan 836d71ae5a4SJacob Faibussowitsch PetscErrorCode PCTelescopeMatNullSpaceCreate_dmda(PC pc, PC_Telescope sred, Mat sub_mat) 837d71ae5a4SJacob Faibussowitsch { 838392968a1SPatrick Sanan Mat B; 839392968a1SPatrick Sanan 840392968a1SPatrick Sanan PetscFunctionBegin; 8419566063dSJacob Faibussowitsch PetscCall(PCGetOperators(pc, NULL, &B)); 842392968a1SPatrick Sanan { 843392968a1SPatrick Sanan MatNullSpace nullspace, sub_nullspace; 8449566063dSJacob Faibussowitsch PetscCall(MatGetNullSpace(B, &nullspace)); 845392968a1SPatrick Sanan if (nullspace) { 8469566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescope: generating nullspace (DMDA)\n")); 8479566063dSJacob Faibussowitsch PetscCall(PCTelescopeSubNullSpaceCreate_dmda_Telescope(pc, sred, nullspace, &sub_nullspace)); 84857f12427SDave May if (PCTelescope_isActiveRank(sred)) { 8499566063dSJacob Faibussowitsch PetscCall(MatSetNullSpace(sub_mat, sub_nullspace)); 8509566063dSJacob Faibussowitsch PetscCall(MatNullSpaceDestroy(&sub_nullspace)); 8511e07b27eSBarry Smith } 852392968a1SPatrick Sanan } 853392968a1SPatrick Sanan } 854392968a1SPatrick Sanan { 855392968a1SPatrick Sanan MatNullSpace nearnullspace, sub_nearnullspace; 8569566063dSJacob Faibussowitsch PetscCall(MatGetNearNullSpace(B, &nearnullspace)); 857392968a1SPatrick Sanan if (nearnullspace) { 8589566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescope: generating near nullspace (DMDA)\n")); 8599566063dSJacob Faibussowitsch PetscCall(PCTelescopeSubNullSpaceCreate_dmda_Telescope(pc, sred, nearnullspace, &sub_nearnullspace)); 86057f12427SDave May if (PCTelescope_isActiveRank(sred)) { 8619566063dSJacob Faibussowitsch PetscCall(MatSetNearNullSpace(sub_mat, sub_nearnullspace)); 8629566063dSJacob Faibussowitsch PetscCall(MatNullSpaceDestroy(&sub_nearnullspace)); 863392968a1SPatrick Sanan } 864392968a1SPatrick Sanan } 865392968a1SPatrick Sanan } 8663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 8671e07b27eSBarry Smith } 8681e07b27eSBarry Smith 869d71ae5a4SJacob Faibussowitsch PetscErrorCode PCApply_Telescope_dmda(PC pc, Vec x, Vec y) 870d71ae5a4SJacob Faibussowitsch { 8711e07b27eSBarry Smith PC_Telescope sred = (PC_Telescope)pc->data; 8721e07b27eSBarry Smith Mat perm; 8731e07b27eSBarry Smith Vec xtmp, xp, xred, yred; 87413c30530SDave May PetscInt i, st, ed; 8751e07b27eSBarry Smith VecScatter scatter; 8761e07b27eSBarry Smith PetscScalar *array; 8771e07b27eSBarry Smith const PetscScalar *x_array; 8781e07b27eSBarry Smith PC_Telescope_DMDACtx *ctx; 8791e07b27eSBarry Smith 8801e07b27eSBarry Smith ctx = (PC_Telescope_DMDACtx *)sred->dm_ctx; 8811e07b27eSBarry Smith xtmp = sred->xtmp; 8821e07b27eSBarry Smith scatter = sred->scatter; 8831e07b27eSBarry Smith xred = sred->xred; 8841e07b27eSBarry Smith yred = sred->yred; 8851e07b27eSBarry Smith perm = ctx->permutation; 8861e07b27eSBarry Smith xp = ctx->xp; 8871e07b27eSBarry Smith 8881e07b27eSBarry Smith PetscFunctionBegin; 8899566063dSJacob Faibussowitsch PetscCall(PetscCitationsRegister(citation, &cited)); 89014c9fce5SDave May 8911e07b27eSBarry Smith /* permute vector into ordering associated with re-partitioned dmda */ 8929566063dSJacob Faibussowitsch PetscCall(MatMultTranspose(perm, x, xp)); 8931e07b27eSBarry Smith 8941e07b27eSBarry Smith /* pull in vector x->xtmp */ 8959566063dSJacob Faibussowitsch PetscCall(VecScatterBegin(scatter, xp, xtmp, INSERT_VALUES, SCATTER_FORWARD)); 8969566063dSJacob Faibussowitsch PetscCall(VecScatterEnd(scatter, xp, xtmp, INSERT_VALUES, SCATTER_FORWARD)); 8971e07b27eSBarry Smith 898a5b23f4aSJose E. Roman /* copy vector entries into xred */ 8999566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xtmp, &x_array)); 9001e07b27eSBarry Smith if (xred) { 9011e07b27eSBarry Smith PetscScalar *LA_xred; 9029566063dSJacob Faibussowitsch PetscCall(VecGetOwnershipRange(xred, &st, &ed)); 9031e07b27eSBarry Smith 9049566063dSJacob Faibussowitsch PetscCall(VecGetArray(xred, &LA_xred)); 905ad540459SPierre Jolivet for (i = 0; i < ed - st; i++) LA_xred[i] = x_array[i]; 9069566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xred, &LA_xred)); 9071e07b27eSBarry Smith } 9089566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xtmp, &x_array)); 9091e07b27eSBarry Smith 9101e07b27eSBarry Smith /* solve */ 91157f12427SDave May if (PCTelescope_isActiveRank(sred)) { 9129566063dSJacob Faibussowitsch PetscCall(KSPSolve(sred->ksp, xred, yred)); 9139566063dSJacob Faibussowitsch PetscCall(KSPCheckSolve(sred->ksp, pc, yred)); 9141e07b27eSBarry Smith } 9151e07b27eSBarry Smith 9161e07b27eSBarry Smith /* return vector */ 9179566063dSJacob Faibussowitsch PetscCall(VecGetArray(xtmp, &array)); 9181e07b27eSBarry Smith if (yred) { 9191e07b27eSBarry Smith const PetscScalar *LA_yred; 9209566063dSJacob Faibussowitsch PetscCall(VecGetOwnershipRange(yred, &st, &ed)); 9219566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(yred, &LA_yred)); 922ad540459SPierre Jolivet for (i = 0; i < ed - st; i++) array[i] = LA_yred[i]; 9239566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(yred, &LA_yred)); 9241e07b27eSBarry Smith } 9259566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xtmp, &array)); 9269566063dSJacob Faibussowitsch PetscCall(VecScatterBegin(scatter, xtmp, xp, INSERT_VALUES, SCATTER_REVERSE)); 9279566063dSJacob Faibussowitsch PetscCall(VecScatterEnd(scatter, xtmp, xp, INSERT_VALUES, SCATTER_REVERSE)); 9289566063dSJacob Faibussowitsch PetscCall(MatMult(perm, xp, y)); 9293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 9301e07b27eSBarry Smith } 9311e07b27eSBarry Smith 932d71ae5a4SJacob Faibussowitsch PetscErrorCode PCApplyRichardson_Telescope_dmda(PC pc, Vec x, Vec y, Vec w, PetscReal rtol, PetscReal abstol, PetscReal dtol, PetscInt its, PetscBool zeroguess, PetscInt *outits, PCRichardsonConvergedReason *reason) 933d71ae5a4SJacob Faibussowitsch { 934f650675bSDave May PC_Telescope sred = (PC_Telescope)pc->data; 935f650675bSDave May Mat perm; 936a1d91a28SDave May Vec xtmp, xp, yred; 937f650675bSDave May PetscInt i, st, ed; 938f650675bSDave May VecScatter scatter; 939f650675bSDave May const PetscScalar *x_array; 940c41e779fSDave May PetscBool default_init_guess_value = PETSC_FALSE; 941f650675bSDave May PC_Telescope_DMDACtx *ctx; 942f650675bSDave May 94357f12427SDave May PetscFunctionBegin; 944f650675bSDave May ctx = (PC_Telescope_DMDACtx *)sred->dm_ctx; 945f650675bSDave May xtmp = sred->xtmp; 946f650675bSDave May scatter = sred->scatter; 947f650675bSDave May yred = sred->yred; 948f650675bSDave May perm = ctx->permutation; 949f650675bSDave May xp = ctx->xp; 950f650675bSDave May 95108401ef6SPierre Jolivet PetscCheck(its <= 1, PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "PCApplyRichardson_Telescope_dmda only supports max_it = 1"); 952f650675bSDave May *reason = (PCRichardsonConvergedReason)0; 953f650675bSDave May 954f650675bSDave May if (!zeroguess) { 9559566063dSJacob Faibussowitsch PetscCall(PetscInfo(pc, "PCTelescopeDMDA: Scattering y for non-zero-initial guess\n")); 956f650675bSDave May /* permute vector into ordering associated with re-partitioned dmda */ 9579566063dSJacob Faibussowitsch PetscCall(MatMultTranspose(perm, y, xp)); 958f650675bSDave May 959f650675bSDave May /* pull in vector x->xtmp */ 9609566063dSJacob Faibussowitsch PetscCall(VecScatterBegin(scatter, xp, xtmp, INSERT_VALUES, SCATTER_FORWARD)); 9619566063dSJacob Faibussowitsch PetscCall(VecScatterEnd(scatter, xp, xtmp, INSERT_VALUES, SCATTER_FORWARD)); 962f650675bSDave May 963a5b23f4aSJose E. Roman /* copy vector entries into xred */ 9649566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xtmp, &x_array)); 965f650675bSDave May if (yred) { 966f650675bSDave May PetscScalar *LA_yred; 9679566063dSJacob Faibussowitsch PetscCall(VecGetOwnershipRange(yred, &st, &ed)); 9689566063dSJacob Faibussowitsch PetscCall(VecGetArray(yred, &LA_yred)); 969ad540459SPierre Jolivet for (i = 0; i < ed - st; i++) LA_yred[i] = x_array[i]; 9709566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yred, &LA_yred)); 971f650675bSDave May } 9729566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xtmp, &x_array)); 973f650675bSDave May } 974f650675bSDave May 97557f12427SDave May if (PCTelescope_isActiveRank(sred)) { 9769566063dSJacob Faibussowitsch PetscCall(KSPGetInitialGuessNonzero(sred->ksp, &default_init_guess_value)); 9779566063dSJacob Faibussowitsch if (!zeroguess) PetscCall(KSPSetInitialGuessNonzero(sred->ksp, PETSC_TRUE)); 978f650675bSDave May } 979f650675bSDave May 9809566063dSJacob Faibussowitsch PetscCall(PCApply_Telescope_dmda(pc, x, y)); 981f650675bSDave May 98248a46eb9SPierre Jolivet if (PCTelescope_isActiveRank(sred)) PetscCall(KSPSetInitialGuessNonzero(sred->ksp, default_init_guess_value)); 983f650675bSDave May 984f650675bSDave May if (!*reason) *reason = PCRICHARDSON_CONVERGED_ITS; 985f650675bSDave May *outits = 1; 9863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 987f650675bSDave May } 988f650675bSDave May 989d71ae5a4SJacob Faibussowitsch PetscErrorCode PCReset_Telescope_dmda(PC pc) 990d71ae5a4SJacob Faibussowitsch { 9911e07b27eSBarry Smith PC_Telescope sred = (PC_Telescope)pc->data; 9921e07b27eSBarry Smith PC_Telescope_DMDACtx *ctx; 9931e07b27eSBarry Smith 9941e07b27eSBarry Smith PetscFunctionBegin; 9951e07b27eSBarry Smith ctx = (PC_Telescope_DMDACtx *)sred->dm_ctx; 9969566063dSJacob Faibussowitsch PetscCall(VecDestroy(&ctx->xp)); 9979566063dSJacob Faibussowitsch PetscCall(MatDestroy(&ctx->permutation)); 9989566063dSJacob Faibussowitsch PetscCall(DMDestroy(&ctx->dmrepart)); 9999566063dSJacob Faibussowitsch PetscCall(PetscFree3(ctx->range_i_re, ctx->range_j_re, ctx->range_k_re)); 10009566063dSJacob Faibussowitsch PetscCall(PetscFree3(ctx->start_i_re, ctx->start_j_re, ctx->start_k_re)); 10013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10021e07b27eSBarry Smith } 10031e07b27eSBarry Smith 100466976f2fSJacob Faibussowitsch static PetscErrorCode DMView_DA_Short_3d(DM dm, PetscViewer v) 1005d71ae5a4SJacob Faibussowitsch { 10061e07b27eSBarry Smith PetscInt M, N, P, m, n, p, ndof, nsw; 10071e07b27eSBarry Smith MPI_Comm comm; 10081e07b27eSBarry Smith PetscMPIInt size; 10091e07b27eSBarry Smith const char *prefix; 10101e07b27eSBarry Smith 10111e07b27eSBarry Smith PetscFunctionBegin; 10129566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)dm, &comm)); 10139566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm, &size)); 10149566063dSJacob Faibussowitsch PetscCall(DMGetOptionsPrefix(dm, &prefix)); 10159566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(dm, NULL, &M, &N, &P, &m, &n, &p, &ndof, &nsw, NULL, NULL, NULL, NULL)); 10169566063dSJacob Faibussowitsch if (prefix) PetscCall(PetscViewerASCIIPrintf(v, "DMDA Object: (%s) %d MPI processes\n", prefix, size)); 10179566063dSJacob Faibussowitsch else PetscCall(PetscViewerASCIIPrintf(v, "DMDA Object: %d MPI processes\n", size)); 101863a3b9bcSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(v, " M %" PetscInt_FMT " N %" PetscInt_FMT " P %" PetscInt_FMT " m %" PetscInt_FMT " n %" PetscInt_FMT " p %" PetscInt_FMT " dof %" PetscInt_FMT " overlap %" PetscInt_FMT "\n", M, N, P, m, n, p, ndof, nsw)); 10193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10201e07b27eSBarry Smith } 10211e07b27eSBarry Smith 102266976f2fSJacob Faibussowitsch static PetscErrorCode DMView_DA_Short_2d(DM dm, PetscViewer v) 1023d71ae5a4SJacob Faibussowitsch { 10241e07b27eSBarry Smith PetscInt M, N, m, n, ndof, nsw; 10251e07b27eSBarry Smith MPI_Comm comm; 10261e07b27eSBarry Smith PetscMPIInt size; 10271e07b27eSBarry Smith const char *prefix; 10281e07b27eSBarry Smith 10291e07b27eSBarry Smith PetscFunctionBegin; 10309566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)dm, &comm)); 10319566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm, &size)); 10329566063dSJacob Faibussowitsch PetscCall(DMGetOptionsPrefix(dm, &prefix)); 10339566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(dm, NULL, &M, &N, NULL, &m, &n, NULL, &ndof, &nsw, NULL, NULL, NULL, NULL)); 10349566063dSJacob Faibussowitsch if (prefix) PetscCall(PetscViewerASCIIPrintf(v, "DMDA Object: (%s) %d MPI processes\n", prefix, size)); 10359566063dSJacob Faibussowitsch else PetscCall(PetscViewerASCIIPrintf(v, "DMDA Object: %d MPI processes\n", size)); 103663a3b9bcSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(v, " M %" PetscInt_FMT " N %" PetscInt_FMT " m %" PetscInt_FMT " n %" PetscInt_FMT " dof %" PetscInt_FMT " overlap %" PetscInt_FMT "\n", M, N, m, n, ndof, nsw)); 10373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10381e07b27eSBarry Smith } 10391e07b27eSBarry Smith 1040d71ae5a4SJacob Faibussowitsch PetscErrorCode DMView_DA_Short(DM dm, PetscViewer v) 1041d71ae5a4SJacob Faibussowitsch { 10421e07b27eSBarry Smith PetscInt dim; 10431e07b27eSBarry Smith 10441e07b27eSBarry Smith PetscFunctionBegin; 10459566063dSJacob Faibussowitsch PetscCall(DMDAGetInfo(dm, &dim, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL)); 10461e07b27eSBarry Smith switch (dim) { 1047d71ae5a4SJacob Faibussowitsch case 2: 1048d71ae5a4SJacob Faibussowitsch PetscCall(DMView_DA_Short_2d(dm, v)); 1049d71ae5a4SJacob Faibussowitsch break; 1050d71ae5a4SJacob Faibussowitsch case 3: 1051d71ae5a4SJacob Faibussowitsch PetscCall(DMView_DA_Short_3d(dm, v)); 1052d71ae5a4SJacob Faibussowitsch break; 10531e07b27eSBarry Smith } 10543ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10551e07b27eSBarry Smith } 1056