1 2 3 #include <petsc/private/matimpl.h> 4 #include <petsc/private/pcimpl.h> 5 #include <petsc/private/dmimpl.h> 6 #include <petscksp.h> /*I "petscksp.h" I*/ 7 #include <petscdm.h> 8 #include <petscdmda.h> 9 10 #include "../src/ksp/pc/impls/telescope/telescope.h" 11 12 static PetscBool cited = PETSC_FALSE; 13 static const char citation[] = 14 "@inproceedings{MaySananRuppKnepleySmith2016,\n" 15 " title = {Extreme-Scale Multigrid Components within PETSc},\n" 16 " author = {Dave A. May and Patrick Sanan and Karl Rupp and Matthew G. Knepley and Barry F. Smith},\n" 17 " booktitle = {Proceedings of the Platform for Advanced Scientific Computing Conference},\n" 18 " series = {PASC '16},\n" 19 " isbn = {978-1-4503-4126-4},\n" 20 " location = {Lausanne, Switzerland},\n" 21 " pages = {5:1--5:12},\n" 22 " articleno = {5},\n" 23 " numpages = {12},\n" 24 " url = {http://doi.acm.org/10.1145/2929908.2929913},\n" 25 " doi = {10.1145/2929908.2929913},\n" 26 " acmid = {2929913},\n" 27 " publisher = {ACM},\n" 28 " address = {New York, NY, USA},\n" 29 " keywords = {GPU, HPC, agglomeration, coarse-level solver, multigrid, parallel computing, preconditioning},\n" 30 " year = {2016}\n" 31 "}\n"; 32 33 static PetscErrorCode _DMDADetermineRankFromGlobalIJK(PetscInt dim,PetscInt i,PetscInt j,PetscInt k, 34 PetscInt Mp,PetscInt Np,PetscInt Pp, 35 PetscInt start_i[],PetscInt start_j[],PetscInt start_k[], 36 PetscInt span_i[],PetscInt span_j[],PetscInt span_k[], 37 PetscMPIInt *_pi,PetscMPIInt *_pj,PetscMPIInt *_pk,PetscMPIInt *rank_re) 38 { 39 PetscInt pi,pj,pk,n; 40 41 PetscFunctionBegin; 42 *rank_re = -1; 43 if (_pi) *_pi = -1; 44 if (_pj) *_pj = -1; 45 if (_pk) *_pk = -1; 46 pi = pj = pk = -1; 47 if (_pi) { 48 for (n=0; n<Mp; n++) { 49 if ( (i >= start_i[n]) && (i < start_i[n]+span_i[n]) ) { 50 pi = n; 51 break; 52 } 53 } 54 if (pi == -1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_USER,"[dmda-ijk] pi cannot be determined : range %D, val %D",Mp,i); 55 *_pi = pi; 56 } 57 58 if (_pj) { 59 for (n=0; n<Np; n++) { 60 if ( (j >= start_j[n]) && (j < start_j[n]+span_j[n]) ) { 61 pj = n; 62 break; 63 } 64 } 65 if (pj == -1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_USER,"[dmda-ijk] pj cannot be determined : range %D, val %D",Np,j); 66 *_pj = pj; 67 } 68 69 if (_pk) { 70 for (n=0; n<Pp; n++) { 71 if ( (k >= start_k[n]) && (k < start_k[n]+span_k[n]) ) { 72 pk = n; 73 break; 74 } 75 } 76 if (pk == -1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_USER,"[dmda-ijk] pk cannot be determined : range %D, val %D",Pp,k); 77 *_pk = pk; 78 } 79 80 switch (dim) { 81 case 1: 82 *rank_re = pi; 83 break; 84 case 2: 85 *rank_re = pi + pj * Mp; 86 break; 87 case 3: 88 *rank_re = pi + pj * Mp + pk * (Mp*Np); 89 break; 90 } 91 PetscFunctionReturn(0); 92 } 93 94 static PetscErrorCode _DMDADetermineGlobalS0(PetscInt dim,PetscMPIInt rank_re,PetscInt Mp_re,PetscInt Np_re,PetscInt Pp_re, 95 PetscInt range_i_re[],PetscInt range_j_re[],PetscInt range_k_re[],PetscInt *s0) 96 { 97 PetscInt i,j,k,start_IJK = 0; 98 PetscInt rank_ijk; 99 100 PetscFunctionBegin; 101 switch (dim) { 102 case 1: 103 for (i=0; i<Mp_re; i++) { 104 rank_ijk = i; 105 if (rank_ijk < rank_re) { 106 start_IJK += range_i_re[i]; 107 } 108 } 109 break; 110 case 2: 111 for (j=0; j<Np_re; j++) { 112 for (i=0; i<Mp_re; i++) { 113 rank_ijk = i + j*Mp_re; 114 if (rank_ijk < rank_re) { 115 start_IJK += range_i_re[i]*range_j_re[j]; 116 } 117 } 118 } 119 break; 120 case 3: 121 for (k=0; k<Pp_re; k++) { 122 for (j=0; j<Np_re; j++) { 123 for (i=0; i<Mp_re; i++) { 124 rank_ijk = i + j*Mp_re + k*Mp_re*Np_re; 125 if (rank_ijk < rank_re) { 126 start_IJK += range_i_re[i]*range_j_re[j]*range_k_re[k]; 127 } 128 } 129 } 130 } 131 break; 132 } 133 *s0 = start_IJK; 134 PetscFunctionReturn(0); 135 } 136 137 static PetscErrorCode PCTelescopeSetUp_dmda_repart_coors2d(PC_Telescope sred,DM dm,DM subdm) 138 { 139 PetscErrorCode ierr; 140 DM cdm; 141 Vec coor,coor_natural,perm_coors; 142 PetscInt i,j,si,sj,ni,nj,M,N,Ml,Nl,c,nidx; 143 PetscInt *fine_indices; 144 IS is_fine,is_local; 145 VecScatter sctx; 146 147 PetscFunctionBegin; 148 ierr = DMGetCoordinates(dm,&coor);CHKERRQ(ierr); 149 if (!coor) return(0); 150 if (PCTelescope_isActiveRank(sred)) { 151 ierr = DMDASetUniformCoordinates(subdm,0.0,1.0,0.0,1.0,0.0,1.0);CHKERRQ(ierr); 152 } 153 /* Get the coordinate vector from the distributed array */ 154 ierr = DMGetCoordinateDM(dm,&cdm);CHKERRQ(ierr); 155 ierr = DMDACreateNaturalVector(cdm,&coor_natural);CHKERRQ(ierr); 156 157 ierr = DMDAGlobalToNaturalBegin(cdm,coor,INSERT_VALUES,coor_natural);CHKERRQ(ierr); 158 ierr = DMDAGlobalToNaturalEnd(cdm,coor,INSERT_VALUES,coor_natural);CHKERRQ(ierr); 159 160 /* get indices of the guys I want to grab */ 161 ierr = DMDAGetInfo(dm,NULL,&M,&N,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL);CHKERRQ(ierr); 162 if (PCTelescope_isActiveRank(sred)) { 163 ierr = DMDAGetCorners(subdm,&si,&sj,NULL,&ni,&nj,NULL);CHKERRQ(ierr); 164 Ml = ni; 165 Nl = nj; 166 } else { 167 si = sj = 0; 168 ni = nj = 0; 169 Ml = Nl = 0; 170 } 171 172 ierr = PetscMalloc1(Ml*Nl*2,&fine_indices);CHKERRQ(ierr); 173 c = 0; 174 if (PCTelescope_isActiveRank(sred)) { 175 for (j=sj; j<sj+nj; j++) { 176 for (i=si; i<si+ni; i++) { 177 nidx = (i) + (j)*M; 178 fine_indices[c ] = 2 * nidx ; 179 fine_indices[c+1] = 2 * nidx + 1 ; 180 c = c + 2; 181 } 182 } 183 if (c != Ml*Nl*2) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_PLIB,"c %D should equal 2 * Ml %D * Nl %D",c,Ml,Nl); 184 } 185 186 /* generate scatter */ 187 ierr = ISCreateGeneral(PetscObjectComm((PetscObject)dm),Ml*Nl*2,fine_indices,PETSC_USE_POINTER,&is_fine);CHKERRQ(ierr); 188 ierr = ISCreateStride(PETSC_COMM_SELF,Ml*Nl*2,0,1,&is_local);CHKERRQ(ierr); 189 190 /* scatter */ 191 ierr = VecCreate(PETSC_COMM_SELF,&perm_coors);CHKERRQ(ierr); 192 ierr = VecSetSizes(perm_coors,PETSC_DECIDE,Ml*Nl*2);CHKERRQ(ierr); 193 ierr = VecSetType(perm_coors,VECSEQ);CHKERRQ(ierr); 194 195 ierr = VecScatterCreate(coor_natural,is_fine,perm_coors,is_local,&sctx);CHKERRQ(ierr); 196 ierr = VecScatterBegin(sctx,coor_natural,perm_coors,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 197 ierr = VecScatterEnd( sctx,coor_natural,perm_coors,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 198 /* access */ 199 if (PCTelescope_isActiveRank(sred)) { 200 Vec _coors; 201 const PetscScalar *LA_perm; 202 PetscScalar *LA_coors; 203 204 ierr = DMGetCoordinates(subdm,&_coors);CHKERRQ(ierr); 205 ierr = VecGetArrayRead(perm_coors,&LA_perm);CHKERRQ(ierr); 206 ierr = VecGetArray(_coors,&LA_coors);CHKERRQ(ierr); 207 for (i=0; i<Ml*Nl*2; i++) { 208 LA_coors[i] = LA_perm[i]; 209 } 210 ierr = VecRestoreArray(_coors,&LA_coors);CHKERRQ(ierr); 211 ierr = VecRestoreArrayRead(perm_coors,&LA_perm);CHKERRQ(ierr); 212 } 213 214 /* update local coords */ 215 if (PCTelescope_isActiveRank(sred)) { 216 DM _dmc; 217 Vec _coors,_coors_local; 218 ierr = DMGetCoordinateDM(subdm,&_dmc);CHKERRQ(ierr); 219 ierr = DMGetCoordinates(subdm,&_coors);CHKERRQ(ierr); 220 ierr = DMGetCoordinatesLocal(subdm,&_coors_local);CHKERRQ(ierr); 221 ierr = DMGlobalToLocalBegin(_dmc,_coors,INSERT_VALUES,_coors_local);CHKERRQ(ierr); 222 ierr = DMGlobalToLocalEnd(_dmc,_coors,INSERT_VALUES,_coors_local);CHKERRQ(ierr); 223 } 224 ierr = VecScatterDestroy(&sctx);CHKERRQ(ierr); 225 ierr = ISDestroy(&is_fine);CHKERRQ(ierr); 226 ierr = PetscFree(fine_indices);CHKERRQ(ierr); 227 ierr = ISDestroy(&is_local);CHKERRQ(ierr); 228 ierr = VecDestroy(&perm_coors);CHKERRQ(ierr); 229 ierr = VecDestroy(&coor_natural);CHKERRQ(ierr); 230 PetscFunctionReturn(0); 231 } 232 233 static PetscErrorCode PCTelescopeSetUp_dmda_repart_coors3d(PC_Telescope sred,DM dm,DM subdm) 234 { 235 PetscErrorCode ierr; 236 DM cdm; 237 Vec coor,coor_natural,perm_coors; 238 PetscInt i,j,k,si,sj,sk,ni,nj,nk,M,N,P,Ml,Nl,Pl,c,nidx; 239 PetscInt *fine_indices; 240 IS is_fine,is_local; 241 VecScatter sctx; 242 243 PetscFunctionBegin; 244 ierr = DMGetCoordinates(dm,&coor);CHKERRQ(ierr); 245 if (!coor) PetscFunctionReturn(0); 246 247 if (PCTelescope_isActiveRank(sred)) { 248 ierr = DMDASetUniformCoordinates(subdm,0.0,1.0,0.0,1.0,0.0,1.0);CHKERRQ(ierr); 249 } 250 251 /* Get the coordinate vector from the distributed array */ 252 ierr = DMGetCoordinateDM(dm,&cdm);CHKERRQ(ierr); 253 ierr = DMDACreateNaturalVector(cdm,&coor_natural);CHKERRQ(ierr); 254 ierr = DMDAGlobalToNaturalBegin(cdm,coor,INSERT_VALUES,coor_natural);CHKERRQ(ierr); 255 ierr = DMDAGlobalToNaturalEnd(cdm,coor,INSERT_VALUES,coor_natural);CHKERRQ(ierr); 256 257 /* get indices of the guys I want to grab */ 258 ierr = DMDAGetInfo(dm,NULL,&M,&N,&P,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL);CHKERRQ(ierr); 259 260 if (PCTelescope_isActiveRank(sred)) { 261 ierr = DMDAGetCorners(subdm,&si,&sj,&sk,&ni,&nj,&nk);CHKERRQ(ierr); 262 Ml = ni; 263 Nl = nj; 264 Pl = nk; 265 } else { 266 si = sj = sk = 0; 267 ni = nj = nk = 0; 268 Ml = Nl = Pl = 0; 269 } 270 271 ierr = PetscMalloc1(Ml*Nl*Pl*3,&fine_indices);CHKERRQ(ierr); 272 273 c = 0; 274 if (PCTelescope_isActiveRank(sred)) { 275 for (k=sk; k<sk+nk; k++) { 276 for (j=sj; j<sj+nj; j++) { 277 for (i=si; i<si+ni; i++) { 278 nidx = (i) + (j)*M + (k)*M*N; 279 fine_indices[c ] = 3 * nidx ; 280 fine_indices[c+1] = 3 * nidx + 1 ; 281 fine_indices[c+2] = 3 * nidx + 2 ; 282 c = c + 3; 283 } 284 } 285 } 286 } 287 288 /* generate scatter */ 289 ierr = ISCreateGeneral(PetscObjectComm((PetscObject)dm),Ml*Nl*Pl*3,fine_indices,PETSC_USE_POINTER,&is_fine);CHKERRQ(ierr); 290 ierr = ISCreateStride(PETSC_COMM_SELF,Ml*Nl*Pl*3,0,1,&is_local);CHKERRQ(ierr); 291 292 /* scatter */ 293 ierr = VecCreate(PETSC_COMM_SELF,&perm_coors);CHKERRQ(ierr); 294 ierr = VecSetSizes(perm_coors,PETSC_DECIDE,Ml*Nl*Pl*3);CHKERRQ(ierr); 295 ierr = VecSetType(perm_coors,VECSEQ);CHKERRQ(ierr); 296 ierr = VecScatterCreate(coor_natural,is_fine,perm_coors,is_local,&sctx);CHKERRQ(ierr); 297 ierr = VecScatterBegin(sctx,coor_natural,perm_coors,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 298 ierr = VecScatterEnd( sctx,coor_natural,perm_coors,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 299 300 /* access */ 301 if (PCTelescope_isActiveRank(sred)) { 302 Vec _coors; 303 const PetscScalar *LA_perm; 304 PetscScalar *LA_coors; 305 306 ierr = DMGetCoordinates(subdm,&_coors);CHKERRQ(ierr); 307 ierr = VecGetArrayRead(perm_coors,&LA_perm);CHKERRQ(ierr); 308 ierr = VecGetArray(_coors,&LA_coors);CHKERRQ(ierr); 309 for (i=0; i<Ml*Nl*Pl*3; i++) { 310 LA_coors[i] = LA_perm[i]; 311 } 312 ierr = VecRestoreArray(_coors,&LA_coors);CHKERRQ(ierr); 313 ierr = VecRestoreArrayRead(perm_coors,&LA_perm);CHKERRQ(ierr); 314 } 315 316 /* update local coords */ 317 if (PCTelescope_isActiveRank(sred)) { 318 DM _dmc; 319 Vec _coors,_coors_local; 320 321 ierr = DMGetCoordinateDM(subdm,&_dmc);CHKERRQ(ierr); 322 ierr = DMGetCoordinates(subdm,&_coors);CHKERRQ(ierr); 323 ierr = DMGetCoordinatesLocal(subdm,&_coors_local);CHKERRQ(ierr); 324 ierr = DMGlobalToLocalBegin(_dmc,_coors,INSERT_VALUES,_coors_local);CHKERRQ(ierr); 325 ierr = DMGlobalToLocalEnd(_dmc,_coors,INSERT_VALUES,_coors_local);CHKERRQ(ierr); 326 } 327 328 ierr = VecScatterDestroy(&sctx);CHKERRQ(ierr); 329 ierr = ISDestroy(&is_fine);CHKERRQ(ierr); 330 ierr = PetscFree(fine_indices);CHKERRQ(ierr); 331 ierr = ISDestroy(&is_local);CHKERRQ(ierr); 332 ierr = VecDestroy(&perm_coors);CHKERRQ(ierr); 333 ierr = VecDestroy(&coor_natural);CHKERRQ(ierr); 334 PetscFunctionReturn(0); 335 } 336 337 static PetscErrorCode PCTelescopeSetUp_dmda_repart_coors(PC pc,PC_Telescope sred,PC_Telescope_DMDACtx *ctx) 338 { 339 PetscInt dim; 340 DM dm,subdm; 341 PetscSubcomm psubcomm; 342 MPI_Comm comm; 343 Vec coor; 344 PetscErrorCode ierr; 345 346 PetscFunctionBegin; 347 ierr = PCGetDM(pc,&dm);CHKERRQ(ierr); 348 ierr = DMGetCoordinates(dm,&coor);CHKERRQ(ierr); 349 if (!coor) PetscFunctionReturn(0); 350 psubcomm = sred->psubcomm; 351 comm = PetscSubcommParent(psubcomm); 352 subdm = ctx->dmrepart; 353 354 ierr = PetscInfo(pc,"PCTelescope: setting up the coordinates (DMDA)\n");CHKERRQ(ierr); 355 ierr = DMDAGetInfo(dm,&dim,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL);CHKERRQ(ierr); 356 switch (dim) { 357 case 1: SETERRQ(comm,PETSC_ERR_SUP,"Telescope: DMDA (1D) repartitioning not provided"); 358 break; 359 case 2: ierr = PCTelescopeSetUp_dmda_repart_coors2d(sred,dm,subdm);CHKERRQ(ierr); 360 break; 361 case 3: ierr = PCTelescopeSetUp_dmda_repart_coors3d(sred,dm,subdm);CHKERRQ(ierr); 362 break; 363 } 364 PetscFunctionReturn(0); 365 } 366 367 /* setup repartitioned dm */ 368 PetscErrorCode PCTelescopeSetUp_dmda_repart(PC pc,PC_Telescope sred,PC_Telescope_DMDACtx *ctx) 369 { 370 PetscErrorCode ierr; 371 DM dm; 372 PetscInt dim,nx,ny,nz,ndof,nsw,sum,k; 373 DMBoundaryType bx,by,bz; 374 DMDAStencilType stencil; 375 const PetscInt *_range_i_re; 376 const PetscInt *_range_j_re; 377 const PetscInt *_range_k_re; 378 DMDAInterpolationType itype; 379 PetscInt refine_x,refine_y,refine_z; 380 MPI_Comm comm,subcomm; 381 const char *prefix; 382 383 PetscFunctionBegin; 384 comm = PetscSubcommParent(sred->psubcomm); 385 subcomm = PetscSubcommChild(sred->psubcomm); 386 ierr = PCGetDM(pc,&dm);CHKERRQ(ierr); 387 388 ierr = DMDAGetInfo(dm,&dim,&nx,&ny,&nz,NULL,NULL,NULL,&ndof,&nsw,&bx,&by,&bz,&stencil);CHKERRQ(ierr); 389 ierr = DMDAGetInterpolationType(dm,&itype);CHKERRQ(ierr); 390 ierr = DMDAGetRefinementFactor(dm,&refine_x,&refine_y,&refine_z);CHKERRQ(ierr); 391 392 ctx->dmrepart = NULL; 393 _range_i_re = _range_j_re = _range_k_re = NULL; 394 /* Create DMDA on the child communicator */ 395 if (PCTelescope_isActiveRank(sred)) { 396 switch (dim) { 397 case 1: 398 ierr = PetscInfo(pc,"PCTelescope: setting up the DMDA on comm subset (1D)\n");CHKERRQ(ierr); 399 /*ierr = DMDACreate1d(subcomm,bx,nx,ndof,nsw,NULL,&ctx->dmrepart);CHKERRQ(ierr);*/ 400 ny = nz = 1; 401 by = bz = DM_BOUNDARY_NONE; 402 break; 403 case 2: 404 ierr = PetscInfo(pc,"PCTelescope: setting up the DMDA on comm subset (2D)\n");CHKERRQ(ierr); 405 /*ierr = DMDACreate2d(subcomm,bx,by,stencil,nx,ny, PETSC_DECIDE,PETSC_DECIDE, ndof,nsw, NULL,NULL,&ctx->dmrepart);CHKERRQ(ierr);*/ 406 nz = 1; 407 bz = DM_BOUNDARY_NONE; 408 break; 409 case 3: 410 ierr = PetscInfo(pc,"PCTelescope: setting up the DMDA on comm subset (3D)\n");CHKERRQ(ierr); 411 /*ierr = DMDACreate3d(subcomm,bx,by,bz,stencil,nx,ny,nz, PETSC_DECIDE,PETSC_DECIDE,PETSC_DECIDE, ndof,nsw, NULL,NULL,NULL,&ctx->dmrepart);CHKERRQ(ierr);*/ 412 break; 413 } 414 /* 415 The API DMDACreate1d(), DMDACreate2d(), DMDACreate3d() does not allow us to set/append 416 a unique option prefix for the DM, thus I prefer to expose the contents of these API's here. 417 This allows users to control the partitioning of the subDM. 418 */ 419 ierr = DMDACreate(subcomm,&ctx->dmrepart);CHKERRQ(ierr); 420 /* Set unique option prefix name */ 421 ierr = KSPGetOptionsPrefix(sred->ksp,&prefix);CHKERRQ(ierr); 422 ierr = DMSetOptionsPrefix(ctx->dmrepart,prefix);CHKERRQ(ierr); 423 ierr = DMAppendOptionsPrefix(ctx->dmrepart,"repart_");CHKERRQ(ierr); 424 /* standard setup from DMDACreate{1,2,3}d() */ 425 ierr = DMSetDimension(ctx->dmrepart,dim);CHKERRQ(ierr); 426 ierr = DMDASetSizes(ctx->dmrepart,nx,ny,nz);CHKERRQ(ierr); 427 ierr = DMDASetNumProcs(ctx->dmrepart,PETSC_DECIDE,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr); 428 ierr = DMDASetBoundaryType(ctx->dmrepart,bx,by,bz);CHKERRQ(ierr); 429 ierr = DMDASetDof(ctx->dmrepart,ndof);CHKERRQ(ierr); 430 ierr = DMDASetStencilType(ctx->dmrepart,stencil);CHKERRQ(ierr); 431 ierr = DMDASetStencilWidth(ctx->dmrepart,nsw);CHKERRQ(ierr); 432 ierr = DMDASetOwnershipRanges(ctx->dmrepart,NULL,NULL,NULL);CHKERRQ(ierr); 433 ierr = DMSetFromOptions(ctx->dmrepart);CHKERRQ(ierr); 434 ierr = DMSetUp(ctx->dmrepart);CHKERRQ(ierr); 435 /* Set refinement factors and interpolation type from the partent */ 436 ierr = DMDASetRefinementFactor(ctx->dmrepart,refine_x,refine_y,refine_z);CHKERRQ(ierr); 437 ierr = DMDASetInterpolationType(ctx->dmrepart,itype);CHKERRQ(ierr); 438 439 ierr = DMDAGetInfo(ctx->dmrepart,NULL,NULL,NULL,NULL,&ctx->Mp_re,&ctx->Np_re,&ctx->Pp_re,NULL,NULL,NULL,NULL,NULL,NULL);CHKERRQ(ierr); 440 ierr = DMDAGetOwnershipRanges(ctx->dmrepart,&_range_i_re,&_range_j_re,&_range_k_re);CHKERRQ(ierr); 441 442 ctx->dmrepart->ops->creatematrix = dm->ops->creatematrix; 443 ctx->dmrepart->ops->createdomaindecomposition = dm->ops->createdomaindecomposition; 444 } 445 446 /* generate ranges for repartitioned dm */ 447 /* note - assume rank 0 always participates */ 448 ierr = MPI_Bcast(&ctx->Mp_re,1,MPIU_INT,0,comm);CHKERRQ(ierr); 449 ierr = MPI_Bcast(&ctx->Np_re,1,MPIU_INT,0,comm);CHKERRQ(ierr); 450 ierr = MPI_Bcast(&ctx->Pp_re,1,MPIU_INT,0,comm);CHKERRQ(ierr); 451 452 ierr = PetscCalloc1(ctx->Mp_re,&ctx->range_i_re);CHKERRQ(ierr); 453 ierr = PetscCalloc1(ctx->Np_re,&ctx->range_j_re);CHKERRQ(ierr); 454 ierr = PetscCalloc1(ctx->Pp_re,&ctx->range_k_re);CHKERRQ(ierr); 455 456 if (_range_i_re) {ierr = PetscMemcpy(ctx->range_i_re,_range_i_re,sizeof(PetscInt)*ctx->Mp_re);CHKERRQ(ierr);} 457 if (_range_j_re) {ierr = PetscMemcpy(ctx->range_j_re,_range_j_re,sizeof(PetscInt)*ctx->Np_re);CHKERRQ(ierr);} 458 if (_range_k_re) {ierr = PetscMemcpy(ctx->range_k_re,_range_k_re,sizeof(PetscInt)*ctx->Pp_re);CHKERRQ(ierr);} 459 460 ierr = MPI_Bcast(ctx->range_i_re,ctx->Mp_re,MPIU_INT,0,comm);CHKERRQ(ierr); 461 ierr = MPI_Bcast(ctx->range_j_re,ctx->Np_re,MPIU_INT,0,comm);CHKERRQ(ierr); 462 ierr = MPI_Bcast(ctx->range_k_re,ctx->Pp_re,MPIU_INT,0,comm);CHKERRQ(ierr); 463 464 ierr = PetscMalloc1(ctx->Mp_re,&ctx->start_i_re);CHKERRQ(ierr); 465 ierr = PetscMalloc1(ctx->Np_re,&ctx->start_j_re);CHKERRQ(ierr); 466 ierr = PetscMalloc1(ctx->Pp_re,&ctx->start_k_re);CHKERRQ(ierr); 467 468 sum = 0; 469 for (k=0; k<ctx->Mp_re; k++) { 470 ctx->start_i_re[k] = sum; 471 sum += ctx->range_i_re[k]; 472 } 473 474 sum = 0; 475 for (k=0; k<ctx->Np_re; k++) { 476 ctx->start_j_re[k] = sum; 477 sum += ctx->range_j_re[k]; 478 } 479 480 sum = 0; 481 for (k=0; k<ctx->Pp_re; k++) { 482 ctx->start_k_re[k] = sum; 483 sum += ctx->range_k_re[k]; 484 } 485 486 /* attach repartitioned dm to child ksp */ 487 { 488 PetscErrorCode (*dmksp_func)(KSP,Mat,Mat,void*); 489 void *dmksp_ctx; 490 491 ierr = DMKSPGetComputeOperators(dm,&dmksp_func,&dmksp_ctx);CHKERRQ(ierr); 492 493 /* attach dm to ksp on sub communicator */ 494 if (PCTelescope_isActiveRank(sred)) { 495 ierr = KSPSetDM(sred->ksp,ctx->dmrepart);CHKERRQ(ierr); 496 497 if (!dmksp_func || sred->ignore_kspcomputeoperators) { 498 ierr = KSPSetDMActive(sred->ksp,PETSC_FALSE);CHKERRQ(ierr); 499 } else { 500 /* sub ksp inherits dmksp_func and context provided by user */ 501 ierr = KSPSetComputeOperators(sred->ksp,dmksp_func,dmksp_ctx);CHKERRQ(ierr); 502 ierr = KSPSetDMActive(sred->ksp,PETSC_TRUE);CHKERRQ(ierr); 503 } 504 } 505 } 506 PetscFunctionReturn(0); 507 } 508 509 PetscErrorCode PCTelescopeSetUp_dmda_permutation_3d(PC pc,PC_Telescope sred,PC_Telescope_DMDACtx *ctx) 510 { 511 PetscErrorCode ierr; 512 DM dm; 513 MPI_Comm comm; 514 Mat Pscalar,P; 515 PetscInt ndof; 516 PetscInt i,j,k,location,startI[3],endI[3],lenI[3],nx,ny,nz; 517 PetscInt sr,er,Mr; 518 Vec V; 519 520 PetscFunctionBegin; 521 ierr = PetscInfo(pc,"PCTelescope: setting up the permutation matrix (DMDA-3D)\n");CHKERRQ(ierr); 522 ierr = PetscObjectGetComm((PetscObject)pc,&comm);CHKERRQ(ierr); 523 524 ierr = PCGetDM(pc,&dm);CHKERRQ(ierr); 525 ierr = DMDAGetInfo(dm,NULL,&nx,&ny,&nz,NULL,NULL,NULL,&ndof,NULL,NULL,NULL,NULL,NULL);CHKERRQ(ierr); 526 527 ierr = DMGetGlobalVector(dm,&V);CHKERRQ(ierr); 528 ierr = VecGetSize(V,&Mr);CHKERRQ(ierr); 529 ierr = VecGetOwnershipRange(V,&sr,&er);CHKERRQ(ierr); 530 ierr = DMRestoreGlobalVector(dm,&V);CHKERRQ(ierr); 531 sr = sr / ndof; 532 er = er / ndof; 533 Mr = Mr / ndof; 534 535 ierr = MatCreate(comm,&Pscalar);CHKERRQ(ierr); 536 ierr = MatSetSizes(Pscalar,(er-sr),(er-sr),Mr,Mr);CHKERRQ(ierr); 537 ierr = MatSetType(Pscalar,MATAIJ);CHKERRQ(ierr); 538 ierr = MatSeqAIJSetPreallocation(Pscalar,1,NULL);CHKERRQ(ierr); 539 ierr = MatMPIAIJSetPreallocation(Pscalar,1,NULL,1,NULL);CHKERRQ(ierr); 540 541 ierr = DMDAGetCorners(dm,NULL,NULL,NULL,&lenI[0],&lenI[1],&lenI[2]);CHKERRQ(ierr); 542 ierr = DMDAGetCorners(dm,&startI[0],&startI[1],&startI[2],&endI[0],&endI[1],&endI[2]);CHKERRQ(ierr); 543 endI[0] += startI[0]; 544 endI[1] += startI[1]; 545 endI[2] += startI[2]; 546 547 for (k=startI[2]; k<endI[2]; k++) { 548 for (j=startI[1]; j<endI[1]; j++) { 549 for (i=startI[0]; i<endI[0]; i++) { 550 PetscMPIInt rank_ijk_re,rank_reI[3]; 551 PetscInt s0_re; 552 PetscInt ii,jj,kk,local_ijk_re,mapped_ijk; 553 PetscInt lenI_re[3]; 554 555 location = (i - startI[0]) + (j - startI[1])*lenI[0] + (k - startI[2])*lenI[0]*lenI[1]; 556 ierr = _DMDADetermineRankFromGlobalIJK(3,i,j,k, ctx->Mp_re,ctx->Np_re,ctx->Pp_re, 557 ctx->start_i_re,ctx->start_j_re,ctx->start_k_re, 558 ctx->range_i_re,ctx->range_j_re,ctx->range_k_re, 559 &rank_reI[0],&rank_reI[1],&rank_reI[2],&rank_ijk_re);CHKERRQ(ierr); 560 ierr = _DMDADetermineGlobalS0(3,rank_ijk_re, ctx->Mp_re,ctx->Np_re,ctx->Pp_re, ctx->range_i_re,ctx->range_j_re,ctx->range_k_re, &s0_re);CHKERRQ(ierr); 561 ii = i - ctx->start_i_re[ rank_reI[0] ]; 562 if (ii < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"[dmdarepart-perm3d] index error ii"); 563 jj = j - ctx->start_j_re[ rank_reI[1] ]; 564 if (jj < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"[dmdarepart-perm3d] index error jj"); 565 kk = k - ctx->start_k_re[ rank_reI[2] ]; 566 if (kk < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"[dmdarepart-perm3d] index error kk"); 567 lenI_re[0] = ctx->range_i_re[ rank_reI[0] ]; 568 lenI_re[1] = ctx->range_j_re[ rank_reI[1] ]; 569 lenI_re[2] = ctx->range_k_re[ rank_reI[2] ]; 570 local_ijk_re = ii + jj * lenI_re[0] + kk * lenI_re[0] * lenI_re[1]; 571 mapped_ijk = s0_re + local_ijk_re; 572 ierr = MatSetValue(Pscalar,sr+location,mapped_ijk,1.0,INSERT_VALUES);CHKERRQ(ierr); 573 } 574 } 575 } 576 ierr = MatAssemblyBegin(Pscalar,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 577 ierr = MatAssemblyEnd(Pscalar,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 578 ierr = MatCreateMAIJ(Pscalar,ndof,&P);CHKERRQ(ierr); 579 ierr = MatDestroy(&Pscalar);CHKERRQ(ierr); 580 ctx->permutation = P; 581 PetscFunctionReturn(0); 582 } 583 584 PetscErrorCode PCTelescopeSetUp_dmda_permutation_2d(PC pc,PC_Telescope sred,PC_Telescope_DMDACtx *ctx) 585 { 586 PetscErrorCode ierr; 587 DM dm; 588 MPI_Comm comm; 589 Mat Pscalar,P; 590 PetscInt ndof; 591 PetscInt i,j,location,startI[2],endI[2],lenI[2],nx,ny,nz; 592 PetscInt sr,er,Mr; 593 Vec V; 594 595 PetscFunctionBegin; 596 ierr = PetscInfo(pc,"PCTelescope: setting up the permutation matrix (DMDA-2D)\n");CHKERRQ(ierr); 597 ierr = PetscObjectGetComm((PetscObject)pc,&comm);CHKERRQ(ierr); 598 ierr = PCGetDM(pc,&dm);CHKERRQ(ierr); 599 ierr = DMDAGetInfo(dm,NULL,&nx,&ny,&nz,NULL,NULL,NULL,&ndof,NULL,NULL,NULL,NULL,NULL);CHKERRQ(ierr); 600 ierr = DMGetGlobalVector(dm,&V);CHKERRQ(ierr); 601 ierr = VecGetSize(V,&Mr);CHKERRQ(ierr); 602 ierr = VecGetOwnershipRange(V,&sr,&er);CHKERRQ(ierr); 603 ierr = DMRestoreGlobalVector(dm,&V);CHKERRQ(ierr); 604 sr = sr / ndof; 605 er = er / ndof; 606 Mr = Mr / ndof; 607 608 ierr = MatCreate(comm,&Pscalar);CHKERRQ(ierr); 609 ierr = MatSetSizes(Pscalar,(er-sr),(er-sr),Mr,Mr);CHKERRQ(ierr); 610 ierr = MatSetType(Pscalar,MATAIJ);CHKERRQ(ierr); 611 ierr = MatSeqAIJSetPreallocation(Pscalar,1,NULL);CHKERRQ(ierr); 612 ierr = MatMPIAIJSetPreallocation(Pscalar,1,NULL,1,NULL);CHKERRQ(ierr); 613 614 ierr = DMDAGetCorners(dm,NULL,NULL,NULL,&lenI[0],&lenI[1],NULL);CHKERRQ(ierr); 615 ierr = DMDAGetCorners(dm,&startI[0],&startI[1],NULL,&endI[0],&endI[1],NULL);CHKERRQ(ierr); 616 endI[0] += startI[0]; 617 endI[1] += startI[1]; 618 619 for (j=startI[1]; j<endI[1]; j++) { 620 for (i=startI[0]; i<endI[0]; i++) { 621 PetscMPIInt rank_ijk_re,rank_reI[3]; 622 PetscInt s0_re; 623 PetscInt ii,jj,local_ijk_re,mapped_ijk; 624 PetscInt lenI_re[3]; 625 626 location = (i - startI[0]) + (j - startI[1])*lenI[0]; 627 ierr = _DMDADetermineRankFromGlobalIJK(2,i,j,0, ctx->Mp_re,ctx->Np_re,ctx->Pp_re, 628 ctx->start_i_re,ctx->start_j_re,ctx->start_k_re, 629 ctx->range_i_re,ctx->range_j_re,ctx->range_k_re, 630 &rank_reI[0],&rank_reI[1],NULL,&rank_ijk_re);CHKERRQ(ierr); 631 632 ierr = _DMDADetermineGlobalS0(2,rank_ijk_re, ctx->Mp_re,ctx->Np_re,ctx->Pp_re, ctx->range_i_re,ctx->range_j_re,ctx->range_k_re, &s0_re);CHKERRQ(ierr); 633 634 ii = i - ctx->start_i_re[ rank_reI[0] ]; 635 if (ii < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"[dmdarepart-perm2d] index error ii"); 636 jj = j - ctx->start_j_re[ rank_reI[1] ]; 637 if (jj < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"[dmdarepart-perm2d] index error jj"); 638 639 lenI_re[0] = ctx->range_i_re[ rank_reI[0] ]; 640 lenI_re[1] = ctx->range_j_re[ rank_reI[1] ]; 641 local_ijk_re = ii + jj * lenI_re[0]; 642 mapped_ijk = s0_re + local_ijk_re; 643 ierr = MatSetValue(Pscalar,sr+location,mapped_ijk,1.0,INSERT_VALUES);CHKERRQ(ierr); 644 } 645 } 646 ierr = MatAssemblyBegin(Pscalar,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 647 ierr = MatAssemblyEnd(Pscalar,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 648 ierr = MatCreateMAIJ(Pscalar,ndof,&P);CHKERRQ(ierr); 649 ierr = MatDestroy(&Pscalar);CHKERRQ(ierr); 650 ctx->permutation = P; 651 PetscFunctionReturn(0); 652 } 653 654 PetscErrorCode PCTelescopeSetUp_dmda_scatters(PC pc,PC_Telescope sred,PC_Telescope_DMDACtx *ctx) 655 { 656 PetscErrorCode ierr; 657 Vec xred,yred,xtmp,x,xp; 658 VecScatter scatter; 659 IS isin; 660 Mat B; 661 PetscInt m,bs,st,ed; 662 MPI_Comm comm; 663 664 PetscFunctionBegin; 665 ierr = PetscObjectGetComm((PetscObject)pc,&comm);CHKERRQ(ierr); 666 ierr = PCGetOperators(pc,NULL,&B);CHKERRQ(ierr); 667 ierr = MatCreateVecs(B,&x,NULL);CHKERRQ(ierr); 668 ierr = MatGetBlockSize(B,&bs);CHKERRQ(ierr); 669 ierr = VecDuplicate(x,&xp);CHKERRQ(ierr); 670 m = 0; 671 xred = NULL; 672 yred = NULL; 673 if (PCTelescope_isActiveRank(sred)) { 674 ierr = DMCreateGlobalVector(ctx->dmrepart,&xred);CHKERRQ(ierr); 675 ierr = VecDuplicate(xred,&yred);CHKERRQ(ierr); 676 ierr = VecGetOwnershipRange(xred,&st,&ed);CHKERRQ(ierr); 677 ierr = ISCreateStride(comm,ed-st,st,1,&isin);CHKERRQ(ierr); 678 ierr = VecGetLocalSize(xred,&m);CHKERRQ(ierr); 679 } else { 680 ierr = VecGetOwnershipRange(x,&st,&ed);CHKERRQ(ierr); 681 ierr = ISCreateStride(comm,0,st,1,&isin);CHKERRQ(ierr); 682 } 683 ierr = ISSetBlockSize(isin,bs);CHKERRQ(ierr); 684 ierr = VecCreate(comm,&xtmp);CHKERRQ(ierr); 685 ierr = VecSetSizes(xtmp,m,PETSC_DECIDE);CHKERRQ(ierr); 686 ierr = VecSetBlockSize(xtmp,bs);CHKERRQ(ierr); 687 ierr = VecSetType(xtmp,((PetscObject)x)->type_name);CHKERRQ(ierr); 688 ierr = VecScatterCreate(x,isin,xtmp,NULL,&scatter);CHKERRQ(ierr); 689 sred->xred = xred; 690 sred->yred = yred; 691 sred->isin = isin; 692 sred->scatter = scatter; 693 sred->xtmp = xtmp; 694 695 ctx->xp = xp; 696 ierr = VecDestroy(&x);CHKERRQ(ierr); 697 PetscFunctionReturn(0); 698 } 699 700 PetscErrorCode PCTelescopeSetUp_dmda(PC pc,PC_Telescope sred) 701 { 702 PC_Telescope_DMDACtx *ctx; 703 PetscInt dim; 704 DM dm; 705 MPI_Comm comm; 706 PetscErrorCode ierr; 707 708 PetscFunctionBegin; 709 ierr = PetscInfo(pc,"PCTelescope: setup (DMDA)\n");CHKERRQ(ierr); 710 PetscMalloc1(1,&ctx); 711 PetscMemzero(ctx,sizeof(PC_Telescope_DMDACtx)); 712 sred->dm_ctx = (void*)ctx; 713 714 ierr = PetscObjectGetComm((PetscObject)pc,&comm);CHKERRQ(ierr); 715 ierr = PCGetDM(pc,&dm);CHKERRQ(ierr); 716 ierr = DMDAGetInfo(dm,&dim,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL);CHKERRQ(ierr); 717 718 PCTelescopeSetUp_dmda_repart(pc,sred,ctx); 719 PCTelescopeSetUp_dmda_repart_coors(pc,sred,ctx); 720 switch (dim) { 721 case 1: SETERRQ(comm,PETSC_ERR_SUP,"Telescope: DMDA (1D) repartitioning not provided"); 722 break; 723 case 2: ierr = PCTelescopeSetUp_dmda_permutation_2d(pc,sred,ctx);CHKERRQ(ierr); 724 break; 725 case 3: ierr = PCTelescopeSetUp_dmda_permutation_3d(pc,sred,ctx);CHKERRQ(ierr); 726 break; 727 } 728 ierr = PCTelescopeSetUp_dmda_scatters(pc,sred,ctx);CHKERRQ(ierr); 729 PetscFunctionReturn(0); 730 } 731 732 PetscErrorCode PCTelescopeMatCreate_dmda_dmactivefalse(PC pc,PC_Telescope sred,MatReuse reuse,Mat *A) 733 { 734 PetscErrorCode ierr; 735 PC_Telescope_DMDACtx *ctx; 736 MPI_Comm comm,subcomm; 737 Mat Bperm,Bred,B,P; 738 PetscInt nr,nc; 739 IS isrow,iscol; 740 Mat Blocal,*_Blocal; 741 742 PetscFunctionBegin; 743 ierr = PetscInfo(pc,"PCTelescope: updating the redundant preconditioned operator (DMDA)\n");CHKERRQ(ierr); 744 ierr = PetscObjectGetComm((PetscObject)pc,&comm);CHKERRQ(ierr); 745 subcomm = PetscSubcommChild(sred->psubcomm); 746 ctx = (PC_Telescope_DMDACtx*)sred->dm_ctx; 747 748 ierr = PCGetOperators(pc,NULL,&B);CHKERRQ(ierr); 749 ierr = MatGetSize(B,&nr,&nc);CHKERRQ(ierr); 750 751 P = ctx->permutation; 752 ierr = MatPtAP(B,P,MAT_INITIAL_MATRIX,1.1,&Bperm);CHKERRQ(ierr); 753 754 /* Get submatrices */ 755 isrow = sred->isin; 756 ierr = ISCreateStride(comm,nc,0,1,&iscol);CHKERRQ(ierr); 757 758 ierr = MatCreateSubMatrices(Bperm,1,&isrow,&iscol,MAT_INITIAL_MATRIX,&_Blocal);CHKERRQ(ierr); 759 Blocal = *_Blocal; 760 Bred = NULL; 761 if (PCTelescope_isActiveRank(sred)) { 762 PetscInt mm; 763 764 if (reuse != MAT_INITIAL_MATRIX) {Bred = *A;} 765 ierr = MatGetSize(Blocal,&mm,NULL);CHKERRQ(ierr); 766 /* ierr = MatCreateMPIMatConcatenateSeqMat(subcomm,Blocal,PETSC_DECIDE,reuse,&Bred);CHKERRQ(ierr); */ 767 ierr = MatCreateMPIMatConcatenateSeqMat(subcomm,Blocal,mm,reuse,&Bred);CHKERRQ(ierr); 768 } 769 *A = Bred; 770 771 ierr = ISDestroy(&iscol);CHKERRQ(ierr); 772 ierr = MatDestroy(&Bperm);CHKERRQ(ierr); 773 ierr = MatDestroyMatrices(1,&_Blocal);CHKERRQ(ierr); 774 PetscFunctionReturn(0); 775 } 776 777 PetscErrorCode PCTelescopeMatCreate_dmda(PC pc,PC_Telescope sred,MatReuse reuse,Mat *A) 778 { 779 PetscErrorCode ierr; 780 DM dm; 781 PetscErrorCode (*dmksp_func)(KSP,Mat,Mat,void*); 782 void *dmksp_ctx; 783 784 PetscFunctionBegin; 785 ierr = PCGetDM(pc,&dm);CHKERRQ(ierr); 786 ierr = DMKSPGetComputeOperators(dm,&dmksp_func,&dmksp_ctx);CHKERRQ(ierr); 787 /* We assume that dmksp_func = NULL, is equivalent to dmActive = PETSC_FALSE */ 788 if (dmksp_func && !sred->ignore_kspcomputeoperators) { 789 DM dmrepart; 790 Mat Ak; 791 792 *A = NULL; 793 if (PCTelescope_isActiveRank(sred)) { 794 ierr = KSPGetDM(sred->ksp,&dmrepart);CHKERRQ(ierr); 795 if (reuse == MAT_INITIAL_MATRIX) { 796 ierr = DMCreateMatrix(dmrepart,&Ak);CHKERRQ(ierr); 797 *A = Ak; 798 } else if (reuse == MAT_REUSE_MATRIX) { 799 Ak = *A; 800 } 801 /* 802 There is no need to explicitly assemble the operator now, 803 the sub-KSP will call the method provided to KSPSetComputeOperators() during KSPSetUp() 804 */ 805 } 806 } else { 807 ierr = PCTelescopeMatCreate_dmda_dmactivefalse(pc,sred,reuse,A);CHKERRQ(ierr); 808 } 809 PetscFunctionReturn(0); 810 } 811 812 PetscErrorCode PCTelescopeSubNullSpaceCreate_dmda_Telescope(PC pc,PC_Telescope sred,MatNullSpace nullspace,MatNullSpace *sub_nullspace) 813 { 814 PetscErrorCode ierr; 815 PetscBool has_const; 816 PetscInt i,k,n = 0; 817 const Vec *vecs; 818 Vec *sub_vecs = NULL; 819 MPI_Comm subcomm; 820 PC_Telescope_DMDACtx *ctx; 821 822 PetscFunctionBegin; 823 ctx = (PC_Telescope_DMDACtx*)sred->dm_ctx; 824 subcomm = PetscSubcommChild(sred->psubcomm); 825 ierr = MatNullSpaceGetVecs(nullspace,&has_const,&n,&vecs);CHKERRQ(ierr); 826 827 if (PCTelescope_isActiveRank(sred)) { 828 /* create new vectors */ 829 if (n) { 830 ierr = VecDuplicateVecs(sred->xred,n,&sub_vecs);CHKERRQ(ierr); 831 } 832 } 833 834 /* copy entries */ 835 for (k=0; k<n; k++) { 836 const PetscScalar *x_array; 837 PetscScalar *LA_sub_vec; 838 PetscInt st,ed; 839 840 /* permute vector into ordering associated with re-partitioned dmda */ 841 ierr = MatMultTranspose(ctx->permutation,vecs[k],ctx->xp);CHKERRQ(ierr); 842 843 /* pull in vector x->xtmp */ 844 ierr = VecScatterBegin(sred->scatter,ctx->xp,sred->xtmp,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 845 ierr = VecScatterEnd(sred->scatter,ctx->xp,sred->xtmp,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 846 847 /* copy vector entries into xred */ 848 ierr = VecGetArrayRead(sred->xtmp,&x_array);CHKERRQ(ierr); 849 if (sub_vecs) { 850 if (sub_vecs[k]) { 851 ierr = VecGetOwnershipRange(sub_vecs[k],&st,&ed);CHKERRQ(ierr); 852 ierr = VecGetArray(sub_vecs[k],&LA_sub_vec);CHKERRQ(ierr); 853 for (i=0; i<ed-st; i++) { 854 LA_sub_vec[i] = x_array[i]; 855 } 856 ierr = VecRestoreArray(sub_vecs[k],&LA_sub_vec);CHKERRQ(ierr); 857 } 858 } 859 ierr = VecRestoreArrayRead(sred->xtmp,&x_array);CHKERRQ(ierr); 860 } 861 862 if (PCTelescope_isActiveRank(sred)) { 863 /* create new (near) nullspace for redundant object */ 864 ierr = MatNullSpaceCreate(subcomm,has_const,n,sub_vecs,sub_nullspace);CHKERRQ(ierr); 865 ierr = VecDestroyVecs(n,&sub_vecs);CHKERRQ(ierr); 866 if (nullspace->remove) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_SUP,"Propagation of custom remove callbacks not supported when propagating (near) nullspaces with PCTelescope"); 867 if (nullspace->rmctx) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_SUP,"Propagation of custom remove callback context not supported when propagating (near) nullspaces with PCTelescope"); 868 } 869 PetscFunctionReturn(0); 870 } 871 872 PetscErrorCode PCTelescopeMatNullSpaceCreate_dmda(PC pc,PC_Telescope sred,Mat sub_mat) 873 { 874 PetscErrorCode ierr; 875 Mat B; 876 877 PetscFunctionBegin; 878 ierr = PCGetOperators(pc,NULL,&B);CHKERRQ(ierr); 879 { 880 MatNullSpace nullspace,sub_nullspace; 881 ierr = MatGetNullSpace(B,&nullspace);CHKERRQ(ierr); 882 if (nullspace) { 883 ierr = PetscInfo(pc,"PCTelescope: generating nullspace (DMDA)\n");CHKERRQ(ierr); 884 ierr = PCTelescopeSubNullSpaceCreate_dmda_Telescope(pc,sred,nullspace,&sub_nullspace);CHKERRQ(ierr); 885 if (PCTelescope_isActiveRank(sred)) { 886 ierr = MatSetNullSpace(sub_mat,sub_nullspace);CHKERRQ(ierr); 887 ierr = MatNullSpaceDestroy(&sub_nullspace);CHKERRQ(ierr); 888 } 889 } 890 } 891 { 892 MatNullSpace nearnullspace,sub_nearnullspace; 893 ierr = MatGetNearNullSpace(B,&nearnullspace);CHKERRQ(ierr); 894 if (nearnullspace) { 895 ierr = PetscInfo(pc,"PCTelescope: generating near nullspace (DMDA)\n");CHKERRQ(ierr); 896 ierr = PCTelescopeSubNullSpaceCreate_dmda_Telescope(pc,sred,nearnullspace,&sub_nearnullspace);CHKERRQ(ierr); 897 if (PCTelescope_isActiveRank(sred)) { 898 ierr = MatSetNearNullSpace(sub_mat,sub_nearnullspace);CHKERRQ(ierr); 899 ierr = MatNullSpaceDestroy(&sub_nearnullspace);CHKERRQ(ierr); 900 } 901 } 902 } 903 PetscFunctionReturn(0); 904 } 905 906 PetscErrorCode PCApply_Telescope_dmda(PC pc,Vec x,Vec y) 907 { 908 PC_Telescope sred = (PC_Telescope)pc->data; 909 PetscErrorCode ierr; 910 Mat perm; 911 Vec xtmp,xp,xred,yred; 912 PetscInt i,st,ed; 913 VecScatter scatter; 914 PetscScalar *array; 915 const PetscScalar *x_array; 916 PC_Telescope_DMDACtx *ctx; 917 918 ctx = (PC_Telescope_DMDACtx*)sred->dm_ctx; 919 xtmp = sred->xtmp; 920 scatter = sred->scatter; 921 xred = sred->xred; 922 yred = sred->yred; 923 perm = ctx->permutation; 924 xp = ctx->xp; 925 926 PetscFunctionBegin; 927 ierr = PetscCitationsRegister(citation,&cited);CHKERRQ(ierr); 928 929 /* permute vector into ordering associated with re-partitioned dmda */ 930 ierr = MatMultTranspose(perm,x,xp);CHKERRQ(ierr); 931 932 /* pull in vector x->xtmp */ 933 ierr = VecScatterBegin(scatter,xp,xtmp,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 934 ierr = VecScatterEnd(scatter,xp,xtmp,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 935 936 /* copy vector entires into xred */ 937 ierr = VecGetArrayRead(xtmp,&x_array);CHKERRQ(ierr); 938 if (xred) { 939 PetscScalar *LA_xred; 940 ierr = VecGetOwnershipRange(xred,&st,&ed);CHKERRQ(ierr); 941 942 ierr = VecGetArray(xred,&LA_xred);CHKERRQ(ierr); 943 for (i=0; i<ed-st; i++) { 944 LA_xred[i] = x_array[i]; 945 } 946 ierr = VecRestoreArray(xred,&LA_xred);CHKERRQ(ierr); 947 } 948 ierr = VecRestoreArrayRead(xtmp,&x_array);CHKERRQ(ierr); 949 950 /* solve */ 951 if (PCTelescope_isActiveRank(sred)) { 952 ierr = KSPSolve(sred->ksp,xred,yred);CHKERRQ(ierr); 953 ierr = KSPCheckSolve(sred->ksp,pc,yred);CHKERRQ(ierr); 954 } 955 956 /* return vector */ 957 ierr = VecGetArray(xtmp,&array);CHKERRQ(ierr); 958 if (yred) { 959 const PetscScalar *LA_yred; 960 ierr = VecGetOwnershipRange(yred,&st,&ed);CHKERRQ(ierr); 961 ierr = VecGetArrayRead(yred,&LA_yred);CHKERRQ(ierr); 962 for (i=0; i<ed-st; i++) { 963 array[i] = LA_yred[i]; 964 } 965 ierr = VecRestoreArrayRead(yred,&LA_yred);CHKERRQ(ierr); 966 } 967 ierr = VecRestoreArray(xtmp,&array);CHKERRQ(ierr); 968 ierr = VecScatterBegin(scatter,xtmp,xp,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 969 ierr = VecScatterEnd(scatter,xtmp,xp,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 970 ierr = MatMult(perm,xp,y);CHKERRQ(ierr); 971 PetscFunctionReturn(0); 972 } 973 974 PetscErrorCode PCApplyRichardson_Telescope_dmda(PC pc,Vec x,Vec y,Vec w,PetscReal rtol,PetscReal abstol, PetscReal dtol,PetscInt its,PetscBool zeroguess,PetscInt *outits,PCRichardsonConvergedReason *reason) 975 { 976 PC_Telescope sred = (PC_Telescope)pc->data; 977 PetscErrorCode ierr; 978 Mat perm; 979 Vec xtmp,xp,yred; 980 PetscInt i,st,ed; 981 VecScatter scatter; 982 const PetscScalar *x_array; 983 PetscBool default_init_guess_value = PETSC_FALSE; 984 PC_Telescope_DMDACtx *ctx; 985 986 PetscFunctionBegin; 987 ctx = (PC_Telescope_DMDACtx*)sred->dm_ctx; 988 xtmp = sred->xtmp; 989 scatter = sred->scatter; 990 yred = sred->yred; 991 perm = ctx->permutation; 992 xp = ctx->xp; 993 994 if (its > 1) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_SUP,"PCApplyRichardson_Telescope_dmda only supports max_it = 1"); 995 *reason = (PCRichardsonConvergedReason)0; 996 997 if (!zeroguess) { 998 ierr = PetscInfo(pc,"PCTelescopeDMDA: Scattering y for non-zero-initial guess\n");CHKERRQ(ierr); 999 /* permute vector into ordering associated with re-partitioned dmda */ 1000 ierr = MatMultTranspose(perm,y,xp);CHKERRQ(ierr); 1001 1002 /* pull in vector x->xtmp */ 1003 ierr = VecScatterBegin(scatter,xp,xtmp,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1004 ierr = VecScatterEnd(scatter,xp,xtmp,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1005 1006 /* copy vector entires into xred */ 1007 ierr = VecGetArrayRead(xtmp,&x_array);CHKERRQ(ierr); 1008 if (yred) { 1009 PetscScalar *LA_yred; 1010 ierr = VecGetOwnershipRange(yred,&st,&ed);CHKERRQ(ierr); 1011 ierr = VecGetArray(yred,&LA_yred);CHKERRQ(ierr); 1012 for (i=0; i<ed-st; i++) { 1013 LA_yred[i] = x_array[i]; 1014 } 1015 ierr = VecRestoreArray(yred,&LA_yred);CHKERRQ(ierr); 1016 } 1017 ierr = VecRestoreArrayRead(xtmp,&x_array);CHKERRQ(ierr); 1018 } 1019 1020 if (PCTelescope_isActiveRank(sred)) { 1021 ierr = KSPGetInitialGuessNonzero(sred->ksp,&default_init_guess_value);CHKERRQ(ierr); 1022 if (!zeroguess) ierr = KSPSetInitialGuessNonzero(sred->ksp,PETSC_TRUE);CHKERRQ(ierr); 1023 } 1024 1025 ierr = PCApply_Telescope_dmda(pc,x,y);CHKERRQ(ierr); 1026 1027 if (PCTelescope_isActiveRank(sred)) { 1028 ierr = KSPSetInitialGuessNonzero(sred->ksp,default_init_guess_value);CHKERRQ(ierr); 1029 } 1030 1031 if (!*reason) *reason = PCRICHARDSON_CONVERGED_ITS; 1032 *outits = 1; 1033 PetscFunctionReturn(0); 1034 } 1035 1036 PetscErrorCode PCReset_Telescope_dmda(PC pc) 1037 { 1038 PetscErrorCode ierr; 1039 PC_Telescope sred = (PC_Telescope)pc->data; 1040 PC_Telescope_DMDACtx *ctx; 1041 1042 PetscFunctionBegin; 1043 ctx = (PC_Telescope_DMDACtx*)sred->dm_ctx; 1044 ierr = VecDestroy(&ctx->xp);CHKERRQ(ierr); 1045 ierr = MatDestroy(&ctx->permutation);CHKERRQ(ierr); 1046 ierr = DMDestroy(&ctx->dmrepart);CHKERRQ(ierr); 1047 ierr = PetscFree(ctx->range_i_re);CHKERRQ(ierr); 1048 ierr = PetscFree(ctx->range_j_re);CHKERRQ(ierr); 1049 ierr = PetscFree(ctx->range_k_re);CHKERRQ(ierr); 1050 ierr = PetscFree(ctx->start_i_re);CHKERRQ(ierr); 1051 ierr = PetscFree(ctx->start_j_re);CHKERRQ(ierr); 1052 ierr = PetscFree(ctx->start_k_re);CHKERRQ(ierr); 1053 PetscFunctionReturn(0); 1054 } 1055 1056 PetscErrorCode DMView_DA_Short_3d(DM dm,PetscViewer v) 1057 { 1058 PetscInt M,N,P,m,n,p,ndof,nsw; 1059 MPI_Comm comm; 1060 PetscMPIInt size; 1061 const char* prefix; 1062 PetscErrorCode ierr; 1063 1064 PetscFunctionBegin; 1065 ierr = PetscObjectGetComm((PetscObject)dm,&comm);CHKERRQ(ierr); 1066 ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 1067 ierr = DMGetOptionsPrefix(dm,&prefix);CHKERRQ(ierr); 1068 ierr = DMDAGetInfo(dm,NULL,&M,&N,&P,&m,&n,&p,&ndof,&nsw,NULL,NULL,NULL,NULL);CHKERRQ(ierr); 1069 if (prefix) {ierr = PetscViewerASCIIPrintf(v,"DMDA Object: (%s) %d MPI processes\n",prefix,size);CHKERRQ(ierr);} 1070 else {ierr = PetscViewerASCIIPrintf(v,"DMDA Object: %d MPI processes\n",size);CHKERRQ(ierr);} 1071 ierr = PetscViewerASCIIPrintf(v," M %D N %D P %D m %D n %D p %D dof %D overlap %D\n",M,N,P,m,n,p,ndof,nsw);CHKERRQ(ierr); 1072 PetscFunctionReturn(0); 1073 } 1074 1075 PetscErrorCode DMView_DA_Short_2d(DM dm,PetscViewer v) 1076 { 1077 PetscInt M,N,m,n,ndof,nsw; 1078 MPI_Comm comm; 1079 PetscMPIInt size; 1080 const char* prefix; 1081 PetscErrorCode ierr; 1082 1083 PetscFunctionBegin; 1084 ierr = PetscObjectGetComm((PetscObject)dm,&comm);CHKERRQ(ierr); 1085 ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 1086 ierr = DMGetOptionsPrefix(dm,&prefix);CHKERRQ(ierr); 1087 ierr = DMDAGetInfo(dm,NULL,&M,&N,NULL,&m,&n,NULL,&ndof,&nsw,NULL,NULL,NULL,NULL);CHKERRQ(ierr); 1088 if (prefix) {PetscViewerASCIIPrintf(v,"DMDA Object: (%s) %d MPI processes\n",prefix,size);CHKERRQ(ierr);} 1089 else {ierr = PetscViewerASCIIPrintf(v,"DMDA Object: %d MPI processes\n",size);CHKERRQ(ierr);} 1090 ierr = PetscViewerASCIIPrintf(v," M %D N %D m %D n %D dof %D overlap %D\n",M,N,m,n,ndof,nsw);CHKERRQ(ierr); 1091 PetscFunctionReturn(0); 1092 } 1093 1094 PetscErrorCode DMView_DA_Short(DM dm,PetscViewer v) 1095 { 1096 PetscErrorCode ierr; 1097 PetscInt dim; 1098 1099 PetscFunctionBegin; 1100 ierr = DMDAGetInfo(dm,&dim,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL);CHKERRQ(ierr); 1101 switch (dim) { 1102 case 2: ierr = DMView_DA_Short_2d(dm,v);CHKERRQ(ierr); 1103 break; 1104 case 3: ierr = DMView_DA_Short_3d(dm,v);CHKERRQ(ierr); 1105 break; 1106 } 1107 PetscFunctionReturn(0); 1108 } 1109 1110