1dba47a55SKris Buschelman #define PETSCKSP_DLL 2dba47a55SKris Buschelman 34b9ad928SBarry Smith /* 43f457be1SHong Zhang This file defines a "solve the problem redundantly on each subgroup of processor" preconditioner. 54b9ad928SBarry Smith */ 66356e834SBarry Smith #include "private/pcimpl.h" /*I "petscpc.h" I*/ 74b9ad928SBarry Smith #include "petscksp.h" 84b9ad928SBarry Smith 94b9ad928SBarry Smith typedef struct { 104b9ad928SBarry Smith PC pc; /* actual preconditioner used on each processor */ 113f457be1SHong Zhang Vec xsub,ysub; /* vectors of a subcommunicator to hold parallel vectors of pc->comm */ 123f457be1SHong Zhang Vec xdup,ydup; /* parallel vector that congregates xsub or ysub facilitating vector scattering */ 134b9ad928SBarry Smith Mat *pmats; /* matrix and optional preconditioner matrix */ 14*f664ae05SHong Zhang Mat pmats_sub; /* matrix and optional preconditioner matrix belong to a subcommunicator */ 153f457be1SHong Zhang VecScatter scatterin,scatterout; /* scatter used to move all values to each processor group (subcommunicator) */ 164b9ad928SBarry Smith PetscTruth useparallelmat; 173f457be1SHong Zhang MPI_Comm subcomm; /* processors belong to a subcommunicator implement a PC in parallel */ 183f457be1SHong Zhang MPI_Comm dupcomm; /* processors belong to pc->comm with their rank remapped in the way 193f457be1SHong Zhang that vector xdup/ydup has contiguous rank while appending xsub/ysub along their colors */ 203f457be1SHong Zhang PetscInt nsubcomm; /* num of subcommunicators, which equals the num of redundant matrix systems */ 213f457be1SHong Zhang PetscInt color; /* color of processors in a subcommunicator */ 224b9ad928SBarry Smith } PC_Redundant; 234b9ad928SBarry Smith 244b9ad928SBarry Smith #undef __FUNCT__ 254b9ad928SBarry Smith #define __FUNCT__ "PCView_Redundant" 266849ba73SBarry Smith static PetscErrorCode PCView_Redundant(PC pc,PetscViewer viewer) 274b9ad928SBarry Smith { 284b9ad928SBarry Smith PC_Redundant *red = (PC_Redundant*)pc->data; 29dfbe8321SBarry Smith PetscErrorCode ierr; 3013f74950SBarry Smith PetscMPIInt rank; 3132077d6dSBarry Smith PetscTruth iascii,isstring; 324b9ad928SBarry Smith PetscViewer sviewer; 334b9ad928SBarry Smith 344b9ad928SBarry Smith PetscFunctionBegin; 354b9ad928SBarry Smith ierr = MPI_Comm_rank(pc->comm,&rank);CHKERRQ(ierr); 3632077d6dSBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSC_VIEWER_ASCII,&iascii);CHKERRQ(ierr); 374b9ad928SBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSC_VIEWER_STRING,&isstring);CHKERRQ(ierr); 3832077d6dSBarry Smith if (iascii) { 394b9ad928SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," Redundant solver preconditioner: Actual PC follows\n");CHKERRQ(ierr); 404b9ad928SBarry Smith ierr = PetscViewerGetSingleton(viewer,&sviewer);CHKERRQ(ierr); 414b9ad928SBarry Smith if (!rank) { 424b9ad928SBarry Smith ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr); 434b9ad928SBarry Smith ierr = PCView(red->pc,sviewer);CHKERRQ(ierr); 444b9ad928SBarry Smith ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr); 454b9ad928SBarry Smith } 464b9ad928SBarry Smith ierr = PetscViewerRestoreSingleton(viewer,&sviewer);CHKERRQ(ierr); 474b9ad928SBarry Smith } else if (isstring) { 484b9ad928SBarry Smith ierr = PetscViewerStringSPrintf(viewer," Redundant solver preconditioner");CHKERRQ(ierr); 494b9ad928SBarry Smith ierr = PetscViewerGetSingleton(viewer,&sviewer);CHKERRQ(ierr); 504b9ad928SBarry Smith if (!rank) { 514b9ad928SBarry Smith ierr = PCView(red->pc,sviewer);CHKERRQ(ierr); 524b9ad928SBarry Smith } 534b9ad928SBarry Smith ierr = PetscViewerRestoreSingleton(viewer,&sviewer);CHKERRQ(ierr); 544b9ad928SBarry Smith } else { 5579a5c55eSBarry Smith SETERRQ1(PETSC_ERR_SUP,"Viewer type %s not supported for PC redundant",((PetscObject)viewer)->type_name); 564b9ad928SBarry Smith } 574b9ad928SBarry Smith PetscFunctionReturn(0); 584b9ad928SBarry Smith } 594b9ad928SBarry Smith 603f457be1SHong Zhang #include "src/mat/matimpl.h" /*I "petscmat.h" I*/ 613f457be1SHong Zhang #include "private/vecimpl.h" 623f457be1SHong Zhang #include "src/mat/impls/aij/mpi/mpiaij.h" /*I "petscmat.h" I*/ 633f457be1SHong Zhang #include "src/mat/impls/aij/seq/aij.h" /*I "petscmat.h" I*/ 643f457be1SHong Zhang 653f457be1SHong Zhang #undef __FUNCT__ 663f457be1SHong Zhang #define __FUNCT__ "MatGetRedundantMatrix" 67*f664ae05SHong Zhang PetscErrorCode MatGetRedundantMatrix_AIJ(Mat mat,PetscInt nsubcomm,MPI_Comm subcomm,PetscInt mlocal_sub,MatReuse reuse,Mat *matredundant) 683f457be1SHong Zhang { 693f457be1SHong Zhang PetscMPIInt rank,size,subrank,subsize; 703f457be1SHong Zhang MPI_Comm comm=mat->comm; 713f457be1SHong Zhang PetscErrorCode ierr; 72*f664ae05SHong Zhang PetscInt nsends,nrecvs,i,prid=100,itmp; 733f457be1SHong Zhang PetscMPIInt *send_rank,*recv_rank; 74*f664ae05SHong Zhang PetscInt *rowrange=mat->rmap.range,nzlocal; 753f457be1SHong Zhang Mat_MPIAIJ *aij = (Mat_MPIAIJ*)mat->data; 763f457be1SHong Zhang Mat A=aij->A,B=aij->B; 773f457be1SHong Zhang Mat_SeqAIJ *a=(Mat_SeqAIJ*)A->data,*b=(Mat_SeqAIJ*)B->data; 783f457be1SHong Zhang Mat C; 793f457be1SHong Zhang 803f457be1SHong Zhang PetscInt nleftover,np_subcomm,j; 813f457be1SHong Zhang PetscInt nz_A,nz_B,*sbuf_j; 823f457be1SHong Zhang PetscScalar *sbuf_a; 833f457be1SHong Zhang PetscInt cstart=mat->cmap.rstart,cend=mat->cmap.rend,row,nzA,nzB,ncols,*cworkA,*cworkB; 843f457be1SHong Zhang PetscInt rstart=mat->rmap.rstart,rend=mat->rmap.rend,*bmap=aij->garray,M,N; 853f457be1SHong Zhang PetscInt *cols,ctmp,lwrite,*rptr,l; 863f457be1SHong Zhang PetscScalar *vals,*aworkA,*aworkB; 873f457be1SHong Zhang PetscMPIInt tag1,tag2,tag3,imdex; 883f457be1SHong Zhang MPI_Request *s_waits1,*s_waits2,*s_waits3,*r_waits1,*r_waits2,*r_waits3; 893f457be1SHong Zhang MPI_Status recv_status,*send_status; 903f457be1SHong Zhang PetscInt *sbuf_nz,*rbuf_nz,count; 913f457be1SHong Zhang PetscInt **rbuf_j; 923f457be1SHong Zhang PetscScalar **rbuf_a; 933f457be1SHong Zhang 943f457be1SHong Zhang PetscFunctionBegin; 953f457be1SHong Zhang ierr = PetscOptionsGetInt(PETSC_NULL,"-prid",&prid,PETSC_NULL);CHKERRQ(ierr); 963f457be1SHong Zhang ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr); 973f457be1SHong Zhang ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 983f457be1SHong Zhang ierr = MPI_Comm_rank(subcomm,&subrank);CHKERRQ(ierr); 993f457be1SHong Zhang ierr = MPI_Comm_size(subcomm,&subsize);CHKERRQ(ierr); 1003f457be1SHong Zhang /* 1013f457be1SHong Zhang ierr = PetscSynchronizedPrintf(comm, "[%d] subrank %d, subsize %d\n",rank,subrank,subsize); 1023f457be1SHong Zhang ierr = PetscSynchronizedFlush(comm);CHKERRQ(ierr); 1033f457be1SHong Zhang */ 1043f457be1SHong Zhang /* get the destination processors */ 1053f457be1SHong Zhang ierr = PetscMalloc((2*size+1)*sizeof(PetscMPIInt),&send_rank); 1063f457be1SHong Zhang recv_rank = send_rank + size; 1073f457be1SHong Zhang np_subcomm = size/nsubcomm; 1083f457be1SHong Zhang nleftover = size - nsubcomm*np_subcomm; 1093f457be1SHong Zhang nsends = 0; nrecvs = 0; 1103f457be1SHong Zhang for (i=0; i<size; i++){ /* i=rank*/ 1113f457be1SHong Zhang if (subrank == i/nsubcomm && rank != i){ /* my_subrank == other's subrank */ 1123f457be1SHong Zhang send_rank[nsends] = i; nsends++; 1133f457be1SHong Zhang recv_rank[nrecvs++] = i; 1143f457be1SHong Zhang } 1153f457be1SHong Zhang } 1163f457be1SHong Zhang if (rank >= size - nleftover){/* this proc is a leftover processor */ 1173f457be1SHong Zhang i = size-nleftover-1; 1183f457be1SHong Zhang j = 0; 1193f457be1SHong Zhang while (j < nsubcomm - nleftover){ 1203f457be1SHong Zhang send_rank[nsends++] = i; 1213f457be1SHong Zhang i--; j++; 1223f457be1SHong Zhang } 1233f457be1SHong Zhang } 1243f457be1SHong Zhang 1253f457be1SHong Zhang if (nleftover && subsize == size/nsubcomm && subrank==subsize-1){ /* this proc recvs from leftover processors */ 1263f457be1SHong Zhang for (i=0; i<nleftover; i++){ 1273f457be1SHong Zhang recv_rank[nrecvs++] = size-nleftover+i; 1283f457be1SHong Zhang } 1293f457be1SHong Zhang } 1303f457be1SHong Zhang if (prid == rank){ 1313f457be1SHong Zhang printf("[%d] sends to ",rank); 1323f457be1SHong Zhang for (i=0; i<nsends; i++) printf(" [%d],",send_rank[i]); 1333f457be1SHong Zhang printf(" \n"); 1343f457be1SHong Zhang } 1353f457be1SHong Zhang /* 1363f457be1SHong Zhang ierr = PetscSynchronizedPrintf(comm, "[%d] nsends %d, nrecvs %d\n",rank,nsends,nrecvs); 1373f457be1SHong Zhang ierr = PetscSynchronizedFlush(comm);CHKERRQ(ierr); 1383f457be1SHong Zhang ierr = MPI_Barrier(comm);CHKERRQ(ierr); 1393f457be1SHong Zhang */ 1403f457be1SHong Zhang 1413f457be1SHong Zhang /* get this processor's nzlocal=nz_A+nz_B */ 1423f457be1SHong Zhang nz_A = a->nz; nz_B = b->nz; 1433f457be1SHong Zhang nzlocal = nz_A + nz_B; 1443f457be1SHong Zhang 1453f457be1SHong Zhang /* allocate sbuf_j, sbuf_a, then copy mat's local entries into the buffers */ 1463f457be1SHong Zhang itmp = nzlocal + rowrange[rank+1] - rowrange[rank] + 2; 1473f457be1SHong Zhang ierr = PetscMalloc(itmp*sizeof(PetscInt),&sbuf_j);CHKERRQ(ierr); 1483f457be1SHong Zhang ierr = PetscMalloc((nzlocal+1)*sizeof(PetscScalar),&sbuf_a);CHKERRQ(ierr); 1493f457be1SHong Zhang 1503f457be1SHong Zhang rptr = sbuf_j; 1513f457be1SHong Zhang cols = sbuf_j + rend-rstart + 1; 1523f457be1SHong Zhang vals = sbuf_a; 1533f457be1SHong Zhang rptr[0] = 0; 1543f457be1SHong Zhang for (i=0; i<rend-rstart; i++){ 1553f457be1SHong Zhang row = i + rstart; 1563f457be1SHong Zhang nzA = a->i[i+1] - a->i[i]; nzB = b->i[i+1] - b->i[i]; 1573f457be1SHong Zhang ncols = nzA + nzB; 1583f457be1SHong Zhang cworkA = a->j + a->i[i]; cworkB = b->j + b->i[i]; 1593f457be1SHong Zhang aworkA = a->a + a->i[i]; aworkB = b->a + b->i[i]; 1603f457be1SHong Zhang /* load the column indices for this row into cols */ 1613f457be1SHong Zhang lwrite = 0; 1623f457be1SHong Zhang for (l=0; l<nzB; l++) { 1633f457be1SHong Zhang if ((ctmp = bmap[cworkB[l]]) < cstart){ 1643f457be1SHong Zhang vals[lwrite] = aworkB[l]; 1653f457be1SHong Zhang cols[lwrite++] = ctmp; 1663f457be1SHong Zhang } 1673f457be1SHong Zhang } 1683f457be1SHong Zhang for (l=0; l<nzA; l++){ 1693f457be1SHong Zhang vals[lwrite] = aworkA[l]; 1703f457be1SHong Zhang cols[lwrite++] = cstart + cworkA[l]; 1713f457be1SHong Zhang } 1723f457be1SHong Zhang for (l=0; l<nzB; l++) { 1733f457be1SHong Zhang if ((ctmp = bmap[cworkB[l]]) >= cend){ 1743f457be1SHong Zhang vals[lwrite] = aworkB[l]; 1753f457be1SHong Zhang cols[lwrite++] = ctmp; 1763f457be1SHong Zhang } 1773f457be1SHong Zhang } 1783f457be1SHong Zhang /* insert local matrix values into C */ 179ca616198SHong Zhang /* ierr = MatSetValues(C,1,&row,ncols,cols,vals,INSERT_VALUES);CHKERRQ(ierr); */ 1803f457be1SHong Zhang 1813f457be1SHong Zhang vals += ncols; 1823f457be1SHong Zhang cols += ncols; 1833f457be1SHong Zhang rptr[i+1] = rptr[i] + ncols; 1843f457be1SHong Zhang } 1853f457be1SHong Zhang /* 1863f457be1SHong Zhang ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1873f457be1SHong Zhang ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1883f457be1SHong Zhang */ 1893f457be1SHong Zhang if (rptr[rend-rstart] != a->nz + b->nz) SETERRQ4(1, "rptr[%d] %d != %d + %d",rend-rstart,rptr[rend-rstart+1],a->nz,b->nz); 1903f457be1SHong Zhang 1913f457be1SHong Zhang /* send nzlocal to others, and recv other's nzlocal */ 1923f457be1SHong Zhang /*--------------------------------------------------*/ 1933f457be1SHong Zhang ierr = PetscMalloc3(nsends+nrecvs+1,PetscInt,&sbuf_nz,nrecvs,PetscInt*,&rbuf_j,nrecvs,PetscScalar*,&rbuf_a);CHKERRQ(ierr); 1943f457be1SHong Zhang rbuf_nz = sbuf_nz + nsends; 1953f457be1SHong Zhang 1963f457be1SHong Zhang ierr = PetscMalloc2(3*(nsends + nrecvs)+1,MPI_Request,&s_waits1,nsends+1,MPI_Status,&send_status);CHKERRQ(ierr); 1973f457be1SHong Zhang s_waits2 = s_waits1 + nsends; 1983f457be1SHong Zhang s_waits3 = s_waits2 + nsends; 1993f457be1SHong Zhang r_waits1 = s_waits3 + nsends; 2003f457be1SHong Zhang r_waits2 = r_waits1 + nrecvs; 2013f457be1SHong Zhang r_waits3 = r_waits2 + nrecvs; 2023f457be1SHong Zhang 2033f457be1SHong Zhang /* get some new tags to keep the communication clean */ 2043f457be1SHong Zhang ierr = PetscObjectGetNewTag((PetscObject)A,&tag1);CHKERRQ(ierr); 2053f457be1SHong Zhang ierr = PetscObjectGetNewTag((PetscObject)A,&tag2);CHKERRQ(ierr); 2063f457be1SHong Zhang ierr = PetscObjectGetNewTag((PetscObject)A,&tag3);CHKERRQ(ierr); 2073f457be1SHong Zhang 2083f457be1SHong Zhang /* post receives of other's nzlocal */ 2093f457be1SHong Zhang for (i=0; i<nrecvs; i++){ 2103f457be1SHong Zhang ierr = MPI_Irecv(rbuf_nz+i,1,MPIU_INT,MPI_ANY_SOURCE,tag1,comm,r_waits1+i);CHKERRQ(ierr); 2113f457be1SHong Zhang } 2123f457be1SHong Zhang 2133f457be1SHong Zhang /* send nzlocal to others */ 2143f457be1SHong Zhang for (i=0; i<nsends; i++){ 2153f457be1SHong Zhang sbuf_nz[i] = nzlocal; 2163f457be1SHong Zhang ierr = MPI_Isend(sbuf_nz+i,1,MPIU_INT,send_rank[i],tag1,comm,s_waits1+i);CHKERRQ(ierr); 2173f457be1SHong Zhang if (prid == rank) printf(" [%d] sends nz %d to [%d]\n",rank,nzlocal,send_rank[i]); 2183f457be1SHong Zhang } 2193f457be1SHong Zhang 2203f457be1SHong Zhang /* wait on receives of nzlocal; allocate space for rbuf_j, rbuf_a */ 2213f457be1SHong Zhang count = nrecvs; 2223f457be1SHong Zhang while (count) { 2233f457be1SHong Zhang ierr = MPI_Waitany(nrecvs,r_waits1,&imdex,&recv_status);CHKERRQ(ierr); 2243f457be1SHong Zhang recv_rank[imdex] = recv_status.MPI_SOURCE; 2253f457be1SHong Zhang /* allocate rbuf_a and rbuf_j; then post receives of rbuf_a and rbuf_j */ 2263f457be1SHong Zhang ierr = PetscMalloc((rbuf_nz[imdex]+1)*sizeof(PetscScalar),&rbuf_a[imdex]);CHKERRQ(ierr); 2273f457be1SHong Zhang ierr = MPI_Irecv(rbuf_a[imdex],rbuf_nz[imdex],MPIU_SCALAR,recv_status.MPI_SOURCE,tag3,comm,r_waits3+imdex);CHKERRQ(ierr); 2283f457be1SHong Zhang 2293f457be1SHong Zhang itmp = rowrange[recv_status.MPI_SOURCE+1] - rowrange[recv_status.MPI_SOURCE]; /* number of expected mat->i */ 2303f457be1SHong Zhang rbuf_nz[imdex] += itmp+2; 2313f457be1SHong Zhang ierr = PetscMalloc(rbuf_nz[imdex]*sizeof(PetscInt),&rbuf_j[imdex]);CHKERRQ(ierr); 2323f457be1SHong Zhang ierr = MPI_Irecv(rbuf_j[imdex],rbuf_nz[imdex],MPIU_INT,recv_status.MPI_SOURCE,tag2,comm,r_waits2+imdex);CHKERRQ(ierr); 2333f457be1SHong Zhang count--; 2343f457be1SHong Zhang } 2353f457be1SHong Zhang 2363f457be1SHong Zhang /* wait on sends of nzlocal */ 2373f457be1SHong Zhang if (nsends) {ierr = MPI_Waitall(nsends,s_waits1,send_status);CHKERRQ(ierr);} 2383f457be1SHong Zhang 2393f457be1SHong Zhang /* send mat->i,j and mat->a to others, and recv from other's */ 2403f457be1SHong Zhang /*-----------------------------------------------------------*/ 2413f457be1SHong Zhang for (i=0; i<nsends; i++){ 2423f457be1SHong Zhang ierr = MPI_Isend(sbuf_a,nzlocal,MPIU_SCALAR,send_rank[i],tag3,comm,s_waits3+i);CHKERRQ(ierr); 2433f457be1SHong Zhang itmp = nzlocal + rowrange[rank+1] - rowrange[rank] + 1; 2443f457be1SHong Zhang ierr = MPI_Isend(sbuf_j,itmp,MPIU_INT,send_rank[i],tag2,comm,s_waits2+i);CHKERRQ(ierr); 2453f457be1SHong Zhang } 2463f457be1SHong Zhang 2473f457be1SHong Zhang /* wait on receives of mat->i,j and mat->a */ 2483f457be1SHong Zhang /*-----------------------------------------*/ 2493f457be1SHong Zhang count = nrecvs; 2503f457be1SHong Zhang while (count) { 2513f457be1SHong Zhang ierr = MPI_Waitany(nrecvs,r_waits3,&imdex,&recv_status);CHKERRQ(ierr); 2523f457be1SHong Zhang if (recv_rank[imdex] != recv_status.MPI_SOURCE) SETERRQ2(1, "recv_rank %d != MPI_SOURCE %d",recv_rank[imdex],recv_status.MPI_SOURCE); 2533f457be1SHong Zhang ierr = MPI_Waitany(nrecvs,r_waits2,&imdex,&recv_status);CHKERRQ(ierr); 2543f457be1SHong Zhang count--; 2553f457be1SHong Zhang } 2563f457be1SHong Zhang 2573f457be1SHong Zhang /* wait on sends of mat->i,j and mat->a */ 2583f457be1SHong Zhang /*--------------------------------------*/ 2593f457be1SHong Zhang if (nsends) { 2603f457be1SHong Zhang ierr = MPI_Waitall(nsends,s_waits3,send_status);CHKERRQ(ierr); 2613f457be1SHong Zhang ierr = MPI_Waitall(nsends,s_waits2,send_status);CHKERRQ(ierr); 2623f457be1SHong Zhang } 2633f457be1SHong Zhang ierr = PetscFree(sbuf_nz);CHKERRQ(ierr); 2643f457be1SHong Zhang ierr = PetscFree2(s_waits1,send_status);CHKERRQ(ierr); 2653f457be1SHong Zhang 2663f457be1SHong Zhang /* create redundant matrix */ 2673f457be1SHong Zhang /*-------------------------*/ 2683f457be1SHong Zhang ierr = MatCreate(subcomm,&C);CHKERRQ(ierr); 2693f457be1SHong Zhang ierr = MatSetSizes(C,mlocal_sub,mlocal_sub,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr); 2703f457be1SHong Zhang ierr = MatSetFromOptions(C);CHKERRQ(ierr); 2713f457be1SHong Zhang 2723f457be1SHong Zhang /* insert local matrix entries */ 2733f457be1SHong Zhang rptr = sbuf_j; 2743f457be1SHong Zhang cols = sbuf_j + rend-rstart + 1; 2753f457be1SHong Zhang vals = sbuf_a; 2763f457be1SHong Zhang for (i=0; i<rend-rstart; i++){ 2773f457be1SHong Zhang row = i + rstart; 2783f457be1SHong Zhang ncols = rptr[i+1] - rptr[i]; 2793f457be1SHong Zhang ierr = MatSetValues(C,1,&row,ncols,cols,vals,INSERT_VALUES);CHKERRQ(ierr); 2803f457be1SHong Zhang vals += ncols; 2813f457be1SHong Zhang cols += ncols; 2823f457be1SHong Zhang } 2833f457be1SHong Zhang /* insert received matrix entries */ 2843f457be1SHong Zhang for (imdex=0; imdex<nrecvs; imdex++){ 2853f457be1SHong Zhang 2863f457be1SHong Zhang rstart = rowrange[recv_rank[imdex]]; 2873f457be1SHong Zhang rend = rowrange[recv_rank[imdex]+1]; 2883f457be1SHong Zhang rptr = rbuf_j[imdex]; 2893f457be1SHong Zhang cols = rbuf_j[imdex] + rend-rstart + 1; 2903f457be1SHong Zhang vals = rbuf_a[imdex]; 2913f457be1SHong Zhang for (i=0; i<rend-rstart; i++){ 2923f457be1SHong Zhang row = i + rstart; 2933f457be1SHong Zhang ncols = rptr[i+1] - rptr[i]; 2943f457be1SHong Zhang ierr = MatSetValues(C,1,&row,ncols,cols,vals,INSERT_VALUES);CHKERRQ(ierr); 2953f457be1SHong Zhang vals += ncols; 2963f457be1SHong Zhang cols += ncols; 2973f457be1SHong Zhang } 2983f457be1SHong Zhang } 2993f457be1SHong Zhang ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3003f457be1SHong Zhang ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3013f457be1SHong Zhang ierr = MatGetSize(C,&M,&N);CHKERRQ(ierr); 3023f457be1SHong Zhang if (M != mat->rmap.N || N != mat->cmap.N) SETERRQ2(PETSC_ERR_ARG_INCOMP,"redundant mat size %d != input mat size %d",M,mat->rmap.N); 3033f457be1SHong Zhang *matredundant = C; 3043f457be1SHong Zhang 3053f457be1SHong Zhang /* free space */ 3063f457be1SHong Zhang ierr = PetscFree(send_rank);CHKERRQ(ierr); 3073f457be1SHong Zhang ierr = PetscFree(sbuf_j);CHKERRQ(ierr); 3083f457be1SHong Zhang ierr = PetscFree(sbuf_a);CHKERRQ(ierr); 3093f457be1SHong Zhang for (i=0; i<nrecvs; i++){ 3103f457be1SHong Zhang ierr = PetscFree(rbuf_j[i]);CHKERRQ(ierr); 3113f457be1SHong Zhang ierr = PetscFree(rbuf_a[i]);CHKERRQ(ierr); 3123f457be1SHong Zhang } 3133f457be1SHong Zhang ierr = PetscFree3(sbuf_nz,rbuf_j,rbuf_a);CHKERRQ(ierr); 3143f457be1SHong Zhang PetscFunctionReturn(0); 3153f457be1SHong Zhang } 3163f457be1SHong Zhang 3174b9ad928SBarry Smith #undef __FUNCT__ 3184b9ad928SBarry Smith #define __FUNCT__ "PCSetUp_Redundant" 3196849ba73SBarry Smith static PetscErrorCode PCSetUp_Redundant(PC pc) 3204b9ad928SBarry Smith { 3214b9ad928SBarry Smith PC_Redundant *red = (PC_Redundant*)pc->data; 322dfbe8321SBarry Smith PetscErrorCode ierr; 3233f457be1SHong Zhang PetscInt mstart,mend,mlocal,m; 32413f74950SBarry Smith PetscMPIInt size; 3254b9ad928SBarry Smith IS isl; 3264b9ad928SBarry Smith MatReuse reuse = MAT_INITIAL_MATRIX; 3274b9ad928SBarry Smith MatStructure str = DIFFERENT_NONZERO_PATTERN; 3284b9ad928SBarry Smith MPI_Comm comm; 32923ce1328SBarry Smith Vec vec; 3304b9ad928SBarry Smith 3313f457be1SHong Zhang PetscInt mlocal_sub; 3323f457be1SHong Zhang PetscMPIInt subsize,subrank; 3333f457be1SHong Zhang PetscInt rstart_sub,rend_sub,mloc_sub; 3343f457be1SHong Zhang Mat Aredundant; 3353f457be1SHong Zhang 3364b9ad928SBarry Smith PetscFunctionBegin; 3373f457be1SHong Zhang ierr = PetscObjectGetComm((PetscObject)pc->pmat,&comm);CHKERRQ(ierr); 33823ce1328SBarry Smith ierr = MatGetVecs(pc->pmat,&vec,0);CHKERRQ(ierr); 3394b9ad928SBarry Smith ierr = PCSetFromOptions(red->pc);CHKERRQ(ierr); 34023ce1328SBarry Smith ierr = VecGetSize(vec,&m);CHKERRQ(ierr); 3414b9ad928SBarry Smith if (!pc->setupcalled) { 3423f457be1SHong Zhang /* create working vectors xsub/ysub and xdup/ydup */ 34323ce1328SBarry Smith ierr = VecGetLocalSize(vec,&mlocal);CHKERRQ(ierr); 3443f457be1SHong Zhang ierr = VecGetOwnershipRange(vec,&mstart,&mend);CHKERRQ(ierr); 3454b9ad928SBarry Smith 3463f457be1SHong Zhang /* get local size of xsub/ysub */ 3473f457be1SHong Zhang ierr = MPI_Comm_size(red->subcomm,&subsize);CHKERRQ(ierr); 3483f457be1SHong Zhang ierr = MPI_Comm_rank(red->subcomm,&subrank);CHKERRQ(ierr); 3493f457be1SHong Zhang rstart_sub = pc->pmat->rmap.range[red->nsubcomm*subrank]; /* rstart in xsub/ysub */ 3503f457be1SHong Zhang if (subrank+1 < subsize){ 3513f457be1SHong Zhang rend_sub = pc->pmat->rmap.range[red->nsubcomm*(subrank+1)]; 3523f457be1SHong Zhang } else { 3533f457be1SHong Zhang rend_sub = m; 3543f457be1SHong Zhang } 3553f457be1SHong Zhang mloc_sub = rend_sub - rstart_sub; 3563f457be1SHong Zhang ierr = VecCreateMPI(red->subcomm,mloc_sub,PETSC_DECIDE,&red->ysub);CHKERRQ(ierr); 3573f457be1SHong Zhang /* create xsub with empty local arrays, because xdup's arrays will be placed into it */ 3583f457be1SHong Zhang ierr = VecCreateMPIWithArray(red->subcomm,mloc_sub,PETSC_DECIDE,PETSC_NULL,&red->xsub);CHKERRQ(ierr); 3593f457be1SHong Zhang 3603f457be1SHong Zhang /* create xdup and ydup. ydup has empty local arrays because ysub's arrays will be place into it. 3613f457be1SHong Zhang Note: we use communicator dupcomm, not pc->comm! */ 3623f457be1SHong Zhang ierr = VecCreateMPI(red->dupcomm,mloc_sub,PETSC_DECIDE,&red->xdup);CHKERRQ(ierr); 3633f457be1SHong Zhang ierr = VecCreateMPIWithArray(red->dupcomm,mloc_sub,PETSC_DECIDE,PETSC_NULL,&red->ydup);CHKERRQ(ierr); 3643f457be1SHong Zhang 3653f457be1SHong Zhang /* create vec scatters */ 3663f457be1SHong Zhang if (!red->scatterin){ 3673f457be1SHong Zhang IS is1,is2; 3683f457be1SHong Zhang PetscInt *idx1,*idx2,i,j,k; 3693f457be1SHong Zhang ierr = PetscMalloc(2*red->nsubcomm*mlocal*sizeof(PetscInt),&idx1);CHKERRQ(ierr); 3703f457be1SHong Zhang idx2 = idx1 + red->nsubcomm*mlocal; 3713f457be1SHong Zhang j = 0; 3723f457be1SHong Zhang for (k=0; k<red->nsubcomm; k++){ 3733f457be1SHong Zhang for (i=mstart; i<mend; i++){ 3743f457be1SHong Zhang idx1[j] = i; 3753f457be1SHong Zhang idx2[j++] = i + m*k; 3763f457be1SHong Zhang } 3773f457be1SHong Zhang } 3783f457be1SHong Zhang ierr = ISCreateGeneral(comm,red->nsubcomm*mlocal,idx1,&is1);CHKERRQ(ierr); 3793f457be1SHong Zhang ierr = ISCreateGeneral(comm,red->nsubcomm*mlocal,idx2,&is2);CHKERRQ(ierr); 3803f457be1SHong Zhang ierr = VecScatterCreate(vec,is1,red->xdup,is2,&red->scatterin);CHKERRQ(ierr); 3813f457be1SHong Zhang ierr = ISDestroy(is1);CHKERRQ(ierr); 3823f457be1SHong Zhang ierr = ISDestroy(is2);CHKERRQ(ierr); 3833f457be1SHong Zhang 3843f457be1SHong Zhang ierr = ISCreateStride(comm,mlocal,mstart+ red->color*m,1,&is1);CHKERRQ(ierr); 3853f457be1SHong Zhang ierr = ISCreateStride(comm,mlocal,mstart,1,&is2);CHKERRQ(ierr); 3863f457be1SHong Zhang ierr = VecScatterCreate(red->xdup,is1,vec,is2,&red->scatterout);CHKERRQ(ierr); 3873f457be1SHong Zhang ierr = ISDestroy(is1);CHKERRQ(ierr); 3883f457be1SHong Zhang ierr = ISDestroy(is2);CHKERRQ(ierr); 3893f457be1SHong Zhang ierr = PetscFree(idx1);CHKERRQ(ierr); 3904b9ad928SBarry Smith } 3914b9ad928SBarry Smith } 39223ce1328SBarry Smith ierr = VecDestroy(vec);CHKERRQ(ierr); 3934b9ad928SBarry Smith 3944b9ad928SBarry Smith /* if pmatrix set by user is sequential then we do not need to gather the parallel matrix */ 3953f457be1SHong Zhang ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 3964b9ad928SBarry Smith if (size == 1) { 3974b9ad928SBarry Smith red->useparallelmat = PETSC_FALSE; 3984b9ad928SBarry Smith } 3994b9ad928SBarry Smith 4004b9ad928SBarry Smith if (red->useparallelmat) { 4014b9ad928SBarry Smith if (pc->setupcalled == 1 && pc->flag == DIFFERENT_NONZERO_PATTERN) { 4024b9ad928SBarry Smith /* destroy old matrices */ 4034b9ad928SBarry Smith if (red->pmats) { 4044b9ad928SBarry Smith ierr = MatDestroyMatrices(1,&red->pmats);CHKERRQ(ierr); 4054b9ad928SBarry Smith } 4064b9ad928SBarry Smith } else if (pc->setupcalled == 1) { 4074b9ad928SBarry Smith reuse = MAT_REUSE_MATRIX; 4084b9ad928SBarry Smith str = SAME_NONZERO_PATTERN; 4094b9ad928SBarry Smith } 4104b9ad928SBarry Smith 4113f457be1SHong Zhang /* grab the parallel matrix and put it into processors of a subcomminicator */ 412*f664ae05SHong Zhang /*--------------------------------------------------------------------------*/ 413*f664ae05SHong Zhang if (red->nsubcomm == size){ 414*f664ae05SHong Zhang /* create sequential matrices in each processor */ 4154b9ad928SBarry Smith ierr = ISCreateStride(PETSC_COMM_SELF,m,0,1,&isl);CHKERRQ(ierr); 4164b9ad928SBarry Smith ierr = MatGetSubMatrices(pc->pmat,1,&isl,&isl,reuse,&red->pmats);CHKERRQ(ierr); 4174b9ad928SBarry Smith ierr = ISDestroy(isl);CHKERRQ(ierr); 418*f664ae05SHong Zhang ierr = PCSetOperators(red->pc,red->pmats[0],red->pmats[0],str);CHKERRQ(ierr); 419*f664ae05SHong Zhang } else { 420*f664ae05SHong Zhang /* create mpi matrices in each subcommunicator */ 421*f664ae05SHong Zhang ierr = VecGetLocalSize(red->ysub,&mlocal_sub);CHKERRQ(ierr); 422*f664ae05SHong Zhang ierr = MatGetRedundantMatrix_AIJ(pc->pmat,red->nsubcomm,red->subcomm,mlocal_sub,reuse,&Aredundant);CHKERRQ(ierr); 4233f457be1SHong Zhang red->pmats_sub = Aredundant; 4243f457be1SHong Zhang /* tell PC of the subcommunicator its operators */ 425*f664ae05SHong Zhang ierr = PCSetOperators(red->pc,Aredundant,Aredundant,str);CHKERRQ(ierr); 426*f664ae05SHong Zhang } 4274b9ad928SBarry Smith } else { 4284b9ad928SBarry Smith ierr = PCSetOperators(red->pc,pc->mat,pc->pmat,pc->flag);CHKERRQ(ierr); 4294b9ad928SBarry Smith } 4304b9ad928SBarry Smith ierr = PCSetFromOptions(red->pc);CHKERRQ(ierr); 4314b9ad928SBarry Smith ierr = PCSetUp(red->pc);CHKERRQ(ierr); 4324b9ad928SBarry Smith PetscFunctionReturn(0); 4334b9ad928SBarry Smith } 4344b9ad928SBarry Smith 4354b9ad928SBarry Smith #undef __FUNCT__ 4364b9ad928SBarry Smith #define __FUNCT__ "PCApply_Redundant" 4376849ba73SBarry Smith static PetscErrorCode PCApply_Redundant(PC pc,Vec x,Vec y) 4384b9ad928SBarry Smith { 4394b9ad928SBarry Smith PC_Redundant *red = (PC_Redundant*)pc->data; 440dfbe8321SBarry Smith PetscErrorCode ierr; 4413f457be1SHong Zhang PetscScalar *array; 4424b9ad928SBarry Smith 4434b9ad928SBarry Smith PetscFunctionBegin; 4443f457be1SHong Zhang /* scatter x to xdup */ 4453f457be1SHong Zhang ierr = VecScatterBegin(x,red->xdup,INSERT_VALUES,SCATTER_FORWARD,red->scatterin);CHKERRQ(ierr); 4463f457be1SHong Zhang ierr = VecScatterEnd(x,red->xdup,INSERT_VALUES,SCATTER_FORWARD,red->scatterin);CHKERRQ(ierr); 4473f457be1SHong Zhang 4483f457be1SHong Zhang /* place xdup's local array into xsub */ 4493f457be1SHong Zhang ierr = VecGetArray(red->xdup,&array);CHKERRQ(ierr); 4503f457be1SHong Zhang ierr = VecPlaceArray(red->xsub,(const PetscScalar*)array);CHKERRQ(ierr); 4514b9ad928SBarry Smith 4524b9ad928SBarry Smith /* apply preconditioner on each processor */ 4533f457be1SHong Zhang ierr = PCApply(red->pc,red->xsub,red->ysub);CHKERRQ(ierr); 4543f457be1SHong Zhang ierr = VecResetArray(red->xsub);CHKERRQ(ierr); 4553f457be1SHong Zhang ierr = VecRestoreArray(red->xdup,&array);CHKERRQ(ierr); 4564b9ad928SBarry Smith 4573f457be1SHong Zhang /* place ysub's local array into ydup */ 4583f457be1SHong Zhang ierr = VecGetArray(red->ysub,&array);CHKERRQ(ierr); 4593f457be1SHong Zhang ierr = VecPlaceArray(red->ydup,(const PetscScalar*)array);CHKERRQ(ierr); 4603f457be1SHong Zhang 4613f457be1SHong Zhang /* scatter ydup to y */ 4623f457be1SHong Zhang ierr = VecScatterBegin(red->ydup,y,INSERT_VALUES,SCATTER_FORWARD,red->scatterout);CHKERRQ(ierr); 4633f457be1SHong Zhang ierr = VecScatterEnd(red->ydup,y,INSERT_VALUES,SCATTER_FORWARD,red->scatterout);CHKERRQ(ierr); 4643f457be1SHong Zhang ierr = VecResetArray(red->ydup);CHKERRQ(ierr); 4653f457be1SHong Zhang ierr = VecRestoreArray(red->ysub,&array);CHKERRQ(ierr); 4664b9ad928SBarry Smith PetscFunctionReturn(0); 4674b9ad928SBarry Smith } 4684b9ad928SBarry Smith 4694b9ad928SBarry Smith #undef __FUNCT__ 4704b9ad928SBarry Smith #define __FUNCT__ "PCDestroy_Redundant" 4716849ba73SBarry Smith static PetscErrorCode PCDestroy_Redundant(PC pc) 4724b9ad928SBarry Smith { 4734b9ad928SBarry Smith PC_Redundant *red = (PC_Redundant*)pc->data; 474dfbe8321SBarry Smith PetscErrorCode ierr; 4754b9ad928SBarry Smith 4764b9ad928SBarry Smith PetscFunctionBegin; 4774b9ad928SBarry Smith if (red->scatterin) {ierr = VecScatterDestroy(red->scatterin);CHKERRQ(ierr);} 4784b9ad928SBarry Smith if (red->scatterout) {ierr = VecScatterDestroy(red->scatterout);CHKERRQ(ierr);} 4793f457be1SHong Zhang if (red->ysub) {ierr = VecDestroy(red->ysub);CHKERRQ(ierr);} 4803f457be1SHong Zhang if (red->xsub) {ierr = VecDestroy(red->xsub);CHKERRQ(ierr);} 4813f457be1SHong Zhang if (red->xdup) {ierr = VecDestroy(red->xdup);CHKERRQ(ierr);} 4823f457be1SHong Zhang if (red->ydup) {ierr = VecDestroy(red->ydup);CHKERRQ(ierr);} 4833f457be1SHong Zhang if (red->pmats_sub) { 4843f457be1SHong Zhang ierr = MatDestroy(red->pmats_sub);CHKERRQ(ierr); 4853f457be1SHong Zhang } 4863f457be1SHong Zhang 4874b9ad928SBarry Smith if (red->pmats) { 4884b9ad928SBarry Smith ierr = MatDestroyMatrices(1,&red->pmats);CHKERRQ(ierr); 4894b9ad928SBarry Smith } 4904b9ad928SBarry Smith ierr = PCDestroy(red->pc);CHKERRQ(ierr); 4914b9ad928SBarry Smith ierr = PetscFree(red);CHKERRQ(ierr); 4924b9ad928SBarry Smith PetscFunctionReturn(0); 4934b9ad928SBarry Smith } 4944b9ad928SBarry Smith 4954b9ad928SBarry Smith #undef __FUNCT__ 4964b9ad928SBarry Smith #define __FUNCT__ "PCSetFromOptions_Redundant" 4976849ba73SBarry Smith static PetscErrorCode PCSetFromOptions_Redundant(PC pc) 4984b9ad928SBarry Smith { 4994b9ad928SBarry Smith PetscFunctionBegin; 5004b9ad928SBarry Smith PetscFunctionReturn(0); 5014b9ad928SBarry Smith } 5024b9ad928SBarry Smith 5034b9ad928SBarry Smith EXTERN_C_BEGIN 5044b9ad928SBarry Smith #undef __FUNCT__ 5054b9ad928SBarry Smith #define __FUNCT__ "PCRedundantSetScatter_Redundant" 506dba47a55SKris Buschelman PetscErrorCode PETSCKSP_DLLEXPORT PCRedundantSetScatter_Redundant(PC pc,VecScatter in,VecScatter out) 5074b9ad928SBarry Smith { 5084b9ad928SBarry Smith PC_Redundant *red = (PC_Redundant*)pc->data; 509dfbe8321SBarry Smith PetscErrorCode ierr; 5104b9ad928SBarry Smith 5114b9ad928SBarry Smith PetscFunctionBegin; 5124b9ad928SBarry Smith red->scatterin = in; 5134b9ad928SBarry Smith red->scatterout = out; 5144b9ad928SBarry Smith ierr = PetscObjectReference((PetscObject)in);CHKERRQ(ierr); 5154b9ad928SBarry Smith ierr = PetscObjectReference((PetscObject)out);CHKERRQ(ierr); 5164b9ad928SBarry Smith PetscFunctionReturn(0); 5174b9ad928SBarry Smith } 5184b9ad928SBarry Smith EXTERN_C_END 5194b9ad928SBarry Smith 5204b9ad928SBarry Smith #undef __FUNCT__ 5214b9ad928SBarry Smith #define __FUNCT__ "PCRedundantSetScatter" 5224b9ad928SBarry Smith /*@ 5234b9ad928SBarry Smith PCRedundantSetScatter - Sets the scatter used to copy values into the 5244b9ad928SBarry Smith redundant local solve and the scatter to move them back into the global 5254b9ad928SBarry Smith vector. 5264b9ad928SBarry Smith 5274b9ad928SBarry Smith Collective on PC 5284b9ad928SBarry Smith 5294b9ad928SBarry Smith Input Parameters: 5304b9ad928SBarry Smith + pc - the preconditioner context 5314b9ad928SBarry Smith . in - the scatter to move the values in 5324b9ad928SBarry Smith - out - the scatter to move them out 5334b9ad928SBarry Smith 5344b9ad928SBarry Smith Level: advanced 5354b9ad928SBarry Smith 5364b9ad928SBarry Smith .keywords: PC, redundant solve 5374b9ad928SBarry Smith @*/ 538dba47a55SKris Buschelman PetscErrorCode PETSCKSP_DLLEXPORT PCRedundantSetScatter(PC pc,VecScatter in,VecScatter out) 5394b9ad928SBarry Smith { 540dfbe8321SBarry Smith PetscErrorCode ierr,(*f)(PC,VecScatter,VecScatter); 5414b9ad928SBarry Smith 5424b9ad928SBarry Smith PetscFunctionBegin; 5434482741eSBarry Smith PetscValidHeaderSpecific(pc,PC_COOKIE,1); 5444482741eSBarry Smith PetscValidHeaderSpecific(in,VEC_SCATTER_COOKIE,2); 5454482741eSBarry Smith PetscValidHeaderSpecific(out,VEC_SCATTER_COOKIE,3); 5464b9ad928SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)pc,"PCRedundantSetScatter_C",(void (**)(void))&f);CHKERRQ(ierr); 5474b9ad928SBarry Smith if (f) { 5484b9ad928SBarry Smith ierr = (*f)(pc,in,out);CHKERRQ(ierr); 5494b9ad928SBarry Smith } 5504b9ad928SBarry Smith PetscFunctionReturn(0); 5514b9ad928SBarry Smith } 5524b9ad928SBarry Smith 5534b9ad928SBarry Smith EXTERN_C_BEGIN 5544b9ad928SBarry Smith #undef __FUNCT__ 5554b9ad928SBarry Smith #define __FUNCT__ "PCRedundantGetPC_Redundant" 556dba47a55SKris Buschelman PetscErrorCode PETSCKSP_DLLEXPORT PCRedundantGetPC_Redundant(PC pc,PC *innerpc) 5574b9ad928SBarry Smith { 5584b9ad928SBarry Smith PC_Redundant *red = (PC_Redundant*)pc->data; 5594b9ad928SBarry Smith 5604b9ad928SBarry Smith PetscFunctionBegin; 5614b9ad928SBarry Smith *innerpc = red->pc; 5624b9ad928SBarry Smith PetscFunctionReturn(0); 5634b9ad928SBarry Smith } 5644b9ad928SBarry Smith EXTERN_C_END 5654b9ad928SBarry Smith 5664b9ad928SBarry Smith #undef __FUNCT__ 5674b9ad928SBarry Smith #define __FUNCT__ "PCRedundantGetPC" 5684b9ad928SBarry Smith /*@ 5694b9ad928SBarry Smith PCRedundantGetPC - Gets the sequential PC created by the redundant PC. 5704b9ad928SBarry Smith 5714b9ad928SBarry Smith Not Collective 5724b9ad928SBarry Smith 5734b9ad928SBarry Smith Input Parameter: 5744b9ad928SBarry Smith . pc - the preconditioner context 5754b9ad928SBarry Smith 5764b9ad928SBarry Smith Output Parameter: 5774b9ad928SBarry Smith . innerpc - the sequential PC 5784b9ad928SBarry Smith 5794b9ad928SBarry Smith Level: advanced 5804b9ad928SBarry Smith 5814b9ad928SBarry Smith .keywords: PC, redundant solve 5824b9ad928SBarry Smith @*/ 583dba47a55SKris Buschelman PetscErrorCode PETSCKSP_DLLEXPORT PCRedundantGetPC(PC pc,PC *innerpc) 5844b9ad928SBarry Smith { 585dfbe8321SBarry Smith PetscErrorCode ierr,(*f)(PC,PC*); 5864b9ad928SBarry Smith 5874b9ad928SBarry Smith PetscFunctionBegin; 5884482741eSBarry Smith PetscValidHeaderSpecific(pc,PC_COOKIE,1); 5894482741eSBarry Smith PetscValidPointer(innerpc,2); 5904b9ad928SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)pc,"PCRedundantGetPC_C",(void (**)(void))&f);CHKERRQ(ierr); 5914b9ad928SBarry Smith if (f) { 5924b9ad928SBarry Smith ierr = (*f)(pc,innerpc);CHKERRQ(ierr); 5934b9ad928SBarry Smith } 5944b9ad928SBarry Smith PetscFunctionReturn(0); 5954b9ad928SBarry Smith } 5964b9ad928SBarry Smith 5974b9ad928SBarry Smith EXTERN_C_BEGIN 5984b9ad928SBarry Smith #undef __FUNCT__ 5994b9ad928SBarry Smith #define __FUNCT__ "PCRedundantGetOperators_Redundant" 600dba47a55SKris Buschelman PetscErrorCode PETSCKSP_DLLEXPORT PCRedundantGetOperators_Redundant(PC pc,Mat *mat,Mat *pmat) 6014b9ad928SBarry Smith { 6024b9ad928SBarry Smith PC_Redundant *red = (PC_Redundant*)pc->data; 6034b9ad928SBarry Smith 6044b9ad928SBarry Smith PetscFunctionBegin; 6054b9ad928SBarry Smith if (mat) *mat = red->pmats[0]; 6064b9ad928SBarry Smith if (pmat) *pmat = red->pmats[0]; 6074b9ad928SBarry Smith PetscFunctionReturn(0); 6084b9ad928SBarry Smith } 6094b9ad928SBarry Smith EXTERN_C_END 6104b9ad928SBarry Smith 6114b9ad928SBarry Smith #undef __FUNCT__ 6124b9ad928SBarry Smith #define __FUNCT__ "PCRedundantGetOperators" 6134b9ad928SBarry Smith /*@ 6144b9ad928SBarry Smith PCRedundantGetOperators - gets the sequential matrix and preconditioner matrix 6154b9ad928SBarry Smith 6164b9ad928SBarry Smith Not Collective 6174b9ad928SBarry Smith 6184b9ad928SBarry Smith Input Parameter: 6194b9ad928SBarry Smith . pc - the preconditioner context 6204b9ad928SBarry Smith 6214b9ad928SBarry Smith Output Parameters: 6224b9ad928SBarry Smith + mat - the matrix 6234b9ad928SBarry Smith - pmat - the (possibly different) preconditioner matrix 6244b9ad928SBarry Smith 6254b9ad928SBarry Smith Level: advanced 6264b9ad928SBarry Smith 6274b9ad928SBarry Smith .keywords: PC, redundant solve 6284b9ad928SBarry Smith @*/ 629dba47a55SKris Buschelman PetscErrorCode PETSCKSP_DLLEXPORT PCRedundantGetOperators(PC pc,Mat *mat,Mat *pmat) 6304b9ad928SBarry Smith { 631dfbe8321SBarry Smith PetscErrorCode ierr,(*f)(PC,Mat*,Mat*); 6324b9ad928SBarry Smith 6334b9ad928SBarry Smith PetscFunctionBegin; 6344482741eSBarry Smith PetscValidHeaderSpecific(pc,PC_COOKIE,1); 6354482741eSBarry Smith if (mat) PetscValidPointer(mat,2); 6364482741eSBarry Smith if (pmat) PetscValidPointer(pmat,3); 6374b9ad928SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)pc,"PCRedundantGetOperators_C",(void (**)(void))&f);CHKERRQ(ierr); 6384b9ad928SBarry Smith if (f) { 6394b9ad928SBarry Smith ierr = (*f)(pc,mat,pmat);CHKERRQ(ierr); 6404b9ad928SBarry Smith } 6414b9ad928SBarry Smith PetscFunctionReturn(0); 6424b9ad928SBarry Smith } 6434b9ad928SBarry Smith 6444b9ad928SBarry Smith /* -------------------------------------------------------------------------------------*/ 64537a17b4dSBarry Smith /*MC 64637a17b4dSBarry Smith PCREDUNDANT - Runs a preconditioner for the entire problem on each processor 64737a17b4dSBarry Smith 64837a17b4dSBarry Smith 64937a17b4dSBarry Smith Options for the redundant preconditioners can be set with -redundant_pc_xxx 65037a17b4dSBarry Smith 65137a17b4dSBarry Smith Level: intermediate 65237a17b4dSBarry Smith 65337a17b4dSBarry Smith 65437a17b4dSBarry Smith .seealso: PCCreate(), PCSetType(), PCType (for list of available types), PCRedundantSetScatter(), 65537a17b4dSBarry Smith PCRedundantGetPC(), PCRedundantGetOperators() 65637a17b4dSBarry Smith 65737a17b4dSBarry Smith M*/ 65837a17b4dSBarry Smith 6594b9ad928SBarry Smith EXTERN_C_BEGIN 6604b9ad928SBarry Smith #undef __FUNCT__ 6614b9ad928SBarry Smith #define __FUNCT__ "PCCreate_Redundant" 662dba47a55SKris Buschelman PetscErrorCode PETSCKSP_DLLEXPORT PCCreate_Redundant(PC pc) 6634b9ad928SBarry Smith { 664dfbe8321SBarry Smith PetscErrorCode ierr; 6654b9ad928SBarry Smith PC_Redundant *red; 666e060cb09SBarry Smith const char *prefix; 6674b9ad928SBarry Smith 6683f457be1SHong Zhang PetscInt nsubcomm,np_subcomm,nleftover,i,j,color; 6693f457be1SHong Zhang PetscMPIInt rank,size,subrank,*subsize; 6703f457be1SHong Zhang MPI_Comm subcomm; 6713f457be1SHong Zhang PetscMPIInt duprank; 6723f457be1SHong Zhang PetscMPIInt rank_dup,size_dup; 6733f457be1SHong Zhang MPI_Comm dupcomm; 6743f457be1SHong Zhang 6754b9ad928SBarry Smith PetscFunctionBegin; 6764b9ad928SBarry Smith ierr = PetscNew(PC_Redundant,&red);CHKERRQ(ierr); 67752e6d16bSBarry Smith ierr = PetscLogObjectMemory(pc,sizeof(PC_Redundant));CHKERRQ(ierr); 6784b9ad928SBarry Smith red->useparallelmat = PETSC_TRUE; 6794b9ad928SBarry Smith 6803f457be1SHong Zhang ierr = MPI_Comm_rank(pc->comm,&rank);CHKERRQ(ierr); 6813f457be1SHong Zhang ierr = MPI_Comm_size(pc->comm,&size);CHKERRQ(ierr); 6823f457be1SHong Zhang nsubcomm = size; 6833f457be1SHong Zhang ierr = PetscOptionsGetInt(PETSC_NULL,"-nsubcomm",&nsubcomm,PETSC_NULL);CHKERRQ(ierr); 6843f457be1SHong Zhang if (nsubcomm > size) SETERRQ2(PETSC_ERR_ARG_OUTOFRANGE, "Num of subcommunicators %D cannot be larger than MPI_Comm_size %D",nsubcomm,size); 6853f457be1SHong Zhang 6863f457be1SHong Zhang /* get size of each subcommunicators */ 6873f457be1SHong Zhang ierr = PetscMalloc((1+nsubcomm)*sizeof(PetscMPIInt),&subsize);CHKERRQ(ierr); 6883f457be1SHong Zhang np_subcomm = size/nsubcomm; 6893f457be1SHong Zhang nleftover = size - nsubcomm*np_subcomm; 6903f457be1SHong Zhang for (i=0; i<nsubcomm; i++){ 6913f457be1SHong Zhang subsize[i] = np_subcomm; 6923f457be1SHong Zhang if (i<nleftover) subsize[i]++; 6933f457be1SHong Zhang } 6943f457be1SHong Zhang 6953f457be1SHong Zhang /* find color for this proc */ 6963f457be1SHong Zhang color = rank%nsubcomm; 6973f457be1SHong Zhang subrank = rank/nsubcomm; 6983f457be1SHong Zhang 6993f457be1SHong Zhang ierr = MPI_Comm_split(pc->comm,color,subrank,&subcomm);CHKERRQ(ierr); 7003f457be1SHong Zhang red->subcomm = subcomm; 7013f457be1SHong Zhang red->color = color; 7023f457be1SHong Zhang red->nsubcomm = nsubcomm; 7033f457be1SHong Zhang 7043f457be1SHong Zhang j = 0; duprank = 0; 7053f457be1SHong Zhang for (i=0; i<nsubcomm; i++){ 7063f457be1SHong Zhang if (j == color){ 7073f457be1SHong Zhang duprank += subrank; 7083f457be1SHong Zhang break; 7093f457be1SHong Zhang } 7103f457be1SHong Zhang duprank += subsize[i]; j++; 7113f457be1SHong Zhang } 7123f457be1SHong Zhang /* 7133f457be1SHong Zhang ierr = PetscSynchronizedPrintf(pc->comm, "[%d] color %d, subrank %d, duprank %d\n",rank,color,subrank,duprank); 7143f457be1SHong Zhang ierr = PetscSynchronizedFlush(pc->comm);CHKERRQ(ierr); 7153f457be1SHong Zhang */ 7163f457be1SHong Zhang 7173f457be1SHong Zhang ierr = MPI_Comm_split(pc->comm,0,duprank,&dupcomm);CHKERRQ(ierr); 7183f457be1SHong Zhang ierr = MPI_Comm_rank(dupcomm,&rank_dup);CHKERRQ(ierr); 7193f457be1SHong Zhang ierr = MPI_Comm_size(dupcomm,&size_dup);CHKERRQ(ierr); 7203f457be1SHong Zhang /* 7213f457be1SHong Zhang ierr = PetscSynchronizedPrintf(pc->comm, "[%d] duprank %d\n",rank,duprank); 7223f457be1SHong Zhang ierr = PetscSynchronizedFlush(pc->comm);CHKERRQ(ierr); 7233f457be1SHong Zhang */ 7243f457be1SHong Zhang red->dupcomm = dupcomm; 7253f457be1SHong Zhang ierr = PetscFree(subsize);CHKERRQ(ierr); 7263f457be1SHong Zhang 7274b9ad928SBarry Smith /* create the sequential PC that each processor has copy of */ 7283f457be1SHong Zhang ierr = PCCreate(subcomm,&red->pc);CHKERRQ(ierr); 7294b9ad928SBarry Smith ierr = PCSetType(red->pc,PCLU);CHKERRQ(ierr); 7304b9ad928SBarry Smith ierr = PCGetOptionsPrefix(pc,&prefix);CHKERRQ(ierr); 7314b9ad928SBarry Smith ierr = PCSetOptionsPrefix(red->pc,prefix);CHKERRQ(ierr); 7324b9ad928SBarry Smith ierr = PCAppendOptionsPrefix(red->pc,"redundant_");CHKERRQ(ierr); 7334b9ad928SBarry Smith 7344b9ad928SBarry Smith pc->ops->apply = PCApply_Redundant; 7354b9ad928SBarry Smith pc->ops->applytranspose = 0; 7364b9ad928SBarry Smith pc->ops->setup = PCSetUp_Redundant; 7374b9ad928SBarry Smith pc->ops->destroy = PCDestroy_Redundant; 7384b9ad928SBarry Smith pc->ops->setfromoptions = PCSetFromOptions_Redundant; 7394b9ad928SBarry Smith pc->ops->setuponblocks = 0; 7404b9ad928SBarry Smith pc->ops->view = PCView_Redundant; 7414b9ad928SBarry Smith pc->ops->applyrichardson = 0; 7424b9ad928SBarry Smith 7434b9ad928SBarry Smith pc->data = (void*)red; 7444b9ad928SBarry Smith 7454b9ad928SBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCRedundantSetScatter_C","PCRedundantSetScatter_Redundant", 7464b9ad928SBarry Smith PCRedundantSetScatter_Redundant);CHKERRQ(ierr); 7474b9ad928SBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCRedundantGetPC_C","PCRedundantGetPC_Redundant", 7484b9ad928SBarry Smith PCRedundantGetPC_Redundant);CHKERRQ(ierr); 7494b9ad928SBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCRedundantGetOperators_C","PCRedundantGetOperators_Redundant", 7504b9ad928SBarry Smith PCRedundantGetOperators_Redundant);CHKERRQ(ierr); 7514b9ad928SBarry Smith 7524b9ad928SBarry Smith PetscFunctionReturn(0); 7534b9ad928SBarry Smith } 7544b9ad928SBarry Smith EXTERN_C_END 755