xref: /petsc/src/ksp/pc/impls/redundant/redundant.c (revision 0ae51fcdcedb33c1b8546b85eed5e90d983fd463)
1dba47a55SKris Buschelman #define PETSCKSP_DLL
2dba47a55SKris Buschelman 
34b9ad928SBarry Smith /*
43f457be1SHong Zhang   This file defines a "solve the problem redundantly on each subgroup of processor" preconditioner.
54b9ad928SBarry Smith */
66356e834SBarry Smith #include "private/pcimpl.h"     /*I "petscpc.h" I*/
74b9ad928SBarry Smith #include "petscksp.h"
84b9ad928SBarry Smith 
94b9ad928SBarry Smith typedef struct {
104b9ad928SBarry Smith   PC         pc;                   /* actual preconditioner used on each processor */
113f457be1SHong Zhang   Vec        xsub,ysub;            /* vectors of a subcommunicator to hold parallel vectors of pc->comm */
123f457be1SHong Zhang   Vec        xdup,ydup;            /* parallel vector that congregates xsub or ysub facilitating vector scattering */
134b9ad928SBarry Smith   Mat        *pmats;               /* matrix and optional preconditioner matrix */
14f664ae05SHong Zhang   Mat        pmats_sub;            /* matrix and optional preconditioner matrix belong to a subcommunicator */
153f457be1SHong Zhang   VecScatter scatterin,scatterout; /* scatter used to move all values to each processor group (subcommunicator) */
164b9ad928SBarry Smith   PetscTruth useparallelmat;
173f457be1SHong Zhang   MPI_Comm   subcomm;              /* processors belong to a subcommunicator implement a PC in parallel */
183f457be1SHong Zhang   MPI_Comm   dupcomm;              /* processors belong to pc->comm with their rank remapped in the way
193f457be1SHong Zhang                                       that vector xdup/ydup has contiguous rank while appending xsub/ysub along their colors */
203f457be1SHong Zhang   PetscInt   nsubcomm;             /* num of subcommunicators, which equals the num of redundant matrix systems */
213f457be1SHong Zhang   PetscInt   color;                /* color of processors in a subcommunicator */
224b9ad928SBarry Smith } PC_Redundant;
234b9ad928SBarry Smith 
244b9ad928SBarry Smith #undef __FUNCT__
254b9ad928SBarry Smith #define __FUNCT__ "PCView_Redundant"
266849ba73SBarry Smith static PetscErrorCode PCView_Redundant(PC pc,PetscViewer viewer)
274b9ad928SBarry Smith {
284b9ad928SBarry Smith   PC_Redundant   *red = (PC_Redundant*)pc->data;
29dfbe8321SBarry Smith   PetscErrorCode ierr;
3013f74950SBarry Smith   PetscMPIInt    rank;
3132077d6dSBarry Smith   PetscTruth     iascii,isstring;
324b9ad928SBarry Smith   PetscViewer    sviewer;
334b9ad928SBarry Smith 
344b9ad928SBarry Smith   PetscFunctionBegin;
354b9ad928SBarry Smith   ierr = MPI_Comm_rank(pc->comm,&rank);CHKERRQ(ierr);
3632077d6dSBarry Smith   ierr = PetscTypeCompare((PetscObject)viewer,PETSC_VIEWER_ASCII,&iascii);CHKERRQ(ierr);
374b9ad928SBarry Smith   ierr = PetscTypeCompare((PetscObject)viewer,PETSC_VIEWER_STRING,&isstring);CHKERRQ(ierr);
3832077d6dSBarry Smith   if (iascii) {
394b9ad928SBarry Smith     ierr = PetscViewerASCIIPrintf(viewer,"  Redundant solver preconditioner: Actual PC follows\n");CHKERRQ(ierr);
404b9ad928SBarry Smith     ierr = PetscViewerGetSingleton(viewer,&sviewer);CHKERRQ(ierr);
414b9ad928SBarry Smith     if (!rank) {
424b9ad928SBarry Smith       ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr);
434b9ad928SBarry Smith       ierr = PCView(red->pc,sviewer);CHKERRQ(ierr);
444b9ad928SBarry Smith       ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr);
454b9ad928SBarry Smith     }
464b9ad928SBarry Smith     ierr = PetscViewerRestoreSingleton(viewer,&sviewer);CHKERRQ(ierr);
474b9ad928SBarry Smith   } else if (isstring) {
484b9ad928SBarry Smith     ierr = PetscViewerStringSPrintf(viewer," Redundant solver preconditioner");CHKERRQ(ierr);
494b9ad928SBarry Smith     ierr = PetscViewerGetSingleton(viewer,&sviewer);CHKERRQ(ierr);
504b9ad928SBarry Smith     if (!rank) {
514b9ad928SBarry Smith       ierr = PCView(red->pc,sviewer);CHKERRQ(ierr);
524b9ad928SBarry Smith     }
534b9ad928SBarry Smith     ierr = PetscViewerRestoreSingleton(viewer,&sviewer);CHKERRQ(ierr);
544b9ad928SBarry Smith   } else {
5579a5c55eSBarry Smith     SETERRQ1(PETSC_ERR_SUP,"Viewer type %s not supported for PC redundant",((PetscObject)viewer)->type_name);
564b9ad928SBarry Smith   }
574b9ad928SBarry Smith   PetscFunctionReturn(0);
584b9ad928SBarry Smith }
594b9ad928SBarry Smith 
603f457be1SHong Zhang #include "src/mat/matimpl.h"        /*I "petscmat.h" I*/
613f457be1SHong Zhang #include "private/vecimpl.h"
623f457be1SHong Zhang #include "src/mat/impls/aij/mpi/mpiaij.h"   /*I "petscmat.h" I*/
633f457be1SHong Zhang #include "src/mat/impls/aij/seq/aij.h"      /*I "petscmat.h" I*/
643f457be1SHong Zhang 
653f457be1SHong Zhang #undef __FUNCT__
663f457be1SHong Zhang #define __FUNCT__ "MatGetRedundantMatrix"
67f664ae05SHong Zhang PetscErrorCode MatGetRedundantMatrix_AIJ(Mat mat,PetscInt nsubcomm,MPI_Comm subcomm,PetscInt mlocal_sub,MatReuse reuse,Mat *matredundant)
683f457be1SHong Zhang {
693f457be1SHong Zhang   PetscMPIInt    rank,size,subrank,subsize;
703f457be1SHong Zhang   MPI_Comm       comm=mat->comm;
713f457be1SHong Zhang   PetscErrorCode ierr;
72f664ae05SHong Zhang   PetscInt       nsends,nrecvs,i,prid=100,itmp;
733f457be1SHong Zhang   PetscMPIInt    *send_rank,*recv_rank;
74f664ae05SHong Zhang   PetscInt       *rowrange=mat->rmap.range,nzlocal;
753f457be1SHong Zhang   Mat_MPIAIJ     *aij = (Mat_MPIAIJ*)mat->data;
763f457be1SHong Zhang   Mat            A=aij->A,B=aij->B;
773f457be1SHong Zhang   Mat_SeqAIJ     *a=(Mat_SeqAIJ*)A->data,*b=(Mat_SeqAIJ*)B->data;
78*0ae51fcdSHong Zhang   Mat            C=*matredundant;
793f457be1SHong Zhang 
803f457be1SHong Zhang   PetscInt       nleftover,np_subcomm,j;
813f457be1SHong Zhang   PetscInt       nz_A,nz_B,*sbuf_j;
823f457be1SHong Zhang   PetscScalar    *sbuf_a;
833f457be1SHong Zhang   PetscInt       cstart=mat->cmap.rstart,cend=mat->cmap.rend,row,nzA,nzB,ncols,*cworkA,*cworkB;
843f457be1SHong Zhang   PetscInt       rstart=mat->rmap.rstart,rend=mat->rmap.rend,*bmap=aij->garray,M,N;
853f457be1SHong Zhang   PetscInt       *cols,ctmp,lwrite,*rptr,l;
863f457be1SHong Zhang   PetscScalar    *vals,*aworkA,*aworkB;
873f457be1SHong Zhang   PetscMPIInt    tag1,tag2,tag3,imdex;
883f457be1SHong Zhang   MPI_Request    *s_waits1,*s_waits2,*s_waits3,*r_waits1,*r_waits2,*r_waits3;
893f457be1SHong Zhang   MPI_Status     recv_status,*send_status;
903f457be1SHong Zhang   PetscInt       *sbuf_nz,*rbuf_nz,count;
913f457be1SHong Zhang   PetscInt       **rbuf_j;
923f457be1SHong Zhang   PetscScalar    **rbuf_a;
933f457be1SHong Zhang 
943f457be1SHong Zhang   PetscFunctionBegin;
95*0ae51fcdSHong Zhang   if (reuse == MAT_REUSE_MATRIX) {
96*0ae51fcdSHong Zhang     PetscTruth flag;
97*0ae51fcdSHong Zhang     ierr = MatGetSize(C,&M,&N);CHKERRQ(ierr);
98*0ae51fcdSHong Zhang     if (M != N || M != mat->rmap.N) {
99*0ae51fcdSHong Zhang       SETERRQ(PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong global size");
100*0ae51fcdSHong Zhang     }
101*0ae51fcdSHong Zhang     ierr = MatGetLocalSize(C,&M,&N);CHKERRQ(ierr);
102*0ae51fcdSHong Zhang     if (M != N || M != mlocal_sub) {
103*0ae51fcdSHong Zhang       SETERRQ(PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong local size");
104*0ae51fcdSHong Zhang     }
105*0ae51fcdSHong Zhang   }
106*0ae51fcdSHong Zhang 
1073f457be1SHong Zhang   ierr = PetscOptionsGetInt(PETSC_NULL,"-prid",&prid,PETSC_NULL);CHKERRQ(ierr);
1083f457be1SHong Zhang   ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr);
1093f457be1SHong Zhang   ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr);
1103f457be1SHong Zhang   ierr = MPI_Comm_rank(subcomm,&subrank);CHKERRQ(ierr);
1113f457be1SHong Zhang   ierr = MPI_Comm_size(subcomm,&subsize);CHKERRQ(ierr);
1123f457be1SHong Zhang   /*
1133f457be1SHong Zhang   ierr = PetscSynchronizedPrintf(comm, "[%d] subrank %d, subsize %d\n",rank,subrank,subsize);
1143f457be1SHong Zhang   ierr = PetscSynchronizedFlush(comm);CHKERRQ(ierr);
1153f457be1SHong Zhang   */
1163f457be1SHong Zhang   /* get the destination processors */
1173f457be1SHong Zhang   ierr = PetscMalloc((2*size+1)*sizeof(PetscMPIInt),&send_rank);
1183f457be1SHong Zhang   recv_rank = send_rank + size;
1193f457be1SHong Zhang   np_subcomm = size/nsubcomm;
1203f457be1SHong Zhang   nleftover  = size - nsubcomm*np_subcomm;
1213f457be1SHong Zhang   nsends = 0; nrecvs = 0;
1223f457be1SHong Zhang   for (i=0; i<size; i++){ /* i=rank*/
1233f457be1SHong Zhang     if (subrank == i/nsubcomm && rank != i){ /* my_subrank == other's subrank */
1243f457be1SHong Zhang       send_rank[nsends] = i; nsends++;
1253f457be1SHong Zhang       recv_rank[nrecvs++] = i;
1263f457be1SHong Zhang     }
1273f457be1SHong Zhang   }
1283f457be1SHong Zhang   if (rank >= size - nleftover){/* this proc is a leftover processor */
1293f457be1SHong Zhang     i = size-nleftover-1;
1303f457be1SHong Zhang     j = 0;
1313f457be1SHong Zhang     while (j < nsubcomm - nleftover){
1323f457be1SHong Zhang       send_rank[nsends++] = i;
1333f457be1SHong Zhang       i--; j++;
1343f457be1SHong Zhang     }
1353f457be1SHong Zhang   }
1363f457be1SHong Zhang 
1373f457be1SHong Zhang   if (nleftover && subsize == size/nsubcomm && subrank==subsize-1){ /* this proc recvs from leftover processors */
1383f457be1SHong Zhang     for (i=0; i<nleftover; i++){
1393f457be1SHong Zhang       recv_rank[nrecvs++] = size-nleftover+i;
1403f457be1SHong Zhang     }
1413f457be1SHong Zhang   }
1423f457be1SHong Zhang   if (prid == rank){
1433f457be1SHong Zhang     printf("[%d] sends to ",rank);
1443f457be1SHong Zhang     for (i=0; i<nsends; i++) printf(" [%d],",send_rank[i]);
1453f457be1SHong Zhang     printf("  \n");
1463f457be1SHong Zhang   }
1473f457be1SHong Zhang   /*
1483f457be1SHong Zhang   ierr = PetscSynchronizedPrintf(comm, "[%d] nsends %d, nrecvs %d\n",rank,nsends,nrecvs);
1493f457be1SHong Zhang   ierr = PetscSynchronizedFlush(comm);CHKERRQ(ierr);
1503f457be1SHong Zhang   ierr = MPI_Barrier(comm);CHKERRQ(ierr);
1513f457be1SHong Zhang   */
1523f457be1SHong Zhang 
1533f457be1SHong Zhang   /* get this processor's nzlocal=nz_A+nz_B */
1543f457be1SHong Zhang   nz_A = a->nz; nz_B = b->nz;
1553f457be1SHong Zhang   nzlocal = nz_A + nz_B;
1563f457be1SHong Zhang 
1573f457be1SHong Zhang   /* allocate sbuf_j, sbuf_a, then copy mat's local entries into the buffers */
1583f457be1SHong Zhang   itmp = nzlocal + rowrange[rank+1] - rowrange[rank] + 2;
1593f457be1SHong Zhang   ierr = PetscMalloc(itmp*sizeof(PetscInt),&sbuf_j);CHKERRQ(ierr);
1603f457be1SHong Zhang   ierr = PetscMalloc((nzlocal+1)*sizeof(PetscScalar),&sbuf_a);CHKERRQ(ierr);
1613f457be1SHong Zhang 
1623f457be1SHong Zhang     rptr = sbuf_j;
1633f457be1SHong Zhang     cols = sbuf_j + rend-rstart + 1;
1643f457be1SHong Zhang     vals = sbuf_a;
1653f457be1SHong Zhang     rptr[0] = 0;
1663f457be1SHong Zhang     for (i=0; i<rend-rstart; i++){
1673f457be1SHong Zhang       row = i + rstart;
1683f457be1SHong Zhang       nzA    = a->i[i+1] - a->i[i]; nzB = b->i[i+1] - b->i[i];
1693f457be1SHong Zhang       ncols  = nzA + nzB;
1703f457be1SHong Zhang       cworkA = a->j + a->i[i]; cworkB = b->j + b->i[i];
1713f457be1SHong Zhang       aworkA = a->a + a->i[i]; aworkB = b->a + b->i[i];
1723f457be1SHong Zhang       /* load the column indices for this row into cols */
1733f457be1SHong Zhang       lwrite = 0;
1743f457be1SHong Zhang       for (l=0; l<nzB; l++) {
1753f457be1SHong Zhang         if ((ctmp = bmap[cworkB[l]]) < cstart){
1763f457be1SHong Zhang           vals[lwrite]   = aworkB[l];
1773f457be1SHong Zhang           cols[lwrite++] = ctmp;
1783f457be1SHong Zhang         }
1793f457be1SHong Zhang       }
1803f457be1SHong Zhang       for (l=0; l<nzA; l++){
1813f457be1SHong Zhang         vals[lwrite]   = aworkA[l];
1823f457be1SHong Zhang         cols[lwrite++] = cstart + cworkA[l];
1833f457be1SHong Zhang       }
1843f457be1SHong Zhang       for (l=0; l<nzB; l++) {
1853f457be1SHong Zhang         if ((ctmp = bmap[cworkB[l]]) >= cend){
1863f457be1SHong Zhang           vals[lwrite]   = aworkB[l];
1873f457be1SHong Zhang           cols[lwrite++] = ctmp;
1883f457be1SHong Zhang         }
1893f457be1SHong Zhang       }
1903f457be1SHong Zhang       /* insert local matrix values into C */
191ca616198SHong Zhang       /* ierr = MatSetValues(C,1,&row,ncols,cols,vals,INSERT_VALUES);CHKERRQ(ierr); */
1923f457be1SHong Zhang 
1933f457be1SHong Zhang       vals += ncols;
1943f457be1SHong Zhang       cols += ncols;
1953f457be1SHong Zhang       rptr[i+1] = rptr[i] + ncols;
1963f457be1SHong Zhang     }
1973f457be1SHong Zhang     /*
1983f457be1SHong Zhang     ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1993f457be1SHong Zhang     ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2003f457be1SHong Zhang     */
2013f457be1SHong Zhang     if (rptr[rend-rstart] != a->nz + b->nz) SETERRQ4(1, "rptr[%d] %d != %d + %d",rend-rstart,rptr[rend-rstart+1],a->nz,b->nz);
2023f457be1SHong Zhang 
2033f457be1SHong Zhang   /* send nzlocal to others, and recv other's nzlocal */
2043f457be1SHong Zhang   /*--------------------------------------------------*/
2053f457be1SHong Zhang   ierr = PetscMalloc3(nsends+nrecvs+1,PetscInt,&sbuf_nz,nrecvs,PetscInt*,&rbuf_j,nrecvs,PetscScalar*,&rbuf_a);CHKERRQ(ierr);
2063f457be1SHong Zhang   rbuf_nz = sbuf_nz + nsends;
2073f457be1SHong Zhang 
2083f457be1SHong Zhang   ierr = PetscMalloc2(3*(nsends + nrecvs)+1,MPI_Request,&s_waits1,nsends+1,MPI_Status,&send_status);CHKERRQ(ierr);
2093f457be1SHong Zhang   s_waits2 = s_waits1 + nsends;
2103f457be1SHong Zhang   s_waits3 = s_waits2 + nsends;
2113f457be1SHong Zhang   r_waits1 = s_waits3 + nsends;
2123f457be1SHong Zhang   r_waits2 = r_waits1 + nrecvs;
2133f457be1SHong Zhang   r_waits3 = r_waits2 + nrecvs;
2143f457be1SHong Zhang 
2153f457be1SHong Zhang   /* get some new tags to keep the communication clean */
2163f457be1SHong Zhang   ierr = PetscObjectGetNewTag((PetscObject)A,&tag1);CHKERRQ(ierr);
2173f457be1SHong Zhang   ierr = PetscObjectGetNewTag((PetscObject)A,&tag2);CHKERRQ(ierr);
2183f457be1SHong Zhang   ierr = PetscObjectGetNewTag((PetscObject)A,&tag3);CHKERRQ(ierr);
2193f457be1SHong Zhang 
2203f457be1SHong Zhang   /* post receives of other's nzlocal */
2213f457be1SHong Zhang   for (i=0; i<nrecvs; i++){
2223f457be1SHong Zhang     ierr = MPI_Irecv(rbuf_nz+i,1,MPIU_INT,MPI_ANY_SOURCE,tag1,comm,r_waits1+i);CHKERRQ(ierr);
2233f457be1SHong Zhang   }
2243f457be1SHong Zhang 
2253f457be1SHong Zhang   /* send nzlocal to others */
2263f457be1SHong Zhang   for (i=0; i<nsends; i++){
2273f457be1SHong Zhang     sbuf_nz[i] = nzlocal;
2283f457be1SHong Zhang     ierr = MPI_Isend(sbuf_nz+i,1,MPIU_INT,send_rank[i],tag1,comm,s_waits1+i);CHKERRQ(ierr);
2293f457be1SHong Zhang     if (prid == rank) printf(" [%d] sends nz %d to [%d]\n",rank,nzlocal,send_rank[i]);
2303f457be1SHong Zhang   }
2313f457be1SHong Zhang 
2323f457be1SHong Zhang   /* wait on receives of nzlocal; allocate space for rbuf_j, rbuf_a */
2333f457be1SHong Zhang   count = nrecvs;
2343f457be1SHong Zhang   while (count) {
2353f457be1SHong Zhang     ierr = MPI_Waitany(nrecvs,r_waits1,&imdex,&recv_status);CHKERRQ(ierr);
2363f457be1SHong Zhang     recv_rank[imdex] = recv_status.MPI_SOURCE;
2373f457be1SHong Zhang     /* allocate rbuf_a and rbuf_j; then post receives of rbuf_a and rbuf_j */
2383f457be1SHong Zhang     ierr = PetscMalloc((rbuf_nz[imdex]+1)*sizeof(PetscScalar),&rbuf_a[imdex]);CHKERRQ(ierr);
2393f457be1SHong Zhang     ierr = MPI_Irecv(rbuf_a[imdex],rbuf_nz[imdex],MPIU_SCALAR,recv_status.MPI_SOURCE,tag3,comm,r_waits3+imdex);CHKERRQ(ierr);
2403f457be1SHong Zhang 
2413f457be1SHong Zhang     itmp = rowrange[recv_status.MPI_SOURCE+1] - rowrange[recv_status.MPI_SOURCE]; /* number of expected mat->i */
2423f457be1SHong Zhang     rbuf_nz[imdex] += itmp+2;
2433f457be1SHong Zhang     ierr = PetscMalloc(rbuf_nz[imdex]*sizeof(PetscInt),&rbuf_j[imdex]);CHKERRQ(ierr);
2443f457be1SHong Zhang     ierr = MPI_Irecv(rbuf_j[imdex],rbuf_nz[imdex],MPIU_INT,recv_status.MPI_SOURCE,tag2,comm,r_waits2+imdex);CHKERRQ(ierr);
2453f457be1SHong Zhang     count--;
2463f457be1SHong Zhang   }
2473f457be1SHong Zhang 
2483f457be1SHong Zhang   /* wait on sends of nzlocal */
2493f457be1SHong Zhang   if (nsends) {ierr = MPI_Waitall(nsends,s_waits1,send_status);CHKERRQ(ierr);}
2503f457be1SHong Zhang 
2513f457be1SHong Zhang   /* send mat->i,j and mat->a to others, and recv from other's */
2523f457be1SHong Zhang   /*-----------------------------------------------------------*/
2533f457be1SHong Zhang   for (i=0; i<nsends; i++){
2543f457be1SHong Zhang     ierr = MPI_Isend(sbuf_a,nzlocal,MPIU_SCALAR,send_rank[i],tag3,comm,s_waits3+i);CHKERRQ(ierr);
2553f457be1SHong Zhang     itmp = nzlocal + rowrange[rank+1] - rowrange[rank] + 1;
2563f457be1SHong Zhang     ierr = MPI_Isend(sbuf_j,itmp,MPIU_INT,send_rank[i],tag2,comm,s_waits2+i);CHKERRQ(ierr);
2573f457be1SHong Zhang   }
2583f457be1SHong Zhang 
2593f457be1SHong Zhang   /* wait on receives of mat->i,j and mat->a */
2603f457be1SHong Zhang   /*-----------------------------------------*/
2613f457be1SHong Zhang   count = nrecvs;
2623f457be1SHong Zhang   while (count) {
2633f457be1SHong Zhang     ierr = MPI_Waitany(nrecvs,r_waits3,&imdex,&recv_status);CHKERRQ(ierr);
2643f457be1SHong Zhang     if (recv_rank[imdex] != recv_status.MPI_SOURCE) SETERRQ2(1, "recv_rank %d != MPI_SOURCE %d",recv_rank[imdex],recv_status.MPI_SOURCE);
2653f457be1SHong Zhang     ierr = MPI_Waitany(nrecvs,r_waits2,&imdex,&recv_status);CHKERRQ(ierr);
2663f457be1SHong Zhang     count--;
2673f457be1SHong Zhang   }
2683f457be1SHong Zhang 
2693f457be1SHong Zhang   /* wait on sends of mat->i,j and mat->a */
2703f457be1SHong Zhang   /*--------------------------------------*/
2713f457be1SHong Zhang   if (nsends) {
2723f457be1SHong Zhang     ierr = MPI_Waitall(nsends,s_waits3,send_status);CHKERRQ(ierr);
2733f457be1SHong Zhang     ierr = MPI_Waitall(nsends,s_waits2,send_status);CHKERRQ(ierr);
2743f457be1SHong Zhang   }
2753f457be1SHong Zhang   ierr = PetscFree(sbuf_nz);CHKERRQ(ierr);
2763f457be1SHong Zhang   ierr = PetscFree2(s_waits1,send_status);CHKERRQ(ierr);
2773f457be1SHong Zhang 
2783f457be1SHong Zhang   /* create redundant matrix */
2793f457be1SHong Zhang   /*-------------------------*/
280*0ae51fcdSHong Zhang   if (reuse == MAT_INITIAL_MATRIX){
2813f457be1SHong Zhang     ierr = MatCreate(subcomm,&C);CHKERRQ(ierr);
2823f457be1SHong Zhang     ierr = MatSetSizes(C,mlocal_sub,mlocal_sub,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr);
2833f457be1SHong Zhang     ierr = MatSetFromOptions(C);CHKERRQ(ierr);
284*0ae51fcdSHong Zhang   } else {
285*0ae51fcdSHong Zhang     C = *matredundant;
286*0ae51fcdSHong Zhang   }
2873f457be1SHong Zhang   /* insert local matrix entries */
2883f457be1SHong Zhang   rptr = sbuf_j;
2893f457be1SHong Zhang   cols = sbuf_j + rend-rstart + 1;
2903f457be1SHong Zhang   vals = sbuf_a;
2913f457be1SHong Zhang   for (i=0; i<rend-rstart; i++){
2923f457be1SHong Zhang     row   = i + rstart;
2933f457be1SHong Zhang     ncols = rptr[i+1] - rptr[i];
2943f457be1SHong Zhang     ierr = MatSetValues(C,1,&row,ncols,cols,vals,INSERT_VALUES);CHKERRQ(ierr);
2953f457be1SHong Zhang     vals += ncols;
2963f457be1SHong Zhang     cols += ncols;
2973f457be1SHong Zhang   }
2983f457be1SHong Zhang   /* insert received matrix entries */
2993f457be1SHong Zhang   for (imdex=0; imdex<nrecvs; imdex++){
3003f457be1SHong Zhang 
3013f457be1SHong Zhang     rstart = rowrange[recv_rank[imdex]];
3023f457be1SHong Zhang     rend   = rowrange[recv_rank[imdex]+1];
3033f457be1SHong Zhang     rptr = rbuf_j[imdex];
3043f457be1SHong Zhang     cols = rbuf_j[imdex] + rend-rstart + 1;
3053f457be1SHong Zhang     vals = rbuf_a[imdex];
3063f457be1SHong Zhang     for (i=0; i<rend-rstart; i++){
3073f457be1SHong Zhang       row   = i + rstart;
3083f457be1SHong Zhang       ncols = rptr[i+1] - rptr[i];
3093f457be1SHong Zhang       ierr = MatSetValues(C,1,&row,ncols,cols,vals,INSERT_VALUES);CHKERRQ(ierr);
3103f457be1SHong Zhang       vals += ncols;
3113f457be1SHong Zhang       cols += ncols;
3123f457be1SHong Zhang     }
3133f457be1SHong Zhang   }
3143f457be1SHong Zhang   ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3153f457be1SHong Zhang   ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3163f457be1SHong Zhang   ierr = MatGetSize(C,&M,&N);CHKERRQ(ierr);
3173f457be1SHong Zhang   if (M != mat->rmap.N || N != mat->cmap.N) SETERRQ2(PETSC_ERR_ARG_INCOMP,"redundant mat size %d != input mat size %d",M,mat->rmap.N);
318*0ae51fcdSHong Zhang   if (reuse == MAT_INITIAL_MATRIX){
3193f457be1SHong Zhang     *matredundant = C;
320*0ae51fcdSHong Zhang   }
3213f457be1SHong Zhang 
3223f457be1SHong Zhang   /* free space */
3233f457be1SHong Zhang   ierr = PetscFree(send_rank);CHKERRQ(ierr);
3243f457be1SHong Zhang   ierr = PetscFree(sbuf_j);CHKERRQ(ierr);
3253f457be1SHong Zhang   ierr = PetscFree(sbuf_a);CHKERRQ(ierr);
3263f457be1SHong Zhang   for (i=0; i<nrecvs; i++){
3273f457be1SHong Zhang     ierr = PetscFree(rbuf_j[i]);CHKERRQ(ierr);
3283f457be1SHong Zhang     ierr = PetscFree(rbuf_a[i]);CHKERRQ(ierr);
3293f457be1SHong Zhang   }
3303f457be1SHong Zhang   ierr = PetscFree3(sbuf_nz,rbuf_j,rbuf_a);CHKERRQ(ierr);
3313f457be1SHong Zhang   PetscFunctionReturn(0);
3323f457be1SHong Zhang }
3333f457be1SHong Zhang 
3344b9ad928SBarry Smith #undef __FUNCT__
3354b9ad928SBarry Smith #define __FUNCT__ "PCSetUp_Redundant"
3366849ba73SBarry Smith static PetscErrorCode PCSetUp_Redundant(PC pc)
3374b9ad928SBarry Smith {
3384b9ad928SBarry Smith   PC_Redundant   *red  = (PC_Redundant*)pc->data;
339dfbe8321SBarry Smith   PetscErrorCode ierr;
3403f457be1SHong Zhang   PetscInt       mstart,mend,mlocal,m;
34113f74950SBarry Smith   PetscMPIInt    size;
3424b9ad928SBarry Smith   IS             isl;
3434b9ad928SBarry Smith   MatReuse       reuse = MAT_INITIAL_MATRIX;
3444b9ad928SBarry Smith   MatStructure   str   = DIFFERENT_NONZERO_PATTERN;
3454b9ad928SBarry Smith   MPI_Comm       comm;
34623ce1328SBarry Smith   Vec            vec;
3474b9ad928SBarry Smith 
3483f457be1SHong Zhang   PetscInt    mlocal_sub;
3493f457be1SHong Zhang   PetscMPIInt subsize,subrank;
3503f457be1SHong Zhang   PetscInt    rstart_sub,rend_sub,mloc_sub;
3513f457be1SHong Zhang 
3524b9ad928SBarry Smith   PetscFunctionBegin;
3533f457be1SHong Zhang   ierr = PetscObjectGetComm((PetscObject)pc->pmat,&comm);CHKERRQ(ierr);
35423ce1328SBarry Smith   ierr = MatGetVecs(pc->pmat,&vec,0);CHKERRQ(ierr);
3554b9ad928SBarry Smith   ierr = PCSetFromOptions(red->pc);CHKERRQ(ierr);
35623ce1328SBarry Smith   ierr = VecGetSize(vec,&m);CHKERRQ(ierr);
3574b9ad928SBarry Smith   if (!pc->setupcalled) {
3583f457be1SHong Zhang     /* create working vectors xsub/ysub and xdup/ydup */
35923ce1328SBarry Smith     ierr = VecGetLocalSize(vec,&mlocal);CHKERRQ(ierr);
3603f457be1SHong Zhang     ierr = VecGetOwnershipRange(vec,&mstart,&mend);CHKERRQ(ierr);
3614b9ad928SBarry Smith 
3623f457be1SHong Zhang     /* get local size of xsub/ysub */
3633f457be1SHong Zhang     ierr = MPI_Comm_size(red->subcomm,&subsize);CHKERRQ(ierr);
3643f457be1SHong Zhang     ierr = MPI_Comm_rank(red->subcomm,&subrank);CHKERRQ(ierr);
3653f457be1SHong Zhang     rstart_sub = pc->pmat->rmap.range[red->nsubcomm*subrank]; /* rstart in xsub/ysub */
3663f457be1SHong Zhang     if (subrank+1 < subsize){
3673f457be1SHong Zhang       rend_sub = pc->pmat->rmap.range[red->nsubcomm*(subrank+1)];
3683f457be1SHong Zhang     } else {
3693f457be1SHong Zhang       rend_sub = m;
3703f457be1SHong Zhang     }
3713f457be1SHong Zhang     mloc_sub = rend_sub - rstart_sub;
3723f457be1SHong Zhang     ierr = VecCreateMPI(red->subcomm,mloc_sub,PETSC_DECIDE,&red->ysub);CHKERRQ(ierr);
3733f457be1SHong Zhang     /* create xsub with empty local arrays, because xdup's arrays will be placed into it */
3743f457be1SHong Zhang     ierr = VecCreateMPIWithArray(red->subcomm,mloc_sub,PETSC_DECIDE,PETSC_NULL,&red->xsub);CHKERRQ(ierr);
3753f457be1SHong Zhang 
3763f457be1SHong Zhang     /* create xdup and ydup. ydup has empty local arrays because ysub's arrays will be place into it.
3773f457be1SHong Zhang        Note: we use communicator dupcomm, not pc->comm! */
3783f457be1SHong Zhang     ierr = VecCreateMPI(red->dupcomm,mloc_sub,PETSC_DECIDE,&red->xdup);CHKERRQ(ierr);
3793f457be1SHong Zhang     ierr = VecCreateMPIWithArray(red->dupcomm,mloc_sub,PETSC_DECIDE,PETSC_NULL,&red->ydup);CHKERRQ(ierr);
3803f457be1SHong Zhang 
3813f457be1SHong Zhang     /* create vec scatters */
3823f457be1SHong Zhang     if (!red->scatterin){
3833f457be1SHong Zhang       IS       is1,is2;
3843f457be1SHong Zhang       PetscInt *idx1,*idx2,i,j,k;
3853f457be1SHong Zhang       ierr = PetscMalloc(2*red->nsubcomm*mlocal*sizeof(PetscInt),&idx1);CHKERRQ(ierr);
3863f457be1SHong Zhang       idx2 = idx1 + red->nsubcomm*mlocal;
3873f457be1SHong Zhang       j = 0;
3883f457be1SHong Zhang       for (k=0; k<red->nsubcomm; k++){
3893f457be1SHong Zhang         for (i=mstart; i<mend; i++){
3903f457be1SHong Zhang           idx1[j]   = i;
3913f457be1SHong Zhang           idx2[j++] = i + m*k;
3923f457be1SHong Zhang         }
3933f457be1SHong Zhang       }
3943f457be1SHong Zhang       ierr = ISCreateGeneral(comm,red->nsubcomm*mlocal,idx1,&is1);CHKERRQ(ierr);
3953f457be1SHong Zhang       ierr = ISCreateGeneral(comm,red->nsubcomm*mlocal,idx2,&is2);CHKERRQ(ierr);
3963f457be1SHong Zhang       ierr = VecScatterCreate(vec,is1,red->xdup,is2,&red->scatterin);CHKERRQ(ierr);
3973f457be1SHong Zhang       ierr = ISDestroy(is1);CHKERRQ(ierr);
3983f457be1SHong Zhang       ierr = ISDestroy(is2);CHKERRQ(ierr);
3993f457be1SHong Zhang 
4003f457be1SHong Zhang       ierr = ISCreateStride(comm,mlocal,mstart+ red->color*m,1,&is1);CHKERRQ(ierr);
4013f457be1SHong Zhang       ierr = ISCreateStride(comm,mlocal,mstart,1,&is2);CHKERRQ(ierr);
4023f457be1SHong Zhang       ierr = VecScatterCreate(red->xdup,is1,vec,is2,&red->scatterout);CHKERRQ(ierr);
4033f457be1SHong Zhang       ierr = ISDestroy(is1);CHKERRQ(ierr);
4043f457be1SHong Zhang       ierr = ISDestroy(is2);CHKERRQ(ierr);
4053f457be1SHong Zhang       ierr = PetscFree(idx1);CHKERRQ(ierr);
4064b9ad928SBarry Smith     }
4074b9ad928SBarry Smith   }
40823ce1328SBarry Smith   ierr = VecDestroy(vec);CHKERRQ(ierr);
4094b9ad928SBarry Smith 
4104b9ad928SBarry Smith   /* if pmatrix set by user is sequential then we do not need to gather the parallel matrix */
4113f457be1SHong Zhang   ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr);
4124b9ad928SBarry Smith   if (size == 1) {
4134b9ad928SBarry Smith     red->useparallelmat = PETSC_FALSE;
4144b9ad928SBarry Smith   }
4154b9ad928SBarry Smith 
4164b9ad928SBarry Smith   if (red->useparallelmat) {
4174b9ad928SBarry Smith     if (pc->setupcalled == 1 && pc->flag == DIFFERENT_NONZERO_PATTERN) {
4184b9ad928SBarry Smith       /* destroy old matrices */
4194b9ad928SBarry Smith       if (red->pmats) {
4204b9ad928SBarry Smith         ierr = MatDestroyMatrices(1,&red->pmats);CHKERRQ(ierr);
4214b9ad928SBarry Smith       }
4224b9ad928SBarry Smith     } else if (pc->setupcalled == 1) {
4234b9ad928SBarry Smith       reuse = MAT_REUSE_MATRIX;
4244b9ad928SBarry Smith       str   = SAME_NONZERO_PATTERN;
4254b9ad928SBarry Smith     }
4264b9ad928SBarry Smith 
4273f457be1SHong Zhang     /* grab the parallel matrix and put it into processors of a subcomminicator */
428f664ae05SHong Zhang     /*--------------------------------------------------------------------------*/
429f664ae05SHong Zhang     ierr = VecGetLocalSize(red->ysub,&mlocal_sub);CHKERRQ(ierr);
430*0ae51fcdSHong Zhang     ierr = MatGetRedundantMatrix_AIJ(pc->pmat,red->nsubcomm,red->subcomm,mlocal_sub,reuse,&red->pmats_sub);CHKERRQ(ierr);
4313f457be1SHong Zhang     /* tell PC of the subcommunicator its operators */
432*0ae51fcdSHong Zhang     ierr = PCSetOperators(red->pc,red->pmats_sub,red->pmats_sub,str);CHKERRQ(ierr);
4334b9ad928SBarry Smith   } else {
4344b9ad928SBarry Smith     ierr = PCSetOperators(red->pc,pc->mat,pc->pmat,pc->flag);CHKERRQ(ierr);
4354b9ad928SBarry Smith   }
4364b9ad928SBarry Smith   ierr = PCSetFromOptions(red->pc);CHKERRQ(ierr);
4374b9ad928SBarry Smith   ierr = PCSetUp(red->pc);CHKERRQ(ierr);
4384b9ad928SBarry Smith   PetscFunctionReturn(0);
4394b9ad928SBarry Smith }
4404b9ad928SBarry Smith 
4414b9ad928SBarry Smith #undef __FUNCT__
4424b9ad928SBarry Smith #define __FUNCT__ "PCApply_Redundant"
4436849ba73SBarry Smith static PetscErrorCode PCApply_Redundant(PC pc,Vec x,Vec y)
4444b9ad928SBarry Smith {
4454b9ad928SBarry Smith   PC_Redundant   *red = (PC_Redundant*)pc->data;
446dfbe8321SBarry Smith   PetscErrorCode ierr;
4473f457be1SHong Zhang   PetscScalar    *array;
4484b9ad928SBarry Smith 
4494b9ad928SBarry Smith   PetscFunctionBegin;
4503f457be1SHong Zhang   /* scatter x to xdup */
4513f457be1SHong Zhang   ierr = VecScatterBegin(x,red->xdup,INSERT_VALUES,SCATTER_FORWARD,red->scatterin);CHKERRQ(ierr);
4523f457be1SHong Zhang   ierr = VecScatterEnd(x,red->xdup,INSERT_VALUES,SCATTER_FORWARD,red->scatterin);CHKERRQ(ierr);
4533f457be1SHong Zhang 
4543f457be1SHong Zhang   /* place xdup's local array into xsub */
4553f457be1SHong Zhang   ierr = VecGetArray(red->xdup,&array);CHKERRQ(ierr);
4563f457be1SHong Zhang   ierr = VecPlaceArray(red->xsub,(const PetscScalar*)array);CHKERRQ(ierr);
4574b9ad928SBarry Smith 
4584b9ad928SBarry Smith   /* apply preconditioner on each processor */
4593f457be1SHong Zhang   ierr = PCApply(red->pc,red->xsub,red->ysub);CHKERRQ(ierr);
4603f457be1SHong Zhang   ierr = VecResetArray(red->xsub);CHKERRQ(ierr);
4613f457be1SHong Zhang   ierr = VecRestoreArray(red->xdup,&array);CHKERRQ(ierr);
4624b9ad928SBarry Smith 
4633f457be1SHong Zhang   /* place ysub's local array into ydup */
4643f457be1SHong Zhang   ierr = VecGetArray(red->ysub,&array);CHKERRQ(ierr);
4653f457be1SHong Zhang   ierr = VecPlaceArray(red->ydup,(const PetscScalar*)array);CHKERRQ(ierr);
4663f457be1SHong Zhang 
4673f457be1SHong Zhang   /* scatter ydup to y */
4683f457be1SHong Zhang   ierr = VecScatterBegin(red->ydup,y,INSERT_VALUES,SCATTER_FORWARD,red->scatterout);CHKERRQ(ierr);
4693f457be1SHong Zhang   ierr = VecScatterEnd(red->ydup,y,INSERT_VALUES,SCATTER_FORWARD,red->scatterout);CHKERRQ(ierr);
4703f457be1SHong Zhang   ierr = VecResetArray(red->ydup);CHKERRQ(ierr);
4713f457be1SHong Zhang   ierr = VecRestoreArray(red->ysub,&array);CHKERRQ(ierr);
4724b9ad928SBarry Smith   PetscFunctionReturn(0);
4734b9ad928SBarry Smith }
4744b9ad928SBarry Smith 
4754b9ad928SBarry Smith #undef __FUNCT__
4764b9ad928SBarry Smith #define __FUNCT__ "PCDestroy_Redundant"
4776849ba73SBarry Smith static PetscErrorCode PCDestroy_Redundant(PC pc)
4784b9ad928SBarry Smith {
4794b9ad928SBarry Smith   PC_Redundant   *red = (PC_Redundant*)pc->data;
480dfbe8321SBarry Smith   PetscErrorCode ierr;
4814b9ad928SBarry Smith 
4824b9ad928SBarry Smith   PetscFunctionBegin;
4834b9ad928SBarry Smith   if (red->scatterin)  {ierr = VecScatterDestroy(red->scatterin);CHKERRQ(ierr);}
4844b9ad928SBarry Smith   if (red->scatterout) {ierr = VecScatterDestroy(red->scatterout);CHKERRQ(ierr);}
4853f457be1SHong Zhang   if (red->ysub)       {ierr = VecDestroy(red->ysub);CHKERRQ(ierr);}
4863f457be1SHong Zhang   if (red->xsub)       {ierr = VecDestroy(red->xsub);CHKERRQ(ierr);}
4873f457be1SHong Zhang   if (red->xdup)       {ierr = VecDestroy(red->xdup);CHKERRQ(ierr);}
4883f457be1SHong Zhang   if (red->ydup)       {ierr = VecDestroy(red->ydup);CHKERRQ(ierr);}
4893f457be1SHong Zhang   if (red->pmats_sub) {
4903f457be1SHong Zhang     ierr = MatDestroy(red->pmats_sub);CHKERRQ(ierr);
4913f457be1SHong Zhang   }
4923f457be1SHong Zhang 
4934b9ad928SBarry Smith   if (red->pmats) {
4944b9ad928SBarry Smith     ierr = MatDestroyMatrices(1,&red->pmats);CHKERRQ(ierr);
4954b9ad928SBarry Smith   }
4964b9ad928SBarry Smith   ierr = PCDestroy(red->pc);CHKERRQ(ierr);
4974b9ad928SBarry Smith   ierr = PetscFree(red);CHKERRQ(ierr);
4984b9ad928SBarry Smith   PetscFunctionReturn(0);
4994b9ad928SBarry Smith }
5004b9ad928SBarry Smith 
5014b9ad928SBarry Smith #undef __FUNCT__
5024b9ad928SBarry Smith #define __FUNCT__ "PCSetFromOptions_Redundant"
5036849ba73SBarry Smith static PetscErrorCode PCSetFromOptions_Redundant(PC pc)
5044b9ad928SBarry Smith {
5054b9ad928SBarry Smith   PetscFunctionBegin;
5064b9ad928SBarry Smith   PetscFunctionReturn(0);
5074b9ad928SBarry Smith }
5084b9ad928SBarry Smith 
5094b9ad928SBarry Smith EXTERN_C_BEGIN
5104b9ad928SBarry Smith #undef __FUNCT__
5114b9ad928SBarry Smith #define __FUNCT__ "PCRedundantSetScatter_Redundant"
512dba47a55SKris Buschelman PetscErrorCode PETSCKSP_DLLEXPORT PCRedundantSetScatter_Redundant(PC pc,VecScatter in,VecScatter out)
5134b9ad928SBarry Smith {
5144b9ad928SBarry Smith   PC_Redundant   *red = (PC_Redundant*)pc->data;
515dfbe8321SBarry Smith   PetscErrorCode ierr;
5164b9ad928SBarry Smith 
5174b9ad928SBarry Smith   PetscFunctionBegin;
5184b9ad928SBarry Smith   red->scatterin  = in;
5194b9ad928SBarry Smith   red->scatterout = out;
5204b9ad928SBarry Smith   ierr = PetscObjectReference((PetscObject)in);CHKERRQ(ierr);
5214b9ad928SBarry Smith   ierr = PetscObjectReference((PetscObject)out);CHKERRQ(ierr);
5224b9ad928SBarry Smith   PetscFunctionReturn(0);
5234b9ad928SBarry Smith }
5244b9ad928SBarry Smith EXTERN_C_END
5254b9ad928SBarry Smith 
5264b9ad928SBarry Smith #undef __FUNCT__
5274b9ad928SBarry Smith #define __FUNCT__ "PCRedundantSetScatter"
5284b9ad928SBarry Smith /*@
5294b9ad928SBarry Smith    PCRedundantSetScatter - Sets the scatter used to copy values into the
5304b9ad928SBarry Smith      redundant local solve and the scatter to move them back into the global
5314b9ad928SBarry Smith      vector.
5324b9ad928SBarry Smith 
5334b9ad928SBarry Smith    Collective on PC
5344b9ad928SBarry Smith 
5354b9ad928SBarry Smith    Input Parameters:
5364b9ad928SBarry Smith +  pc - the preconditioner context
5374b9ad928SBarry Smith .  in - the scatter to move the values in
5384b9ad928SBarry Smith -  out - the scatter to move them out
5394b9ad928SBarry Smith 
5404b9ad928SBarry Smith    Level: advanced
5414b9ad928SBarry Smith 
5424b9ad928SBarry Smith .keywords: PC, redundant solve
5434b9ad928SBarry Smith @*/
544dba47a55SKris Buschelman PetscErrorCode PETSCKSP_DLLEXPORT PCRedundantSetScatter(PC pc,VecScatter in,VecScatter out)
5454b9ad928SBarry Smith {
546dfbe8321SBarry Smith   PetscErrorCode ierr,(*f)(PC,VecScatter,VecScatter);
5474b9ad928SBarry Smith 
5484b9ad928SBarry Smith   PetscFunctionBegin;
5494482741eSBarry Smith   PetscValidHeaderSpecific(pc,PC_COOKIE,1);
5504482741eSBarry Smith   PetscValidHeaderSpecific(in,VEC_SCATTER_COOKIE,2);
5514482741eSBarry Smith   PetscValidHeaderSpecific(out,VEC_SCATTER_COOKIE,3);
5524b9ad928SBarry Smith   ierr = PetscObjectQueryFunction((PetscObject)pc,"PCRedundantSetScatter_C",(void (**)(void))&f);CHKERRQ(ierr);
5534b9ad928SBarry Smith   if (f) {
5544b9ad928SBarry Smith     ierr = (*f)(pc,in,out);CHKERRQ(ierr);
5554b9ad928SBarry Smith   }
5564b9ad928SBarry Smith   PetscFunctionReturn(0);
5574b9ad928SBarry Smith }
5584b9ad928SBarry Smith 
5594b9ad928SBarry Smith EXTERN_C_BEGIN
5604b9ad928SBarry Smith #undef __FUNCT__
5614b9ad928SBarry Smith #define __FUNCT__ "PCRedundantGetPC_Redundant"
562dba47a55SKris Buschelman PetscErrorCode PETSCKSP_DLLEXPORT PCRedundantGetPC_Redundant(PC pc,PC *innerpc)
5634b9ad928SBarry Smith {
5644b9ad928SBarry Smith   PC_Redundant *red = (PC_Redundant*)pc->data;
5654b9ad928SBarry Smith 
5664b9ad928SBarry Smith   PetscFunctionBegin;
5674b9ad928SBarry Smith   *innerpc = red->pc;
5684b9ad928SBarry Smith   PetscFunctionReturn(0);
5694b9ad928SBarry Smith }
5704b9ad928SBarry Smith EXTERN_C_END
5714b9ad928SBarry Smith 
5724b9ad928SBarry Smith #undef __FUNCT__
5734b9ad928SBarry Smith #define __FUNCT__ "PCRedundantGetPC"
5744b9ad928SBarry Smith /*@
5754b9ad928SBarry Smith    PCRedundantGetPC - Gets the sequential PC created by the redundant PC.
5764b9ad928SBarry Smith 
5774b9ad928SBarry Smith    Not Collective
5784b9ad928SBarry Smith 
5794b9ad928SBarry Smith    Input Parameter:
5804b9ad928SBarry Smith .  pc - the preconditioner context
5814b9ad928SBarry Smith 
5824b9ad928SBarry Smith    Output Parameter:
5834b9ad928SBarry Smith .  innerpc - the sequential PC
5844b9ad928SBarry Smith 
5854b9ad928SBarry Smith    Level: advanced
5864b9ad928SBarry Smith 
5874b9ad928SBarry Smith .keywords: PC, redundant solve
5884b9ad928SBarry Smith @*/
589dba47a55SKris Buschelman PetscErrorCode PETSCKSP_DLLEXPORT PCRedundantGetPC(PC pc,PC *innerpc)
5904b9ad928SBarry Smith {
591dfbe8321SBarry Smith   PetscErrorCode ierr,(*f)(PC,PC*);
5924b9ad928SBarry Smith 
5934b9ad928SBarry Smith   PetscFunctionBegin;
5944482741eSBarry Smith   PetscValidHeaderSpecific(pc,PC_COOKIE,1);
5954482741eSBarry Smith   PetscValidPointer(innerpc,2);
5964b9ad928SBarry Smith   ierr = PetscObjectQueryFunction((PetscObject)pc,"PCRedundantGetPC_C",(void (**)(void))&f);CHKERRQ(ierr);
5974b9ad928SBarry Smith   if (f) {
5984b9ad928SBarry Smith     ierr = (*f)(pc,innerpc);CHKERRQ(ierr);
5994b9ad928SBarry Smith   }
6004b9ad928SBarry Smith   PetscFunctionReturn(0);
6014b9ad928SBarry Smith }
6024b9ad928SBarry Smith 
6034b9ad928SBarry Smith EXTERN_C_BEGIN
6044b9ad928SBarry Smith #undef __FUNCT__
6054b9ad928SBarry Smith #define __FUNCT__ "PCRedundantGetOperators_Redundant"
606dba47a55SKris Buschelman PetscErrorCode PETSCKSP_DLLEXPORT PCRedundantGetOperators_Redundant(PC pc,Mat *mat,Mat *pmat)
6074b9ad928SBarry Smith {
6084b9ad928SBarry Smith   PC_Redundant *red = (PC_Redundant*)pc->data;
6094b9ad928SBarry Smith 
6104b9ad928SBarry Smith   PetscFunctionBegin;
6114b9ad928SBarry Smith   if (mat)  *mat  = red->pmats[0];
6124b9ad928SBarry Smith   if (pmat) *pmat = red->pmats[0];
6134b9ad928SBarry Smith   PetscFunctionReturn(0);
6144b9ad928SBarry Smith }
6154b9ad928SBarry Smith EXTERN_C_END
6164b9ad928SBarry Smith 
6174b9ad928SBarry Smith #undef __FUNCT__
6184b9ad928SBarry Smith #define __FUNCT__ "PCRedundantGetOperators"
6194b9ad928SBarry Smith /*@
6204b9ad928SBarry Smith    PCRedundantGetOperators - gets the sequential matrix and preconditioner matrix
6214b9ad928SBarry Smith 
6224b9ad928SBarry Smith    Not Collective
6234b9ad928SBarry Smith 
6244b9ad928SBarry Smith    Input Parameter:
6254b9ad928SBarry Smith .  pc - the preconditioner context
6264b9ad928SBarry Smith 
6274b9ad928SBarry Smith    Output Parameters:
6284b9ad928SBarry Smith +  mat - the matrix
6294b9ad928SBarry Smith -  pmat - the (possibly different) preconditioner matrix
6304b9ad928SBarry Smith 
6314b9ad928SBarry Smith    Level: advanced
6324b9ad928SBarry Smith 
6334b9ad928SBarry Smith .keywords: PC, redundant solve
6344b9ad928SBarry Smith @*/
635dba47a55SKris Buschelman PetscErrorCode PETSCKSP_DLLEXPORT PCRedundantGetOperators(PC pc,Mat *mat,Mat *pmat)
6364b9ad928SBarry Smith {
637dfbe8321SBarry Smith   PetscErrorCode ierr,(*f)(PC,Mat*,Mat*);
6384b9ad928SBarry Smith 
6394b9ad928SBarry Smith   PetscFunctionBegin;
6404482741eSBarry Smith   PetscValidHeaderSpecific(pc,PC_COOKIE,1);
6414482741eSBarry Smith   if (mat)  PetscValidPointer(mat,2);
6424482741eSBarry Smith   if (pmat) PetscValidPointer(pmat,3);
6434b9ad928SBarry Smith   ierr = PetscObjectQueryFunction((PetscObject)pc,"PCRedundantGetOperators_C",(void (**)(void))&f);CHKERRQ(ierr);
6444b9ad928SBarry Smith   if (f) {
6454b9ad928SBarry Smith     ierr = (*f)(pc,mat,pmat);CHKERRQ(ierr);
6464b9ad928SBarry Smith   }
6474b9ad928SBarry Smith   PetscFunctionReturn(0);
6484b9ad928SBarry Smith }
6494b9ad928SBarry Smith 
6504b9ad928SBarry Smith /* -------------------------------------------------------------------------------------*/
65137a17b4dSBarry Smith /*MC
65237a17b4dSBarry Smith      PCREDUNDANT - Runs a preconditioner for the entire problem on each processor
65337a17b4dSBarry Smith 
65437a17b4dSBarry Smith 
65537a17b4dSBarry Smith      Options for the redundant preconditioners can be set with -redundant_pc_xxx
65637a17b4dSBarry Smith 
65737a17b4dSBarry Smith    Level: intermediate
65837a17b4dSBarry Smith 
65937a17b4dSBarry Smith 
66037a17b4dSBarry Smith .seealso:  PCCreate(), PCSetType(), PCType (for list of available types), PCRedundantSetScatter(),
66137a17b4dSBarry Smith            PCRedundantGetPC(), PCRedundantGetOperators()
66237a17b4dSBarry Smith 
66337a17b4dSBarry Smith M*/
66437a17b4dSBarry Smith 
6654b9ad928SBarry Smith EXTERN_C_BEGIN
6664b9ad928SBarry Smith #undef __FUNCT__
6674b9ad928SBarry Smith #define __FUNCT__ "PCCreate_Redundant"
668dba47a55SKris Buschelman PetscErrorCode PETSCKSP_DLLEXPORT PCCreate_Redundant(PC pc)
6694b9ad928SBarry Smith {
670dfbe8321SBarry Smith   PetscErrorCode ierr;
6714b9ad928SBarry Smith   PC_Redundant   *red;
672e060cb09SBarry Smith   const char     *prefix;
6734b9ad928SBarry Smith 
6743f457be1SHong Zhang   PetscInt       nsubcomm,np_subcomm,nleftover,i,j,color;
6753f457be1SHong Zhang   PetscMPIInt    rank,size,subrank,*subsize;
6763f457be1SHong Zhang   MPI_Comm       subcomm;
6773f457be1SHong Zhang   PetscMPIInt    duprank;
6783f457be1SHong Zhang   PetscMPIInt    rank_dup,size_dup;
6793f457be1SHong Zhang   MPI_Comm       dupcomm;
6803f457be1SHong Zhang 
6814b9ad928SBarry Smith   PetscFunctionBegin;
6824b9ad928SBarry Smith   ierr = PetscNew(PC_Redundant,&red);CHKERRQ(ierr);
68352e6d16bSBarry Smith   ierr = PetscLogObjectMemory(pc,sizeof(PC_Redundant));CHKERRQ(ierr);
6844b9ad928SBarry Smith   red->useparallelmat   = PETSC_TRUE;
6854b9ad928SBarry Smith 
6863f457be1SHong Zhang   ierr = MPI_Comm_rank(pc->comm,&rank);CHKERRQ(ierr);
6873f457be1SHong Zhang   ierr = MPI_Comm_size(pc->comm,&size);CHKERRQ(ierr);
6883f457be1SHong Zhang   nsubcomm = size;
6893f457be1SHong Zhang   ierr = PetscOptionsGetInt(PETSC_NULL,"-nsubcomm",&nsubcomm,PETSC_NULL);CHKERRQ(ierr);
6903f457be1SHong Zhang   if (nsubcomm > size) SETERRQ2(PETSC_ERR_ARG_OUTOFRANGE, "Num of subcommunicators %D cannot be larger than MPI_Comm_size %D",nsubcomm,size);
6913f457be1SHong Zhang 
6923f457be1SHong Zhang   /* get size of each subcommunicators */
6933f457be1SHong Zhang   ierr = PetscMalloc((1+nsubcomm)*sizeof(PetscMPIInt),&subsize);CHKERRQ(ierr);
6943f457be1SHong Zhang   np_subcomm = size/nsubcomm;
6953f457be1SHong Zhang   nleftover  = size - nsubcomm*np_subcomm;
6963f457be1SHong Zhang   for (i=0; i<nsubcomm; i++){
6973f457be1SHong Zhang     subsize[i] = np_subcomm;
6983f457be1SHong Zhang     if (i<nleftover) subsize[i]++;
6993f457be1SHong Zhang   }
7003f457be1SHong Zhang 
7013f457be1SHong Zhang   /* find color for this proc */
7023f457be1SHong Zhang   color   = rank%nsubcomm;
7033f457be1SHong Zhang   subrank = rank/nsubcomm;
7043f457be1SHong Zhang 
7053f457be1SHong Zhang   ierr = MPI_Comm_split(pc->comm,color,subrank,&subcomm);CHKERRQ(ierr);
7063f457be1SHong Zhang   red->subcomm  = subcomm;
7073f457be1SHong Zhang   red->color    = color;
7083f457be1SHong Zhang   red->nsubcomm = nsubcomm;
7093f457be1SHong Zhang 
7103f457be1SHong Zhang   j = 0; duprank = 0;
7113f457be1SHong Zhang   for (i=0; i<nsubcomm; i++){
7123f457be1SHong Zhang     if (j == color){
7133f457be1SHong Zhang       duprank += subrank;
7143f457be1SHong Zhang       break;
7153f457be1SHong Zhang     }
7163f457be1SHong Zhang     duprank += subsize[i]; j++;
7173f457be1SHong Zhang   }
7183f457be1SHong Zhang   /*
7193f457be1SHong Zhang   ierr = PetscSynchronizedPrintf(pc->comm, "[%d] color %d, subrank %d, duprank %d\n",rank,color,subrank,duprank);
7203f457be1SHong Zhang   ierr = PetscSynchronizedFlush(pc->comm);CHKERRQ(ierr);
7213f457be1SHong Zhang   */
7223f457be1SHong Zhang 
7233f457be1SHong Zhang   ierr = MPI_Comm_split(pc->comm,0,duprank,&dupcomm);CHKERRQ(ierr);
7243f457be1SHong Zhang   ierr = MPI_Comm_rank(dupcomm,&rank_dup);CHKERRQ(ierr);
7253f457be1SHong Zhang   ierr = MPI_Comm_size(dupcomm,&size_dup);CHKERRQ(ierr);
7263f457be1SHong Zhang   /*
7273f457be1SHong Zhang   ierr = PetscSynchronizedPrintf(pc->comm, "[%d] duprank %d\n",rank,duprank);
7283f457be1SHong Zhang   ierr = PetscSynchronizedFlush(pc->comm);CHKERRQ(ierr);
7293f457be1SHong Zhang   */
7303f457be1SHong Zhang   red->dupcomm = dupcomm;
7313f457be1SHong Zhang   ierr = PetscFree(subsize);CHKERRQ(ierr);
7323f457be1SHong Zhang 
7334b9ad928SBarry Smith   /* create the sequential PC that each processor has copy of */
7343f457be1SHong Zhang   ierr = PCCreate(subcomm,&red->pc);CHKERRQ(ierr);
7354b9ad928SBarry Smith   ierr = PCSetType(red->pc,PCLU);CHKERRQ(ierr);
7364b9ad928SBarry Smith   ierr = PCGetOptionsPrefix(pc,&prefix);CHKERRQ(ierr);
7374b9ad928SBarry Smith   ierr = PCSetOptionsPrefix(red->pc,prefix);CHKERRQ(ierr);
7384b9ad928SBarry Smith   ierr = PCAppendOptionsPrefix(red->pc,"redundant_");CHKERRQ(ierr);
7394b9ad928SBarry Smith 
7404b9ad928SBarry Smith   pc->ops->apply             = PCApply_Redundant;
7414b9ad928SBarry Smith   pc->ops->applytranspose    = 0;
7424b9ad928SBarry Smith   pc->ops->setup             = PCSetUp_Redundant;
7434b9ad928SBarry Smith   pc->ops->destroy           = PCDestroy_Redundant;
7444b9ad928SBarry Smith   pc->ops->setfromoptions    = PCSetFromOptions_Redundant;
7454b9ad928SBarry Smith   pc->ops->setuponblocks     = 0;
7464b9ad928SBarry Smith   pc->ops->view              = PCView_Redundant;
7474b9ad928SBarry Smith   pc->ops->applyrichardson   = 0;
7484b9ad928SBarry Smith 
7494b9ad928SBarry Smith   pc->data     = (void*)red;
7504b9ad928SBarry Smith 
7514b9ad928SBarry Smith   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCRedundantSetScatter_C","PCRedundantSetScatter_Redundant",
7524b9ad928SBarry Smith                     PCRedundantSetScatter_Redundant);CHKERRQ(ierr);
7534b9ad928SBarry Smith   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCRedundantGetPC_C","PCRedundantGetPC_Redundant",
7544b9ad928SBarry Smith                     PCRedundantGetPC_Redundant);CHKERRQ(ierr);
7554b9ad928SBarry Smith   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCRedundantGetOperators_C","PCRedundantGetOperators_Redundant",
7564b9ad928SBarry Smith                     PCRedundantGetOperators_Redundant);CHKERRQ(ierr);
7574b9ad928SBarry Smith 
7584b9ad928SBarry Smith   PetscFunctionReturn(0);
7594b9ad928SBarry Smith }
7604b9ad928SBarry Smith EXTERN_C_END
761