xref: /petsc/src/mat/impls/aij/mpi/mmaij.c (revision c5bfad50543b83456d5604272280e5873a4d8884)
1be1d678aSKris Buschelman 
28c79f6d3SBarry Smith /*
38c79f6d3SBarry Smith    Support for the parallel AIJ matrix vector multiply
48c79f6d3SBarry Smith */
5c6db04a5SJed Brown #include <../src/mat/impls/aij/mpi/mpiaij.h>
68c79f6d3SBarry Smith 
74a2ae208SSatish Balay #undef __FUNCT__
84a2ae208SSatish Balay #define __FUNCT__ "MatSetUpMultiply_MPIAIJ"
9dfbe8321SBarry Smith PetscErrorCode MatSetUpMultiply_MPIAIJ(Mat mat)
108c79f6d3SBarry Smith {
1144a69424SLois Curfman McInnes   Mat_MPIAIJ         *aij = (Mat_MPIAIJ*)mat->data;
12ec8511deSBarry Smith   Mat_SeqAIJ         *B = (Mat_SeqAIJ*)(aij->B->data);
136849ba73SBarry Smith   PetscErrorCode     ierr;
14b1d57f15SBarry Smith   PetscInt           i,j,*aj = B->j,ec = 0,*garray;
151eb62cbbSBarry Smith   IS                 from,to;
161eb62cbbSBarry Smith   Vec                gvec;
17ace3abfcSBarry Smith   PetscBool          useblockis;
18aa482453SBarry Smith #if defined (PETSC_USE_CTABLE)
190f5bd95cSBarry Smith   PetscTable         gid1_lid1;
200f5bd95cSBarry Smith   PetscTablePosition tpos;
21b1d57f15SBarry Smith   PetscInt           gid,lid;
226f531f54SSatish Balay #else
23d0f46423SBarry Smith   PetscInt           N = mat->cmap->N,*indices;
242066d6f7SSatish Balay #endif
252066d6f7SSatish Balay 
263a40ed3dSBarry Smith   PetscFunctionBegin;
272066d6f7SSatish Balay 
28aa482453SBarry Smith #if defined (PETSC_USE_CTABLE)
29*c5bfad50SMark F. Adams   /* use a table */
30e23dfa41SBarry Smith   ierr = PetscTableCreate(aij->B->rmap->n,mat->cmap->N+1,&gid1_lid1);CHKERRQ(ierr);
31d0f46423SBarry Smith   for (i=0; i<aij->B->rmap->n; i++) {
322066d6f7SSatish Balay     for (j=0; j<B->ilen[i]; j++) {
33b1d57f15SBarry Smith       PetscInt data,gid1 = aj[B->i[i] + j] + 1;
340f5bd95cSBarry Smith       ierr = PetscTableFind(gid1_lid1,gid1,&data);CHKERRQ(ierr);
35fa46199cSSatish Balay       if (!data) {
362066d6f7SSatish Balay         /* one based table */
373861aac3SJed Brown         ierr = PetscTableAdd(gid1_lid1,gid1,++ec,INSERT_VALUES);CHKERRQ(ierr);
382066d6f7SSatish Balay       }
392066d6f7SSatish Balay     }
402066d6f7SSatish Balay   }
412066d6f7SSatish Balay   /* form array of columns we need */
42b1d57f15SBarry Smith   ierr = PetscMalloc((ec+1)*sizeof(PetscInt),&garray);CHKERRQ(ierr);
430f5bd95cSBarry Smith   ierr = PetscTableGetHeadPosition(gid1_lid1,&tpos);CHKERRQ(ierr);
442066d6f7SSatish Balay   while (tpos) {
450f5bd95cSBarry Smith     ierr = PetscTableGetNext(gid1_lid1,&tpos,&gid,&lid);CHKERRQ(ierr);
46b0a32e0cSBarry Smith     gid--;
47b0a32e0cSBarry Smith     lid--;
482066d6f7SSatish Balay     garray[lid] = gid;
492066d6f7SSatish Balay   }
500064e2bbSSatish Balay   ierr = PetscSortInt(ec,garray);CHKERRQ(ierr); /* sort, and rebuild */
510f5bd95cSBarry Smith   ierr = PetscTableRemoveAll(gid1_lid1);CHKERRQ(ierr);
522066d6f7SSatish Balay   for (i=0; i<ec; i++) {
533861aac3SJed Brown     ierr = PetscTableAdd(gid1_lid1,garray[i]+1,i+1,INSERT_VALUES);CHKERRQ(ierr);
542066d6f7SSatish Balay   }
552066d6f7SSatish Balay   /* compact out the extra columns in B */
56d0f46423SBarry Smith   for (i=0; i<aij->B->rmap->n; i++) {
572066d6f7SSatish Balay     for (j=0; j<B->ilen[i]; j++) {
58b1d57f15SBarry Smith       PetscInt gid1 = aj[B->i[i] + j] + 1;
590f5bd95cSBarry Smith       ierr = PetscTableFind(gid1_lid1,gid1,&lid);CHKERRQ(ierr);
60fa46199cSSatish Balay       lid --;
61b3fb0a6cSMatthew Knepley       aj[B->i[i] + j]  = lid;
622066d6f7SSatish Balay     }
632066d6f7SSatish Balay   }
64d0f46423SBarry Smith   aij->B->cmap->n = aij->B->cmap->N = ec;
6526283091SBarry Smith   ierr = PetscLayoutSetUp((aij->B->cmap));CHKERRQ(ierr);
666bc0bbbfSBarry Smith   ierr = PetscTableDestroy(&gid1_lid1);CHKERRQ(ierr);
672066d6f7SSatish Balay #else
6811285404SBarry Smith   /* Make an array as long as the number of columns */
691eb62cbbSBarry Smith   /* mark those columns that are in aij->B */
70b1d57f15SBarry Smith   ierr = PetscMalloc((N+1)*sizeof(PetscInt),&indices);CHKERRQ(ierr);
71b1d57f15SBarry Smith   ierr = PetscMemzero(indices,N*sizeof(PetscInt));CHKERRQ(ierr);
72d0f46423SBarry Smith   for (i=0; i<aij->B->rmap->n; i++) {
73d6dfbf8fSBarry Smith     for (j=0; j<B->ilen[i]; j++) {
74bfec09a0SHong Zhang       if (!indices[aj[B->i[i] + j] ]) ec++;
75bfec09a0SHong Zhang       indices[aj[B->i[i] + j] ] = 1;
76416022c9SBarry Smith     }
771eb62cbbSBarry Smith   }
788c79f6d3SBarry Smith 
791eb62cbbSBarry Smith   /* form array of columns we need */
80b1d57f15SBarry Smith   ierr = PetscMalloc((ec+1)*sizeof(PetscInt),&garray);CHKERRQ(ierr);
811eb62cbbSBarry Smith   ec = 0;
821eb62cbbSBarry Smith   for (i=0; i<N; i++) {
831eb62cbbSBarry Smith     if (indices[i]) garray[ec++] = i;
841eb62cbbSBarry Smith   }
851eb62cbbSBarry Smith 
861eb62cbbSBarry Smith   /* make indices now point into garray */
871eb62cbbSBarry Smith   for (i=0; i<ec; i++) {
88bfec09a0SHong Zhang     indices[garray[i]] = i;
891eb62cbbSBarry Smith   }
901eb62cbbSBarry Smith 
911eb62cbbSBarry Smith   /* compact out the extra columns in B */
92d0f46423SBarry Smith   for (i=0; i<aij->B->rmap->n; i++) {
93d6dfbf8fSBarry Smith     for (j=0; j<B->ilen[i]; j++) {
94bfec09a0SHong Zhang       aj[B->i[i] + j] = indices[aj[B->i[i] + j]];
951eb62cbbSBarry Smith     }
96d6dfbf8fSBarry Smith   }
97d0f46423SBarry Smith   aij->B->cmap->n = aij->B->cmap->N = ec;
9826283091SBarry Smith   ierr = PetscLayoutSetUp((aij->B->cmap));CHKERRQ(ierr);
99606d414cSSatish Balay   ierr = PetscFree(indices);CHKERRQ(ierr);
1002066d6f7SSatish Balay #endif
1011eb62cbbSBarry Smith   /* create local vector that is used to scatter into */
102029af93fSBarry Smith   ierr = VecCreateSeq(PETSC_COMM_SELF,ec,&aij->lvec);CHKERRQ(ierr);
1031eb62cbbSBarry Smith 
104d6dfbf8fSBarry Smith   /* create two temporary Index sets for build scatter gather */
10503919abeSBarry Smith   /*  check for the special case where blocks are communicated for faster VecScatterXXX */
106a2f3521dSMark F. Adams   useblockis = PETSC_FALSE;
107*c5bfad50SMark F. Adams   if (mat->cmap->bs > 1) {
108*c5bfad50SMark F. Adams     PetscInt bs = mat->cmap->bs,ibs,ga;
10903919abeSBarry Smith     if (!(ec % bs)) {
1103ba34427SBarry Smith       useblockis = PETSC_TRUE;
11103919abeSBarry Smith       for (i=0; i<ec/bs; i++) {
11203919abeSBarry Smith         if ((ga = garray[ibs = i*bs]) % bs) {
11303919abeSBarry Smith           useblockis = PETSC_FALSE;
11403919abeSBarry Smith           break;
11503919abeSBarry Smith         }
11603919abeSBarry Smith         for (j=1; j<bs; j++) {
11703919abeSBarry Smith           if (garray[ibs+j] != ga+j) {
11803919abeSBarry Smith             useblockis = PETSC_FALSE;
11903919abeSBarry Smith             break;
12003919abeSBarry Smith           }
12103919abeSBarry Smith         }
12203919abeSBarry Smith         if (!useblockis) break;
12303919abeSBarry Smith       }
12403919abeSBarry Smith     }
12503919abeSBarry Smith   }
126*c5bfad50SMark F. Adams #if defined(PETSC_USE_DEBUG)
127*c5bfad50SMark F. Adams   i = (PetscInt)useblockis;
128*c5bfad50SMark F. Adams   ierr = MPI_Allreduce(&i,&j,1,MPIU_INT,MPI_MIN,((PetscObject)mat)->comm); CHKERRQ(ierr);
129*c5bfad50SMark F. Adams   if(j!=i) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Use of blocked not consistant (I am usning blocked)");
130*c5bfad50SMark F. Adams #endif
131*c5bfad50SMark F. Adams 
13203919abeSBarry Smith   if (useblockis) {
133*c5bfad50SMark F. Adams     PetscInt *ga,bs = mat->cmap->bs,iec = ec/bs;
134*c5bfad50SMark F. Adams     if(ec%bs)SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"ec=%D bs=%D",ec,bs);
135ae15b995SBarry Smith     ierr = PetscInfo(mat,"Using block index set to define scatter\n");
136*c5bfad50SMark F. Adams     ierr = PetscMalloc(iec*sizeof(PetscInt),&ga);CHKERRQ(ierr);
137e82e9f6bSBarry Smith     for (i=0; i<iec; i++) ga[i] = garray[i*bs]/bs;
138deff0451SBarry Smith     ierr = ISCreateBlock(((PetscObject)mat)->comm,bs,iec,ga,PETSC_OWN_POINTER,&from);CHKERRQ(ierr);
13903919abeSBarry Smith   } else {
14070b3c8c7SBarry Smith     ierr = ISCreateGeneral(((PetscObject)mat)->comm,ec,garray,PETSC_COPY_VALUES,&from);CHKERRQ(ierr);
14103919abeSBarry Smith   }
142*c5bfad50SMark F. Adams 
143029af93fSBarry Smith   ierr = ISCreateStride(PETSC_COMM_SELF,ec,0,1,&to);CHKERRQ(ierr);
1441eb62cbbSBarry Smith 
1451eb62cbbSBarry Smith   /* create temporary global vector to generate scatter context */
146b5eb4454SBarry Smith   /* This does not allocate the array's memory so is efficient */
147778a2246SBarry Smith   ierr = VecCreateMPIWithArray(((PetscObject)mat)->comm,1,mat->cmap->n,mat->cmap->N,PETSC_NULL,&gvec);CHKERRQ(ierr);
1481eb62cbbSBarry Smith 
1492d336d48SLois Curfman McInnes   /* generate the scatter context */
15008480c60SBarry Smith   ierr = VecScatterCreate(gvec,from,aij->lvec,to,&aij->Mvctx);CHKERRQ(ierr);
15152e6d16bSBarry Smith   ierr = PetscLogObjectParent(mat,aij->Mvctx);CHKERRQ(ierr);
15252e6d16bSBarry Smith   ierr = PetscLogObjectParent(mat,aij->lvec);CHKERRQ(ierr);
15352e6d16bSBarry Smith   ierr = PetscLogObjectParent(mat,from);CHKERRQ(ierr);
15452e6d16bSBarry Smith   ierr = PetscLogObjectParent(mat,to);CHKERRQ(ierr);
1559e25ed09SBarry Smith   aij->garray = garray;
15652e6d16bSBarry Smith   ierr = PetscLogObjectMemory(mat,(ec+1)*sizeof(PetscInt));CHKERRQ(ierr);
1576bf464f9SBarry Smith   ierr = ISDestroy(&from);CHKERRQ(ierr);
1586bf464f9SBarry Smith   ierr = ISDestroy(&to);CHKERRQ(ierr);
1596bf464f9SBarry Smith   ierr = VecDestroy(&gvec);CHKERRQ(ierr);
1603a40ed3dSBarry Smith   PetscFunctionReturn(0);
1618c79f6d3SBarry Smith }
1629e25ed09SBarry Smith 
1639e25ed09SBarry Smith 
1644a2ae208SSatish Balay #undef __FUNCT__
165ab9863d7SBarry Smith #define __FUNCT__ "MatDisAssemble_MPIAIJ"
1662493cbb0SBarry Smith /*
1672493cbb0SBarry Smith      Takes the local part of an already assembled MPIAIJ matrix
1682493cbb0SBarry Smith    and disassembles it. This is to allow new nonzeros into the matrix
1692493cbb0SBarry Smith    that require more communication in the matrix vector multiply.
1702493cbb0SBarry Smith    Thus certain data-structures must be rebuilt.
1712493cbb0SBarry Smith 
1722493cbb0SBarry Smith    Kind of slow! But that's what application programmers get when
1732493cbb0SBarry Smith    they are sloppy.
1742493cbb0SBarry Smith */
175ab9863d7SBarry Smith PetscErrorCode MatDisAssemble_MPIAIJ(Mat A)
1762493cbb0SBarry Smith {
1772493cbb0SBarry Smith   Mat_MPIAIJ     *aij = (Mat_MPIAIJ*)A->data;
1782493cbb0SBarry Smith   Mat            B = aij->B,Bnew;
179ec8511deSBarry Smith   Mat_SeqAIJ     *Baij = (Mat_SeqAIJ*)B->data;
180dfbe8321SBarry Smith   PetscErrorCode ierr;
181d0f46423SBarry Smith   PetscInt       i,j,m = B->rmap->n,n = A->cmap->N,col,ct = 0,*garray = aij->garray,*nz,ec;
18287828ca2SBarry Smith   PetscScalar    v;
1832493cbb0SBarry Smith 
1843a40ed3dSBarry Smith   PetscFunctionBegin;
1852493cbb0SBarry Smith   /* free stuff related to matrix-vec multiply */
186b0a32e0cSBarry Smith   ierr = VecGetSize(aij->lvec,&ec);CHKERRQ(ierr); /* needed for PetscLogObjectMemory below */
1875e1f6667SBarry Smith   ierr = VecDestroy(&aij->lvec);CHKERRQ(ierr);
1885e1f6667SBarry Smith   ierr = VecScatterDestroy(&aij->Mvctx);CHKERRQ(ierr);
189464493b3SBarry Smith   if (aij->colmap) {
190aa482453SBarry Smith #if defined (PETSC_USE_CTABLE)
1916bc0bbbfSBarry Smith     ierr = PetscTableDestroy(&aij->colmap);CHKERRQ(ierr);
1922066d6f7SSatish Balay #else
193606d414cSSatish Balay     ierr = PetscFree(aij->colmap);CHKERRQ(ierr);
194d0f46423SBarry Smith     ierr = PetscLogObjectMemory(A,-aij->B->cmap->n*sizeof(PetscInt));CHKERRQ(ierr);
1952066d6f7SSatish Balay #endif
196464493b3SBarry Smith   }
1972493cbb0SBarry Smith 
1982493cbb0SBarry Smith   /* make sure that B is assembled so we can access its values */
1996d4a8577SBarry Smith   ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
200fe2f2677SBarry Smith   ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2012493cbb0SBarry Smith 
2022493cbb0SBarry Smith   /* invent new B and copy stuff over */
203b1d57f15SBarry Smith   ierr = PetscMalloc((m+1)*sizeof(PetscInt),&nz);CHKERRQ(ierr);
20448b35521SBarry Smith   for (i=0; i<m; i++) {
20548b35521SBarry Smith     nz[i] = Baij->i[i+1] - Baij->i[i];
20648b35521SBarry Smith   }
207f69a0ea3SMatthew Knepley   ierr = MatCreate(PETSC_COMM_SELF,&Bnew);CHKERRQ(ierr);
208f69a0ea3SMatthew Knepley   ierr = MatSetSizes(Bnew,m,n,m,n);CHKERRQ(ierr);
209a2f3521dSMark F. Adams   ierr = MatSetBlockSizes(Bnew,A->rmap->bs,A->cmap->bs);CHKERRQ(ierr);
2107adad957SLisandro Dalcin   ierr = MatSetType(Bnew,((PetscObject)B)->type_name);CHKERRQ(ierr);
211f204ca49SKris Buschelman   ierr = MatSeqAIJSetPreallocation(Bnew,0,nz);CHKERRQ(ierr);
2122576faa2SJed Brown   ((Mat_SeqAIJ*)Bnew->data)->nonew = Baij->nonew; /* Inherit insertion error options. */
213606d414cSSatish Balay   ierr = PetscFree(nz);CHKERRQ(ierr);
2142493cbb0SBarry Smith   for (i=0; i<m; i++) {
215bfec09a0SHong Zhang     for (j=Baij->i[i]; j<Baij->i[i+1]; j++) {
216bfec09a0SHong Zhang       col  = garray[Baij->j[ct]];
2172493cbb0SBarry Smith       v    = Baij->a[ct++];
21883271157SBarry Smith       ierr = MatSetValues(Bnew,1,&i,1,&col,&v,B->insertmode);CHKERRQ(ierr);
2192493cbb0SBarry Smith     }
2202493cbb0SBarry Smith   }
221606d414cSSatish Balay   ierr = PetscFree(aij->garray);CHKERRQ(ierr);
22252e6d16bSBarry Smith   ierr = PetscLogObjectMemory(A,-ec*sizeof(PetscInt));CHKERRQ(ierr);
2236bf464f9SBarry Smith   ierr = MatDestroy(&B);CHKERRQ(ierr);
22452e6d16bSBarry Smith   ierr = PetscLogObjectParent(A,Bnew);CHKERRQ(ierr);
2252493cbb0SBarry Smith   aij->B = Bnew;
226227d817aSBarry Smith   A->was_assembled = PETSC_FALSE;
2273a40ed3dSBarry Smith   PetscFunctionReturn(0);
2282493cbb0SBarry Smith }
2292493cbb0SBarry Smith 
2302cd6534aSBarry Smith /*      ugly stuff added for Glenn someday we should fix this up */
2312cd6534aSBarry Smith 
232b1d57f15SBarry Smith static PetscInt *auglyrmapd = 0,*auglyrmapo = 0;  /* mapping from the local ordering to the "diagonal" and "off-diagonal"
2332cd6534aSBarry Smith                                       parts of the local matrix */
2342cd6534aSBarry Smith static Vec auglydd = 0,auglyoo = 0;   /* work vectors used to scale the two parts of the local matrix */
2352cd6534aSBarry Smith 
2362cd6534aSBarry Smith 
2372cd6534aSBarry Smith #undef __FUNCT__
2382cd6534aSBarry Smith #define __FUNCT__ "MatMPIAIJDiagonalScaleLocalSetUp"
239dfbe8321SBarry Smith PetscErrorCode MatMPIAIJDiagonalScaleLocalSetUp(Mat inA,Vec scale)
2402cd6534aSBarry Smith {
2412cd6534aSBarry Smith   Mat_MPIAIJ     *ina = (Mat_MPIAIJ*) inA->data; /*access private part of matrix */
242dfbe8321SBarry Smith   PetscErrorCode ierr;
243b1d57f15SBarry Smith   PetscInt       i,n,nt,cstart,cend,no,*garray = ina->garray,*lindices;
244b1d57f15SBarry Smith   PetscInt       *r_rmapd,*r_rmapo;
2452cd6534aSBarry Smith 
2462cd6534aSBarry Smith   PetscFunctionBegin;
2472cd6534aSBarry Smith   ierr = MatGetOwnershipRange(inA,&cstart,&cend);CHKERRQ(ierr);
2482cd6534aSBarry Smith   ierr = MatGetSize(ina->A,PETSC_NULL,&n);CHKERRQ(ierr);
249992144d0SBarry Smith   ierr = PetscMalloc((inA->rmap->mapping->n+1)*sizeof(PetscInt),&r_rmapd);CHKERRQ(ierr);
250992144d0SBarry Smith   ierr = PetscMemzero(r_rmapd,inA->rmap->mapping->n*sizeof(PetscInt));CHKERRQ(ierr);
2512cd6534aSBarry Smith   nt   = 0;
252992144d0SBarry Smith   for (i=0; i<inA->rmap->mapping->n; i++) {
253992144d0SBarry Smith     if (inA->rmap->mapping->indices[i] >= cstart && inA->rmap->mapping->indices[i] < cend) {
2542cd6534aSBarry Smith       nt++;
255992144d0SBarry Smith       r_rmapd[i] = inA->rmap->mapping->indices[i] + 1;
2562cd6534aSBarry Smith     }
2572cd6534aSBarry Smith   }
258e32f2f54SBarry Smith   if (nt != n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Hmm nt %D n %D",nt,n);
259b1d57f15SBarry Smith   ierr = PetscMalloc((n+1)*sizeof(PetscInt),&auglyrmapd);CHKERRQ(ierr);
260992144d0SBarry Smith   for (i=0; i<inA->rmap->mapping->n; i++) {
2612cd6534aSBarry Smith     if (r_rmapd[i]){
2622cd6534aSBarry Smith       auglyrmapd[(r_rmapd[i]-1)-cstart] = i;
2632cd6534aSBarry Smith     }
2642cd6534aSBarry Smith   }
2652cd6534aSBarry Smith   ierr = PetscFree(r_rmapd);CHKERRQ(ierr);
2662cd6534aSBarry Smith   ierr = VecCreateSeq(PETSC_COMM_SELF,n,&auglydd);CHKERRQ(ierr);
2672cd6534aSBarry Smith 
268d0f46423SBarry Smith   ierr = PetscMalloc((inA->cmap->N+1)*sizeof(PetscInt),&lindices);CHKERRQ(ierr);
269d0f46423SBarry Smith   ierr = PetscMemzero(lindices,inA->cmap->N*sizeof(PetscInt));CHKERRQ(ierr);
270d0f46423SBarry Smith   for (i=0; i<ina->B->cmap->n; i++) {
2712cd6534aSBarry Smith     lindices[garray[i]] = i+1;
2722cd6534aSBarry Smith   }
273992144d0SBarry Smith   no   = inA->rmap->mapping->n - nt;
274992144d0SBarry Smith   ierr = PetscMalloc((inA->rmap->mapping->n+1)*sizeof(PetscInt),&r_rmapo);CHKERRQ(ierr);
275992144d0SBarry Smith   ierr = PetscMemzero(r_rmapo,inA->rmap->mapping->n*sizeof(PetscInt));CHKERRQ(ierr);
2762cd6534aSBarry Smith   nt   = 0;
277992144d0SBarry Smith   for (i=0; i<inA->rmap->mapping->n; i++) {
278992144d0SBarry Smith     if (lindices[inA->rmap->mapping->indices[i]]) {
2792cd6534aSBarry Smith       nt++;
280992144d0SBarry Smith       r_rmapo[i] = lindices[inA->rmap->mapping->indices[i]];
2812cd6534aSBarry Smith     }
2822cd6534aSBarry Smith   }
283e32f2f54SBarry Smith   if (nt > no) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Hmm nt %D no %D",nt,n);
2842cd6534aSBarry Smith   ierr = PetscFree(lindices);CHKERRQ(ierr);
285b1d57f15SBarry Smith   ierr = PetscMalloc((nt+1)*sizeof(PetscInt),&auglyrmapo);CHKERRQ(ierr);
286992144d0SBarry Smith   for (i=0; i<inA->rmap->mapping->n; i++) {
2872cd6534aSBarry Smith     if (r_rmapo[i]){
2882cd6534aSBarry Smith       auglyrmapo[(r_rmapo[i]-1)] = i;
2892cd6534aSBarry Smith     }
2902cd6534aSBarry Smith   }
2912cd6534aSBarry Smith   ierr = PetscFree(r_rmapo);CHKERRQ(ierr);
2922cd6534aSBarry Smith   ierr = VecCreateSeq(PETSC_COMM_SELF,nt,&auglyoo);CHKERRQ(ierr);
2932cd6534aSBarry Smith 
2942cd6534aSBarry Smith   PetscFunctionReturn(0);
2952cd6534aSBarry Smith }
2962cd6534aSBarry Smith 
2972cd6534aSBarry Smith #undef __FUNCT__
2982cd6534aSBarry Smith #define __FUNCT__ "MatMPIAIJDiagonalScaleLocal"
299dfbe8321SBarry Smith PetscErrorCode MatMPIAIJDiagonalScaleLocal(Mat A,Vec scale)
3002cd6534aSBarry Smith {
30192b32695SKris Buschelman   /* This routine should really be abandoned as it duplicates MatDiagonalScaleLocal */
3024ac538c5SBarry Smith   PetscErrorCode ierr;
30392b32695SKris Buschelman 
30492b32695SKris Buschelman   PetscFunctionBegin;
3054ac538c5SBarry Smith   ierr = PetscTryMethod(A,"MatDiagonalScaleLocal_C",(Mat,Vec),(A,scale));CHKERRQ(ierr);
30692b32695SKris Buschelman   PetscFunctionReturn(0);
30792b32695SKris Buschelman }
30892b32695SKris Buschelman 
30992b32695SKris Buschelman EXTERN_C_BEGIN
31092b32695SKris Buschelman #undef __FUNCT__
31192b32695SKris Buschelman #define __FUNCT__ "MatDiagonalScaleLocal_MPIAIJ"
3127087cfbeSBarry Smith PetscErrorCode  MatDiagonalScaleLocal_MPIAIJ(Mat A,Vec scale)
31392b32695SKris Buschelman {
3142cd6534aSBarry Smith   Mat_MPIAIJ     *a = (Mat_MPIAIJ*) A->data; /*access private part of matrix */
315dfbe8321SBarry Smith   PetscErrorCode ierr;
316b1d57f15SBarry Smith   PetscInt       n,i;
3172cd6534aSBarry Smith   PetscScalar    *d,*o,*s;
3182cd6534aSBarry Smith 
3192cd6534aSBarry Smith   PetscFunctionBegin;
3202cd6534aSBarry Smith   if (!auglyrmapd) {
3212cd6534aSBarry Smith     ierr = MatMPIAIJDiagonalScaleLocalSetUp(A,scale);CHKERRQ(ierr);
3222cd6534aSBarry Smith   }
3232cd6534aSBarry Smith 
3241ebc52fbSHong Zhang   ierr = VecGetArray(scale,&s);CHKERRQ(ierr);
3252cd6534aSBarry Smith 
3262cd6534aSBarry Smith   ierr = VecGetLocalSize(auglydd,&n);CHKERRQ(ierr);
3271ebc52fbSHong Zhang   ierr = VecGetArray(auglydd,&d);CHKERRQ(ierr);
3282cd6534aSBarry Smith   for (i=0; i<n; i++) {
3292cd6534aSBarry Smith     d[i] = s[auglyrmapd[i]]; /* copy "diagonal" (true local) portion of scale into dd vector */
3302cd6534aSBarry Smith   }
3311ebc52fbSHong Zhang   ierr = VecRestoreArray(auglydd,&d);CHKERRQ(ierr);
3322cd6534aSBarry Smith   /* column scale "diagonal" portion of local matrix */
3332cd6534aSBarry Smith   ierr = MatDiagonalScale(a->A,PETSC_NULL,auglydd);CHKERRQ(ierr);
3342cd6534aSBarry Smith 
3352cd6534aSBarry Smith   ierr = VecGetLocalSize(auglyoo,&n);CHKERRQ(ierr);
3361ebc52fbSHong Zhang   ierr = VecGetArray(auglyoo,&o);CHKERRQ(ierr);
3372cd6534aSBarry Smith   for (i=0; i<n; i++) {
3382cd6534aSBarry Smith     o[i] = s[auglyrmapo[i]]; /* copy "off-diagonal" portion of scale into oo vector */
3392cd6534aSBarry Smith   }
3401ebc52fbSHong Zhang   ierr = VecRestoreArray(scale,&s);CHKERRQ(ierr);
3411ebc52fbSHong Zhang   ierr = VecRestoreArray(auglyoo,&o);CHKERRQ(ierr);
3422cd6534aSBarry Smith   /* column scale "off-diagonal" portion of local matrix */
3432cd6534aSBarry Smith   ierr = MatDiagonalScale(a->B,PETSC_NULL,auglyoo);CHKERRQ(ierr);
3442cd6534aSBarry Smith 
3452cd6534aSBarry Smith   PetscFunctionReturn(0);
3462cd6534aSBarry Smith }
34792b32695SKris Buschelman EXTERN_C_END
3482cd6534aSBarry Smith 
34948b35521SBarry Smith 
350