xref: /petsc/src/mat/impls/baij/mpi/mmbaij.c (revision 04f1ad800057a4f24d0314e6009435793918095d)
1bba1ac68SSatish Balay /*$Id: mmbaij.c,v 1.46 2001/09/25 00:31:36 balay Exp $*/
28016bdd1SSatish Balay 
38016bdd1SSatish Balay /*
4d9653453SSatish Balay    Support for the parallel BAIJ matrix vector multiply
58016bdd1SSatish Balay */
670f55243SBarry Smith #include "src/mat/impls/baij/mpi/mpibaij.h"
78016bdd1SSatish Balay #include "src/vec/vecimpl.h"
8bba1ac68SSatish Balay 
9bba1ac68SSatish Balay EXTERN int MatSetValuesBlocked_SeqBAIJ(Mat,int,int*,int,int*,PetscScalar*,InsertMode);
108016bdd1SSatish Balay 
114a2ae208SSatish Balay #undef __FUNCT__
124a2ae208SSatish Balay #define __FUNCT__ "MatSetUpMultiply_MPIBAIJ"
13d9653453SSatish Balay int MatSetUpMultiply_MPIBAIJ(Mat mat)
148016bdd1SSatish Balay {
15d9653453SSatish Balay   Mat_MPIBAIJ        *baij = (Mat_MPIBAIJ*)mat->data;
16d9653453SSatish Balay   Mat_SeqBAIJ        *B = (Mat_SeqBAIJ*)(baij->B->data);
17d9653453SSatish Balay   int                Nbs = baij->Nbs,i,j,*indices,*aj = B->j,ierr,ec = 0,*garray;
183d3cf644SBarry Smith   int                bs = baij->bs,*stmp;
198016bdd1SSatish Balay   IS                 from,to;
208016bdd1SSatish Balay   Vec                gvec;
21aa482453SBarry Smith #if defined (PETSC_USE_CTABLE)
220f5bd95cSBarry Smith   PetscTable         gid1_lid1;
230f5bd95cSBarry Smith   PetscTablePosition tpos;
2473a2e727SSatish Balay   int                gid,lid;
2573a2e727SSatish Balay #endif
268016bdd1SSatish Balay 
273a40ed3dSBarry Smith   PetscFunctionBegin;
2873a2e727SSatish Balay 
29aa482453SBarry Smith #if defined (PETSC_USE_CTABLE)
3073a2e727SSatish Balay   /* use a table - Mark Adams */
31273d9f13SBarry Smith   ierr = PetscTableCreate(B->mbs,&gid1_lid1);CHKERRQ(ierr);
3273a2e727SSatish Balay   for (i=0; i<B->mbs; i++) {
3373a2e727SSatish Balay     for (j=0; j<B->ilen[i]; j++) {
34fa46199cSSatish Balay       int data,gid1 = aj[B->i[i]+j] + 1;
350f5bd95cSBarry Smith       ierr = PetscTableFind(gid1_lid1,gid1,&data) ;CHKERRQ(ierr);
36fa46199cSSatish Balay       if (!data) {
3773a2e727SSatish Balay         /* one based table */
380f5bd95cSBarry Smith         ierr = PetscTableAdd(gid1_lid1,gid1,++ec);CHKERRQ(ierr);
3973a2e727SSatish Balay       }
4073a2e727SSatish Balay     }
4173a2e727SSatish Balay   }
4273a2e727SSatish Balay   /* form array of columns we need */
43b0a32e0cSBarry Smith   ierr = PetscMalloc((ec+1)*sizeof(int),&garray);CHKERRQ(ierr);
440f5bd95cSBarry Smith   ierr = PetscTableGetHeadPosition(gid1_lid1,&tpos);CHKERRQ(ierr);
4573a2e727SSatish Balay   while (tpos) {
460f5bd95cSBarry Smith     ierr = PetscTableGetNext(gid1_lid1,&tpos,&gid,&lid);CHKERRQ(ierr);
4773a2e727SSatish Balay     gid--; lid--;
4873a2e727SSatish Balay     garray[lid] = gid;
4973a2e727SSatish Balay   }
500064e2bbSSatish Balay   ierr = PetscSortInt(ec,garray);CHKERRQ(ierr);
510064e2bbSSatish Balay   /* qsort(garray, ec, sizeof(int), intcomparcarc); */
520f5bd95cSBarry Smith   ierr = PetscTableRemoveAll(gid1_lid1);CHKERRQ(ierr);
5373a2e727SSatish Balay   for (i=0; i<ec; i++) {
540f5bd95cSBarry Smith     ierr = PetscTableAdd(gid1_lid1,garray[i]+1,i+1);CHKERRQ(ierr);
5573a2e727SSatish Balay   }
5673a2e727SSatish Balay   /* compact out the extra columns in B */
5773a2e727SSatish Balay   for (i=0; i<B->mbs; i++) {
5873a2e727SSatish Balay     for (j=0; j<B->ilen[i]; j++) {
5973a2e727SSatish Balay       int gid1 = aj[B->i[i] + j] + 1;
600f5bd95cSBarry Smith       ierr = PetscTableFind(gid1_lid1,gid1,&lid);CHKERRQ(ierr);
61fa46199cSSatish Balay       lid --;
6273a2e727SSatish Balay       aj[B->i[i]+j] = lid;
6373a2e727SSatish Balay     }
6473a2e727SSatish Balay   }
6573a2e727SSatish Balay   B->nbs     = ec;
66273d9f13SBarry Smith   baij->B->n = ec*B->bs;
670f5bd95cSBarry Smith   ierr = PetscTableDelete(gid1_lid1);CHKERRQ(ierr);
6873a2e727SSatish Balay   /* Mark Adams */
6973a2e727SSatish Balay #else
70435da068SBarry Smith   /* Make an array as long as the number of columns */
71d9653453SSatish Balay   /* mark those columns that are in baij->B */
72b0a32e0cSBarry Smith   ierr = PetscMalloc((Nbs+1)*sizeof(int),&indices);CHKERRQ(ierr);
73549d3d68SSatish Balay   ierr = PetscMemzero(indices,Nbs*sizeof(int));CHKERRQ(ierr);
74d9653453SSatish Balay   for (i=0; i<B->mbs; i++) {
758016bdd1SSatish Balay     for (j=0; j<B->ilen[i]; j++) {
76d9653453SSatish Balay       if (!indices[aj[B->i[i] + j]]) ec++;
77d9653453SSatish Balay       indices[aj[B->i[i] + j]] = 1;
788016bdd1SSatish Balay     }
798016bdd1SSatish Balay   }
808016bdd1SSatish Balay 
818016bdd1SSatish Balay   /* form array of columns we need */
82b0a32e0cSBarry Smith   ierr = PetscMalloc((ec+1)*sizeof(int),&garray);CHKERRQ(ierr);
838016bdd1SSatish Balay   ec = 0;
84d9653453SSatish Balay   for (i=0; i<Nbs; i++) {
850bdbc534SSatish Balay     if (indices[i]) {
860bdbc534SSatish Balay       garray[ec++] = i;
870bdbc534SSatish Balay     }
888016bdd1SSatish Balay   }
898016bdd1SSatish Balay 
908016bdd1SSatish Balay   /* make indices now point into garray */
918016bdd1SSatish Balay   for (i=0; i<ec; i++) {
92d9653453SSatish Balay     indices[garray[i]] = i;
938016bdd1SSatish Balay   }
948016bdd1SSatish Balay 
958016bdd1SSatish Balay   /* compact out the extra columns in B */
96d9653453SSatish Balay   for (i=0; i<B->mbs; i++) {
978016bdd1SSatish Balay     for (j=0; j<B->ilen[i]; j++) {
98d9653453SSatish Balay       aj[B->i[i] + j] = indices[aj[B->i[i] + j]];
998016bdd1SSatish Balay     }
1008016bdd1SSatish Balay   }
101d9653453SSatish Balay   B->nbs       = ec;
102273d9f13SBarry Smith   baij->B->n   = ec*B->bs;
103606d414cSSatish Balay   ierr = PetscFree(indices);CHKERRQ(ierr);
10473a2e727SSatish Balay #endif
1058016bdd1SSatish Balay 
1068016bdd1SSatish Balay   /* create local vector that is used to scatter into */
107029af93fSBarry Smith   ierr = VecCreateSeq(PETSC_COMM_SELF,ec*bs,&baij->lvec);CHKERRQ(ierr);
1088016bdd1SSatish Balay 
109c16cb8f2SBarry Smith   /* create two temporary index sets for building scatter-gather */
1103d3cf644SBarry Smith   for (i=0; i<ec; i++) {
111c16cb8f2SBarry Smith     garray[i] = bs*garray[i];
112c16cb8f2SBarry Smith   }
113029af93fSBarry Smith   ierr = ISCreateBlock(PETSC_COMM_SELF,bs,ec,garray,&from);CHKERRQ(ierr);
1143d3cf644SBarry Smith   for (i=0; i<ec; i++) {
115c16cb8f2SBarry Smith     garray[i] = garray[i]/bs;
116c16cb8f2SBarry Smith   }
117c16cb8f2SBarry Smith 
118b0a32e0cSBarry Smith   ierr = PetscMalloc((ec+1)*sizeof(int),&stmp);CHKERRQ(ierr);
119537820f0SBarry Smith   for (i=0; i<ec; i++) { stmp[i] = bs*i; }
120029af93fSBarry Smith   ierr = ISCreateBlock(PETSC_COMM_SELF,bs,ec,stmp,&to);CHKERRQ(ierr);
121606d414cSSatish Balay   ierr = PetscFree(stmp);CHKERRQ(ierr);
1228016bdd1SSatish Balay 
1238016bdd1SSatish Balay   /* create temporary global vector to generate scatter context */
1248016bdd1SSatish Balay   /* this is inefficient, but otherwise we must do either
1258016bdd1SSatish Balay      1) save garray until the first actual scatter when the vector is known or
1268016bdd1SSatish Balay      2) have another way of generating a scatter context without a vector.*/
127273d9f13SBarry Smith   ierr = VecCreateMPI(mat->comm,mat->n,mat->N,&gvec);CHKERRQ(ierr);
1288016bdd1SSatish Balay 
1298016bdd1SSatish Balay   /* gnerate the scatter context */
130d9653453SSatish Balay   ierr = VecScatterCreate(gvec,from,baij->lvec,to,&baij->Mvctx);CHKERRQ(ierr);
13190f02eecSBarry Smith 
13290f02eecSBarry Smith   /*
13390f02eecSBarry Smith       Post the receives for the first matrix vector product. We sync-chronize after
13490f02eecSBarry Smith     this on the chance that the user immediately calls MatMult() after assemblying
13590f02eecSBarry Smith     the matrix.
13690f02eecSBarry Smith   */
13743a90d84SBarry Smith   ierr = VecScatterPostRecvs(gvec,baij->lvec,INSERT_VALUES,SCATTER_FORWARD,baij->Mvctx);CHKERRQ(ierr);
138ca161407SBarry Smith   ierr = MPI_Barrier(mat->comm);CHKERRQ(ierr);
13990f02eecSBarry Smith 
140b0a32e0cSBarry Smith   PetscLogObjectParent(mat,baij->Mvctx);
141b0a32e0cSBarry Smith   PetscLogObjectParent(mat,baij->lvec);
142b0a32e0cSBarry Smith   PetscLogObjectParent(mat,from);
143b0a32e0cSBarry Smith   PetscLogObjectParent(mat,to);
144d9653453SSatish Balay   baij->garray = garray;
145b0a32e0cSBarry Smith   PetscLogObjectMemory(mat,(ec+1)*sizeof(int));
1468016bdd1SSatish Balay   ierr = ISDestroy(from);CHKERRQ(ierr);
1478016bdd1SSatish Balay   ierr = ISDestroy(to);CHKERRQ(ierr);
148888f2ed8SSatish Balay   ierr = VecDestroy(gvec);CHKERRQ(ierr);
1493a40ed3dSBarry Smith   PetscFunctionReturn(0);
1508016bdd1SSatish Balay }
1518016bdd1SSatish Balay 
1528016bdd1SSatish Balay /*
153d9653453SSatish Balay      Takes the local part of an already assembled MPIBAIJ matrix
1548016bdd1SSatish Balay    and disassembles it. This is to allow new nonzeros into the matrix
1558016bdd1SSatish Balay    that require more communication in the matrix vector multiply.
1568016bdd1SSatish Balay    Thus certain data-structures must be rebuilt.
1578016bdd1SSatish Balay 
1588016bdd1SSatish Balay    Kind of slow! But that's what application programmers get when
1598016bdd1SSatish Balay    they are sloppy.
1608016bdd1SSatish Balay */
1614a2ae208SSatish Balay #undef __FUNCT__
1624a2ae208SSatish Balay #define __FUNCT__ "DisAssemble_MPIBAIJ"
163d9653453SSatish Balay int DisAssemble_MPIBAIJ(Mat A)
1648016bdd1SSatish Balay {
165d9653453SSatish Balay   Mat_MPIBAIJ  *baij = (Mat_MPIBAIJ*)A->data;
166d9653453SSatish Balay   Mat          B = baij->B,Bnew;
167d9653453SSatish Balay   Mat_SeqBAIJ  *Bbaij = (Mat_SeqBAIJ*)B->data;
168273d9f13SBarry Smith   int          ierr,i,j,mbs=Bbaij->mbs,n = A->N,col,*garray=baij->garray;
169bba1ac68SSatish Balay   int          bs2=baij->bs2,*nz,ec,m = A->m;
1703eda8832SBarry Smith   MatScalar    *a = Bbaij->a;
17187828ca2SBarry Smith   PetscScalar  *atmp;
1728016bdd1SSatish Balay 
1733a40ed3dSBarry Smith   PetscFunctionBegin;
1748016bdd1SSatish Balay   /* free stuff related to matrix-vec multiply */
175b0a32e0cSBarry Smith   ierr = VecGetSize(baij->lvec,&ec);CHKERRQ(ierr); /* needed for PetscLogObjectMemory below */
176d9653453SSatish Balay   ierr = VecDestroy(baij->lvec);CHKERRQ(ierr); baij->lvec = 0;
177d9653453SSatish Balay   ierr = VecScatterDestroy(baij->Mvctx);CHKERRQ(ierr); baij->Mvctx = 0;
178d9653453SSatish Balay   if (baij->colmap) {
179aa482453SBarry Smith #if defined (PETSC_USE_CTABLE)
1800f5bd95cSBarry Smith     ierr = PetscTableDelete(baij->colmap); baij->colmap = 0;CHKERRQ(ierr);
18148e59246SSatish Balay #else
182606d414cSSatish Balay     ierr = PetscFree(baij->colmap);CHKERRQ(ierr);
183606d414cSSatish Balay     baij->colmap = 0;
184b0a32e0cSBarry Smith     PetscLogObjectMemory(A,-Bbaij->nbs*sizeof(int));
18548e59246SSatish Balay #endif
1868016bdd1SSatish Balay   }
1878016bdd1SSatish Balay 
1888016bdd1SSatish Balay   /* make sure that B is assembled so we can access its values */
1896d4a8577SBarry Smith   ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1903eda8832SBarry Smith   ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1918016bdd1SSatish Balay 
1928016bdd1SSatish Balay   /* invent new B and copy stuff over */
19382502324SSatish Balay   ierr = PetscMalloc(mbs*sizeof(int),&nz);CHKERRQ(ierr);
194d9653453SSatish Balay   for (i=0; i<mbs; i++) {
195d9653453SSatish Balay     nz[i] = Bbaij->i[i+1]-Bbaij->i[i];
1968016bdd1SSatish Balay   }
197029af93fSBarry Smith   ierr = MatCreateSeqBAIJ(PETSC_COMM_SELF,baij->bs,m,n,0,nz,&Bnew);CHKERRQ(ierr);
198bba1ac68SSatish Balay   ierr = MatSetOption(Bnew,MAT_COLUMN_ORIENTED);CHKERRQ(ierr);
199d9653453SSatish Balay 
2005010ffefSSatish Balay #if defined(PETSC_USE_MAT_SINGLE)
201bba1ac68SSatish Balay   ierr = PetscMalloc(bs2*sizeof(PetscScalar),&atmp);CHKERRQ(ierr);
202bba1ac68SSatish Balay #endif
203bba1ac68SSatish Balay     for (i=0; i<mbs; i++) {
204bba1ac68SSatish Balay       for (j=Bbaij->i[i]; j<Bbaij->i[i+1]; j++) {
205bba1ac68SSatish Balay         col  = garray[Bbaij->j[j]];
206bba1ac68SSatish Balay #if defined(PETSC_USE_MAT_SINGLE)
207bba1ac68SSatish Balay         for (k=0; k<bs2; k++) atmp[k] = a[j*bs2+k];
2083eda8832SBarry Smith #else
2093eda8832SBarry Smith         atmp = a + j*bs2;
2103eda8832SBarry Smith #endif
211bba1ac68SSatish Balay         ierr = MatSetValuesBlocked_SeqBAIJ(Bnew,1,&i,1,&col,atmp,B->insertmode);CHKERRQ(ierr);
2128016bdd1SSatish Balay       }
2138016bdd1SSatish Balay     }
214bba1ac68SSatish Balay   ierr = MatSetOption(Bnew,MAT_ROW_ORIENTED);CHKERRQ(ierr);
215bba1ac68SSatish Balay 
2163eda8832SBarry Smith #if defined(PETSC_USE_MAT_SINGLE)
2173eda8832SBarry Smith   ierr = PetscFree(atmp);CHKERRQ(ierr);
2183eda8832SBarry Smith #endif
219bba1ac68SSatish Balay 
220bba1ac68SSatish Balay   ierr = PetscFree(nz);CHKERRQ(ierr);
221606d414cSSatish Balay   ierr = PetscFree(baij->garray);CHKERRQ(ierr);
222606d414cSSatish Balay   baij->garray = 0;
223b0a32e0cSBarry Smith   PetscLogObjectMemory(A,-ec*sizeof(int));
2248016bdd1SSatish Balay   ierr = MatDestroy(B);CHKERRQ(ierr);
225b0a32e0cSBarry Smith   PetscLogObjectParent(A,Bnew);
226d9653453SSatish Balay   baij->B = Bnew;
2278016bdd1SSatish Balay   A->was_assembled = PETSC_FALSE;
2283a40ed3dSBarry Smith   PetscFunctionReturn(0);
2298016bdd1SSatish Balay }
2308016bdd1SSatish Balay 
231*04f1ad80SBarry Smith /*      ugly stuff added for Glenn someday we should fix this up */
232*04f1ad80SBarry Smith 
233*04f1ad80SBarry Smith int *uglyrmapd = 0,*uglyrmapo = 0;  /* mapping from the local ordering to the "diagonal" and "off-diagonal"
234*04f1ad80SBarry Smith                                       parts of the local matrix */
235*04f1ad80SBarry Smith Vec uglydd = 0,uglyoo = 0;   /* work vectors used to scale the two parts of the local matrix */
236*04f1ad80SBarry Smith 
237*04f1ad80SBarry Smith 
238*04f1ad80SBarry Smith #undef __FUNC__
239*04f1ad80SBarry Smith #define __FUNC__ "MatMPIBAIJDiagonalScaleLocalSetUp"
240*04f1ad80SBarry Smith int MatMPIBAIJDiagonalScaleLocalSetUp(Mat inA,Vec scale)
241*04f1ad80SBarry Smith {
242*04f1ad80SBarry Smith   Mat_MPIBAIJ  *ina = (Mat_MPIBAIJ*) inA->data; /*access private part of matrix */
243*04f1ad80SBarry Smith   Mat_SeqBAIJ  *A = (Mat_SeqBAIJ*)ina->A->data;
244*04f1ad80SBarry Smith   Mat_SeqBAIJ  *B = (Mat_SeqBAIJ*)ina->B->data;
245*04f1ad80SBarry Smith   int          ierr,bs = A->bs,i,n,nt,j,cstart,cend,no,*garray = ina->garray,*lindices;
246*04f1ad80SBarry Smith   int          *r_rmapd,*r_rmapo;
247*04f1ad80SBarry Smith 
248*04f1ad80SBarry Smith   PetscFunctionBegin;
249*04f1ad80SBarry Smith   ierr = MatGetOwnershipRange(inA,&cstart,&cend);CHKERRQ(ierr);
250*04f1ad80SBarry Smith   ierr = MatGetSize(ina->A,PETSC_NULL,&n);CHKERRQ(ierr);
251*04f1ad80SBarry Smith   ierr = PetscMalloc((inA->bmapping->n+1)*sizeof(int),&r_rmapd);CHKERRQ(ierr);
252*04f1ad80SBarry Smith   ierr = PetscMemzero(r_rmapd,inA->bmapping->n*sizeof(int));CHKERRQ(ierr);
253*04f1ad80SBarry Smith   nt   = 0;
254*04f1ad80SBarry Smith   for (i=0; i<inA->bmapping->n; i++) {
255*04f1ad80SBarry Smith     if (inA->bmapping->indices[i]*bs >= cstart && inA->bmapping->indices[i]*bs < cend) {
256*04f1ad80SBarry Smith       nt++;
257*04f1ad80SBarry Smith       r_rmapd[i] = inA->bmapping->indices[i] + 1;
258*04f1ad80SBarry Smith     }
259*04f1ad80SBarry Smith   }
260*04f1ad80SBarry Smith   if (nt*bs != n) SETERRQ2(1,"Hmm nt*bs %d n %d",nt*bs,n);
261*04f1ad80SBarry Smith   ierr = PetscMalloc((n+1)*sizeof(int),&uglyrmapd);CHKERRQ(ierr);
262*04f1ad80SBarry Smith   for (i=0; i<inA->bmapping->n; i++) {
263*04f1ad80SBarry Smith     if (r_rmapd[i]){
264*04f1ad80SBarry Smith       for (j=0; j<bs; j++) {
265*04f1ad80SBarry Smith         uglyrmapd[(r_rmapd[i]-1)*bs+j-cstart] = i*bs + j;
266*04f1ad80SBarry Smith       }
267*04f1ad80SBarry Smith     }
268*04f1ad80SBarry Smith   }
269*04f1ad80SBarry Smith   ierr = PetscFree(r_rmapd);CHKERRQ(ierr);
270*04f1ad80SBarry Smith   ierr = VecCreateSeq(PETSC_COMM_SELF,n,&uglydd);CHKERRQ(ierr);
271*04f1ad80SBarry Smith 
272*04f1ad80SBarry Smith   ierr = PetscMalloc((ina->Nbs+1)*sizeof(int),&lindices);CHKERRQ(ierr);
273*04f1ad80SBarry Smith   ierr = PetscMemzero(lindices,ina->Nbs*sizeof(int));CHKERRQ(ierr);
274*04f1ad80SBarry Smith   for (i=0; i<B->nbs; i++) {
275*04f1ad80SBarry Smith     lindices[garray[i]] = i+1;
276*04f1ad80SBarry Smith   }
277*04f1ad80SBarry Smith   no   = inA->bmapping->n - nt;
278*04f1ad80SBarry Smith   ierr = PetscMalloc((inA->bmapping->n+1)*sizeof(int),&r_rmapo);CHKERRQ(ierr);
279*04f1ad80SBarry Smith   ierr = PetscMemzero(r_rmapo,inA->bmapping->n*sizeof(int));CHKERRQ(ierr);
280*04f1ad80SBarry Smith   nt   = 0;
281*04f1ad80SBarry Smith   for (i=0; i<inA->bmapping->n; i++) {
282*04f1ad80SBarry Smith     if (lindices[inA->bmapping->indices[i]]) {
283*04f1ad80SBarry Smith       nt++;
284*04f1ad80SBarry Smith       r_rmapo[i] = lindices[inA->bmapping->indices[i]];
285*04f1ad80SBarry Smith     }
286*04f1ad80SBarry Smith   }
287*04f1ad80SBarry Smith   if (nt > no) SETERRQ2(1,"Hmm nt %d no %d",nt,n);
288*04f1ad80SBarry Smith   ierr = PetscFree(lindices);CHKERRQ(ierr);
289*04f1ad80SBarry Smith   ierr = PetscMalloc((nt*bs+1)*sizeof(int),&uglyrmapo);CHKERRQ(ierr);
290*04f1ad80SBarry Smith   for (i=0; i<inA->bmapping->n; i++) {
291*04f1ad80SBarry Smith     if (r_rmapo[i]){
292*04f1ad80SBarry Smith       for (j=0; j<bs; j++) {
293*04f1ad80SBarry Smith         uglyrmapo[(r_rmapo[i]-1)*bs+j] = i*bs + j;
294*04f1ad80SBarry Smith       }
295*04f1ad80SBarry Smith     }
296*04f1ad80SBarry Smith   }
297*04f1ad80SBarry Smith   ierr = PetscFree(r_rmapo);CHKERRQ(ierr);
298*04f1ad80SBarry Smith   ierr = VecCreateSeq(PETSC_COMM_SELF,nt*bs,&uglyoo);CHKERRQ(ierr);
299*04f1ad80SBarry Smith 
300*04f1ad80SBarry Smith   PetscFunctionReturn(0);
301*04f1ad80SBarry Smith }
302*04f1ad80SBarry Smith 
303*04f1ad80SBarry Smith #undef __FUNC__
304*04f1ad80SBarry Smith #define __FUNC__ "MatMPIBAIJDiagonalScaleLocal"
305*04f1ad80SBarry Smith int MatMPIBAIJDiagonalScaleLocal(Mat A,Vec scale)
306*04f1ad80SBarry Smith {
307*04f1ad80SBarry Smith   Mat_MPIBAIJ  *a = (Mat_MPIBAIJ*) A->data; /*access private part of matrix */
308*04f1ad80SBarry Smith   int          ierr,n,i;
309*04f1ad80SBarry Smith   PetscScalar  *d,*o,*s;
310*04f1ad80SBarry Smith 
311*04f1ad80SBarry Smith   PetscFunctionBegin;
312*04f1ad80SBarry Smith   ierr = VecGetArray(scale,&s);CHKERRQ(ierr);
313*04f1ad80SBarry Smith 
314*04f1ad80SBarry Smith   ierr = VecGetLocalSize(uglydd,&n);CHKERRQ(ierr);
315*04f1ad80SBarry Smith   ierr = VecGetArray(uglydd,&d);CHKERRQ(ierr);
316*04f1ad80SBarry Smith   for (i=0; i<n; i++) {
317*04f1ad80SBarry Smith     d[i] = s[uglyrmapd[i]]; /* copy "diagonal" (true local) portion of scale into dd vector */
318*04f1ad80SBarry Smith   }
319*04f1ad80SBarry Smith   ierr = VecRestoreArray(uglydd,&d);CHKERRQ(ierr);
320*04f1ad80SBarry Smith   /* column scale "diagonal" portion of local matrix */
321*04f1ad80SBarry Smith   ierr = MatDiagonalScale(a->A,PETSC_NULL,uglydd);CHKERRQ(ierr);
322*04f1ad80SBarry Smith 
323*04f1ad80SBarry Smith   ierr = VecGetLocalSize(uglyoo,&n);CHKERRQ(ierr);
324*04f1ad80SBarry Smith   ierr = VecGetArray(uglyoo,&o);CHKERRQ(ierr);
325*04f1ad80SBarry Smith   for (i=0; i<n; i++) {
326*04f1ad80SBarry Smith     o[i] = s[uglyrmapo[i]]; /* copy "off-diagonal" portion of scale into oo vector */
327*04f1ad80SBarry Smith   }
328*04f1ad80SBarry Smith   ierr = VecRestoreArray(scale,&s);CHKERRQ(ierr);
329*04f1ad80SBarry Smith   ierr = VecRestoreArray(uglyoo,&o);CHKERRQ(ierr);
330*04f1ad80SBarry Smith   /* column scale "off-diagonal" portion of local matrix */
331*04f1ad80SBarry Smith   ierr = MatDiagonalScale(a->B,PETSC_NULL,uglyoo);CHKERRQ(ierr);
332*04f1ad80SBarry Smith 
333*04f1ad80SBarry Smith   PetscFunctionReturn(0);
334*04f1ad80SBarry Smith }
335*04f1ad80SBarry Smith 
3368016bdd1SSatish Balay 
3373eda8832SBarry Smith 
338