xref: /petsc/src/mat/impls/aij/mpi/mmaij.c (revision a3ebf921741f253acd95844bdd6a9601d7f5a522)
1be1d678aSKris Buschelman 
28c79f6d3SBarry Smith /*
38c79f6d3SBarry Smith    Support for the parallel AIJ matrix vector multiply
48c79f6d3SBarry Smith */
5c6db04a5SJed Brown #include <../src/mat/impls/aij/mpi/mpiaij.h>
6aeda0f58SHong Zhang #include <petsc/private/vecimpl.h>
7af0996ceSBarry Smith #include <petsc/private/isimpl.h>    /* needed because accesses data structure of ISLocalToGlobalMapping directly */
88c79f6d3SBarry Smith 
9dfbe8321SBarry Smith PetscErrorCode MatSetUpMultiply_MPIAIJ(Mat mat)
108c79f6d3SBarry Smith {
1144a69424SLois Curfman McInnes   Mat_MPIAIJ     *aij = (Mat_MPIAIJ*)mat->data;
12ec8511deSBarry Smith   Mat_SeqAIJ     *B   = (Mat_SeqAIJ*)(aij->B->data);
136849ba73SBarry Smith   PetscErrorCode ierr;
14b1d57f15SBarry Smith   PetscInt       i,j,*aj = B->j,ec = 0,*garray;
151eb62cbbSBarry Smith   IS             from,to;
161eb62cbbSBarry Smith   Vec            gvec;
17aa482453SBarry Smith #if defined(PETSC_USE_CTABLE)
180f5bd95cSBarry Smith   PetscTable         gid1_lid1;
190f5bd95cSBarry Smith   PetscTablePosition tpos;
20b1d57f15SBarry Smith   PetscInt           gid,lid;
216f531f54SSatish Balay #else
22d0f46423SBarry Smith   PetscInt N = mat->cmap->N,*indices;
232066d6f7SSatish Balay #endif
242066d6f7SSatish Balay 
253a40ed3dSBarry Smith   PetscFunctionBegin;
264b8d542aSHong Zhang   if (!aij->garray) {
27aa482453SBarry Smith #if defined(PETSC_USE_CTABLE)
28c5bfad50SMark F. Adams     /* use a table */
29e23dfa41SBarry Smith     ierr = PetscTableCreate(aij->B->rmap->n,mat->cmap->N+1,&gid1_lid1);CHKERRQ(ierr);
30d0f46423SBarry Smith     for (i=0; i<aij->B->rmap->n; i++) {
312066d6f7SSatish Balay       for (j=0; j<B->ilen[i]; j++) {
32b1d57f15SBarry Smith         PetscInt data,gid1 = aj[B->i[i] + j] + 1;
330f5bd95cSBarry Smith         ierr = PetscTableFind(gid1_lid1,gid1,&data);CHKERRQ(ierr);
34fa46199cSSatish Balay         if (!data) {
352066d6f7SSatish Balay           /* one based table */
363861aac3SJed Brown           ierr = PetscTableAdd(gid1_lid1,gid1,++ec,INSERT_VALUES);CHKERRQ(ierr);
372066d6f7SSatish Balay         }
382066d6f7SSatish Balay       }
392066d6f7SSatish Balay     }
402066d6f7SSatish Balay     /* form array of columns we need */
41854ce69bSBarry Smith     ierr = PetscMalloc1(ec+1,&garray);CHKERRQ(ierr);
420f5bd95cSBarry Smith     ierr = PetscTableGetHeadPosition(gid1_lid1,&tpos);CHKERRQ(ierr);
432066d6f7SSatish Balay     while (tpos) {
440f5bd95cSBarry Smith       ierr = PetscTableGetNext(gid1_lid1,&tpos,&gid,&lid);CHKERRQ(ierr);
45b0a32e0cSBarry Smith       gid--;
46b0a32e0cSBarry Smith       lid--;
472066d6f7SSatish Balay       garray[lid] = gid;
482066d6f7SSatish Balay     }
490064e2bbSSatish Balay     ierr = PetscSortInt(ec,garray);CHKERRQ(ierr); /* sort, and rebuild */
500f5bd95cSBarry Smith     ierr = PetscTableRemoveAll(gid1_lid1);CHKERRQ(ierr);
512066d6f7SSatish Balay     for (i=0; i<ec; i++) {
523861aac3SJed Brown       ierr = PetscTableAdd(gid1_lid1,garray[i]+1,i+1,INSERT_VALUES);CHKERRQ(ierr);
532066d6f7SSatish Balay     }
542066d6f7SSatish Balay     /* compact out the extra columns in B */
55d0f46423SBarry Smith     for (i=0; i<aij->B->rmap->n; i++) {
562066d6f7SSatish Balay       for (j=0; j<B->ilen[i]; j++) {
57b1d57f15SBarry Smith         PetscInt gid1 = aj[B->i[i] + j] + 1;
580f5bd95cSBarry Smith         ierr = PetscTableFind(gid1_lid1,gid1,&lid);CHKERRQ(ierr);
59fa46199cSSatish Balay         lid--;
60b3fb0a6cSMatthew Knepley         aj[B->i[i] + j] = lid;
612066d6f7SSatish Balay       }
622066d6f7SSatish Balay     }
63d0f46423SBarry Smith     aij->B->cmap->n = aij->B->cmap->N = ec;
64cdce4254SBarry Smith     aij->B->cmap->bs = 1;
652205254eSKarl Rupp 
6626283091SBarry Smith     ierr = PetscLayoutSetUp((aij->B->cmap));CHKERRQ(ierr);
676bc0bbbfSBarry Smith     ierr = PetscTableDestroy(&gid1_lid1);CHKERRQ(ierr);
682066d6f7SSatish Balay #else
6911285404SBarry Smith     /* Make an array as long as the number of columns */
701eb62cbbSBarry Smith     /* mark those columns that are in aij->B */
711795a4d1SJed Brown     ierr = PetscCalloc1(N+1,&indices);CHKERRQ(ierr);
72d0f46423SBarry Smith     for (i=0; i<aij->B->rmap->n; i++) {
73d6dfbf8fSBarry Smith       for (j=0; j<B->ilen[i]; j++) {
74bfec09a0SHong Zhang         if (!indices[aj[B->i[i] + j]]) ec++;
75bfec09a0SHong Zhang         indices[aj[B->i[i] + j]] = 1;
76416022c9SBarry Smith       }
771eb62cbbSBarry Smith     }
788c79f6d3SBarry Smith 
791eb62cbbSBarry Smith     /* form array of columns we need */
80854ce69bSBarry Smith     ierr = PetscMalloc1(ec+1,&garray);CHKERRQ(ierr);
811eb62cbbSBarry Smith     ec   = 0;
821eb62cbbSBarry Smith     for (i=0; i<N; i++) {
831eb62cbbSBarry Smith       if (indices[i]) garray[ec++] = i;
841eb62cbbSBarry Smith     }
851eb62cbbSBarry Smith 
861eb62cbbSBarry Smith     /* make indices now point into garray */
871eb62cbbSBarry Smith     for (i=0; i<ec; i++) {
88bfec09a0SHong Zhang       indices[garray[i]] = i;
891eb62cbbSBarry Smith     }
901eb62cbbSBarry Smith 
911eb62cbbSBarry Smith     /* compact out the extra columns in B */
92d0f46423SBarry Smith     for (i=0; i<aij->B->rmap->n; i++) {
93d6dfbf8fSBarry Smith       for (j=0; j<B->ilen[i]; j++) {
94bfec09a0SHong Zhang         aj[B->i[i] + j] = indices[aj[B->i[i] + j]];
951eb62cbbSBarry Smith       }
96d6dfbf8fSBarry Smith     }
97d0f46423SBarry Smith     aij->B->cmap->n = aij->B->cmap->N = ec;
98cd0e7f71SBarry Smith     aij->B->cmap->bs = 1;
992205254eSKarl Rupp 
10026283091SBarry Smith     ierr = PetscLayoutSetUp((aij->B->cmap));CHKERRQ(ierr);
101606d414cSSatish Balay     ierr = PetscFree(indices);CHKERRQ(ierr);
1022066d6f7SSatish Balay #endif
1034b8d542aSHong Zhang   } else {
1044b8d542aSHong Zhang     garray = aij->garray;
1054b8d542aSHong Zhang   }
1064b8d542aSHong Zhang 
1074b8d542aSHong Zhang   if (!aij->lvec) {
1081eb62cbbSBarry Smith     /* create local vector that is used to scatter into */
109029af93fSBarry Smith     ierr = VecCreateSeq(PETSC_COMM_SELF,ec,&aij->lvec);CHKERRQ(ierr);
1104b8d542aSHong Zhang   } else {
1114b8d542aSHong Zhang     ierr = VecGetSize(aij->lvec,&ec);CHKERRQ(ierr);
1124b8d542aSHong Zhang   }
1131eb62cbbSBarry Smith 
114d6dfbf8fSBarry Smith   /* create two temporary Index sets for build scatter gather */
115*a3ebf921SJunchao Zhang   ierr = ISCreateGeneral(PETSC_COMM_SELF,ec,garray,PETSC_COPY_VALUES,&from);CHKERRQ(ierr);
116029af93fSBarry Smith   ierr = ISCreateStride(PETSC_COMM_SELF,ec,0,1,&to);CHKERRQ(ierr);
1171eb62cbbSBarry Smith 
1181eb62cbbSBarry Smith   /* create temporary global vector to generate scatter context */
119b5eb4454SBarry Smith   /* This does not allocate the array's memory so is efficient */
120ce94432eSBarry Smith   ierr = VecCreateMPIWithArray(PetscObjectComm((PetscObject)mat),1,mat->cmap->n,mat->cmap->N,NULL,&gvec);CHKERRQ(ierr);
1211eb62cbbSBarry Smith 
1222d336d48SLois Curfman McInnes   /* generate the scatter context */
123a78d8160SHong Zhang   if (aij->Mvctx_mpi1_flg) {
12401ad2aeeSHong Zhang     ierr = VecScatterDestroy(&aij->Mvctx_mpi1);CHKERRQ(ierr);
1259448b7f1SJunchao Zhang     ierr = VecScatterCreate(gvec,from,aij->lvec,to,&aij->Mvctx_mpi1);CHKERRQ(ierr);
126803a1b88SHong Zhang     ierr = VecScatterSetType(aij->Mvctx_mpi1,VECSCATTERMPI1);CHKERRQ(ierr);
1274b8d542aSHong Zhang     ierr = PetscLogObjectParent((PetscObject)mat,(PetscObject)aij->Mvctx_mpi1);CHKERRQ(ierr);
1284b8d542aSHong Zhang   } else {
1293f6a6bdaSHong Zhang     ierr = VecScatterDestroy(&aij->Mvctx);CHKERRQ(ierr);
1309448b7f1SJunchao Zhang     ierr = VecScatterCreate(gvec,from,aij->lvec,to,&aij->Mvctx);CHKERRQ(ierr);
1313bb1ff40SBarry Smith     ierr = PetscLogObjectParent((PetscObject)mat,(PetscObject)aij->Mvctx);CHKERRQ(ierr);
1323bb1ff40SBarry Smith     ierr = PetscLogObjectParent((PetscObject)mat,(PetscObject)aij->lvec);CHKERRQ(ierr);
1334b8d542aSHong Zhang     ierr = PetscLogObjectMemory((PetscObject)mat,(ec+1)*sizeof(PetscInt));CHKERRQ(ierr);
1344b8d542aSHong Zhang   }
13567bb5161SHong Zhang   aij->garray = garray;
1364b8d542aSHong Zhang 
1373bb1ff40SBarry Smith   ierr = PetscLogObjectParent((PetscObject)mat,(PetscObject)from);CHKERRQ(ierr);
1383bb1ff40SBarry Smith   ierr = PetscLogObjectParent((PetscObject)mat,(PetscObject)to);CHKERRQ(ierr);
1392205254eSKarl Rupp 
1406bf464f9SBarry Smith   ierr = ISDestroy(&from);CHKERRQ(ierr);
1416bf464f9SBarry Smith   ierr = ISDestroy(&to);CHKERRQ(ierr);
1426bf464f9SBarry Smith   ierr = VecDestroy(&gvec);CHKERRQ(ierr);
1433a40ed3dSBarry Smith   PetscFunctionReturn(0);
1448c79f6d3SBarry Smith }
1459e25ed09SBarry Smith 
1462493cbb0SBarry Smith /*
1472493cbb0SBarry Smith      Takes the local part of an already assembled MPIAIJ matrix
1482493cbb0SBarry Smith    and disassembles it. This is to allow new nonzeros into the matrix
1492493cbb0SBarry Smith    that require more communication in the matrix vector multiply.
1502493cbb0SBarry Smith    Thus certain data-structures must be rebuilt.
1512493cbb0SBarry Smith 
1522493cbb0SBarry Smith    Kind of slow! But that's what application programmers get when
1532493cbb0SBarry Smith    they are sloppy.
1542493cbb0SBarry Smith */
155ab9863d7SBarry Smith PetscErrorCode MatDisAssemble_MPIAIJ(Mat A)
1562493cbb0SBarry Smith {
1572493cbb0SBarry Smith   Mat_MPIAIJ     *aij  = (Mat_MPIAIJ*)A->data;
1582493cbb0SBarry Smith   Mat            B     = aij->B,Bnew;
159ec8511deSBarry Smith   Mat_SeqAIJ     *Baij = (Mat_SeqAIJ*)B->data;
160dfbe8321SBarry Smith   PetscErrorCode ierr;
161d0f46423SBarry Smith   PetscInt       i,j,m = B->rmap->n,n = A->cmap->N,col,ct = 0,*garray = aij->garray,*nz,ec;
16287828ca2SBarry Smith   PetscScalar    v;
1632493cbb0SBarry Smith 
1643a40ed3dSBarry Smith   PetscFunctionBegin;
1652493cbb0SBarry Smith   /* free stuff related to matrix-vec multiply */
166b0a32e0cSBarry Smith   ierr = VecGetSize(aij->lvec,&ec);CHKERRQ(ierr); /* needed for PetscLogObjectMemory below */
1675e1f6667SBarry Smith   ierr = VecDestroy(&aij->lvec);CHKERRQ(ierr);
168464493b3SBarry Smith   if (aij->colmap) {
169aa482453SBarry Smith #if defined(PETSC_USE_CTABLE)
1706bc0bbbfSBarry Smith     ierr = PetscTableDestroy(&aij->colmap);CHKERRQ(ierr);
1712066d6f7SSatish Balay #else
172606d414cSSatish Balay     ierr = PetscFree(aij->colmap);CHKERRQ(ierr);
1733bb1ff40SBarry Smith     ierr = PetscLogObjectMemory((PetscObject)A,-aij->B->cmap->n*sizeof(PetscInt));CHKERRQ(ierr);
1742066d6f7SSatish Balay #endif
175464493b3SBarry Smith   }
1762493cbb0SBarry Smith 
1772493cbb0SBarry Smith   /* make sure that B is assembled so we can access its values */
1786d4a8577SBarry Smith   ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
179fe2f2677SBarry Smith   ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1802493cbb0SBarry Smith 
1812493cbb0SBarry Smith   /* invent new B and copy stuff over */
182854ce69bSBarry Smith   ierr = PetscMalloc1(m+1,&nz);CHKERRQ(ierr);
18348b35521SBarry Smith   for (i=0; i<m; i++) {
18448b35521SBarry Smith     nz[i] = Baij->i[i+1] - Baij->i[i];
18548b35521SBarry Smith   }
186f69a0ea3SMatthew Knepley   ierr = MatCreate(PETSC_COMM_SELF,&Bnew);CHKERRQ(ierr);
187f69a0ea3SMatthew Knepley   ierr = MatSetSizes(Bnew,m,n,m,n);CHKERRQ(ierr);
18833d57670SJed Brown   ierr = MatSetBlockSizesFromMats(Bnew,A,A);CHKERRQ(ierr);
1897adad957SLisandro Dalcin   ierr = MatSetType(Bnew,((PetscObject)B)->type_name);CHKERRQ(ierr);
190f204ca49SKris Buschelman   ierr = MatSeqAIJSetPreallocation(Bnew,0,nz);CHKERRQ(ierr);
1912205254eSKarl Rupp 
192b38c15b3SStefano Zampini   if (Baij->nonew >= 0) { /* Inherit insertion error options (if positive). */
193b38c15b3SStefano Zampini     ((Mat_SeqAIJ*)Bnew->data)->nonew = Baij->nonew;
194b38c15b3SStefano Zampini   }
195b38c15b3SStefano Zampini 
19677341eacSDmitry Karpeev   /*
19777341eacSDmitry Karpeev    Ensure that B's nonzerostate is monotonically increasing.
19877341eacSDmitry Karpeev    Or should this follow the MatSetValues() loop to preserve B's nonzerstate across a MatDisAssemble() call?
19977341eacSDmitry Karpeev    */
200f69fde56SShane Stafford   Bnew->nonzerostate = B->nonzerostate;
2012205254eSKarl Rupp 
202606d414cSSatish Balay   ierr = PetscFree(nz);CHKERRQ(ierr);
2032493cbb0SBarry Smith   for (i=0; i<m; i++) {
204bfec09a0SHong Zhang     for (j=Baij->i[i]; j<Baij->i[i+1]; j++) {
205bfec09a0SHong Zhang       col  = garray[Baij->j[ct]];
2062493cbb0SBarry Smith       v    = Baij->a[ct++];
20783271157SBarry Smith       ierr = MatSetValues(Bnew,1,&i,1,&col,&v,B->insertmode);CHKERRQ(ierr);
2082493cbb0SBarry Smith     }
2092493cbb0SBarry Smith   }
210606d414cSSatish Balay   ierr = PetscFree(aij->garray);CHKERRQ(ierr);
2113bb1ff40SBarry Smith   ierr = PetscLogObjectMemory((PetscObject)A,-ec*sizeof(PetscInt));CHKERRQ(ierr);
2126bf464f9SBarry Smith   ierr = MatDestroy(&B);CHKERRQ(ierr);
2133bb1ff40SBarry Smith   ierr = PetscLogObjectParent((PetscObject)A,(PetscObject)Bnew);CHKERRQ(ierr);
2142205254eSKarl Rupp 
2152493cbb0SBarry Smith   aij->B           = Bnew;
216227d817aSBarry Smith   A->was_assembled = PETSC_FALSE;
2173a40ed3dSBarry Smith   PetscFunctionReturn(0);
2182493cbb0SBarry Smith }
2192493cbb0SBarry Smith 
2202cd6534aSBarry Smith /*      ugly stuff added for Glenn someday we should fix this up */
2212cd6534aSBarry Smith 
2222205254eSKarl Rupp static PetscInt *auglyrmapd = 0,*auglyrmapo = 0; /* mapping from the local ordering to the "diagonal" and "off-diagonal" parts of the local matrix */
2232cd6534aSBarry Smith static Vec auglydd          = 0,auglyoo     = 0; /* work vectors used to scale the two parts of the local matrix */
2242cd6534aSBarry Smith 
2252cd6534aSBarry Smith 
226dfbe8321SBarry Smith PetscErrorCode MatMPIAIJDiagonalScaleLocalSetUp(Mat inA,Vec scale)
2272cd6534aSBarry Smith {
2282cd6534aSBarry Smith   Mat_MPIAIJ     *ina = (Mat_MPIAIJ*) inA->data; /*access private part of matrix */
229dfbe8321SBarry Smith   PetscErrorCode ierr;
230b1d57f15SBarry Smith   PetscInt       i,n,nt,cstart,cend,no,*garray = ina->garray,*lindices;
231b1d57f15SBarry Smith   PetscInt       *r_rmapd,*r_rmapo;
2322cd6534aSBarry Smith 
2332cd6534aSBarry Smith   PetscFunctionBegin;
2342cd6534aSBarry Smith   ierr = MatGetOwnershipRange(inA,&cstart,&cend);CHKERRQ(ierr);
2350298fd71SBarry Smith   ierr = MatGetSize(ina->A,NULL,&n);CHKERRQ(ierr);
2361795a4d1SJed Brown   ierr = PetscCalloc1(inA->rmap->mapping->n+1,&r_rmapd);CHKERRQ(ierr);
2372cd6534aSBarry Smith   nt   = 0;
238992144d0SBarry Smith   for (i=0; i<inA->rmap->mapping->n; i++) {
239992144d0SBarry Smith     if (inA->rmap->mapping->indices[i] >= cstart && inA->rmap->mapping->indices[i] < cend) {
2402cd6534aSBarry Smith       nt++;
241992144d0SBarry Smith       r_rmapd[i] = inA->rmap->mapping->indices[i] + 1;
2422cd6534aSBarry Smith     }
2432cd6534aSBarry Smith   }
244e32f2f54SBarry Smith   if (nt != n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Hmm nt %D n %D",nt,n);
245854ce69bSBarry Smith   ierr = PetscMalloc1(n+1,&auglyrmapd);CHKERRQ(ierr);
246992144d0SBarry Smith   for (i=0; i<inA->rmap->mapping->n; i++) {
2472cd6534aSBarry Smith     if (r_rmapd[i]) {
2482cd6534aSBarry Smith       auglyrmapd[(r_rmapd[i]-1)-cstart] = i;
2492cd6534aSBarry Smith     }
2502cd6534aSBarry Smith   }
2512cd6534aSBarry Smith   ierr = PetscFree(r_rmapd);CHKERRQ(ierr);
2522cd6534aSBarry Smith   ierr = VecCreateSeq(PETSC_COMM_SELF,n,&auglydd);CHKERRQ(ierr);
2532cd6534aSBarry Smith 
2541795a4d1SJed Brown   ierr = PetscCalloc1(inA->cmap->N+1,&lindices);CHKERRQ(ierr);
255d0f46423SBarry Smith   for (i=0; i<ina->B->cmap->n; i++) {
2562cd6534aSBarry Smith     lindices[garray[i]] = i+1;
2572cd6534aSBarry Smith   }
258992144d0SBarry Smith   no   = inA->rmap->mapping->n - nt;
2591795a4d1SJed Brown   ierr = PetscCalloc1(inA->rmap->mapping->n+1,&r_rmapo);CHKERRQ(ierr);
2602cd6534aSBarry Smith   nt   = 0;
261992144d0SBarry Smith   for (i=0; i<inA->rmap->mapping->n; i++) {
262992144d0SBarry Smith     if (lindices[inA->rmap->mapping->indices[i]]) {
2632cd6534aSBarry Smith       nt++;
264992144d0SBarry Smith       r_rmapo[i] = lindices[inA->rmap->mapping->indices[i]];
2652cd6534aSBarry Smith     }
2662cd6534aSBarry Smith   }
267e32f2f54SBarry Smith   if (nt > no) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Hmm nt %D no %D",nt,n);
2682cd6534aSBarry Smith   ierr = PetscFree(lindices);CHKERRQ(ierr);
269854ce69bSBarry Smith   ierr = PetscMalloc1(nt+1,&auglyrmapo);CHKERRQ(ierr);
270992144d0SBarry Smith   for (i=0; i<inA->rmap->mapping->n; i++) {
2712cd6534aSBarry Smith     if (r_rmapo[i]) {
2722cd6534aSBarry Smith       auglyrmapo[(r_rmapo[i]-1)] = i;
2732cd6534aSBarry Smith     }
2742cd6534aSBarry Smith   }
2752cd6534aSBarry Smith   ierr = PetscFree(r_rmapo);CHKERRQ(ierr);
2762cd6534aSBarry Smith   ierr = VecCreateSeq(PETSC_COMM_SELF,nt,&auglyoo);CHKERRQ(ierr);
2772cd6534aSBarry Smith   PetscFunctionReturn(0);
2782cd6534aSBarry Smith }
2792cd6534aSBarry Smith 
280dfbe8321SBarry Smith PetscErrorCode MatMPIAIJDiagonalScaleLocal(Mat A,Vec scale)
2812cd6534aSBarry Smith {
28292b32695SKris Buschelman   /* This routine should really be abandoned as it duplicates MatDiagonalScaleLocal */
2834ac538c5SBarry Smith   PetscErrorCode ierr;
28492b32695SKris Buschelman 
28592b32695SKris Buschelman   PetscFunctionBegin;
2864ac538c5SBarry Smith   ierr = PetscTryMethod(A,"MatDiagonalScaleLocal_C",(Mat,Vec),(A,scale));CHKERRQ(ierr);
28792b32695SKris Buschelman   PetscFunctionReturn(0);
28892b32695SKris Buschelman }
28992b32695SKris Buschelman 
2907087cfbeSBarry Smith PetscErrorCode  MatDiagonalScaleLocal_MPIAIJ(Mat A,Vec scale)
29192b32695SKris Buschelman {
2922cd6534aSBarry Smith   Mat_MPIAIJ        *a = (Mat_MPIAIJ*) A->data; /*access private part of matrix */
293dfbe8321SBarry Smith   PetscErrorCode    ierr;
294b1d57f15SBarry Smith   PetscInt          n,i;
295bca11509SBarry Smith   PetscScalar       *d,*o;
296bca11509SBarry Smith   const PetscScalar *s;
2972cd6534aSBarry Smith 
2982cd6534aSBarry Smith   PetscFunctionBegin;
2992cd6534aSBarry Smith   if (!auglyrmapd) {
3002cd6534aSBarry Smith     ierr = MatMPIAIJDiagonalScaleLocalSetUp(A,scale);CHKERRQ(ierr);
3012cd6534aSBarry Smith   }
3022cd6534aSBarry Smith 
303bca11509SBarry Smith   ierr = VecGetArrayRead(scale,&s);CHKERRQ(ierr);
3042cd6534aSBarry Smith 
3052cd6534aSBarry Smith   ierr = VecGetLocalSize(auglydd,&n);CHKERRQ(ierr);
3061ebc52fbSHong Zhang   ierr = VecGetArray(auglydd,&d);CHKERRQ(ierr);
3072cd6534aSBarry Smith   for (i=0; i<n; i++) {
3082cd6534aSBarry Smith     d[i] = s[auglyrmapd[i]]; /* copy "diagonal" (true local) portion of scale into dd vector */
3092cd6534aSBarry Smith   }
3101ebc52fbSHong Zhang   ierr = VecRestoreArray(auglydd,&d);CHKERRQ(ierr);
3112cd6534aSBarry Smith   /* column scale "diagonal" portion of local matrix */
3120298fd71SBarry Smith   ierr = MatDiagonalScale(a->A,NULL,auglydd);CHKERRQ(ierr);
3132cd6534aSBarry Smith 
3142cd6534aSBarry Smith   ierr = VecGetLocalSize(auglyoo,&n);CHKERRQ(ierr);
3151ebc52fbSHong Zhang   ierr = VecGetArray(auglyoo,&o);CHKERRQ(ierr);
3162cd6534aSBarry Smith   for (i=0; i<n; i++) {
3172cd6534aSBarry Smith     o[i] = s[auglyrmapo[i]]; /* copy "off-diagonal" portion of scale into oo vector */
3182cd6534aSBarry Smith   }
319bca11509SBarry Smith   ierr = VecRestoreArrayRead(scale,&s);CHKERRQ(ierr);
3201ebc52fbSHong Zhang   ierr = VecRestoreArray(auglyoo,&o);CHKERRQ(ierr);
3212cd6534aSBarry Smith   /* column scale "off-diagonal" portion of local matrix */
3220298fd71SBarry Smith   ierr = MatDiagonalScale(a->B,NULL,auglyoo);CHKERRQ(ierr);
3232cd6534aSBarry Smith   PetscFunctionReturn(0);
3242cd6534aSBarry Smith }
325