xref: /petsc/src/mat/impls/aij/mpi/fdmpiaij.c (revision f8c2866e654d46b30197bc999c108affa4012b0e)
1a64fbb32SBarry Smith 
2c6db04a5SJed Brown #include <../src/mat/impls/aij/mpi/mpiaij.h>
30d1c53f1SHong Zhang #include <../src/mat/impls/baij/mpi/mpibaij.h>
40d1c53f1SHong Zhang 
50d1c53f1SHong Zhang #undef __FUNCT__
60d1c53f1SHong Zhang #define __FUNCT__ "MatFDColoringApply_BAIJ_new"
70d1c53f1SHong Zhang PetscErrorCode  MatFDColoringApply_BAIJ_new(Mat J,MatFDColoring coloring,Vec x1,MatStructure *flag,void *sctx)
80d1c53f1SHong Zhang {
90d1c53f1SHong Zhang   PetscErrorCode (*f)(void*,Vec,Vec,void*) = (PetscErrorCode (*)(void*,Vec,Vec,void*))coloring->f;
100d1c53f1SHong Zhang   PetscErrorCode ierr;
110d1c53f1SHong Zhang   PetscInt       k,cstart,cend,l,row,col,nz,spidx,i,j;
120d1c53f1SHong Zhang   PetscScalar    dx=0.0,*y,*xx,*w3_array,*dy_i,*dy=coloring->dy;
130d1c53f1SHong Zhang   PetscScalar    *vscale_array;
140d1c53f1SHong Zhang   PetscReal      epsilon=coloring->error_rel,umin=coloring->umin,unorm;
150d1c53f1SHong Zhang   Vec            w1=coloring->w1,w2=coloring->w2,w3,vscale=coloring->vscale;
160d1c53f1SHong Zhang   void           *fctx=coloring->fctx;
170d1c53f1SHong Zhang   PetscBool      flg=PETSC_FALSE;
180d1c53f1SHong Zhang   PetscInt       ctype=coloring->ctype,nxloc,nrows_k;
190d1c53f1SHong Zhang   Mat_MPIBAIJ    *aij=(Mat_MPIBAIJ*)J->data;
200d1c53f1SHong Zhang   PetscScalar    *valaddr;
210d1c53f1SHong Zhang   MatEntry       *Jentry=coloring->matentry;
220d1c53f1SHong Zhang   const PetscInt ncolors=coloring->ncolors,*ncolumns=coloring->ncolumns,*nrows=coloring->nrows;
230d1c53f1SHong Zhang   PetscInt       bs=J->rmap->bs;
240d1c53f1SHong Zhang 
250d1c53f1SHong Zhang   PetscFunctionBegin;
260d1c53f1SHong Zhang   ierr = MatSetUnfactored(J);CHKERRQ(ierr);
270d1c53f1SHong Zhang   ierr = PetscOptionsGetBool(NULL,"-mat_fd_coloring_dont_rezero",&flg,NULL);CHKERRQ(ierr);
280d1c53f1SHong Zhang   if (flg) {
290d1c53f1SHong Zhang     ierr = PetscInfo(coloring,"Not calling MatZeroEntries()\n");CHKERRQ(ierr);
300d1c53f1SHong Zhang   } else {
310d1c53f1SHong Zhang     PetscBool assembled;
320d1c53f1SHong Zhang     ierr = MatAssembled(J,&assembled);CHKERRQ(ierr);
330d1c53f1SHong Zhang     if (assembled) {
340d1c53f1SHong Zhang       ierr = MatZeroEntries(J);CHKERRQ(ierr);
350d1c53f1SHong Zhang     }
360d1c53f1SHong Zhang   }
370d1c53f1SHong Zhang 
380d1c53f1SHong Zhang   /* create vscale for storing dx */
390d1c53f1SHong Zhang   if (!vscale) {
400d1c53f1SHong Zhang     if (ctype == IS_COLORING_GLOBAL && coloring->htype[0] == 'd') {
410d1c53f1SHong Zhang       ierr = VecCreateGhost(PetscObjectComm((PetscObject)J),J->cmap->n,PETSC_DETERMINE,aij->B->cmap->n,aij->garray,&vscale);CHKERRQ(ierr);
420d1c53f1SHong Zhang 
430d1c53f1SHong Zhang     } else if (ctype == IS_COLORING_GHOSTED) {
440d1c53f1SHong Zhang       ierr = VecDuplicate(x1,&vscale);CHKERRQ(ierr);
450d1c53f1SHong Zhang     }
460d1c53f1SHong Zhang     coloring->vscale = vscale;
470d1c53f1SHong Zhang   }
480d1c53f1SHong Zhang 
490d1c53f1SHong Zhang   /* (1) Set w1 = F(x1) */
500d1c53f1SHong Zhang   if (!coloring->fset) {
510d1c53f1SHong Zhang     ierr = PetscLogEventBegin(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr);
520d1c53f1SHong Zhang     ierr = (*f)(sctx,x1,w1,fctx);CHKERRQ(ierr);
530d1c53f1SHong Zhang     ierr = PetscLogEventEnd(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr);
540d1c53f1SHong Zhang   } else {
550d1c53f1SHong Zhang     coloring->fset = PETSC_FALSE;
560d1c53f1SHong Zhang   }
570d1c53f1SHong Zhang 
580d1c53f1SHong Zhang   /* (2) Compute vscale = 1./dx - the local scale factors, including ghost points */
590d1c53f1SHong Zhang   ierr = VecGetLocalSize(x1,&nxloc);CHKERRQ(ierr);
600d1c53f1SHong Zhang   //PetscMPIInt rank;
610d1c53f1SHong Zhang   //ierr = MPI_Comm_rank(PETSC_COMM_WORLD,&rank);CHKERRQ(ierr);
620d1c53f1SHong Zhang   //printf("[%d] nxloc %d\n",rank,nxloc);
630d1c53f1SHong Zhang   if (coloring->htype[0] == 'w') {
640d1c53f1SHong Zhang     /* vscale = dx is a constant scalar */
650d1c53f1SHong Zhang     ierr = VecNorm(x1,NORM_2,&unorm);CHKERRQ(ierr);
660d1c53f1SHong Zhang     dx = 1.0/(PetscSqrtReal(1.0 + unorm)*epsilon);
670d1c53f1SHong Zhang   } else {
680d1c53f1SHong Zhang     ierr = VecGetArray(x1,&xx);CHKERRQ(ierr);
690d1c53f1SHong Zhang     ierr = VecGetArray(vscale,&vscale_array);CHKERRQ(ierr);
700d1c53f1SHong Zhang     for (col=0; col<nxloc; col++) {
710d1c53f1SHong Zhang       dx = xx[col];
720d1c53f1SHong Zhang       if (PetscAbsScalar(dx) < umin) {
730d1c53f1SHong Zhang         if (PetscRealPart(dx) >= 0.0)      dx = umin;
740d1c53f1SHong Zhang         else if (PetscRealPart(dx) < 0.0 ) dx = -umin;
750d1c53f1SHong Zhang       }
760d1c53f1SHong Zhang       dx               *= epsilon;
770d1c53f1SHong Zhang       vscale_array[col] = 1.0/dx;
780d1c53f1SHong Zhang     }
790d1c53f1SHong Zhang     ierr = VecRestoreArray(x1,&xx);CHKERRQ(ierr);
800d1c53f1SHong Zhang     ierr = VecRestoreArray(vscale,&vscale_array);CHKERRQ(ierr);
810d1c53f1SHong Zhang   }
820d1c53f1SHong Zhang   if (ctype == IS_COLORING_GLOBAL && coloring->htype[0] != 'w') {
830d1c53f1SHong Zhang     ierr = VecGhostUpdateBegin(vscale,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
840d1c53f1SHong Zhang     ierr = VecGhostUpdateEnd(vscale,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
850d1c53f1SHong Zhang   }
860d1c53f1SHong Zhang 
870d1c53f1SHong Zhang   /* (3) Loop over each color */
880d1c53f1SHong Zhang   if (!coloring->w3) {
890d1c53f1SHong Zhang     ierr = VecDuplicate(x1,&coloring->w3);CHKERRQ(ierr);
900d1c53f1SHong Zhang     ierr = PetscLogObjectParent((PetscObject)coloring,(PetscObject)coloring->w3);CHKERRQ(ierr);
910d1c53f1SHong Zhang   }
920d1c53f1SHong Zhang   w3 = coloring->w3;
930d1c53f1SHong Zhang 
940d1c53f1SHong Zhang   ierr = VecGetOwnershipRange(x1,&cstart,&cend);CHKERRQ(ierr); /* used by ghosted vscale */
950d1c53f1SHong Zhang   if (vscale) {
960d1c53f1SHong Zhang     ierr = VecGetArray(vscale,&vscale_array);CHKERRQ(ierr);
970d1c53f1SHong Zhang   }
980d1c53f1SHong Zhang   nz   = 0;
990d1c53f1SHong Zhang   for (k=0; k<ncolors; k++) {
1000d1c53f1SHong Zhang     coloring->currentcolor = k;
1010d1c53f1SHong Zhang 
1020d1c53f1SHong Zhang     /*
1030d1c53f1SHong Zhang       (3-1) Loop over each column associated with color
1040d1c53f1SHong Zhang       adding the perturbation to the vector w3 = x1 + dx.
1050d1c53f1SHong Zhang     */
1060d1c53f1SHong Zhang     ierr = VecCopy(x1,w3);CHKERRQ(ierr);
1070d1c53f1SHong Zhang     dy_i = dy;
1080d1c53f1SHong Zhang     for (i=0; i<bs; i++) {     /* Loop over a block of columns */
1090d1c53f1SHong Zhang       //------------------------------------------------
1100d1c53f1SHong Zhang       ierr = VecGetArray(w3,&w3_array);CHKERRQ(ierr);
1110d1c53f1SHong Zhang       if (ctype == IS_COLORING_GLOBAL) w3_array -= cstart; /* shift pointer so global index can be used */
1120d1c53f1SHong Zhang       if (coloring->htype[0] == 'w') {
1130d1c53f1SHong Zhang         for (l=0; l<ncolumns[k]; l++) {
1140d1c53f1SHong Zhang           col            = i + bs*coloring->columns[k][l];  /* local column (in global index!) of the matrix we are probing for */
1150d1c53f1SHong Zhang           w3_array[col] += 1.0/dx;
1160d1c53f1SHong Zhang 
1170d1c53f1SHong Zhang           if (i) {
1180d1c53f1SHong Zhang             w3_array[col-1] -= 1.0/dx; /* resume original w3[col-1] */
1190d1c53f1SHong Zhang           }
1200d1c53f1SHong Zhang 
1210d1c53f1SHong Zhang         }
1220d1c53f1SHong Zhang       } else { /* htype == 'ds' */
1230d1c53f1SHong Zhang         vscale_array -= cstart; /* shift pointer so global index can be used */
1240d1c53f1SHong Zhang         for (l=0; l<ncolumns[k]; l++) {
125*f8c2866eSHong Zhang           col = i + bs*coloring->columns[k][l]; /* local column (in global index!) of the matrix we are probing for */
1260d1c53f1SHong Zhang           w3_array[col] += 1.0/vscale_array[col];
1270d1c53f1SHong Zhang 
1280d1c53f1SHong Zhang           if (i) {
1290d1c53f1SHong Zhang             w3_array[col-1] -=  1.0/vscale_array[col-1]; /* resume original w3[col-1] */
1300d1c53f1SHong Zhang           }
1310d1c53f1SHong Zhang 
1320d1c53f1SHong Zhang         }
1330d1c53f1SHong Zhang         vscale_array += cstart;
1340d1c53f1SHong Zhang       }
1350d1c53f1SHong Zhang       if (ctype == IS_COLORING_GLOBAL) w3_array += cstart;
1360d1c53f1SHong Zhang       ierr = VecRestoreArray(w3,&w3_array);CHKERRQ(ierr);
1370d1c53f1SHong Zhang 
1380d1c53f1SHong Zhang       /*
1390d1c53f1SHong Zhang        (3-2) Evaluate function at w3 = x1 + dx (here dx is a vector of perturbations)
1400d1c53f1SHong Zhang                            w2 = F(x1 + dx) - F(x1)
1410d1c53f1SHong Zhang        */
1420d1c53f1SHong Zhang       ierr = PetscLogEventBegin(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr);
1430d1c53f1SHong Zhang       ierr = VecPlaceArray(w2,dy_i);CHKERRQ(ierr); /* place w2 to the array dy_i */
1440d1c53f1SHong Zhang       ierr = (*f)(sctx,w3,w2,fctx);CHKERRQ(ierr);
1450d1c53f1SHong Zhang       ierr = PetscLogEventEnd(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr);
1460d1c53f1SHong Zhang       ierr = VecAXPY(w2,-1.0,w1);CHKERRQ(ierr);
1470d1c53f1SHong Zhang       //---------------------------------------------
1480d1c53f1SHong Zhang       ierr = VecResetArray(w2);CHKERRQ(ierr);
1490d1c53f1SHong Zhang       dy_i += nxloc; /* points to dy+i*nxloc */
1500d1c53f1SHong Zhang     }
1510d1c53f1SHong Zhang 
1520d1c53f1SHong Zhang     /*
1530d1c53f1SHong Zhang      (3-3) Loop over rows of vector, putting results into Jacobian matrix
1540d1c53f1SHong Zhang     */
1550d1c53f1SHong Zhang     nrows_k = nrows[k];
1560d1c53f1SHong Zhang     ierr = VecGetArray(w2,&y);CHKERRQ(ierr);
1570d1c53f1SHong Zhang     if (coloring->htype[0] == 'w') {
1580d1c53f1SHong Zhang       for (l=0; l<nrows_k; l++) {
1590d1c53f1SHong Zhang         row     = bs*Jentry[nz].row;   /* local row index */
1600d1c53f1SHong Zhang         valaddr = Jentry[nz].valaddr;
1610d1c53f1SHong Zhang         nz++;
1620d1c53f1SHong Zhang         spidx = 0;
1630d1c53f1SHong Zhang         dy_i  = dy;
1640d1c53f1SHong Zhang         for (i=0; i<bs; i++) {   /* column of the block */
1650d1c53f1SHong Zhang           for (j=0; j<bs; j++) { /* row of the block */
1660d1c53f1SHong Zhang             valaddr[spidx++] = dy_i[row+j]*dx;
1670d1c53f1SHong Zhang           }
168*f8c2866eSHong Zhang           dy_i += nxloc; /* points to dy+i*nxloc */
1690d1c53f1SHong Zhang         }
1700d1c53f1SHong Zhang       }
1710d1c53f1SHong Zhang     } else { /* htype == 'ds' */
1720d1c53f1SHong Zhang       for (l=0; l<nrows_k; l++) {
1730d1c53f1SHong Zhang         row     = bs*Jentry[nz].row;   /* local row index */
1740d1c53f1SHong Zhang         col     = bs*Jentry[nz].col;   /* local column index */
175*f8c2866eSHong Zhang         valaddr = Jentry[nz].valaddr;
1760d1c53f1SHong Zhang         nz++;
177*f8c2866eSHong Zhang         spidx = 0;
178*f8c2866eSHong Zhang         dy_i  = dy;
179*f8c2866eSHong Zhang         for (i=0; i<bs; i++) {   /* column of the block */
180*f8c2866eSHong Zhang           for (j=0; j<bs; j++) { /* row of the block */
181*f8c2866eSHong Zhang             valaddr[spidx++] = dy_i[row+j]*vscale_array[col+i];
182*f8c2866eSHong Zhang           }
183*f8c2866eSHong Zhang           dy_i += nxloc; /* points to dy+i*nxloc */
184*f8c2866eSHong Zhang         }
1850d1c53f1SHong Zhang       }
1860d1c53f1SHong Zhang     }
1870d1c53f1SHong Zhang     ierr = VecRestoreArray(w2,&y);CHKERRQ(ierr);
1880d1c53f1SHong Zhang   }
1890d1c53f1SHong Zhang   ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1900d1c53f1SHong Zhang   ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1910d1c53f1SHong Zhang   if (vscale) {
1920d1c53f1SHong Zhang     ierr = VecRestoreArray(vscale,&vscale_array);CHKERRQ(ierr);
1930d1c53f1SHong Zhang   }
1940d1c53f1SHong Zhang 
1950d1c53f1SHong Zhang   coloring->currentcolor = -1;
1960d1c53f1SHong Zhang   PetscFunctionReturn(0);
1970d1c53f1SHong Zhang }
198a64fbb32SBarry Smith 
199ab9863d7SBarry Smith extern PetscErrorCode MatCreateColmap_MPIAIJ_Private(Mat);
2004a2ae208SSatish Balay #undef __FUNCT__
201c53567a0SHong Zhang #define __FUNCT__ "MatFDColoringApply_AIJ_new"
202c53567a0SHong Zhang PetscErrorCode  MatFDColoringApply_AIJ_new(Mat J,MatFDColoring coloring,Vec x1,MatStructure *flag,void *sctx)
203fcd7ac73SHong Zhang {
204fcd7ac73SHong Zhang   PetscErrorCode (*f)(void*,Vec,Vec,void*) = (PetscErrorCode (*)(void*,Vec,Vec,void*))coloring->f;
205fcd7ac73SHong Zhang   PetscErrorCode ierr;
206a2f2d239SHong Zhang   PetscInt       k,cstart,cend,l,row,col,nz;
2079e917edbSHong Zhang   PetscScalar    dx=0.0,*y,*xx,*w3_array;
208fcd7ac73SHong Zhang   PetscScalar    *vscale_array;
209fcd7ac73SHong Zhang   PetscReal      epsilon=coloring->error_rel,umin=coloring->umin,unorm;
2108bc97078SHong Zhang   Vec            w1=coloring->w1,w2=coloring->w2,w3,vscale=coloring->vscale;
211fcd7ac73SHong Zhang   void           *fctx=coloring->fctx;
212fcd7ac73SHong Zhang   PetscBool      flg=PETSC_FALSE;
213c53567a0SHong Zhang   PetscInt       ctype=coloring->ctype,nxloc,nrows_k;
214f5aae955SHong Zhang   Mat_MPIAIJ     *aij=(Mat_MPIAIJ*)J->data;
215573f477fSHong Zhang   MatEntry       *Jentry=coloring->matentry;
2168bc97078SHong Zhang   const PetscInt ncolors=coloring->ncolors,*ncolumns=coloring->ncolumns,*nrows=coloring->nrows;
217fcd7ac73SHong Zhang 
218fcd7ac73SHong Zhang   PetscFunctionBegin;
219fcd7ac73SHong Zhang   ierr = MatSetUnfactored(J);CHKERRQ(ierr);
220fcd7ac73SHong Zhang   ierr = PetscOptionsGetBool(NULL,"-mat_fd_coloring_dont_rezero",&flg,NULL);CHKERRQ(ierr);
221fcd7ac73SHong Zhang   if (flg) {
222fcd7ac73SHong Zhang     ierr = PetscInfo(coloring,"Not calling MatZeroEntries()\n");CHKERRQ(ierr);
223fcd7ac73SHong Zhang   } else {
224fcd7ac73SHong Zhang     PetscBool assembled;
225fcd7ac73SHong Zhang     ierr = MatAssembled(J,&assembled);CHKERRQ(ierr);
226fcd7ac73SHong Zhang     if (assembled) {
227fcd7ac73SHong Zhang       ierr = MatZeroEntries(J);CHKERRQ(ierr);
228fcd7ac73SHong Zhang     }
229fcd7ac73SHong Zhang   }
230fcd7ac73SHong Zhang 
2319e917edbSHong Zhang   /* create vscale for storing dx */
2329e917edbSHong Zhang   if (!vscale) {
2339e917edbSHong Zhang     if (ctype == IS_COLORING_GLOBAL && coloring->htype[0] == 'd') {
2349e917edbSHong Zhang       ierr = VecCreateGhost(PetscObjectComm((PetscObject)J),J->cmap->n,PETSC_DETERMINE,aij->B->cmap->n,aij->garray,&vscale);CHKERRQ(ierr);
2359e917edbSHong Zhang     } else if (ctype == IS_COLORING_GHOSTED) {
2368bc97078SHong Zhang       ierr = VecDuplicate(x1,&vscale);CHKERRQ(ierr);
2379e917edbSHong Zhang     }
2388bc97078SHong Zhang     coloring->vscale = vscale;
239fcd7ac73SHong Zhang   }
240fcd7ac73SHong Zhang 
2418bc97078SHong Zhang   /* (1) Set w1 = F(x1) */
242fcd7ac73SHong Zhang   if (!coloring->fset) {
243fcd7ac73SHong Zhang     ierr = PetscLogEventBegin(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr);
244f6af9589SHong Zhang     ierr = (*f)(sctx,x1,w1,fctx);CHKERRQ(ierr);
245fcd7ac73SHong Zhang     ierr = PetscLogEventEnd(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr);
246fcd7ac73SHong Zhang   } else {
247fcd7ac73SHong Zhang     coloring->fset = PETSC_FALSE;
248fcd7ac73SHong Zhang   }
249fcd7ac73SHong Zhang 
2508bc97078SHong Zhang   /* (2) Compute vscale = 1./dx - the local scale factors, including ghost points */
251f6af9589SHong Zhang   if (coloring->htype[0] == 'w') {
2529e917edbSHong Zhang     /* vscale = dx is a constant scalar */
253f6af9589SHong Zhang     ierr = VecNorm(x1,NORM_2,&unorm);CHKERRQ(ierr);
254c53567a0SHong Zhang     dx = 1.0/(PetscSqrtReal(1.0 + unorm)*epsilon);
25570e7395fSHong Zhang   } else {
25674d3cef9SHong Zhang     ierr = VecGetLocalSize(x1,&nxloc);CHKERRQ(ierr);
257f6af9589SHong Zhang     ierr = VecGetArray(x1,&xx);CHKERRQ(ierr);
2588bc97078SHong Zhang     ierr = VecGetArray(vscale,&vscale_array);CHKERRQ(ierr);
25974d3cef9SHong Zhang     for (col=0; col<nxloc; col++) {
260fcd7ac73SHong Zhang       dx = xx[col];
26174d3cef9SHong Zhang       if (PetscAbsScalar(dx) < umin) {
26274d3cef9SHong Zhang         if (PetscRealPart(dx) >= 0.0)      dx = umin;
26374d3cef9SHong Zhang         else if (PetscRealPart(dx) < 0.0 ) dx = -umin;
26474d3cef9SHong Zhang       }
265fcd7ac73SHong Zhang       dx               *= epsilon;
26674d3cef9SHong Zhang       vscale_array[col] = 1.0/dx;
267f6af9589SHong Zhang     }
26874d3cef9SHong Zhang     ierr = VecRestoreArray(x1,&xx);CHKERRQ(ierr);
2698bc97078SHong Zhang     ierr = VecRestoreArray(vscale,&vscale_array);CHKERRQ(ierr);
27070e7395fSHong Zhang   }
2719e917edbSHong Zhang   if (ctype == IS_COLORING_GLOBAL && coloring->htype[0] != 'w') {
2728bc97078SHong Zhang     ierr = VecGhostUpdateBegin(vscale,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2738bc97078SHong Zhang     ierr = VecGhostUpdateEnd(vscale,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
274fcd7ac73SHong Zhang   }
275fcd7ac73SHong Zhang 
2768bc97078SHong Zhang   /* (3) Loop over each color */
2778bc97078SHong Zhang   if (!coloring->w3) {
2788bc97078SHong Zhang     ierr = VecDuplicate(x1,&coloring->w3);CHKERRQ(ierr);
2798bc97078SHong Zhang     ierr = PetscLogObjectParent((PetscObject)coloring,(PetscObject)coloring->w3);CHKERRQ(ierr);
2808bc97078SHong Zhang   }
2818bc97078SHong Zhang   w3 = coloring->w3;
282fcd7ac73SHong Zhang 
2838bc97078SHong Zhang   ierr = VecGetOwnershipRange(x1,&cstart,&cend);CHKERRQ(ierr); /* used by ghosted vscale */
2849e917edbSHong Zhang   if (vscale) {
2858bc97078SHong Zhang     ierr = VecGetArray(vscale,&vscale_array);CHKERRQ(ierr);
2869e917edbSHong Zhang   }
2878bc97078SHong Zhang   nz   = 0;
2888bc97078SHong Zhang   for (k=0; k<ncolors; k++) {
2898bc97078SHong Zhang     coloring->currentcolor = k;
2909e917edbSHong Zhang 
291fcd7ac73SHong Zhang     /*
2928bc97078SHong Zhang       (3-1) Loop over each column associated with color
293f6af9589SHong Zhang       adding the perturbation to the vector w3 = x1 + dx.
294fcd7ac73SHong Zhang     */
295f6af9589SHong Zhang     ierr = VecCopy(x1,w3);CHKERRQ(ierr);
296f6af9589SHong Zhang     ierr = VecGetArray(w3,&w3_array);CHKERRQ(ierr);
297a2f2d239SHong Zhang     if (ctype == IS_COLORING_GLOBAL) w3_array -= cstart; /* shift pointer so global index can be used */
298b039d6c4SHong Zhang     if (coloring->htype[0] == 'w') {
2998bc97078SHong Zhang       for (l=0; l<ncolumns[k]; l++) {
300f6af9589SHong Zhang         col = coloring->columns[k][l]; /* local column (in global index!) of the matrix we are probing for */
3019e917edbSHong Zhang         w3_array[col] += 1.0/dx;
3029e917edbSHong Zhang       }
303b039d6c4SHong Zhang     } else { /* htype == 'ds' */
304a2f2d239SHong Zhang       vscale_array -= cstart; /* shift pointer so global index can be used */
305b039d6c4SHong Zhang       for (l=0; l<ncolumns[k]; l++) {
306b039d6c4SHong Zhang         col = coloring->columns[k][l]; /* local column (in global index!) of the matrix we are probing for */
307a2f2d239SHong Zhang         w3_array[col] += 1.0/vscale_array[col];
30870e7395fSHong Zhang       }
309a2f2d239SHong Zhang       vscale_array += cstart;
310fcd7ac73SHong Zhang     }
311a2f2d239SHong Zhang     if (ctype == IS_COLORING_GLOBAL) w3_array += cstart;
312fcd7ac73SHong Zhang     ierr = VecRestoreArray(w3,&w3_array);CHKERRQ(ierr);
3139e917edbSHong Zhang 
314fcd7ac73SHong Zhang     /*
3158bc97078SHong Zhang       (3-2) Evaluate function at w3 = x1 + dx (here dx is a vector of perturbations)
316fcd7ac73SHong Zhang                            w2 = F(x1 + dx) - F(x1)
317fcd7ac73SHong Zhang     */
318fcd7ac73SHong Zhang     ierr = PetscLogEventBegin(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr);
319fcd7ac73SHong Zhang     ierr = (*f)(sctx,w3,w2,fctx);CHKERRQ(ierr);
320fcd7ac73SHong Zhang     ierr = PetscLogEventEnd(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr);
321fcd7ac73SHong Zhang     ierr = VecAXPY(w2,-1.0,w1);CHKERRQ(ierr);
3229e917edbSHong Zhang 
3238bc97078SHong Zhang     /*
3248bc97078SHong Zhang      (3-3) Loop over rows of vector, putting results into Jacobian matrix
3258bc97078SHong Zhang     */
326c53567a0SHong Zhang     nrows_k = nrows[k];
327fcd7ac73SHong Zhang     ierr = VecGetArray(w2,&y);CHKERRQ(ierr);
328b039d6c4SHong Zhang     if (coloring->htype[0] == 'w') {
329c53567a0SHong Zhang       for (l=0; l<nrows_k; l++) {
330573f477fSHong Zhang         row                     = Jentry[nz].row;   /* local row index */
331b039d6c4SHong Zhang         *(Jentry[nz++].valaddr) = y[row]*dx;
3329e917edbSHong Zhang       }
333b039d6c4SHong Zhang     } else { /* htype == 'ds' */
334c53567a0SHong Zhang       for (l=0; l<nrows_k; l++) {
335b039d6c4SHong Zhang         row                   = Jentry[nz].row;   /* local row index */
336b039d6c4SHong Zhang         *(Jentry[nz].valaddr) = y[row]*vscale_array[Jentry[nz].col];
337573f477fSHong Zhang         nz++;
338fcd7ac73SHong Zhang       }
339b039d6c4SHong Zhang     }
340fcd7ac73SHong Zhang     ierr = VecRestoreArray(w2,&y);CHKERRQ(ierr);
3418bc97078SHong Zhang   }
342f5aae955SHong Zhang   ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
343f5aae955SHong Zhang   ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3449e917edbSHong Zhang   if (vscale) {
3458bc97078SHong Zhang     ierr = VecRestoreArray(vscale,&vscale_array);CHKERRQ(ierr);
3469e917edbSHong Zhang   }
347fcd7ac73SHong Zhang 
348fcd7ac73SHong Zhang   coloring->currentcolor = -1;
349fcd7ac73SHong Zhang   PetscFunctionReturn(0);
350fcd7ac73SHong Zhang }
351fcd7ac73SHong Zhang 
352fcd7ac73SHong Zhang #undef __FUNCT__
353fcd7ac73SHong Zhang #define __FUNCT__ "MatFDColoringCreate_MPIAIJ_new"
354fcd7ac73SHong Zhang PetscErrorCode MatFDColoringCreate_MPIAIJ_new(Mat mat,ISColoring iscoloring,MatFDColoring c)
355fcd7ac73SHong Zhang {
3560d1c53f1SHong Zhang   //Mat_MPIAIJ             *aij=(Mat_MPIAIJ*)mat->data;
357fcd7ac73SHong Zhang   PetscErrorCode         ierr;
358fcd7ac73SHong Zhang   PetscMPIInt            size,*ncolsonproc,*disp,nn;
3594b2e90caSHong Zhang   PetscInt               i,n,nrows,nrows_i,j,k,m,ncols,col;
36072c15787SHong Zhang   const PetscInt         *is,*A_ci,*A_cj,*B_ci,*B_cj,*row = NULL,*ltog=NULL;
361fcd7ac73SHong Zhang   PetscInt               nis=iscoloring->n,nctot,*cols;
362d3825b63SHong Zhang   PetscInt               *rowhit,cstart,cend,colb;
363fcd7ac73SHong Zhang   IS                     *isa;
364fcd7ac73SHong Zhang   ISLocalToGlobalMapping map=mat->cmap->mapping;
365fcd7ac73SHong Zhang   PetscInt               ctype=c->ctype;
3660d1c53f1SHong Zhang   Mat                    A,B;
3670d1c53f1SHong Zhang   //Mat                    A=aij->A,B=aij->B;
3680d1c53f1SHong Zhang   //Mat_SeqAIJ             *spA=(Mat_SeqAIJ*)A->data,*spB=(Mat_SeqAIJ*)B->data;
3690d1c53f1SHong Zhang   //PetscScalar            *A_val=spA->a,*B_val=spB->a;
3700d1c53f1SHong Zhang   PetscScalar            *A_val,*B_val;
371fcd7ac73SHong Zhang   PetscInt               spidx;
3720d1c53f1SHong Zhang   PetscInt               *spidxA,*spidxB,nz,bs,bs2;
373d3825b63SHong Zhang   PetscScalar            **valaddrhit;
374573f477fSHong Zhang   MatEntry               *Jentry;
3750d1c53f1SHong Zhang   PetscBool              isBAIJ;
3760d1c53f1SHong Zhang #if defined(PETSC_USE_CTABLE)
3770d1c53f1SHong Zhang   PetscTable             colmap=NULL;
3780d1c53f1SHong Zhang #else
3790d1c53f1SHong Zhang   PetscInt               *colmap=NULL;     /* local col number of off-diag col */
3800d1c53f1SHong Zhang #endif
381fcd7ac73SHong Zhang 
382fcd7ac73SHong Zhang   PetscFunctionBegin;
38372c15787SHong Zhang   if (ctype == IS_COLORING_GHOSTED) {
38472c15787SHong Zhang     if (!map) SETERRQ(PetscObjectComm((PetscObject)mat),PETSC_ERR_ARG_INCOMP,"When using ghosted differencing matrix must have local to global mapping provided with MatSetLocalToGlobalMapping");
38572c15787SHong Zhang     ierr = ISLocalToGlobalMappingGetIndices(map,&ltog);CHKERRQ(ierr);
38672c15787SHong Zhang   }
387fcd7ac73SHong Zhang 
3880d1c53f1SHong Zhang   ierr = MatGetBlockSize(mat,&bs);CHKERRQ(ierr);
3890d1c53f1SHong Zhang   ierr = PetscObjectTypeCompare((PetscObject)mat,MATMPIBAIJ,&isBAIJ);CHKERRQ(ierr);
3900d1c53f1SHong Zhang   if (!isBAIJ) {
3910d1c53f1SHong Zhang     bs = 1; /* only bs=1 is supported for non MPIBAIJ matrix */
3920d1c53f1SHong Zhang     Mat_MPIAIJ             *aij=(Mat_MPIAIJ*)mat->data;
3930d1c53f1SHong Zhang     A=aij->A; B=aij->B;
3940d1c53f1SHong Zhang     Mat_SeqAIJ             *spA=(Mat_SeqAIJ*)A->data,*spB=(Mat_SeqAIJ*)B->data;
3950d1c53f1SHong Zhang     A_val=spA->a; B_val=spB->a;
3960d1c53f1SHong Zhang     nz         = spA->nz + spB->nz; /* total nonzero entries of mat */
3970d1c53f1SHong Zhang     if (!aij->colmap) {
3980d1c53f1SHong Zhang       ierr = MatCreateColmap_MPIAIJ_Private(mat);CHKERRQ(ierr);
3990d1c53f1SHong Zhang       colmap = aij->colmap;
4000d1c53f1SHong Zhang     }
4010d1c53f1SHong Zhang     ierr = MatGetColumnIJ_SeqAIJ_Color(A,0,PETSC_FALSE,PETSC_FALSE,&ncols,&A_ci,&A_cj,&spidxA,NULL);CHKERRQ(ierr);
4020d1c53f1SHong Zhang     ierr = MatGetColumnIJ_SeqAIJ_Color(B,0,PETSC_FALSE,PETSC_FALSE,&ncols,&B_ci,&B_cj,&spidxB,NULL);CHKERRQ(ierr);
4030d1c53f1SHong Zhang   } else {
4040d1c53f1SHong Zhang     Mat_MPIBAIJ             *aij=(Mat_MPIBAIJ*)mat->data;
4050d1c53f1SHong Zhang     A=aij->A; B=aij->B;
4060d1c53f1SHong Zhang     Mat_SeqBAIJ             *spA=(Mat_SeqBAIJ*)A->data,*spB=(Mat_SeqBAIJ*)B->data;
4070d1c53f1SHong Zhang     A_val=spA->a; B_val=spB->a;
4080d1c53f1SHong Zhang     nz         = spA->nz + spB->nz; /* total nonzero entries of mat */
4090d1c53f1SHong Zhang     if (!aij->colmap) {
4100d1c53f1SHong Zhang       ierr = MatCreateColmap_MPIBAIJ_Private(mat);CHKERRQ(ierr);
4110d1c53f1SHong Zhang       colmap = aij->colmap;
4120d1c53f1SHong Zhang     }
4130d1c53f1SHong Zhang     ierr = MatGetColumnIJ_SeqBAIJ_Color(A,0,PETSC_FALSE,PETSC_FALSE,&ncols,&A_ci,&A_cj,&spidxA,NULL);CHKERRQ(ierr);
4140d1c53f1SHong Zhang     ierr = MatGetColumnIJ_SeqBAIJ_Color(B,0,PETSC_FALSE,PETSC_FALSE,&ncols,&B_ci,&B_cj,&spidxB,NULL);CHKERRQ(ierr);
4150d1c53f1SHong Zhang   }
4160d1c53f1SHong Zhang 
4170d1c53f1SHong Zhang   m         = mat->rmap->n/bs;
4180d1c53f1SHong Zhang   cstart    = mat->cmap->rstart/bs;
4190d1c53f1SHong Zhang   cend      = mat->cmap->rend/bs;
4200d1c53f1SHong Zhang   c->M      = mat->rmap->N/bs;         /* set the global rows and columns and local rows */
4210d1c53f1SHong Zhang   c->N      = mat->cmap->N/bs;
422d3825b63SHong Zhang   c->m      = m;
4230d1c53f1SHong Zhang   c->rstart = mat->rmap->rstart/bs;
424fcd7ac73SHong Zhang 
425fcd7ac73SHong Zhang   c->ncolors = nis;
426fcd7ac73SHong Zhang   ierr       = PetscMalloc(nis*sizeof(PetscInt),&c->ncolumns);CHKERRQ(ierr);
427fcd7ac73SHong Zhang   ierr       = PetscMalloc(nis*sizeof(PetscInt*),&c->columns);CHKERRQ(ierr);
428fcd7ac73SHong Zhang   ierr       = PetscMalloc(nis*sizeof(PetscInt),&c->nrows);CHKERRQ(ierr);
4298bc97078SHong Zhang   ierr       = PetscLogObjectMemory((PetscObject)c,3*nis*sizeof(PetscInt));CHKERRQ(ierr);
430fcd7ac73SHong Zhang 
4310d1c53f1SHong Zhang   //nz         = spA->nz + spB->nz; /* total nonzero entries of mat */
432573f477fSHong Zhang   ierr       = PetscMalloc(nz*sizeof(MatEntry),&Jentry);CHKERRQ(ierr);
4338bc97078SHong Zhang   ierr       = PetscLogObjectMemory((PetscObject)c,nz*sizeof(MatEntry));CHKERRQ(ierr);
4348bc97078SHong Zhang   c->matentry = Jentry;
435a774a6f1SHong Zhang 
436d3825b63SHong Zhang   /* Allow access to data structures of local part of matrix
437d3825b63SHong Zhang    - creates aij->colmap which maps global column number to local number in part B */
4380d1c53f1SHong Zhang   //if (!aij->colmap) {
4390d1c53f1SHong Zhang   //  ierr = MatCreateColmap_MPIAIJ_Private(mat);CHKERRQ(ierr);
4400d1c53f1SHong Zhang   //}
4410d1c53f1SHong Zhang   //ierr = MatGetColumnIJ_SeqAIJ_Color(aij->A,0,PETSC_FALSE,PETSC_FALSE,&ncols,&A_ci,&A_cj,&spidxA,NULL);CHKERRQ(ierr);
4420d1c53f1SHong Zhang   //ierr = MatGetColumnIJ_SeqAIJ_Color(aij->B,0,PETSC_FALSE,PETSC_FALSE,&ncols,&B_ci,&B_cj,&spidxB,NULL);CHKERRQ(ierr);
443fcd7ac73SHong Zhang 
444d3825b63SHong Zhang   ierr = PetscMalloc2(m+1,PetscInt,&rowhit,m+1,PetscScalar*,&valaddrhit);CHKERRQ(ierr);
445fcd7ac73SHong Zhang   nz = 0;
44672c15787SHong Zhang   ierr = ISColoringGetIS(iscoloring,PETSC_IGNORE,&isa);CHKERRQ(ierr);
447d3825b63SHong Zhang   for (i=0; i<nis; i++) { /* for each local color */
448fcd7ac73SHong Zhang     ierr = ISGetLocalSize(isa[i],&n);CHKERRQ(ierr);
449fcd7ac73SHong Zhang     ierr = ISGetIndices(isa[i],&is);CHKERRQ(ierr);
450fcd7ac73SHong Zhang 
451fcd7ac73SHong Zhang     c->ncolumns[i] = n; /* local number of columns of this color on this process */
452fcd7ac73SHong Zhang     if (n) {
453fcd7ac73SHong Zhang       ierr = PetscMalloc(n*sizeof(PetscInt),&c->columns[i]);CHKERRQ(ierr);
454fcd7ac73SHong Zhang       ierr = PetscLogObjectMemory((PetscObject)c,n*sizeof(PetscInt));CHKERRQ(ierr);
455fcd7ac73SHong Zhang       ierr = PetscMemcpy(c->columns[i],is,n*sizeof(PetscInt));CHKERRQ(ierr);
456a2f2d239SHong Zhang       /* convert global column indices to local ones! */
457a2f2d239SHong Zhang 
458fcd7ac73SHong Zhang     } else {
459fcd7ac73SHong Zhang       c->columns[i] = 0;
460fcd7ac73SHong Zhang     }
461fcd7ac73SHong Zhang 
462fcd7ac73SHong Zhang     if (ctype == IS_COLORING_GLOBAL) {
463d3825b63SHong Zhang       /* Determine nctot, the total (parallel) number of columns of this color */
464fcd7ac73SHong Zhang       ierr = MPI_Comm_size(PetscObjectComm((PetscObject)mat),&size);CHKERRQ(ierr);
465fcd7ac73SHong Zhang       ierr = PetscMalloc2(size,PetscMPIInt,&ncolsonproc,size,PetscMPIInt,&disp);CHKERRQ(ierr);
466fcd7ac73SHong Zhang 
467d3825b63SHong Zhang       /* ncolsonproc[j]: local ncolumns on proc[j] of this color */
468fcd7ac73SHong Zhang       ierr  = PetscMPIIntCast(n,&nn);CHKERRQ(ierr);
469fcd7ac73SHong Zhang       ierr  = MPI_Allgather(&nn,1,MPI_INT,ncolsonproc,1,MPI_INT,PetscObjectComm((PetscObject)mat));CHKERRQ(ierr);
470fcd7ac73SHong Zhang       nctot = 0; for (j=0; j<size; j++) nctot += ncolsonproc[j];
471fcd7ac73SHong Zhang       if (!nctot) {
472fcd7ac73SHong Zhang         ierr = PetscInfo(mat,"Coloring of matrix has some unneeded colors with no corresponding rows\n");CHKERRQ(ierr);
473fcd7ac73SHong Zhang       }
474fcd7ac73SHong Zhang 
475fcd7ac73SHong Zhang       disp[0] = 0;
476fcd7ac73SHong Zhang       for (j=1; j<size; j++) {
477fcd7ac73SHong Zhang         disp[j] = disp[j-1] + ncolsonproc[j-1];
478fcd7ac73SHong Zhang       }
479fcd7ac73SHong Zhang 
480d3825b63SHong Zhang       /* Get cols, the complete list of columns for this color on each process */
481fcd7ac73SHong Zhang       ierr = PetscMalloc((nctot+1)*sizeof(PetscInt),&cols);CHKERRQ(ierr);
482fcd7ac73SHong Zhang       ierr = MPI_Allgatherv((void*)is,n,MPIU_INT,cols,ncolsonproc,disp,MPIU_INT,PetscObjectComm((PetscObject)mat));CHKERRQ(ierr);
483fcd7ac73SHong Zhang       ierr = PetscFree2(ncolsonproc,disp);CHKERRQ(ierr);
484fcd7ac73SHong Zhang     } else if (ctype == IS_COLORING_GHOSTED) {
485fcd7ac73SHong Zhang       /* Determine local number of columns of this color on this process, including ghost points */
486fcd7ac73SHong Zhang       nctot = n;
487fcd7ac73SHong Zhang       ierr  = PetscMalloc((nctot+1)*sizeof(PetscInt),&cols);CHKERRQ(ierr);
488fcd7ac73SHong Zhang       ierr  = PetscMemcpy(cols,is,n*sizeof(PetscInt));CHKERRQ(ierr);
489fcd7ac73SHong Zhang     } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Not provided for this MatFDColoring type");
490fcd7ac73SHong Zhang 
4911b97d346SHong Zhang     /* Mark all rows affect by these columns */
492d3825b63SHong Zhang     ierr = PetscMemzero(rowhit,m*sizeof(PetscInt));CHKERRQ(ierr);
4930d1c53f1SHong Zhang     bs2     = bs*bs;
4944b2e90caSHong Zhang     nrows_i = 0;
4951b97d346SHong Zhang     for (j=0; j<nctot; j++) { /* loop over columns*/
496fcd7ac73SHong Zhang       if (ctype == IS_COLORING_GHOSTED) {
497fcd7ac73SHong Zhang         col = ltog[cols[j]];
498fcd7ac73SHong Zhang       } else {
499fcd7ac73SHong Zhang         col = cols[j];
500fcd7ac73SHong Zhang       }
501fcd7ac73SHong Zhang       if (col >= cstart && col < cend) { /* column is in diagonal block of matrix A */
502d3825b63SHong Zhang         row      = A_cj + A_ci[col-cstart];
503d3825b63SHong Zhang         nrows    = A_ci[col-cstart+1] - A_ci[col-cstart];
5044b2e90caSHong Zhang         nrows_i += nrows;
505fcd7ac73SHong Zhang         /* loop over columns of A marking them in rowhit */
506d3825b63SHong Zhang         for (k=0; k<nrows; k++) {
507d3825b63SHong Zhang           /* set valaddrhit for part A */
508fcd7ac73SHong Zhang           spidx            = spidxA[A_ci[col-cstart] + k];
5090d1c53f1SHong Zhang           valaddrhit[*row] = &A_val[bs2*spidx];
510a774a6f1SHong Zhang           rowhit[*row++]   = col - cstart + 1; /* local column index */
511fcd7ac73SHong Zhang         }
512fcd7ac73SHong Zhang       } else { /* column is in off-diagonal block of matrix B */
513fcd7ac73SHong Zhang #if defined(PETSC_USE_CTABLE)
5140d1c53f1SHong Zhang         //ierr = PetscTableFind(aij->colmap,col+1,&colb);CHKERRQ(ierr);
5150d1c53f1SHong Zhang         ierr = PetscTableFind(colmap,col+1,&colb);CHKERRQ(ierr);
516fcd7ac73SHong Zhang         colb--;
517fcd7ac73SHong Zhang #else
5180d1c53f1SHong Zhang         //colb = aij->colmap[col] - 1; /* local column index */
5190d1c53f1SHong Zhang         colb = colmap[col] - 1; /* local column index */
520fcd7ac73SHong Zhang #endif
521fcd7ac73SHong Zhang         if (colb == -1) {
522d3825b63SHong Zhang           nrows = 0;
523fcd7ac73SHong Zhang         } else {
5240d1c53f1SHong Zhang           colb  = colb/bs;
525d3825b63SHong Zhang           row   = B_cj + B_ci[colb];
526d3825b63SHong Zhang           nrows = B_ci[colb+1] - B_ci[colb];
527fcd7ac73SHong Zhang         }
5284b2e90caSHong Zhang         nrows_i += nrows;
529fcd7ac73SHong Zhang         /* loop over columns of B marking them in rowhit */
530d3825b63SHong Zhang         for (k=0; k<nrows; k++) {
531d3825b63SHong Zhang           /* set valaddrhit for part B */
532fcd7ac73SHong Zhang           spidx            = spidxB[B_ci[colb] + k];
5330d1c53f1SHong Zhang           valaddrhit[*row] = &B_val[bs2*spidx];
53470e7395fSHong Zhang           rowhit[*row++]   = colb + 1 + cend - cstart; /* local column index */
535fcd7ac73SHong Zhang         }
536fcd7ac73SHong Zhang       }
537fcd7ac73SHong Zhang     }
5384b2e90caSHong Zhang     c->nrows[i] = nrows_i;
5398bc97078SHong Zhang 
540d3825b63SHong Zhang     for (j=0; j<m; j++) {
541fcd7ac73SHong Zhang       if (rowhit[j]) {
542573f477fSHong Zhang         Jentry[nz].row     = j;              /* local row index */
543573f477fSHong Zhang         Jentry[nz].col     = rowhit[j] - 1;  /* local column index */
544573f477fSHong Zhang         Jentry[nz].valaddr = valaddrhit[j];  /* address of mat value for this entry */
545573f477fSHong Zhang         nz++;
546fcd7ac73SHong Zhang       }
547fcd7ac73SHong Zhang     }
548fcd7ac73SHong Zhang     ierr = PetscFree(cols);CHKERRQ(ierr);
549fcd7ac73SHong Zhang   }
5508bc97078SHong Zhang   ierr = ISColoringRestoreIS(iscoloring,&isa);CHKERRQ(ierr);
5510d1c53f1SHong Zhang   //if (nz != spA->nz + spB->nz) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"nz %d != mat->nz %d\n",nz,spA->nz+spB->nz);
552fcd7ac73SHong Zhang 
553d3825b63SHong Zhang   ierr = PetscFree2(rowhit,valaddrhit);CHKERRQ(ierr);
5540d1c53f1SHong Zhang   if (isBAIJ) {
5550d1c53f1SHong Zhang     ierr = MatRestoreColumnIJ_SeqBAIJ_Color(A,0,PETSC_FALSE,PETSC_FALSE,&ncols,&A_ci,&A_cj,&spidxA,NULL);CHKERRQ(ierr);
5560d1c53f1SHong Zhang     ierr = MatRestoreColumnIJ_SeqBAIJ_Color(B,0,PETSC_FALSE,PETSC_FALSE,&ncols,&B_ci,&B_cj,&spidxB,NULL);CHKERRQ(ierr);
5570d1c53f1SHong Zhang     ierr = PetscMalloc(bs*mat->cmap->n*sizeof(PetscScalar),&c->dy);CHKERRQ(ierr);
5580d1c53f1SHong Zhang     mat->ops->fdcoloringapply = MatFDColoringApply_BAIJ_new;
5590d1c53f1SHong Zhang   } else {
5600d1c53f1SHong Zhang     ierr = MatRestoreColumnIJ_SeqAIJ_Color(A,0,PETSC_FALSE,PETSC_FALSE,&ncols,&A_ci,&A_cj,&spidxA,NULL);CHKERRQ(ierr);
5610d1c53f1SHong Zhang     ierr = MatRestoreColumnIJ_SeqAIJ_Color(B,0,PETSC_FALSE,PETSC_FALSE,&ncols,&B_ci,&B_cj,&spidxB,NULL);CHKERRQ(ierr);
5620d1c53f1SHong Zhang     mat->ops->fdcoloringapply = MatFDColoringApply_AIJ_new;
5630d1c53f1SHong Zhang   }
5640d1c53f1SHong Zhang 
56572c15787SHong Zhang   if (ctype == IS_COLORING_GHOSTED) {
56672c15787SHong Zhang     ierr = ISLocalToGlobalMappingRestoreIndices(map,&ltog);CHKERRQ(ierr);
56772c15787SHong Zhang   }
568fcd7ac73SHong Zhang   PetscFunctionReturn(0);
569fcd7ac73SHong Zhang }
570fcd7ac73SHong Zhang 
571fcd7ac73SHong Zhang /*------------------------------------------------------*/
572fcd7ac73SHong Zhang #undef __FUNCT__
5734a2ae208SSatish Balay #define __FUNCT__ "MatFDColoringCreate_MPIAIJ"
574dfbe8321SBarry Smith PetscErrorCode MatFDColoringCreate_MPIAIJ(Mat mat,ISColoring iscoloring,MatFDColoring c)
575a64fbb32SBarry Smith {
5766eaac0f3SBarry Smith   Mat_MPIAIJ             *aij = (Mat_MPIAIJ*)mat->data;
5776849ba73SBarry Smith   PetscErrorCode         ierr;
578b1d57f15SBarry Smith   PetscMPIInt            size,*ncolsonproc,*disp,nn;
5791a83f524SJed Brown   PetscInt               i,n,nrows,j,k,m,ncols,col;
580afcb2eb5SJed Brown   const PetscInt         *is,*A_ci,*A_cj,*B_ci,*B_cj,*rows = 0,*ltog;
5811a83f524SJed Brown   PetscInt               nis = iscoloring->n,nctot,*cols;
582f6d58c54SBarry Smith   PetscInt               *rowhit,M,cstart,cend,colb;
583b1d57f15SBarry Smith   PetscInt               *columnsforrow,l;
584b9617806SBarry Smith   IS                     *isa;
585ace3abfcSBarry Smith   PetscBool              done,flg;
586992144d0SBarry Smith   ISLocalToGlobalMapping map   = mat->cmap->mapping;
587afcb2eb5SJed Brown   PetscInt               ctype=c->ctype;
588fcd7ac73SHong Zhang   PetscBool              new_impl=PETSC_FALSE;
589a64fbb32SBarry Smith 
5903a40ed3dSBarry Smith   PetscFunctionBegin;
591fcd7ac73SHong Zhang   ierr = PetscOptionsName("-new","using new impls","",&new_impl);CHKERRQ(ierr);
592fcd7ac73SHong Zhang   if (new_impl){
593fcd7ac73SHong Zhang     ierr =  MatFDColoringCreate_MPIAIJ_new(mat,iscoloring,c);CHKERRQ(ierr);
594fcd7ac73SHong Zhang     PetscFunctionReturn(0);
595fcd7ac73SHong Zhang   }
596ce94432eSBarry Smith   if (ctype == IS_COLORING_GHOSTED && !map) SETERRQ(PetscObjectComm((PetscObject)mat),PETSC_ERR_ARG_INCOMP,"When using ghosted differencing matrix must have local to global mapping provided with MatSetLocalToGlobalMapping");
597522c5e43SBarry Smith 
598afcb2eb5SJed Brown   if (map) {ierr = ISLocalToGlobalMappingGetIndices(map,&ltog);CHKERRQ(ierr);}
599afcb2eb5SJed Brown   else     ltog = NULL;
600b9617806SBarry Smith   ierr = ISColoringGetIS(iscoloring,PETSC_IGNORE,&isa);CHKERRQ(ierr);
6013acb8795SBarry Smith 
602f6d58c54SBarry Smith   M         = mat->rmap->n;
603f6d58c54SBarry Smith   cstart    = mat->cmap->rstart;
604f6d58c54SBarry Smith   cend      = mat->cmap->rend;
605f6d58c54SBarry Smith   c->M      = mat->rmap->N;         /* set the global rows and columns and local rows */
606f6d58c54SBarry Smith   c->N      = mat->cmap->N;
607f6d58c54SBarry Smith   c->m      = mat->rmap->n;
608f6d58c54SBarry Smith   c->rstart = mat->rmap->rstart;
609005c665bSBarry Smith 
610a64fbb32SBarry Smith   c->ncolors = nis;
611b1d57f15SBarry Smith   ierr       = PetscMalloc(nis*sizeof(PetscInt),&c->ncolumns);CHKERRQ(ierr);
612b1d57f15SBarry Smith   ierr       = PetscMalloc(nis*sizeof(PetscInt*),&c->columns);CHKERRQ(ierr);
613b1d57f15SBarry Smith   ierr       = PetscMalloc(nis*sizeof(PetscInt),&c->nrows);CHKERRQ(ierr);
614b1d57f15SBarry Smith   ierr       = PetscMalloc(nis*sizeof(PetscInt*),&c->rows);CHKERRQ(ierr);
615b1d57f15SBarry Smith   ierr       = PetscMalloc(nis*sizeof(PetscInt*),&c->columnsforrow);CHKERRQ(ierr);
6163bb1ff40SBarry Smith   ierr       = PetscLogObjectMemory((PetscObject)c,5*nis*sizeof(PetscInt));CHKERRQ(ierr);
6176eaac0f3SBarry Smith 
6186eaac0f3SBarry Smith   /* Allow access to data structures of local part of matrix */
6196eaac0f3SBarry Smith   if (!aij->colmap) {
620ab9863d7SBarry Smith     ierr = MatCreateColmap_MPIAIJ_Private(mat);CHKERRQ(ierr);
6216eaac0f3SBarry Smith   }
6223acb8795SBarry Smith   ierr = MatGetColumnIJ(aij->A,0,PETSC_FALSE,PETSC_FALSE,&ncols,&A_ci,&A_cj,&done);CHKERRQ(ierr);
6233acb8795SBarry Smith   ierr = MatGetColumnIJ(aij->B,0,PETSC_FALSE,PETSC_FALSE,&ncols,&B_ci,&B_cj,&done);CHKERRQ(ierr);
6246eaac0f3SBarry Smith 
625b1d57f15SBarry Smith   ierr = PetscMalloc((M+1)*sizeof(PetscInt),&rowhit);CHKERRQ(ierr);
626b1d57f15SBarry Smith   ierr = PetscMalloc((M+1)*sizeof(PetscInt),&columnsforrow);CHKERRQ(ierr);
6276eaac0f3SBarry Smith 
628a64fbb32SBarry Smith   for (i=0; i<nis; i++) {
629b9b97703SBarry Smith     ierr = ISGetLocalSize(isa[i],&n);CHKERRQ(ierr);
630a64fbb32SBarry Smith     ierr = ISGetIndices(isa[i],&is);CHKERRQ(ierr);
6312205254eSKarl Rupp 
632fcd7ac73SHong Zhang     c->ncolumns[i] = n; /* local number of columns of this color on this process */
633a64fbb32SBarry Smith     if (n) {
634b1d57f15SBarry Smith       ierr = PetscMalloc(n*sizeof(PetscInt),&c->columns[i]);CHKERRQ(ierr);
6353bb1ff40SBarry Smith       ierr = PetscLogObjectMemory((PetscObject)c,n*sizeof(PetscInt));CHKERRQ(ierr);
636b1d57f15SBarry Smith       ierr = PetscMemcpy(c->columns[i],is,n*sizeof(PetscInt));CHKERRQ(ierr);
637a64fbb32SBarry Smith     } else {
638a64fbb32SBarry Smith       c->columns[i] = 0;
639a64fbb32SBarry Smith     }
640a64fbb32SBarry Smith 
6418ee2e534SBarry Smith     if (ctype == IS_COLORING_GLOBAL) {
6426eaac0f3SBarry Smith       /* Determine the total (parallel) number of columns of this color */
643ce94432eSBarry Smith       ierr = MPI_Comm_size(PetscObjectComm((PetscObject)mat),&size);CHKERRQ(ierr);
644687f1162SBarry Smith       ierr = PetscMalloc2(size,PetscMPIInt,&ncolsonproc,size,PetscMPIInt,&disp);CHKERRQ(ierr);
645b8f8c88eSHong Zhang 
6464dc2109aSBarry Smith       ierr  = PetscMPIIntCast(n,&nn);CHKERRQ(ierr);
647ce94432eSBarry Smith       ierr  = MPI_Allgather(&nn,1,MPI_INT,ncolsonproc,1,MPI_INT,PetscObjectComm((PetscObject)mat));CHKERRQ(ierr);
6482205254eSKarl Rupp       nctot = 0; for (j=0; j<size; j++) nctot += ncolsonproc[j];
6493a7fca6bSBarry Smith       if (!nctot) {
650ae15b995SBarry Smith         ierr = PetscInfo(mat,"Coloring of matrix has some unneeded colors with no corresponding rows\n");CHKERRQ(ierr);
6513a7fca6bSBarry Smith       }
6526eaac0f3SBarry Smith 
6536eaac0f3SBarry Smith       disp[0] = 0;
6546eaac0f3SBarry Smith       for (j=1; j<size; j++) {
6556eaac0f3SBarry Smith         disp[j] = disp[j-1] + ncolsonproc[j-1];
6566eaac0f3SBarry Smith       }
6576eaac0f3SBarry Smith 
6586eaac0f3SBarry Smith       /* Get complete list of columns for color on each processor */
659b1d57f15SBarry Smith       ierr = PetscMalloc((nctot+1)*sizeof(PetscInt),&cols);CHKERRQ(ierr);
660ce94432eSBarry Smith       ierr = MPI_Allgatherv((void*)is,n,MPIU_INT,cols,ncolsonproc,disp,MPIU_INT,PetscObjectComm((PetscObject)mat));CHKERRQ(ierr);
6611d79065fSBarry Smith       ierr = PetscFree2(ncolsonproc,disp);CHKERRQ(ierr);
662b8f8c88eSHong Zhang     } else if (ctype == IS_COLORING_GHOSTED) {
663b8f8c88eSHong Zhang       /* Determine local number of columns of this color on this process, including ghost points */
664b8f8c88eSHong Zhang       nctot = n;
665b8f8c88eSHong Zhang       ierr  = PetscMalloc((nctot+1)*sizeof(PetscInt),&cols);CHKERRQ(ierr);
666b8f8c88eSHong Zhang       ierr  = PetscMemcpy(cols,is,n*sizeof(PetscInt));CHKERRQ(ierr);
667f23aa3ddSBarry Smith     } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Not provided for this MatFDColoring type");
6686eaac0f3SBarry Smith 
6696eaac0f3SBarry Smith     /*
6706eaac0f3SBarry Smith        Mark all rows affect by these columns
6716eaac0f3SBarry Smith     */
672b8f8c88eSHong Zhang     /* Temporary option to allow for debugging/testing */
67390d69ab7SBarry Smith     flg  = PETSC_FALSE;
6740298fd71SBarry Smith     ierr = PetscOptionsGetBool(NULL,"-matfdcoloring_slow",&flg,NULL);CHKERRQ(ierr);
675f158e583SBarry Smith     if (!flg) { /*-----------------------------------------------------------------------------*/
676f158e583SBarry Smith       /* crude, fast version */
677b1d57f15SBarry Smith       ierr = PetscMemzero(rowhit,M*sizeof(PetscInt));CHKERRQ(ierr);
678a64fbb32SBarry Smith       /* loop over columns*/
6796eaac0f3SBarry Smith       for (j=0; j<nctot; j++) {
680b8f8c88eSHong Zhang         if (ctype == IS_COLORING_GHOSTED) {
681b8f8c88eSHong Zhang           col = ltog[cols[j]];
682b8f8c88eSHong Zhang         } else {
6836eaac0f3SBarry Smith           col = cols[j];
684b8f8c88eSHong Zhang         }
6856eaac0f3SBarry Smith         if (col >= cstart && col < cend) {
6866eaac0f3SBarry Smith           /* column is in diagonal block of matrix */
6876eaac0f3SBarry Smith           rows = A_cj + A_ci[col-cstart];
6886eaac0f3SBarry Smith           m    = A_ci[col-cstart+1] - A_ci[col-cstart];
6896eaac0f3SBarry Smith         } else {
690aa482453SBarry Smith #if defined(PETSC_USE_CTABLE)
691cb9801acSJed Brown           ierr = PetscTableFind(aij->colmap,col+1,&colb);CHKERRQ(ierr);
692fa46199cSSatish Balay           colb--;
693b3d2dc96SSatish Balay #else
6946eaac0f3SBarry Smith           colb = aij->colmap[col] - 1;
695b3d2dc96SSatish Balay #endif
6966eaac0f3SBarry Smith           if (colb == -1) {
6976eaac0f3SBarry Smith             m = 0;
6986eaac0f3SBarry Smith           } else {
6996eaac0f3SBarry Smith             rows = B_cj + B_ci[colb];
7006eaac0f3SBarry Smith             m    = B_ci[colb+1] - B_ci[colb];
7016eaac0f3SBarry Smith           }
7026eaac0f3SBarry Smith         }
703a64fbb32SBarry Smith         /* loop over columns marking them in rowhit */
704a64fbb32SBarry Smith         for (k=0; k<m; k++) {
705a64fbb32SBarry Smith           rowhit[*rows++] = col + 1;
706a64fbb32SBarry Smith         }
707a64fbb32SBarry Smith       }
7086eaac0f3SBarry Smith 
709a64fbb32SBarry Smith       /* count the number of hits */
710a64fbb32SBarry Smith       nrows = 0;
7116eaac0f3SBarry Smith       for (j=0; j<M; j++) {
712a64fbb32SBarry Smith         if (rowhit[j]) nrows++;
713a64fbb32SBarry Smith       }
714a64fbb32SBarry Smith       c->nrows[i] = nrows;
715b1d57f15SBarry Smith       ierr        = PetscMalloc((nrows+1)*sizeof(PetscInt),&c->rows[i]);CHKERRQ(ierr);
716b1d57f15SBarry Smith       ierr        = PetscMalloc((nrows+1)*sizeof(PetscInt),&c->columnsforrow[i]);CHKERRQ(ierr);
7173bb1ff40SBarry Smith       ierr        = PetscLogObjectMemory((PetscObject)c,2*(nrows+1)*sizeof(PetscInt));CHKERRQ(ierr);
718a64fbb32SBarry Smith       nrows       = 0;
7196eaac0f3SBarry Smith       for (j=0; j<M; j++) {
720a64fbb32SBarry Smith         if (rowhit[j]) {
721fcd7ac73SHong Zhang           c->rows[i][nrows]          = j;              /* local row index */
722fcd7ac73SHong Zhang           c->columnsforrow[i][nrows] = rowhit[j] - 1;  /* global column index */
723a64fbb32SBarry Smith           nrows++;
724a64fbb32SBarry Smith         }
725a64fbb32SBarry Smith       }
726a64fbb32SBarry Smith     } else { /*-------------------------------------------------------------------------------*/
727f158e583SBarry Smith       /* slow version, using rowhit as a linked list */
728b1d57f15SBarry Smith       PetscInt currentcol,fm,mfm;
7296eaac0f3SBarry Smith       rowhit[M] = M;
730a64fbb32SBarry Smith       nrows     = 0;
731a64fbb32SBarry Smith       /* loop over columns*/
7326eaac0f3SBarry Smith       for (j=0; j<nctot; j++) {
733b8f8c88eSHong Zhang         if (ctype == IS_COLORING_GHOSTED) {
734b8f8c88eSHong Zhang           col = ltog[cols[j]];
735b8f8c88eSHong Zhang         } else {
7366eaac0f3SBarry Smith           col = cols[j];
737b8f8c88eSHong Zhang         }
7386eaac0f3SBarry Smith         if (col >= cstart && col < cend) {
7396eaac0f3SBarry Smith           /* column is in diagonal block of matrix */
7406eaac0f3SBarry Smith           rows = A_cj + A_ci[col-cstart];
7416eaac0f3SBarry Smith           m    = A_ci[col-cstart+1] - A_ci[col-cstart];
7426eaac0f3SBarry Smith         } else {
743aa482453SBarry Smith #if defined(PETSC_USE_CTABLE)
7440f5bd95cSBarry Smith           ierr = PetscTableFind(aij->colmap,col+1,&colb);CHKERRQ(ierr);
745fa46199cSSatish Balay           colb--;
746b3d2dc96SSatish Balay #else
7476eaac0f3SBarry Smith           colb = aij->colmap[col] - 1;
748b3d2dc96SSatish Balay #endif
7496eaac0f3SBarry Smith           if (colb == -1) {
7506eaac0f3SBarry Smith             m = 0;
7516eaac0f3SBarry Smith           } else {
7526eaac0f3SBarry Smith             rows = B_cj + B_ci[colb];
7536eaac0f3SBarry Smith             m    = B_ci[colb+1] - B_ci[colb];
7546eaac0f3SBarry Smith           }
7556eaac0f3SBarry Smith         }
756b8f8c88eSHong Zhang 
757a64fbb32SBarry Smith         /* loop over columns marking them in rowhit */
7586eaac0f3SBarry Smith         fm = M;    /* fm points to first entry in linked list */
759a64fbb32SBarry Smith         for (k=0; k<m; k++) {
760a64fbb32SBarry Smith           currentcol = *rows++;
761a64fbb32SBarry Smith           /* is it already in the list? */
762a64fbb32SBarry Smith           do {
763a64fbb32SBarry Smith             mfm = fm;
764a64fbb32SBarry Smith             fm  = rowhit[fm];
765a64fbb32SBarry Smith           } while (fm < currentcol);
766a64fbb32SBarry Smith           /* not in list so add it */
767a64fbb32SBarry Smith           if (fm != currentcol) {
768a64fbb32SBarry Smith             nrows++;
769a64fbb32SBarry Smith             columnsforrow[currentcol] = col;
770a64fbb32SBarry Smith             /* next three lines insert new entry into linked list */
771a64fbb32SBarry Smith             rowhit[mfm]        = currentcol;
772a64fbb32SBarry Smith             rowhit[currentcol] = fm;
773a64fbb32SBarry Smith             fm                 = currentcol;
774a64fbb32SBarry Smith             /* fm points to present position in list since we know the columns are sorted */
775f23aa3ddSBarry Smith           } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Invalid coloring of matrix detected");
776a64fbb32SBarry Smith         }
777a64fbb32SBarry Smith       }
778a64fbb32SBarry Smith       c->nrows[i] = nrows;
7792205254eSKarl Rupp 
780b1d57f15SBarry Smith       ierr = PetscMalloc((nrows+1)*sizeof(PetscInt),&c->rows[i]);CHKERRQ(ierr);
781b1d57f15SBarry Smith       ierr = PetscMalloc((nrows+1)*sizeof(PetscInt),&c->columnsforrow[i]);CHKERRQ(ierr);
7823bb1ff40SBarry Smith       ierr = PetscLogObjectMemory((PetscObject)c,(nrows+1)*sizeof(PetscInt));CHKERRQ(ierr);
783a64fbb32SBarry Smith       /* now store the linked list of rows into c->rows[i] */
784a64fbb32SBarry Smith       nrows = 0;
7856eaac0f3SBarry Smith       fm    = rowhit[M];
786a64fbb32SBarry Smith       do {
787a64fbb32SBarry Smith         c->rows[i][nrows]            = fm;
788a64fbb32SBarry Smith         c->columnsforrow[i][nrows++] = columnsforrow[fm];
789a64fbb32SBarry Smith         fm                           = rowhit[fm];
7906eaac0f3SBarry Smith       } while (fm < M);
7916eaac0f3SBarry Smith     } /* ---------------------------------------------------------------------------------------*/
792606d414cSSatish Balay     ierr = PetscFree(cols);CHKERRQ(ierr);
7936eaac0f3SBarry Smith   }
79430b34957SBarry Smith 
79530b34957SBarry Smith   /* Optimize by adding the vscale, and scaleforrow[][] fields */
79630b34957SBarry Smith   /*
79730b34957SBarry Smith        vscale will contain the "diagonal" on processor scalings followed by the off processor
79830b34957SBarry Smith   */
7998ee2e534SBarry Smith   if (ctype == IS_COLORING_GLOBAL) {
800ce94432eSBarry Smith     ierr = VecCreateGhost(PetscObjectComm((PetscObject)mat),aij->A->rmap->n,PETSC_DETERMINE,aij->B->cmap->n,aij->garray,&c->vscale);CHKERRQ(ierr);
801b1d57f15SBarry Smith     ierr = PetscMalloc(c->ncolors*sizeof(PetscInt*),&c->vscaleforrow);CHKERRQ(ierr);
80230b34957SBarry Smith     for (k=0; k<c->ncolors; k++) {
803b1d57f15SBarry Smith       ierr = PetscMalloc((c->nrows[k]+1)*sizeof(PetscInt),&c->vscaleforrow[k]);CHKERRQ(ierr);
80430b34957SBarry Smith       for (l=0; l<c->nrows[k]; l++) {
80530b34957SBarry Smith         col = c->columnsforrow[k][l];
80630b34957SBarry Smith         if (col >= cstart && col < cend) {
80730b34957SBarry Smith           /* column is in diagonal block of matrix */
80830b34957SBarry Smith           colb = col - cstart;
80930b34957SBarry Smith         } else {
81030b34957SBarry Smith           /* column  is in "off-processor" part */
81130b34957SBarry Smith #if defined(PETSC_USE_CTABLE)
81230b34957SBarry Smith           ierr = PetscTableFind(aij->colmap,col+1,&colb);CHKERRQ(ierr);
81330b34957SBarry Smith           colb--;
81430b34957SBarry Smith #else
81530b34957SBarry Smith           colb = aij->colmap[col] - 1;
81630b34957SBarry Smith #endif
81730b34957SBarry Smith           colb += cend - cstart;
81830b34957SBarry Smith         }
81930b34957SBarry Smith         c->vscaleforrow[k][l] = colb;
82030b34957SBarry Smith       }
82130b34957SBarry Smith     }
822b8f8c88eSHong Zhang   } else if (ctype == IS_COLORING_GHOSTED) {
823b8f8c88eSHong Zhang     /* Get gtol mapping */
824afcb2eb5SJed Brown     PetscInt N = mat->cmap->N,nlocal,*gtol;
825b8f8c88eSHong Zhang     ierr = PetscMalloc((N+1)*sizeof(PetscInt),&gtol);CHKERRQ(ierr);
826b8f8c88eSHong Zhang     for (i=0; i<N; i++) gtol[i] = -1;
827afcb2eb5SJed Brown     ierr = ISLocalToGlobalMappingGetSize(map,&nlocal);CHKERRQ(ierr);
828afcb2eb5SJed Brown     for (i=0; i<nlocal; i++) gtol[ltog[i]] = i;
829b8f8c88eSHong Zhang 
830b8f8c88eSHong Zhang     c->vscale = 0; /* will be created in MatFDColoringApply() */
831b8f8c88eSHong Zhang     ierr      = PetscMalloc(c->ncolors*sizeof(PetscInt*),&c->vscaleforrow);CHKERRQ(ierr);
832b8f8c88eSHong Zhang     for (k=0; k<c->ncolors; k++) {
833b8f8c88eSHong Zhang       ierr = PetscMalloc((c->nrows[k]+1)*sizeof(PetscInt),&c->vscaleforrow[k]);CHKERRQ(ierr);
834b8f8c88eSHong Zhang       for (l=0; l<c->nrows[k]; l++) {
835b8f8c88eSHong Zhang         col = c->columnsforrow[k][l];      /* global column index */
836b8f8c88eSHong Zhang         c->vscaleforrow[k][l] = gtol[col]; /* local column index */
837b8f8c88eSHong Zhang       }
838b8f8c88eSHong Zhang     }
839b8f8c88eSHong Zhang     ierr = PetscFree(gtol);CHKERRQ(ierr);
840b8f8c88eSHong Zhang   }
841b9617806SBarry Smith   ierr = ISColoringRestoreIS(iscoloring,&isa);CHKERRQ(ierr);
84230b34957SBarry Smith 
843606d414cSSatish Balay   ierr = PetscFree(rowhit);CHKERRQ(ierr);
844606d414cSSatish Balay   ierr = PetscFree(columnsforrow);CHKERRQ(ierr);
8453acb8795SBarry Smith   ierr = MatRestoreColumnIJ(aij->A,0,PETSC_FALSE,PETSC_FALSE,&ncols,&A_ci,&A_cj,&done);CHKERRQ(ierr);
8463acb8795SBarry Smith   ierr = MatRestoreColumnIJ(aij->B,0,PETSC_FALSE,PETSC_FALSE,&ncols,&B_ci,&B_cj,&done);CHKERRQ(ierr);
847afcb2eb5SJed Brown   if (map) {ierr = ISLocalToGlobalMappingRestoreIndices(map,&ltog);CHKERRQ(ierr);}
8483a40ed3dSBarry Smith   PetscFunctionReturn(0);
849a64fbb32SBarry Smith }
850a64fbb32SBarry Smith 
851b9617806SBarry Smith 
852b9617806SBarry Smith 
853b9617806SBarry Smith 
854b9617806SBarry Smith 
855b9617806SBarry Smith 
856