1be1d678aSKris Buschelman #define PETSCMAT_DLL 2b3cc6726SBarry Smith 3d5d45c9bSBarry Smith /* 43369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 5d5d45c9bSBarry Smith matrix storage format. 6d5d45c9bSBarry Smith */ 73369ce9aSBarry Smith 89e070d67SMatthew Knepley #include "src/mat/impls/aij/seq/aij.h" /*I "petscmat.h" I*/ 9f5eb4b81SSatish Balay #include "src/inline/spops.h" 108d195f9aSBarry Smith #include "src/inline/dot.h" 110a835dfdSSatish Balay #include "petscbt.h" 1217ab2063SBarry Smith 134a2ae208SSatish Balay #undef __FUNCT__ 144a2ae208SSatish Balay #define __FUNCT__ "MatGetRowIJ_SeqAIJ" 1597f1f81fSBarry Smith PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscTruth symmetric,PetscInt *m,PetscInt *ia[],PetscInt *ja[],PetscTruth *done) 1617ab2063SBarry Smith { 17416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 18dfbe8321SBarry Smith PetscErrorCode ierr; 1997f1f81fSBarry Smith PetscInt i,ishift; 2017ab2063SBarry Smith 213a40ed3dSBarry Smith PetscFunctionBegin; 2231625ec5SSatish Balay *m = A->m; 233a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 24bfeeae90SHong Zhang ishift = 0; 2553e63a63SBarry Smith if (symmetric && !A->structurally_symmetric) { 26273d9f13SBarry Smith ierr = MatToSymmetricIJ_SeqAIJ(A->m,a->i,a->j,ishift,oshift,ia,ja);CHKERRQ(ierr); 27bfeeae90SHong Zhang } else if (oshift == 1) { 2897f1f81fSBarry Smith PetscInt nz = a->i[A->m]; 293b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 3097f1f81fSBarry Smith ierr = PetscMalloc((A->m+1)*sizeof(PetscInt),ia);CHKERRQ(ierr); 3197f1f81fSBarry Smith ierr = PetscMalloc((nz+1)*sizeof(PetscInt),ja);CHKERRQ(ierr); 323b2fbd54SBarry Smith for (i=0; i<nz; i++) (*ja)[i] = a->j[i] + 1; 33273d9f13SBarry Smith for (i=0; i<A->m+1; i++) (*ia)[i] = a->i[i] + 1; 346945ee14SBarry Smith } else { 356945ee14SBarry Smith *ia = a->i; *ja = a->j; 36a2ce50c7SBarry Smith } 373a40ed3dSBarry Smith PetscFunctionReturn(0); 38a2744918SBarry Smith } 39a2744918SBarry Smith 404a2ae208SSatish Balay #undef __FUNCT__ 414a2ae208SSatish Balay #define __FUNCT__ "MatRestoreRowIJ_SeqAIJ" 4297f1f81fSBarry Smith PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscTruth symmetric,PetscInt *n,PetscInt *ia[],PetscInt *ja[],PetscTruth *done) 436945ee14SBarry Smith { 44dfbe8321SBarry Smith PetscErrorCode ierr; 456945ee14SBarry Smith 463a40ed3dSBarry Smith PetscFunctionBegin; 473a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 48bfeeae90SHong Zhang if ((symmetric && !A->structurally_symmetric) || oshift == 1) { 49606d414cSSatish Balay ierr = PetscFree(*ia);CHKERRQ(ierr); 50606d414cSSatish Balay ierr = PetscFree(*ja);CHKERRQ(ierr); 51bcd2baecSBarry Smith } 523a40ed3dSBarry Smith PetscFunctionReturn(0); 5317ab2063SBarry Smith } 5417ab2063SBarry Smith 554a2ae208SSatish Balay #undef __FUNCT__ 564a2ae208SSatish Balay #define __FUNCT__ "MatGetColumnIJ_SeqAIJ" 5797f1f81fSBarry Smith PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscTruth symmetric,PetscInt *nn,PetscInt *ia[],PetscInt *ja[],PetscTruth *done) 583b2fbd54SBarry Smith { 593b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 60dfbe8321SBarry Smith PetscErrorCode ierr; 6197f1f81fSBarry Smith PetscInt i,*collengths,*cia,*cja,n = A->n,m = A->m; 6297f1f81fSBarry Smith PetscInt nz = a->i[m],row,*jj,mr,col; 633b2fbd54SBarry Smith 643a40ed3dSBarry Smith PetscFunctionBegin; 653b2fbd54SBarry Smith *nn = A->n; 663a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 673b2fbd54SBarry Smith if (symmetric) { 68bfeeae90SHong Zhang ierr = MatToSymmetricIJ_SeqAIJ(A->m,a->i,a->j,0,oshift,ia,ja);CHKERRQ(ierr); 693b2fbd54SBarry Smith } else { 7097f1f81fSBarry Smith ierr = PetscMalloc((n+1)*sizeof(PetscInt),&collengths);CHKERRQ(ierr); 7197f1f81fSBarry Smith ierr = PetscMemzero(collengths,n*sizeof(PetscInt));CHKERRQ(ierr); 7297f1f81fSBarry Smith ierr = PetscMalloc((n+1)*sizeof(PetscInt),&cia);CHKERRQ(ierr); 7397f1f81fSBarry Smith ierr = PetscMalloc((nz+1)*sizeof(PetscInt),&cja);CHKERRQ(ierr); 743b2fbd54SBarry Smith jj = a->j; 753b2fbd54SBarry Smith for (i=0; i<nz; i++) { 76bfeeae90SHong Zhang collengths[jj[i]]++; 773b2fbd54SBarry Smith } 783b2fbd54SBarry Smith cia[0] = oshift; 793b2fbd54SBarry Smith for (i=0; i<n; i++) { 803b2fbd54SBarry Smith cia[i+1] = cia[i] + collengths[i]; 813b2fbd54SBarry Smith } 8297f1f81fSBarry Smith ierr = PetscMemzero(collengths,n*sizeof(PetscInt));CHKERRQ(ierr); 833b2fbd54SBarry Smith jj = a->j; 84a93ec695SBarry Smith for (row=0; row<m; row++) { 85a93ec695SBarry Smith mr = a->i[row+1] - a->i[row]; 86a93ec695SBarry Smith for (i=0; i<mr; i++) { 87bfeeae90SHong Zhang col = *jj++; 883b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 893b2fbd54SBarry Smith } 903b2fbd54SBarry Smith } 91606d414cSSatish Balay ierr = PetscFree(collengths);CHKERRQ(ierr); 923b2fbd54SBarry Smith *ia = cia; *ja = cja; 933b2fbd54SBarry Smith } 943a40ed3dSBarry Smith PetscFunctionReturn(0); 953b2fbd54SBarry Smith } 963b2fbd54SBarry Smith 974a2ae208SSatish Balay #undef __FUNCT__ 984a2ae208SSatish Balay #define __FUNCT__ "MatRestoreColumnIJ_SeqAIJ" 9997f1f81fSBarry Smith PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscTruth symmetric,PetscInt *n,PetscInt *ia[],PetscInt *ja[],PetscTruth *done) 1003b2fbd54SBarry Smith { 101dfbe8321SBarry Smith PetscErrorCode ierr; 102606d414cSSatish Balay 1033a40ed3dSBarry Smith PetscFunctionBegin; 1043a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 1053b2fbd54SBarry Smith 106606d414cSSatish Balay ierr = PetscFree(*ia);CHKERRQ(ierr); 107606d414cSSatish Balay ierr = PetscFree(*ja);CHKERRQ(ierr); 1083b2fbd54SBarry Smith 1093a40ed3dSBarry Smith PetscFunctionReturn(0); 1103b2fbd54SBarry Smith } 1113b2fbd54SBarry Smith 112227d817aSBarry Smith #define CHUNKSIZE 15 11317ab2063SBarry Smith 1144a2ae208SSatish Balay #undef __FUNCT__ 1154a2ae208SSatish Balay #define __FUNCT__ "MatSetValues_SeqAIJ" 11697f1f81fSBarry Smith PetscErrorCode MatSetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 11717ab2063SBarry Smith { 118416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 119e2ee6c50SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 12097f1f81fSBarry Smith PetscInt *imax = a->imax,*ai = a->i,*ailen = a->ilen; 1216849ba73SBarry Smith PetscErrorCode ierr; 122e2ee6c50SBarry Smith PetscInt *aj = a->j,nonew = a->nonew,lastcol = -1; 12387828ca2SBarry Smith PetscScalar *ap,value,*aa = a->a; 12436db0b34SBarry Smith PetscTruth ignorezeroentries = ((a->ignorezeroentries && is == ADD_VALUES) ? PETSC_TRUE:PETSC_FALSE); 125273d9f13SBarry Smith PetscTruth roworiented = a->roworiented; 12617ab2063SBarry Smith 1273a40ed3dSBarry Smith PetscFunctionBegin; 12817ab2063SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 129416022c9SBarry Smith row = im[k]; 1305ef9f2a5SBarry Smith if (row < 0) continue; 1312515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 13277431f27SBarry Smith if (row >= A->m) SETERRQ2(PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",row,A->m-1); 1333b2fbd54SBarry Smith #endif 134bfeeae90SHong Zhang rp = aj + ai[row]; ap = aa + ai[row]; 13517ab2063SBarry Smith rmax = imax[row]; nrow = ailen[row]; 136416022c9SBarry Smith low = 0; 137c71e6ed7SBarry Smith high = nrow; 13817ab2063SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 1395ef9f2a5SBarry Smith if (in[l] < 0) continue; 1402515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 14177431f27SBarry Smith if (in[l] >= A->n) SETERRQ2(PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",in[l],A->n-1); 1423b2fbd54SBarry Smith #endif 143bfeeae90SHong Zhang col = in[l]; 1444b0e389bSBarry Smith if (roworiented) { 1455ef9f2a5SBarry Smith value = v[l + k*n]; 146bef8e0ddSBarry Smith } else { 1474b0e389bSBarry Smith value = v[k + l*m]; 1484b0e389bSBarry Smith } 149abc0a331SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 15036db0b34SBarry Smith 151c71e6ed7SBarry Smith if (col < lastcol) low = 0; else high = nrow; 152e2ee6c50SBarry Smith lastcol = col; 153416022c9SBarry Smith while (high-low > 5) { 154416022c9SBarry Smith t = (low+high)/2; 155416022c9SBarry Smith if (rp[t] > col) high = t; 156416022c9SBarry Smith else low = t; 15717ab2063SBarry Smith } 158416022c9SBarry Smith for (i=low; i<high; i++) { 15917ab2063SBarry Smith if (rp[i] > col) break; 16017ab2063SBarry Smith if (rp[i] == col) { 161416022c9SBarry Smith if (is == ADD_VALUES) ap[i] += value; 16217ab2063SBarry Smith else ap[i] = value; 16317ab2063SBarry Smith goto noinsert; 16417ab2063SBarry Smith } 16517ab2063SBarry Smith } 166abc0a331SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 167c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 16877431f27SBarry Smith else if (nonew == -1) SETERRQ2(PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero at (%D,%D) in the matrix",row,col); 16917ab2063SBarry Smith if (nrow >= rmax) { 17017ab2063SBarry Smith /* there is no extra room in row, therefore enlarge */ 17197f1f81fSBarry Smith PetscInt new_nz = ai[A->m] + CHUNKSIZE,*new_i,*new_j; 172a7ed9263SMatthew Knepley size_t len; 17387828ca2SBarry Smith PetscScalar *new_a; 17417ab2063SBarry Smith 17577431f27SBarry Smith if (nonew == -2) SETERRQ2(PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero at (%D,%D) in the matrix requiring new malloc()",row,col); 17696854ed6SLois Curfman McInnes 17717ab2063SBarry Smith /* malloc new storage space */ 178a96a251dSBarry Smith ierr = PetscMalloc3(new_nz,PetscScalar,&new_a,new_nz,PetscInt,&new_j,A->m+1,PetscInt,&new_i);CHKERRQ(ierr); 17917ab2063SBarry Smith 18017ab2063SBarry Smith /* copy over old data into new slots */ 18117ab2063SBarry Smith for (ii=0; ii<row+1; ii++) {new_i[ii] = ai[ii];} 182273d9f13SBarry Smith for (ii=row+1; ii<A->m+1; ii++) {new_i[ii] = ai[ii]+CHUNKSIZE;} 18397f1f81fSBarry Smith ierr = PetscMemcpy(new_j,aj,(ai[row]+nrow)*sizeof(PetscInt));CHKERRQ(ierr); 184bfeeae90SHong Zhang len = (((size_t) new_nz) - CHUNKSIZE - ai[row] - nrow ); 18597f1f81fSBarry Smith ierr = PetscMemcpy(new_j+ai[row]+nrow+CHUNKSIZE,aj+ai[row]+nrow,len*sizeof(PetscInt));CHKERRQ(ierr); 186bfeeae90SHong Zhang ierr = PetscMemcpy(new_a,aa,(((size_t) ai[row])+nrow)*sizeof(PetscScalar));CHKERRQ(ierr); 187bfeeae90SHong Zhang ierr = PetscMemcpy(new_a+ai[row]+nrow+CHUNKSIZE,aa+ai[row]+nrow,len*sizeof(PetscScalar));CHKERRQ(ierr); 18817ab2063SBarry Smith /* free up old matrix storage */ 189606d414cSSatish Balay if (!a->singlemalloc) { 190a96a251dSBarry Smith ierr = PetscFree(a->a);CHKERRQ(ierr); 191606d414cSSatish Balay ierr = PetscFree(a->i);CHKERRQ(ierr); 192606d414cSSatish Balay ierr = PetscFree(a->j);CHKERRQ(ierr); 193a96a251dSBarry Smith } else { 194a96a251dSBarry Smith ierr = PetscFree3(a->a,a->i,a->j);CHKERRQ(ierr); 195606d414cSSatish Balay } 196416022c9SBarry Smith aa = a->a = new_a; ai = a->i = new_i; aj = a->j = new_j; 197f1e2ffcdSBarry Smith a->singlemalloc = PETSC_TRUE; 19817ab2063SBarry Smith 199bfeeae90SHong Zhang rp = aj + ai[row]; ap = aa + ai[row] ; 200416022c9SBarry Smith rmax = imax[row] = imax[row] + CHUNKSIZE; 20152e6d16bSBarry Smith ierr = PetscLogObjectMemory(A,CHUNKSIZE*(sizeof(PetscInt) + sizeof(PetscScalar)));CHKERRQ(ierr); 202416022c9SBarry Smith a->maxnz += CHUNKSIZE; 203b810aeb4SBarry Smith a->reallocs++; 20417ab2063SBarry Smith } 205416022c9SBarry Smith N = nrow++ - 1; a->nz++; 206416022c9SBarry Smith /* shift up all the later entries in this row */ 207416022c9SBarry Smith for (ii=N; ii>=i; ii--) { 20817ab2063SBarry Smith rp[ii+1] = rp[ii]; 20917ab2063SBarry Smith ap[ii+1] = ap[ii]; 21017ab2063SBarry Smith } 21117ab2063SBarry Smith rp[i] = col; 21217ab2063SBarry Smith ap[i] = value; 21317ab2063SBarry Smith noinsert:; 214416022c9SBarry Smith low = i + 1; 21517ab2063SBarry Smith } 21617ab2063SBarry Smith ailen[row] = nrow; 21717ab2063SBarry Smith } 21888e51ccdSHong Zhang A->same_nonzero = PETSC_FALSE; 2193a40ed3dSBarry Smith PetscFunctionReturn(0); 22017ab2063SBarry Smith } 22117ab2063SBarry Smith 2224a2ae208SSatish Balay #undef __FUNCT__ 2234a2ae208SSatish Balay #define __FUNCT__ "MatGetValues_SeqAIJ" 22497f1f81fSBarry Smith PetscErrorCode MatGetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],PetscScalar v[]) 2257eb43aa7SLois Curfman McInnes { 2267eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 22797f1f81fSBarry Smith PetscInt *rp,k,low,high,t,row,nrow,i,col,l,*aj = a->j; 22897f1f81fSBarry Smith PetscInt *ai = a->i,*ailen = a->ilen; 22987828ca2SBarry Smith PetscScalar *ap,*aa = a->a,zero = 0.0; 2307eb43aa7SLois Curfman McInnes 2313a40ed3dSBarry Smith PetscFunctionBegin; 2327eb43aa7SLois Curfman McInnes for (k=0; k<m; k++) { /* loop over rows */ 2337eb43aa7SLois Curfman McInnes row = im[k]; 23477431f27SBarry Smith if (row < 0) SETERRQ1(PETSC_ERR_ARG_OUTOFRANGE,"Negative row: %D",row); 23577431f27SBarry Smith if (row >= A->m) SETERRQ2(PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",row,A->m-1); 236bfeeae90SHong Zhang rp = aj + ai[row]; ap = aa + ai[row]; 2377eb43aa7SLois Curfman McInnes nrow = ailen[row]; 2387eb43aa7SLois Curfman McInnes for (l=0; l<n; l++) { /* loop over columns */ 23977431f27SBarry Smith if (in[l] < 0) SETERRQ1(PETSC_ERR_ARG_OUTOFRANGE,"Negative column: %D",in[l]); 24077431f27SBarry Smith if (in[l] >= A->n) SETERRQ2(PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",in[l],A->n-1); 241bfeeae90SHong Zhang col = in[l] ; 2427eb43aa7SLois Curfman McInnes high = nrow; low = 0; /* assume unsorted */ 2437eb43aa7SLois Curfman McInnes while (high-low > 5) { 2447eb43aa7SLois Curfman McInnes t = (low+high)/2; 2457eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 2467eb43aa7SLois Curfman McInnes else low = t; 2477eb43aa7SLois Curfman McInnes } 2487eb43aa7SLois Curfman McInnes for (i=low; i<high; i++) { 2497eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 2507eb43aa7SLois Curfman McInnes if (rp[i] == col) { 251b49de8d1SLois Curfman McInnes *v++ = ap[i]; 2527eb43aa7SLois Curfman McInnes goto finished; 2537eb43aa7SLois Curfman McInnes } 2547eb43aa7SLois Curfman McInnes } 255b49de8d1SLois Curfman McInnes *v++ = zero; 2567eb43aa7SLois Curfman McInnes finished:; 2577eb43aa7SLois Curfman McInnes } 2587eb43aa7SLois Curfman McInnes } 2593a40ed3dSBarry Smith PetscFunctionReturn(0); 2607eb43aa7SLois Curfman McInnes } 2617eb43aa7SLois Curfman McInnes 26217ab2063SBarry Smith 2634a2ae208SSatish Balay #undef __FUNCT__ 2644a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqAIJ_Binary" 265dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Binary(Mat A,PetscViewer viewer) 26617ab2063SBarry Smith { 267416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2686849ba73SBarry Smith PetscErrorCode ierr; 2696f69ff64SBarry Smith PetscInt i,*col_lens; 2706f69ff64SBarry Smith int fd; 27117ab2063SBarry Smith 2723a40ed3dSBarry Smith PetscFunctionBegin; 273b0a32e0cSBarry Smith ierr = PetscViewerBinaryGetDescriptor(viewer,&fd);CHKERRQ(ierr); 27497f1f81fSBarry Smith ierr = PetscMalloc((4+A->m)*sizeof(PetscInt),&col_lens);CHKERRQ(ierr); 275552e946dSBarry Smith col_lens[0] = MAT_FILE_COOKIE; 276273d9f13SBarry Smith col_lens[1] = A->m; 277273d9f13SBarry Smith col_lens[2] = A->n; 278416022c9SBarry Smith col_lens[3] = a->nz; 279416022c9SBarry Smith 280416022c9SBarry Smith /* store lengths of each row and write (including header) to file */ 281273d9f13SBarry Smith for (i=0; i<A->m; i++) { 282416022c9SBarry Smith col_lens[4+i] = a->i[i+1] - a->i[i]; 28317ab2063SBarry Smith } 2846f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,col_lens,4+A->m,PETSC_INT,PETSC_TRUE);CHKERRQ(ierr); 285606d414cSSatish Balay ierr = PetscFree(col_lens);CHKERRQ(ierr); 286416022c9SBarry Smith 287416022c9SBarry Smith /* store column indices (zero start index) */ 2886f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,a->j,a->nz,PETSC_INT,PETSC_FALSE);CHKERRQ(ierr); 289416022c9SBarry Smith 290416022c9SBarry Smith /* store nonzero values */ 2916f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,a->a,a->nz,PETSC_SCALAR,PETSC_FALSE);CHKERRQ(ierr); 2923a40ed3dSBarry Smith PetscFunctionReturn(0); 29317ab2063SBarry Smith } 294416022c9SBarry Smith 295dfbe8321SBarry Smith EXTERN PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat,PetscViewer); 296cd155464SBarry Smith 2974a2ae208SSatish Balay #undef __FUNCT__ 2984a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqAIJ_ASCII" 299dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_ASCII(Mat A,PetscViewer viewer) 300416022c9SBarry Smith { 301416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 302dfbe8321SBarry Smith PetscErrorCode ierr; 30397f1f81fSBarry Smith PetscInt i,j,m = A->m,shift=0; 304fb9695e5SSatish Balay char *name; 305f3ef73ceSBarry Smith PetscViewerFormat format; 30617ab2063SBarry Smith 3073a40ed3dSBarry Smith PetscFunctionBegin; 308435da068SBarry Smith ierr = PetscObjectGetName((PetscObject)A,&name);CHKERRQ(ierr); 309b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 31071c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 31197f1f81fSBarry Smith PetscInt nofinalvalue = 0; 312273d9f13SBarry Smith if ((a->i[m] == a->i[m-1]) || (a->j[a->nz-1] != A->n-!shift)) { 313d00d2cf4SBarry Smith nofinalvalue = 1; 314d00d2cf4SBarry Smith } 315b0a32e0cSBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_NO);CHKERRQ(ierr); 31677431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Size = %D %D \n",m,A->n);CHKERRQ(ierr); 31777431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Nonzeros = %D \n",a->nz);CHKERRQ(ierr); 31877431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"zzz = zeros(%D,3);\n",a->nz+nofinalvalue);CHKERRQ(ierr); 319b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"zzz = [\n");CHKERRQ(ierr); 32017ab2063SBarry Smith 32117ab2063SBarry Smith for (i=0; i<m; i++) { 322416022c9SBarry Smith for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 323aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 32477431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e + %18.16ei \n",i+1,a->j[j]+!shift,PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 32517ab2063SBarry Smith #else 32677431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e\n",i+1,a->j[j]+!shift,a->a[j]);CHKERRQ(ierr); 32717ab2063SBarry Smith #endif 32817ab2063SBarry Smith } 32917ab2063SBarry Smith } 330d00d2cf4SBarry Smith if (nofinalvalue) { 33177431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e\n",m,A->n,0.0);CHKERRQ(ierr); 332d00d2cf4SBarry Smith } 333fb9695e5SSatish Balay ierr = PetscViewerASCIIPrintf(viewer,"];\n %s = spconvert(zzz);\n",name);CHKERRQ(ierr); 334b0a32e0cSBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_YES);CHKERRQ(ierr); 33568369a75SKris Buschelman } else if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO) { 336cd155464SBarry Smith PetscFunctionReturn(0); 337fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 338b0a32e0cSBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_NO);CHKERRQ(ierr); 33944cd7ae7SLois Curfman McInnes for (i=0; i<m; i++) { 34077431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 34144cd7ae7SLois Curfman McInnes for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 342aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 34336db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 34477431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j]+shift,PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 34536db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 34677431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j]+shift,PetscRealPart(a->a[j]),-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 34736db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 34877431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j]+shift,PetscRealPart(a->a[j]));CHKERRQ(ierr); 3496831982aSBarry Smith } 35044cd7ae7SLois Curfman McInnes #else 35177431f27SBarry Smith if (a->a[j] != 0.0) {ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j]+shift,a->a[j]);CHKERRQ(ierr);} 35244cd7ae7SLois Curfman McInnes #endif 35344cd7ae7SLois Curfman McInnes } 354b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 35544cd7ae7SLois Curfman McInnes } 356b0a32e0cSBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_YES);CHKERRQ(ierr); 357fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 35897f1f81fSBarry Smith PetscInt nzd=0,fshift=1,*sptr; 359b0a32e0cSBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_NO);CHKERRQ(ierr); 36097f1f81fSBarry Smith ierr = PetscMalloc((m+1)*sizeof(PetscInt),&sptr);CHKERRQ(ierr); 361496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 362496be53dSLois Curfman McInnes sptr[i] = nzd+1; 363496be53dSLois Curfman McInnes for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 364496be53dSLois Curfman McInnes if (a->j[j] >= i) { 365aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 36636db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 367496be53dSLois Curfman McInnes #else 368496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 369496be53dSLois Curfman McInnes #endif 370496be53dSLois Curfman McInnes } 371496be53dSLois Curfman McInnes } 372496be53dSLois Curfman McInnes } 3732e44a96cSLois Curfman McInnes sptr[m] = nzd+1; 37477431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %D %D\n\n",m,nzd);CHKERRQ(ierr); 3752e44a96cSLois Curfman McInnes for (i=0; i<m+1; i+=6) { 37677431f27SBarry Smith if (i+4<m) {ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4],sptr[i+5]);CHKERRQ(ierr);} 37777431f27SBarry Smith else if (i+3<m) {ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4]);CHKERRQ(ierr);} 37877431f27SBarry Smith else if (i+2<m) {ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3]);CHKERRQ(ierr);} 37977431f27SBarry Smith else if (i+1<m) {ierr = PetscViewerASCIIPrintf(viewer," %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2]);CHKERRQ(ierr);} 38077431f27SBarry Smith else if (i<m) {ierr = PetscViewerASCIIPrintf(viewer," %D %D\n",sptr[i],sptr[i+1]);CHKERRQ(ierr);} 38177431f27SBarry Smith else {ierr = PetscViewerASCIIPrintf(viewer," %D\n",sptr[i]);CHKERRQ(ierr);} 382496be53dSLois Curfman McInnes } 383b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 384606d414cSSatish Balay ierr = PetscFree(sptr);CHKERRQ(ierr); 385496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 386496be53dSLois Curfman McInnes for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 38777431f27SBarry Smith if (a->j[j] >= i) {ierr = PetscViewerASCIIPrintf(viewer," %D ",a->j[j]+fshift);CHKERRQ(ierr);} 388496be53dSLois Curfman McInnes } 389b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 390496be53dSLois Curfman McInnes } 391b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 392496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 393496be53dSLois Curfman McInnes for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 394496be53dSLois Curfman McInnes if (a->j[j] >= i) { 395aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 39636db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) { 397b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %18.16e %18.16e ",PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 3986831982aSBarry Smith } 399496be53dSLois Curfman McInnes #else 400b0a32e0cSBarry Smith if (a->a[j] != 0.0) {ierr = PetscViewerASCIIPrintf(viewer," %18.16e ",a->a[j]);CHKERRQ(ierr);} 401496be53dSLois Curfman McInnes #endif 402496be53dSLois Curfman McInnes } 403496be53dSLois Curfman McInnes } 404b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 405496be53dSLois Curfman McInnes } 406b0a32e0cSBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_YES);CHKERRQ(ierr); 407fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 40897f1f81fSBarry Smith PetscInt cnt = 0,jcnt; 40987828ca2SBarry Smith PetscScalar value; 41002594712SBarry Smith 411b0a32e0cSBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_NO);CHKERRQ(ierr); 41202594712SBarry Smith for (i=0; i<m; i++) { 41302594712SBarry Smith jcnt = 0; 414273d9f13SBarry Smith for (j=0; j<A->n; j++) { 415e24b481bSBarry Smith if (jcnt < a->i[i+1]-a->i[i] && j == a->j[cnt]) { 41602594712SBarry Smith value = a->a[cnt++]; 417e24b481bSBarry Smith jcnt++; 41802594712SBarry Smith } else { 41902594712SBarry Smith value = 0.0; 42002594712SBarry Smith } 421aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 422b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %7.5e+%7.5e i ",PetscRealPart(value),PetscImaginaryPart(value));CHKERRQ(ierr); 42302594712SBarry Smith #else 424b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %7.5e ",value);CHKERRQ(ierr); 42502594712SBarry Smith #endif 42602594712SBarry Smith } 427b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 42802594712SBarry Smith } 429b0a32e0cSBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_YES);CHKERRQ(ierr); 4303a40ed3dSBarry Smith } else { 431b0a32e0cSBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_NO);CHKERRQ(ierr); 43217ab2063SBarry Smith for (i=0; i<m; i++) { 43377431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 434416022c9SBarry Smith for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 435aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 43636db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 43777431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j]+shift,PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 43836db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 43977431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j]+shift,PetscRealPart(a->a[j]),-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 4403a40ed3dSBarry Smith } else { 44177431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j]+shift,PetscRealPart(a->a[j]));CHKERRQ(ierr); 44217ab2063SBarry Smith } 44317ab2063SBarry Smith #else 44477431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j]+shift,a->a[j]);CHKERRQ(ierr); 44517ab2063SBarry Smith #endif 44617ab2063SBarry Smith } 447b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 44817ab2063SBarry Smith } 449b0a32e0cSBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_YES);CHKERRQ(ierr); 45017ab2063SBarry Smith } 451b0a32e0cSBarry Smith ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 4523a40ed3dSBarry Smith PetscFunctionReturn(0); 453416022c9SBarry Smith } 454416022c9SBarry Smith 4554a2ae208SSatish Balay #undef __FUNCT__ 4564a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqAIJ_Draw_Zoom" 457dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw,void *Aa) 458416022c9SBarry Smith { 459480ef9eaSBarry Smith Mat A = (Mat) Aa; 460416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 461dfbe8321SBarry Smith PetscErrorCode ierr; 46297f1f81fSBarry Smith PetscInt i,j,m = A->m,color; 46336db0b34SBarry Smith PetscReal xl,yl,xr,yr,x_l,x_r,y_l,y_r,maxv = 0.0; 464b0a32e0cSBarry Smith PetscViewer viewer; 465f3ef73ceSBarry Smith PetscViewerFormat format; 466cddf8d76SBarry Smith 4673a40ed3dSBarry Smith PetscFunctionBegin; 468480ef9eaSBarry Smith ierr = PetscObjectQuery((PetscObject)A,"Zoomviewer",(PetscObject*)&viewer);CHKERRQ(ierr); 469b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 47019bcc07fSBarry Smith 471b0a32e0cSBarry Smith ierr = PetscDrawGetCoordinates(draw,&xl,&yl,&xr,&yr);CHKERRQ(ierr); 472416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 4730513a670SBarry Smith 474fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 4750513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 476b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 477416022c9SBarry Smith for (i=0; i<m; i++) { 478cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 479bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 480bfeeae90SHong Zhang x_l = a->j[j] ; x_r = x_l + 1.0; 481aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 48236db0b34SBarry Smith if (PetscRealPart(a->a[j]) >= 0.) continue; 483cddf8d76SBarry Smith #else 484cddf8d76SBarry Smith if (a->a[j] >= 0.) continue; 485cddf8d76SBarry Smith #endif 486b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 487cddf8d76SBarry Smith } 488cddf8d76SBarry Smith } 489b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 490cddf8d76SBarry Smith for (i=0; i<m; i++) { 491cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 492bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 493bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 494cddf8d76SBarry Smith if (a->a[j] != 0.) continue; 495b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 496cddf8d76SBarry Smith } 497cddf8d76SBarry Smith } 498b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 499cddf8d76SBarry Smith for (i=0; i<m; i++) { 500cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 501bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 502bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 503aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 50436db0b34SBarry Smith if (PetscRealPart(a->a[j]) <= 0.) continue; 505cddf8d76SBarry Smith #else 506cddf8d76SBarry Smith if (a->a[j] <= 0.) continue; 507cddf8d76SBarry Smith #endif 508b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 509416022c9SBarry Smith } 510416022c9SBarry Smith } 5110513a670SBarry Smith } else { 5120513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 5130513a670SBarry Smith /* first determine max of all nonzero values */ 51497f1f81fSBarry Smith PetscInt nz = a->nz,count; 515b0a32e0cSBarry Smith PetscDraw popup; 51636db0b34SBarry Smith PetscReal scale; 5170513a670SBarry Smith 5180513a670SBarry Smith for (i=0; i<nz; i++) { 5190513a670SBarry Smith if (PetscAbsScalar(a->a[i]) > maxv) maxv = PetscAbsScalar(a->a[i]); 5200513a670SBarry Smith } 521b0a32e0cSBarry Smith scale = (245.0 - PETSC_DRAW_BASIC_COLORS)/maxv; 522b0a32e0cSBarry Smith ierr = PetscDrawGetPopup(draw,&popup);CHKERRQ(ierr); 523b0a32e0cSBarry Smith if (popup) {ierr = PetscDrawScalePopup(popup,0.0,maxv);CHKERRQ(ierr);} 5240513a670SBarry Smith count = 0; 5250513a670SBarry Smith for (i=0; i<m; i++) { 5260513a670SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 527bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 528bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 52997f1f81fSBarry Smith color = PETSC_DRAW_BASIC_COLORS + (PetscInt)(scale*PetscAbsScalar(a->a[count])); 530b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 5310513a670SBarry Smith count++; 5320513a670SBarry Smith } 5330513a670SBarry Smith } 5340513a670SBarry Smith } 535480ef9eaSBarry Smith PetscFunctionReturn(0); 536480ef9eaSBarry Smith } 537cddf8d76SBarry Smith 5384a2ae208SSatish Balay #undef __FUNCT__ 5394a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqAIJ_Draw" 540dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw(Mat A,PetscViewer viewer) 541480ef9eaSBarry Smith { 542dfbe8321SBarry Smith PetscErrorCode ierr; 543b0a32e0cSBarry Smith PetscDraw draw; 54436db0b34SBarry Smith PetscReal xr,yr,xl,yl,h,w; 545480ef9eaSBarry Smith PetscTruth isnull; 546480ef9eaSBarry Smith 547480ef9eaSBarry Smith PetscFunctionBegin; 548b0a32e0cSBarry Smith ierr = PetscViewerDrawGetDraw(viewer,0,&draw);CHKERRQ(ierr); 549b0a32e0cSBarry Smith ierr = PetscDrawIsNull(draw,&isnull);CHKERRQ(ierr); 550480ef9eaSBarry Smith if (isnull) PetscFunctionReturn(0); 551480ef9eaSBarry Smith 552480ef9eaSBarry Smith ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",(PetscObject)viewer);CHKERRQ(ierr); 553273d9f13SBarry Smith xr = A->n; yr = A->m; h = yr/10.0; w = xr/10.0; 554480ef9eaSBarry Smith xr += w; yr += h; xl = -w; yl = -h; 555b0a32e0cSBarry Smith ierr = PetscDrawSetCoordinates(draw,xl,yl,xr,yr);CHKERRQ(ierr); 556b0a32e0cSBarry Smith ierr = PetscDrawZoom(draw,MatView_SeqAIJ_Draw_Zoom,A);CHKERRQ(ierr); 557480ef9eaSBarry Smith ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",PETSC_NULL);CHKERRQ(ierr); 5583a40ed3dSBarry Smith PetscFunctionReturn(0); 559416022c9SBarry Smith } 560416022c9SBarry Smith 5614a2ae208SSatish Balay #undef __FUNCT__ 5624a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqAIJ" 563dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ(Mat A,PetscViewer viewer) 564416022c9SBarry Smith { 565416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 566dfbe8321SBarry Smith PetscErrorCode ierr; 56732077d6dSBarry Smith PetscTruth issocket,iascii,isbinary,isdraw; 568416022c9SBarry Smith 5693a40ed3dSBarry Smith PetscFunctionBegin; 570b0a32e0cSBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSC_VIEWER_SOCKET,&issocket);CHKERRQ(ierr); 57132077d6dSBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSC_VIEWER_ASCII,&iascii);CHKERRQ(ierr); 572fb9695e5SSatish Balay ierr = PetscTypeCompare((PetscObject)viewer,PETSC_VIEWER_BINARY,&isbinary);CHKERRQ(ierr); 573fb9695e5SSatish Balay ierr = PetscTypeCompare((PetscObject)viewer,PETSC_VIEWER_DRAW,&isdraw);CHKERRQ(ierr); 574c45a1595SBarry Smith if (iascii) { 5753a40ed3dSBarry Smith ierr = MatView_SeqAIJ_ASCII(A,viewer);CHKERRQ(ierr); 576c45a1595SBarry Smith #if defined(PETSC_HAVE_SOCKET) 577c45a1595SBarry Smith } else if (issocket) { 578c45a1595SBarry Smith ierr = PetscViewerSocketPutSparse_Private(viewer,A->m,A->n,a->nz,a->a,a->i,a->j);CHKERRQ(ierr); 579c45a1595SBarry Smith #endif 5800f5bd95cSBarry Smith } else if (isbinary) { 5813a40ed3dSBarry Smith ierr = MatView_SeqAIJ_Binary(A,viewer);CHKERRQ(ierr); 5820f5bd95cSBarry Smith } else if (isdraw) { 5833a40ed3dSBarry Smith ierr = MatView_SeqAIJ_Draw(A,viewer);CHKERRQ(ierr); 5845cd90555SBarry Smith } else { 585958c9bccSBarry Smith SETERRQ1(PETSC_ERR_SUP,"Viewer type %s not supported by SeqAIJ matrices",((PetscObject)viewer)->type_name); 58617ab2063SBarry Smith } 5874846f1f5SKris Buschelman ierr = MatView_Inode(A,viewer);CHKERRQ(ierr); 5883a40ed3dSBarry Smith PetscFunctionReturn(0); 58917ab2063SBarry Smith } 59019bcc07fSBarry Smith 5914a2ae208SSatish Balay #undef __FUNCT__ 5924a2ae208SSatish Balay #define __FUNCT__ "MatAssemblyEnd_SeqAIJ" 593dfbe8321SBarry Smith PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A,MatAssemblyType mode) 59417ab2063SBarry Smith { 595416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 5966849ba73SBarry Smith PetscErrorCode ierr; 59797f1f81fSBarry Smith PetscInt fshift = 0,i,j,*ai = a->i,*aj = a->j,*imax = a->imax; 59897f1f81fSBarry Smith PetscInt m = A->m,*ip,N,*ailen = a->ilen,rmax = 0; 59987828ca2SBarry Smith PetscScalar *aa = a->a,*ap; 6003447b6efSHong Zhang PetscReal ratio=0.6; 60117ab2063SBarry Smith 6023a40ed3dSBarry Smith PetscFunctionBegin; 6033a40ed3dSBarry Smith if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0); 60417ab2063SBarry Smith 60543ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 60617ab2063SBarry Smith for (i=1; i<m; i++) { 607416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 60817ab2063SBarry Smith fshift += imax[i-1] - ailen[i-1]; 60994a9d846SBarry Smith rmax = PetscMax(rmax,ailen[i]); 61017ab2063SBarry Smith if (fshift) { 611bfeeae90SHong Zhang ip = aj + ai[i] ; 612bfeeae90SHong Zhang ap = aa + ai[i] ; 61317ab2063SBarry Smith N = ailen[i]; 61417ab2063SBarry Smith for (j=0; j<N; j++) { 61517ab2063SBarry Smith ip[j-fshift] = ip[j]; 61617ab2063SBarry Smith ap[j-fshift] = ap[j]; 61717ab2063SBarry Smith } 61817ab2063SBarry Smith } 61917ab2063SBarry Smith ai[i] = ai[i-1] + ailen[i-1]; 62017ab2063SBarry Smith } 62117ab2063SBarry Smith if (m) { 62217ab2063SBarry Smith fshift += imax[m-1] - ailen[m-1]; 62317ab2063SBarry Smith ai[m] = ai[m-1] + ailen[m-1]; 62417ab2063SBarry Smith } 62517ab2063SBarry Smith /* reset ilen and imax for each row */ 62617ab2063SBarry Smith for (i=0; i<m; i++) { 62717ab2063SBarry Smith ailen[i] = imax[i] = ai[i+1] - ai[i]; 62817ab2063SBarry Smith } 629bfeeae90SHong Zhang a->nz = ai[m]; 63017ab2063SBarry Smith 63117ab2063SBarry Smith /* diagonals may have moved, so kill the diagonal pointers */ 632416022c9SBarry Smith if (fshift && a->diag) { 633606d414cSSatish Balay ierr = PetscFree(a->diag);CHKERRQ(ierr); 63452e6d16bSBarry Smith ierr = PetscLogObjectMemory(A,-(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 635416022c9SBarry Smith a->diag = 0; 63617ab2063SBarry Smith } 63763ba0a88SBarry Smith ierr = PetscLogInfo((A,"MatAssemblyEnd_SeqAIJ:Matrix size: %D X %D; storage space: %D unneeded,%D used\n",m,A->n,fshift,a->nz));CHKERRQ(ierr); 63863ba0a88SBarry Smith ierr = PetscLogInfo((A,"MatAssemblyEnd_SeqAIJ:Number of mallocs during MatSetValues() is %D\n",a->reallocs));CHKERRQ(ierr); 63963ba0a88SBarry Smith ierr = PetscLogInfo((A,"MatAssemblyEnd_SeqAIJ:Maximum nonzeros in any row is %D\n",rmax));CHKERRQ(ierr); 640dd5f02e7SSatish Balay a->reallocs = 0; 6414e220ebcSLois Curfman McInnes A->info.nz_unneeded = (double)fshift; 64236db0b34SBarry Smith a->rmax = rmax; 6434e220ebcSLois Curfman McInnes 644cb5d8e9eSHong Zhang /* check for zero rows. If found a large number of zero rows, use CompressedRow functions */ 645317fbc4cSHong Zhang ierr = Mat_CheckCompressedRow(A,&a->compressedrow,a->i,m,ratio);CHKERRQ(ierr); 64688e51ccdSHong Zhang A->same_nonzero = PETSC_TRUE; 64771c2f376SKris Buschelman 6484846f1f5SKris Buschelman ierr = MatAssemblyEnd_Inode(A,mode);CHKERRQ(ierr); 6493a40ed3dSBarry Smith PetscFunctionReturn(0); 65017ab2063SBarry Smith } 65117ab2063SBarry Smith 6524a2ae208SSatish Balay #undef __FUNCT__ 6534a2ae208SSatish Balay #define __FUNCT__ "MatZeroEntries_SeqAIJ" 654dfbe8321SBarry Smith PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 65517ab2063SBarry Smith { 656416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 657dfbe8321SBarry Smith PetscErrorCode ierr; 6583a40ed3dSBarry Smith 6593a40ed3dSBarry Smith PetscFunctionBegin; 660bfeeae90SHong Zhang ierr = PetscMemzero(a->a,(a->i[A->m])*sizeof(PetscScalar));CHKERRQ(ierr); 6613a40ed3dSBarry Smith PetscFunctionReturn(0); 66217ab2063SBarry Smith } 663416022c9SBarry Smith 6644a2ae208SSatish Balay #undef __FUNCT__ 6654a2ae208SSatish Balay #define __FUNCT__ "MatDestroy_SeqAIJ" 666dfbe8321SBarry Smith PetscErrorCode MatDestroy_SeqAIJ(Mat A) 66717ab2063SBarry Smith { 668416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 669dfbe8321SBarry Smith PetscErrorCode ierr; 670d5d45c9bSBarry Smith 6713a40ed3dSBarry Smith PetscFunctionBegin; 672aa482453SBarry Smith #if defined(PETSC_USE_LOG) 67377431f27SBarry Smith PetscLogObjectState((PetscObject)A,"Rows=%D, Cols=%D, NZ=%D",A->m,A->n,a->nz); 67417ab2063SBarry Smith #endif 67536db0b34SBarry Smith if (a->freedata) { 676606d414cSSatish Balay if (!a->singlemalloc) { 677*ab93d7beSBarry Smith if (a->a) {ierr = PetscFree(a->a);CHKERRQ(ierr);} 678*ab93d7beSBarry Smith if (a->i) {ierr = PetscFree(a->i);CHKERRQ(ierr);} 679*ab93d7beSBarry Smith if (a->j) {ierr = PetscFree(a->j);CHKERRQ(ierr);} 680a96a251dSBarry Smith } else { 681a96a251dSBarry Smith ierr = PetscFree3(a->a,a->j,a->i);CHKERRQ(ierr); 682606d414cSSatish Balay } 68336db0b34SBarry Smith } 684c38d4ed2SBarry Smith if (a->row) { 685c38d4ed2SBarry Smith ierr = ISDestroy(a->row);CHKERRQ(ierr); 686c38d4ed2SBarry Smith } 687c38d4ed2SBarry Smith if (a->col) { 688c38d4ed2SBarry Smith ierr = ISDestroy(a->col);CHKERRQ(ierr); 689c38d4ed2SBarry Smith } 690606d414cSSatish Balay if (a->diag) {ierr = PetscFree(a->diag);CHKERRQ(ierr);} 691*ab93d7beSBarry Smith if (a->ilen) {ierr = PetscFree2(a->imax,a->ilen);CHKERRQ(ierr);} 692273d9f13SBarry Smith if (a->idiag) {ierr = PetscFree(a->idiag);CHKERRQ(ierr);} 693606d414cSSatish Balay if (a->solve_work) {ierr = PetscFree(a->solve_work);CHKERRQ(ierr);} 69482bf6240SBarry Smith if (a->icol) {ierr = ISDestroy(a->icol);CHKERRQ(ierr);} 695606d414cSSatish Balay if (a->saved_values) {ierr = PetscFree(a->saved_values);CHKERRQ(ierr);} 696cc8ba8e1SBarry Smith if (a->coloring) {ierr = ISColoringDestroy(a->coloring);CHKERRQ(ierr);} 697a30b2313SHong Zhang if (a->xtoy) {ierr = PetscFree(a->xtoy);CHKERRQ(ierr);} 698d487561eSHong Zhang if (a->compressedrow.use){ierr = PetscFree(a->compressedrow.i);} 699a30b2313SHong Zhang 7004846f1f5SKris Buschelman ierr = MatDestroy_Inode(A);CHKERRQ(ierr); 7014846f1f5SKris Buschelman 702606d414cSSatish Balay ierr = PetscFree(a);CHKERRQ(ierr); 703901853e0SKris Buschelman 704901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatSeqAIJSetColumnIndices_C","",PETSC_NULL);CHKERRQ(ierr); 705901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatStoreValues_C","",PETSC_NULL);CHKERRQ(ierr); 706901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatRetrieveValues_C","",PETSC_NULL);CHKERRQ(ierr); 707901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatConvert_seqaij_seqsbaij_C","",PETSC_NULL);CHKERRQ(ierr); 708901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatConvert_seqaij_seqbaij_C","",PETSC_NULL);CHKERRQ(ierr); 709901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatIsTranspose_C","",PETSC_NULL);CHKERRQ(ierr); 710901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatSeqAIJSetPreallocation_C","",PETSC_NULL);CHKERRQ(ierr); 711901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatReorderForNonzeroDiagonal_C","",PETSC_NULL);CHKERRQ(ierr); 7123a40ed3dSBarry Smith PetscFunctionReturn(0); 71317ab2063SBarry Smith } 71417ab2063SBarry Smith 7154a2ae208SSatish Balay #undef __FUNCT__ 7164a2ae208SSatish Balay #define __FUNCT__ "MatCompress_SeqAIJ" 717dfbe8321SBarry Smith PetscErrorCode MatCompress_SeqAIJ(Mat A) 71817ab2063SBarry Smith { 7193a40ed3dSBarry Smith PetscFunctionBegin; 7203a40ed3dSBarry Smith PetscFunctionReturn(0); 72117ab2063SBarry Smith } 72217ab2063SBarry Smith 7234a2ae208SSatish Balay #undef __FUNCT__ 7244a2ae208SSatish Balay #define __FUNCT__ "MatSetOption_SeqAIJ" 725dfbe8321SBarry Smith PetscErrorCode MatSetOption_SeqAIJ(Mat A,MatOption op) 72617ab2063SBarry Smith { 727416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 7284846f1f5SKris Buschelman PetscErrorCode ierr; 7293a40ed3dSBarry Smith 7303a40ed3dSBarry Smith PetscFunctionBegin; 731a65d3064SKris Buschelman switch (op) { 732a65d3064SKris Buschelman case MAT_ROW_ORIENTED: 733a65d3064SKris Buschelman a->roworiented = PETSC_TRUE; 734a65d3064SKris Buschelman break; 735a65d3064SKris Buschelman case MAT_KEEP_ZEROED_ROWS: 736a65d3064SKris Buschelman a->keepzeroedrows = PETSC_TRUE; 737a65d3064SKris Buschelman break; 738a65d3064SKris Buschelman case MAT_COLUMN_ORIENTED: 739a65d3064SKris Buschelman a->roworiented = PETSC_FALSE; 740a65d3064SKris Buschelman break; 741a65d3064SKris Buschelman case MAT_COLUMNS_SORTED: 742a65d3064SKris Buschelman a->sorted = PETSC_TRUE; 743a65d3064SKris Buschelman break; 744a65d3064SKris Buschelman case MAT_COLUMNS_UNSORTED: 745a65d3064SKris Buschelman a->sorted = PETSC_FALSE; 746a65d3064SKris Buschelman break; 747a65d3064SKris Buschelman case MAT_NO_NEW_NONZERO_LOCATIONS: 748a65d3064SKris Buschelman a->nonew = 1; 749a65d3064SKris Buschelman break; 750a65d3064SKris Buschelman case MAT_NEW_NONZERO_LOCATION_ERR: 751a65d3064SKris Buschelman a->nonew = -1; 752a65d3064SKris Buschelman break; 753a65d3064SKris Buschelman case MAT_NEW_NONZERO_ALLOCATION_ERR: 754a65d3064SKris Buschelman a->nonew = -2; 755a65d3064SKris Buschelman break; 756a65d3064SKris Buschelman case MAT_YES_NEW_NONZERO_LOCATIONS: 757a65d3064SKris Buschelman a->nonew = 0; 758a65d3064SKris Buschelman break; 759a65d3064SKris Buschelman case MAT_IGNORE_ZERO_ENTRIES: 760a65d3064SKris Buschelman a->ignorezeroentries = PETSC_TRUE; 761a65d3064SKris Buschelman break; 762d487561eSHong Zhang case MAT_USE_COMPRESSEDROW: 763d487561eSHong Zhang a->compressedrow.use = PETSC_TRUE; 764d487561eSHong Zhang break; 765d487561eSHong Zhang case MAT_DO_NOT_USE_COMPRESSEDROW: 766d487561eSHong Zhang a->compressedrow.use = PETSC_FALSE; 767d487561eSHong Zhang break; 768a65d3064SKris Buschelman case MAT_ROWS_SORTED: 769a65d3064SKris Buschelman case MAT_ROWS_UNSORTED: 770a65d3064SKris Buschelman case MAT_YES_NEW_DIAGONALS: 771a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 772a65d3064SKris Buschelman case MAT_USE_HASH_TABLE: 77363ba0a88SBarry Smith ierr = PetscLogInfo((A,"MatSetOption_SeqAIJ:Option ignored\n"));CHKERRQ(ierr); 774a65d3064SKris Buschelman break; 775a65d3064SKris Buschelman case MAT_NO_NEW_DIAGONALS: 77629bbc08cSBarry Smith SETERRQ(PETSC_ERR_SUP,"MAT_NO_NEW_DIAGONALS"); 777a65d3064SKris Buschelman default: 77871c2f376SKris Buschelman break; 779a65d3064SKris Buschelman } 7804846f1f5SKris Buschelman ierr = MatSetOption_Inode(A,op);CHKERRQ(ierr); 7813a40ed3dSBarry Smith PetscFunctionReturn(0); 78217ab2063SBarry Smith } 78317ab2063SBarry Smith 7844a2ae208SSatish Balay #undef __FUNCT__ 7854a2ae208SSatish Balay #define __FUNCT__ "MatGetDiagonal_SeqAIJ" 786dfbe8321SBarry Smith PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A,Vec v) 78717ab2063SBarry Smith { 788416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 7896849ba73SBarry Smith PetscErrorCode ierr; 79097f1f81fSBarry Smith PetscInt i,j,n; 79187828ca2SBarry Smith PetscScalar *x,zero = 0.0; 79217ab2063SBarry Smith 7933a40ed3dSBarry Smith PetscFunctionBegin; 7943a40ed3dSBarry Smith ierr = VecSet(&zero,v);CHKERRQ(ierr); 7951ebc52fbSHong Zhang ierr = VecGetArray(v,&x);CHKERRQ(ierr); 79636db0b34SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 797273d9f13SBarry Smith if (n != A->m) SETERRQ(PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 798273d9f13SBarry Smith for (i=0; i<A->m; i++) { 799bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 800bfeeae90SHong Zhang if (a->j[j] == i) { 801416022c9SBarry Smith x[i] = a->a[j]; 80217ab2063SBarry Smith break; 80317ab2063SBarry Smith } 80417ab2063SBarry Smith } 80517ab2063SBarry Smith } 8061ebc52fbSHong Zhang ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 8073a40ed3dSBarry Smith PetscFunctionReturn(0); 80817ab2063SBarry Smith } 80917ab2063SBarry Smith 8104a2ae208SSatish Balay #undef __FUNCT__ 8114a2ae208SSatish Balay #define __FUNCT__ "MatMultTransposeAdd_SeqAIJ" 812dfbe8321SBarry Smith PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A,Vec xx,Vec zz,Vec yy) 81317ab2063SBarry Smith { 814416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 8155c897100SBarry Smith PetscScalar *x,*y; 816dfbe8321SBarry Smith PetscErrorCode ierr; 81797f1f81fSBarry Smith PetscInt m = A->m; 8185c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 8195c897100SBarry Smith PetscScalar *v,alpha; 8207b2bb3b9SHong Zhang PetscInt n,i,*idx,*ii,*ridx=PETSC_NULL; 8213447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 8224eb6d288SHong Zhang PetscTruth usecprow = cprow.use; 8235c897100SBarry Smith #endif 82417ab2063SBarry Smith 8253a40ed3dSBarry Smith PetscFunctionBegin; 8262e8a6d31SBarry Smith if (zz != yy) {ierr = VecCopy(zz,yy);CHKERRQ(ierr);} 8271ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 8281ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 8295c897100SBarry Smith 8305c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 831bfeeae90SHong Zhang fortranmulttransposeaddaij_(&m,x,a->i,a->j,a->a,y); 8325c897100SBarry Smith #else 8333447b6efSHong Zhang if (usecprow){ 8343447b6efSHong Zhang m = cprow.nrows; 8353447b6efSHong Zhang ii = cprow.i; 8367b2bb3b9SHong Zhang ridx = cprow.rindex; 8373447b6efSHong Zhang } else { 8383447b6efSHong Zhang ii = a->i; 8393447b6efSHong Zhang } 84017ab2063SBarry Smith for (i=0; i<m; i++) { 8413447b6efSHong Zhang idx = a->j + ii[i] ; 8423447b6efSHong Zhang v = a->a + ii[i] ; 8433447b6efSHong Zhang n = ii[i+1] - ii[i]; 8443447b6efSHong Zhang if (usecprow){ 8457b2bb3b9SHong Zhang alpha = x[ridx[i]]; 8463447b6efSHong Zhang } else { 84717ab2063SBarry Smith alpha = x[i]; 8483447b6efSHong Zhang } 84917ab2063SBarry Smith while (n-->0) {y[*idx++] += alpha * *v++;} 85017ab2063SBarry Smith } 8515c897100SBarry Smith #endif 852efee365bSSatish Balay ierr = PetscLogFlops(2*a->nz);CHKERRQ(ierr); 8531ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 8541ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 8553a40ed3dSBarry Smith PetscFunctionReturn(0); 85617ab2063SBarry Smith } 85717ab2063SBarry Smith 8584a2ae208SSatish Balay #undef __FUNCT__ 8595c897100SBarry Smith #define __FUNCT__ "MatMultTranspose_SeqAIJ" 860dfbe8321SBarry Smith PetscErrorCode MatMultTranspose_SeqAIJ(Mat A,Vec xx,Vec yy) 8615c897100SBarry Smith { 8628d5b0100SBarry Smith PetscScalar zero = 0.0; 863dfbe8321SBarry Smith PetscErrorCode ierr; 8645c897100SBarry Smith 8655c897100SBarry Smith PetscFunctionBegin; 8665c897100SBarry Smith ierr = VecSet(&zero,yy);CHKERRQ(ierr); 8675c897100SBarry Smith ierr = MatMultTransposeAdd_SeqAIJ(A,xx,yy,yy);CHKERRQ(ierr); 8685c897100SBarry Smith PetscFunctionReturn(0); 8695c897100SBarry Smith } 8705c897100SBarry Smith 8715c897100SBarry Smith 8725c897100SBarry Smith #undef __FUNCT__ 8734a2ae208SSatish Balay #define __FUNCT__ "MatMult_SeqAIJ" 874dfbe8321SBarry Smith PetscErrorCode MatMult_SeqAIJ(Mat A,Vec xx,Vec yy) 87517ab2063SBarry Smith { 876416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 87797952fefSHong Zhang PetscScalar *x,*y,*aa; 878dfbe8321SBarry Smith PetscErrorCode ierr; 87997952fefSHong Zhang PetscInt m=A->m,*aj,*ii; 880aa482453SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 88197952fefSHong Zhang PetscInt n,i,jrow,j,*ridx=PETSC_NULL; 882362ced78SSatish Balay PetscScalar sum; 88397952fefSHong Zhang PetscTruth usecprow=a->compressedrow.use; 884e36a17ebSSatish Balay #endif 88517ab2063SBarry Smith 886b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 88797952fefSHong Zhang #pragma disjoint(*x,*y,*aa) 888fee21e36SBarry Smith #endif 889fee21e36SBarry Smith 8903a40ed3dSBarry Smith PetscFunctionBegin; 8911ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 8921ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 89397952fefSHong Zhang aj = a->j; 89497952fefSHong Zhang aa = a->a; 895416022c9SBarry Smith ii = a->i; 896aa482453SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 89797952fefSHong Zhang fortranmultaij_(&m,x,ii,aj,aa,y); 8988d195f9aSBarry Smith #else 8994eb6d288SHong Zhang if (usecprow){ /* use compressed row format */ 90097952fefSHong Zhang m = a->compressedrow.nrows; 90197952fefSHong Zhang ii = a->compressedrow.i; 90297952fefSHong Zhang ridx = a->compressedrow.rindex; 90397952fefSHong Zhang for (i=0; i<m; i++){ 90497952fefSHong Zhang n = ii[i+1] - ii[i]; 90597952fefSHong Zhang aj = a->j + ii[i]; 90697952fefSHong Zhang aa = a->a + ii[i]; 90797952fefSHong Zhang sum = 0.0; 90897952fefSHong Zhang for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; 90997952fefSHong Zhang y[*ridx++] = sum; 91097952fefSHong Zhang } 91197952fefSHong Zhang } else { /* do not use compressed row format */ 91217ab2063SBarry Smith for (i=0; i<m; i++) { 9139ea0dfa2SSatish Balay jrow = ii[i]; 9149ea0dfa2SSatish Balay n = ii[i+1] - jrow; 91517ab2063SBarry Smith sum = 0.0; 9169ea0dfa2SSatish Balay for (j=0; j<n; j++) { 91797952fefSHong Zhang sum += aa[jrow]*x[aj[jrow]]; jrow++; 9189ea0dfa2SSatish Balay } 91917ab2063SBarry Smith y[i] = sum; 92017ab2063SBarry Smith } 92197952fefSHong Zhang } 9228d195f9aSBarry Smith #endif 923efee365bSSatish Balay ierr = PetscLogFlops(2*a->nz - m);CHKERRQ(ierr); 9241ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 9251ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 9263a40ed3dSBarry Smith PetscFunctionReturn(0); 92717ab2063SBarry Smith } 92817ab2063SBarry Smith 9294a2ae208SSatish Balay #undef __FUNCT__ 9304a2ae208SSatish Balay #define __FUNCT__ "MatMultAdd_SeqAIJ" 931dfbe8321SBarry Smith PetscErrorCode MatMultAdd_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz) 93217ab2063SBarry Smith { 933416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 93497952fefSHong Zhang PetscScalar *x,*y,*z,*aa; 935dfbe8321SBarry Smith PetscErrorCode ierr; 93697952fefSHong Zhang PetscInt m = A->m,*aj,*ii; 937aa482453SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 93897952fefSHong Zhang PetscInt n,i,jrow,j,*ridx=PETSC_NULL; 939362ced78SSatish Balay PetscScalar sum; 94097952fefSHong Zhang PetscTruth usecprow=a->compressedrow.use; 941e36a17ebSSatish Balay #endif 9429ea0dfa2SSatish Balay 9433a40ed3dSBarry Smith PetscFunctionBegin; 9441ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 9451ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 9462e8a6d31SBarry Smith if (zz != yy) { 9471ebc52fbSHong Zhang ierr = VecGetArray(zz,&z);CHKERRQ(ierr); 9482e8a6d31SBarry Smith } else { 9492e8a6d31SBarry Smith z = y; 9502e8a6d31SBarry Smith } 951bfeeae90SHong Zhang 95297952fefSHong Zhang aj = a->j; 95397952fefSHong Zhang aa = a->a; 954cddf8d76SBarry Smith ii = a->i; 955aa482453SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 95697952fefSHong Zhang fortranmultaddaij_(&m,x,ii,aj,aa,y,z); 95702ab625aSSatish Balay #else 9584eb6d288SHong Zhang if (usecprow){ /* use compressed row format */ 9594eb6d288SHong Zhang if (zz != yy){ 9604eb6d288SHong Zhang ierr = PetscMemcpy(z,y,m*sizeof(PetscScalar));CHKERRQ(ierr); 9614eb6d288SHong Zhang } 96297952fefSHong Zhang m = a->compressedrow.nrows; 96397952fefSHong Zhang ii = a->compressedrow.i; 96497952fefSHong Zhang ridx = a->compressedrow.rindex; 96597952fefSHong Zhang for (i=0; i<m; i++){ 96697952fefSHong Zhang n = ii[i+1] - ii[i]; 96797952fefSHong Zhang aj = a->j + ii[i]; 96897952fefSHong Zhang aa = a->a + ii[i]; 96997952fefSHong Zhang sum = y[*ridx]; 97097952fefSHong Zhang for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; 97197952fefSHong Zhang z[*ridx++] = sum; 97297952fefSHong Zhang } 97397952fefSHong Zhang } else { /* do not use compressed row format */ 97417ab2063SBarry Smith for (i=0; i<m; i++) { 9759ea0dfa2SSatish Balay jrow = ii[i]; 9769ea0dfa2SSatish Balay n = ii[i+1] - jrow; 97717ab2063SBarry Smith sum = y[i]; 9789ea0dfa2SSatish Balay for (j=0; j<n; j++) { 97997952fefSHong Zhang sum += aa[jrow]*x[aj[jrow]]; jrow++; 9809ea0dfa2SSatish Balay } 98117ab2063SBarry Smith z[i] = sum; 98217ab2063SBarry Smith } 98397952fefSHong Zhang } 98402ab625aSSatish Balay #endif 985efee365bSSatish Balay ierr = PetscLogFlops(2*a->nz);CHKERRQ(ierr); 9861ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 9871ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 9882e8a6d31SBarry Smith if (zz != yy) { 9891ebc52fbSHong Zhang ierr = VecRestoreArray(zz,&z);CHKERRQ(ierr); 9902e8a6d31SBarry Smith } 9913a40ed3dSBarry Smith PetscFunctionReturn(0); 99217ab2063SBarry Smith } 99317ab2063SBarry Smith 99417ab2063SBarry Smith /* 99517ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 99617ab2063SBarry Smith */ 9974a2ae208SSatish Balay #undef __FUNCT__ 9984a2ae208SSatish Balay #define __FUNCT__ "MatMarkDiagonal_SeqAIJ" 999dfbe8321SBarry Smith PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 100017ab2063SBarry Smith { 1001416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 10026849ba73SBarry Smith PetscErrorCode ierr; 100397f1f81fSBarry Smith PetscInt i,j,*diag,m = A->m; 100417ab2063SBarry Smith 10053a40ed3dSBarry Smith PetscFunctionBegin; 1006f1e2ffcdSBarry Smith if (a->diag) PetscFunctionReturn(0); 1007f1e2ffcdSBarry Smith 100897f1f81fSBarry Smith ierr = PetscMalloc((m+1)*sizeof(PetscInt),&diag);CHKERRQ(ierr); 100952e6d16bSBarry Smith ierr = PetscLogObjectMemory(A,(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 1010273d9f13SBarry Smith for (i=0; i<A->m; i++) { 101135b0346bSBarry Smith diag[i] = a->i[i+1]; 1012bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1013bfeeae90SHong Zhang if (a->j[j] == i) { 1014bfeeae90SHong Zhang diag[i] = j; 101517ab2063SBarry Smith break; 101617ab2063SBarry Smith } 101717ab2063SBarry Smith } 101817ab2063SBarry Smith } 1019416022c9SBarry Smith a->diag = diag; 10203a40ed3dSBarry Smith PetscFunctionReturn(0); 102117ab2063SBarry Smith } 102217ab2063SBarry Smith 1023be5855fcSBarry Smith /* 1024be5855fcSBarry Smith Checks for missing diagonals 1025be5855fcSBarry Smith */ 10264a2ae208SSatish Balay #undef __FUNCT__ 10274a2ae208SSatish Balay #define __FUNCT__ "MatMissingDiagonal_SeqAIJ" 1028dfbe8321SBarry Smith PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A) 1029be5855fcSBarry Smith { 1030be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 10316849ba73SBarry Smith PetscErrorCode ierr; 103297f1f81fSBarry Smith PetscInt *diag,*jj = a->j,i; 1033be5855fcSBarry Smith 1034be5855fcSBarry Smith PetscFunctionBegin; 1035f1e2ffcdSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 1036f1e2ffcdSBarry Smith diag = a->diag; 1037273d9f13SBarry Smith for (i=0; i<A->m; i++) { 1038bfeeae90SHong Zhang if (jj[diag[i]] != i) { 103977431f27SBarry Smith SETERRQ1(PETSC_ERR_PLIB,"Matrix is missing diagonal number %D",i); 1040be5855fcSBarry Smith } 1041be5855fcSBarry Smith } 1042be5855fcSBarry Smith PetscFunctionReturn(0); 1043be5855fcSBarry Smith } 1044be5855fcSBarry Smith 10454a2ae208SSatish Balay #undef __FUNCT__ 10464a2ae208SSatish Balay #define __FUNCT__ "MatRelax_SeqAIJ" 104797f1f81fSBarry Smith PetscErrorCode MatRelax_SeqAIJ(Mat A,Vec bb,PetscReal omega,MatSORType flag,PetscReal fshift,PetscInt its,PetscInt lits,Vec xx) 104817ab2063SBarry Smith { 1049416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1050beeb8507SBarry Smith PetscScalar *x,d,*xs,sum,*t,scale,*idiag=0,*mdiag; 1051beeb8507SBarry Smith const PetscScalar *v = a->a, *b, *bs,*xb, *ts; 1052dfbe8321SBarry Smith PetscErrorCode ierr; 105397f1f81fSBarry Smith PetscInt n = A->n,m = A->m,i; 105497f1f81fSBarry Smith const PetscInt *idx,*diag; 105517ab2063SBarry Smith 10563a40ed3dSBarry Smith PetscFunctionBegin; 1057b965ef7fSBarry Smith its = its*lits; 105877431f27SBarry Smith if (its <= 0) SETERRQ2(PETSC_ERR_ARG_WRONG,"Relaxation requires global its %D and local its %D both positive",its,lits); 105991723122SBarry Smith 1060ed480e8bSBarry Smith if (!a->diag) {ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr);} 1061ed480e8bSBarry Smith diag = a->diag; 1062ed480e8bSBarry Smith if (!a->idiag) { 1063ed480e8bSBarry Smith ierr = PetscMalloc(3*m*sizeof(PetscScalar),&a->idiag);CHKERRQ(ierr); 1064ed480e8bSBarry Smith a->ssor = a->idiag + m; 1065ed480e8bSBarry Smith mdiag = a->ssor + m; 1066ed480e8bSBarry Smith 1067ed480e8bSBarry Smith v = a->a; 1068ed480e8bSBarry Smith 1069ed480e8bSBarry Smith /* this is wrong when fshift omega changes each iteration */ 1070958c9bccSBarry Smith if (omega == 1.0 && !fshift) { 1071ed480e8bSBarry Smith for (i=0; i<m; i++) { 1072ed480e8bSBarry Smith mdiag[i] = v[diag[i]]; 1073ed480e8bSBarry Smith a->idiag[i] = 1.0/v[diag[i]]; 1074ed480e8bSBarry Smith } 1075efee365bSSatish Balay ierr = PetscLogFlops(m);CHKERRQ(ierr); 1076ed480e8bSBarry Smith } else { 1077ed480e8bSBarry Smith for (i=0; i<m; i++) { 1078ed480e8bSBarry Smith mdiag[i] = v[diag[i]]; 1079beeb8507SBarry Smith a->idiag[i] = omega/(fshift + v[diag[i]]); 1080ed480e8bSBarry Smith } 1081efee365bSSatish Balay ierr = PetscLogFlops(2*m);CHKERRQ(ierr); 1082beeb8507SBarry Smith } 1083ed480e8bSBarry Smith } 1084ed480e8bSBarry Smith t = a->ssor; 1085ed480e8bSBarry Smith idiag = a->idiag; 1086ed480e8bSBarry Smith mdiag = a->idiag + 2*m; 1087ed480e8bSBarry Smith 10881ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 1089fb2e594dSBarry Smith if (xx != bb) { 10901ebc52fbSHong Zhang ierr = VecGetArray(bb,(PetscScalar**)&b);CHKERRQ(ierr); 1091fb2e594dSBarry Smith } else { 1092fb2e594dSBarry Smith b = x; 1093fb2e594dSBarry Smith } 1094fb2e594dSBarry Smith 1095ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 1096ed480e8bSBarry Smith xs = x; 109717ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 109817ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1099ed480e8bSBarry Smith bs = b; 110017ab2063SBarry Smith for (i=0; i<m; i++) { 1101ed480e8bSBarry Smith d = fshift + a->a[diag[i]]; 1102416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1103ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1104ed480e8bSBarry Smith v = a->a + diag[i] + 1; 110517ab2063SBarry Smith sum = b[i]*d/omega; 110617ab2063SBarry Smith SPARSEDENSEDOT(sum,bs,v,idx,n); 110717ab2063SBarry Smith x[i] = sum; 110817ab2063SBarry Smith } 11091ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 11101ebc52fbSHong Zhang if (bb != xx) {ierr = VecRestoreArray(bb,(PetscScalar**)&b);CHKERRQ(ierr);} 1111efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 11123a40ed3dSBarry Smith PetscFunctionReturn(0); 111317ab2063SBarry Smith } 1114c783ea89SBarry Smith 1115ed480e8bSBarry Smith 1116fc3d8934SBarry Smith /* Let A = L + U + D; where L is lower trianglar, 1117fc3d8934SBarry Smith U is upper triangular, E is diagonal; This routine applies 1118fc3d8934SBarry Smith 1119fc3d8934SBarry Smith (L + E)^{-1} A (U + E)^{-1} 1120fc3d8934SBarry Smith 1121fc3d8934SBarry Smith to a vector efficiently using Eisenstat's trick. This is for 1122fc3d8934SBarry Smith the case of SSOR preconditioner, so E is D/omega where omega 112348af12d7SBarry Smith is the relaxation factor. 1124fc3d8934SBarry Smith */ 1125fc3d8934SBarry Smith 112648af12d7SBarry Smith if (flag == SOR_APPLY_LOWER) { 112729bbc08cSBarry Smith SETERRQ(PETSC_ERR_SUP,"SOR_APPLY_LOWER is not implemented"); 11283a40ed3dSBarry Smith } else if (flag & SOR_EISENSTAT) { 112917ab2063SBarry Smith /* Let A = L + U + D; where L is lower trianglar, 113017ab2063SBarry Smith U is upper triangular, E is diagonal; This routine applies 113117ab2063SBarry Smith 113217ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 113317ab2063SBarry Smith 113417ab2063SBarry Smith to a vector efficiently using Eisenstat's trick. This is for 113517ab2063SBarry Smith the case of SSOR preconditioner, so E is D/omega where omega 113617ab2063SBarry Smith is the relaxation factor. 113717ab2063SBarry Smith */ 113817ab2063SBarry Smith scale = (2.0/omega) - 1.0; 113917ab2063SBarry Smith 114017ab2063SBarry Smith /* x = (E + U)^{-1} b */ 114117ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1142416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1143ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1144ed480e8bSBarry Smith v = a->a + diag[i] + 1; 114517ab2063SBarry Smith sum = b[i]; 114617ab2063SBarry Smith SPARSEDENSEMDOT(sum,xs,v,idx,n); 1147ed480e8bSBarry Smith x[i] = sum*idiag[i]; 114817ab2063SBarry Smith } 114917ab2063SBarry Smith 115017ab2063SBarry Smith /* t = b - (2*E - D)x */ 1151416022c9SBarry Smith v = a->a; 1152ed480e8bSBarry Smith for (i=0; i<m; i++) { t[i] = b[i] - scale*(v[*diag++])*x[i]; } 115317ab2063SBarry Smith 115417ab2063SBarry Smith /* t = (E + L)^{-1}t */ 1155ed480e8bSBarry Smith ts = t; 1156416022c9SBarry Smith diag = a->diag; 115717ab2063SBarry Smith for (i=0; i<m; i++) { 1158416022c9SBarry Smith n = diag[i] - a->i[i]; 1159ed480e8bSBarry Smith idx = a->j + a->i[i]; 1160ed480e8bSBarry Smith v = a->a + a->i[i]; 116117ab2063SBarry Smith sum = t[i]; 116217ab2063SBarry Smith SPARSEDENSEMDOT(sum,ts,v,idx,n); 1163ed480e8bSBarry Smith t[i] = sum*idiag[i]; 1164733d66baSBarry Smith /* x = x + t */ 1165733d66baSBarry Smith x[i] += t[i]; 116617ab2063SBarry Smith } 116717ab2063SBarry Smith 1168efee365bSSatish Balay ierr = PetscLogFlops(6*m-1 + 2*a->nz);CHKERRQ(ierr); 11691ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 11701ebc52fbSHong Zhang if (bb != xx) {ierr = VecRestoreArray(bb,(PetscScalar**)&b);CHKERRQ(ierr);} 11713a40ed3dSBarry Smith PetscFunctionReturn(0); 117217ab2063SBarry Smith } 117317ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 117417ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP){ 117577d8c4bbSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_RELAXAIJ) 117697f1f81fSBarry Smith fortranrelaxaijforwardzero_(&m,&omega,x,a->i,a->j,(PetscInt*)diag,idiag,a->a,(void*)b); 117777d8c4bbSBarry Smith #else 117817ab2063SBarry Smith for (i=0; i<m; i++) { 1179416022c9SBarry Smith n = diag[i] - a->i[i]; 1180ed480e8bSBarry Smith idx = a->j + a->i[i]; 1181ed480e8bSBarry Smith v = a->a + a->i[i]; 118217ab2063SBarry Smith sum = b[i]; 118317ab2063SBarry Smith SPARSEDENSEMDOT(sum,xs,v,idx,n); 1184ed480e8bSBarry Smith x[i] = sum*idiag[i]; 118517ab2063SBarry Smith } 118677d8c4bbSBarry Smith #endif 118717ab2063SBarry Smith xb = x; 1188efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 11893a40ed3dSBarry Smith } else xb = b; 119017ab2063SBarry Smith if ((flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) && 119117ab2063SBarry Smith (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP)) { 119217ab2063SBarry Smith for (i=0; i<m; i++) { 1193ed480e8bSBarry Smith x[i] *= mdiag[i]; 119417ab2063SBarry Smith } 1195efee365bSSatish Balay ierr = PetscLogFlops(m);CHKERRQ(ierr); 119617ab2063SBarry Smith } 119717ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP){ 119877d8c4bbSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_RELAXAIJ) 119997f1f81fSBarry Smith fortranrelaxaijbackwardzero_(&m,&omega,x,a->i,a->j,(PetscInt*)diag,idiag,a->a,(void*)xb); 120077d8c4bbSBarry Smith #else 120117ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1202416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1203ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1204ed480e8bSBarry Smith v = a->a + diag[i] + 1; 120517ab2063SBarry Smith sum = xb[i]; 120617ab2063SBarry Smith SPARSEDENSEMDOT(sum,xs,v,idx,n); 1207ed480e8bSBarry Smith x[i] = sum*idiag[i]; 120817ab2063SBarry Smith } 120977d8c4bbSBarry Smith #endif 1210efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 121117ab2063SBarry Smith } 121217ab2063SBarry Smith its--; 121317ab2063SBarry Smith } 121417ab2063SBarry Smith while (its--) { 121517ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP){ 121677d8c4bbSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_RELAXAIJ) 121797f1f81fSBarry Smith fortranrelaxaijforward_(&m,&omega,x,a->i,a->j,(PetscInt*)diag,a->a,(void*)b); 121877d8c4bbSBarry Smith #else 121917ab2063SBarry Smith for (i=0; i<m; i++) { 1220ed480e8bSBarry Smith d = fshift + a->a[diag[i]]; 1221416022c9SBarry Smith n = a->i[i+1] - a->i[i]; 1222ed480e8bSBarry Smith idx = a->j + a->i[i]; 1223ed480e8bSBarry Smith v = a->a + a->i[i]; 122417ab2063SBarry Smith sum = b[i]; 122517ab2063SBarry Smith SPARSEDENSEMDOT(sum,xs,v,idx,n); 1226ed480e8bSBarry Smith x[i] = (1. - omega)*x[i] + (sum + mdiag[i]*x[i])*idiag[i]; 122717ab2063SBarry Smith } 122877d8c4bbSBarry Smith #endif 1229efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 123017ab2063SBarry Smith } 123117ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP){ 123277d8c4bbSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_RELAXAIJ) 123397f1f81fSBarry Smith fortranrelaxaijbackward_(&m,&omega,x,a->i,a->j,(PetscInt*)diag,a->a,(void*)b); 123477d8c4bbSBarry Smith #else 123517ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1236ed480e8bSBarry Smith d = fshift + a->a[diag[i]]; 1237416022c9SBarry Smith n = a->i[i+1] - a->i[i]; 1238ed480e8bSBarry Smith idx = a->j + a->i[i]; 1239ed480e8bSBarry Smith v = a->a + a->i[i]; 124017ab2063SBarry Smith sum = b[i]; 124117ab2063SBarry Smith SPARSEDENSEMDOT(sum,xs,v,idx,n); 1242ed480e8bSBarry Smith x[i] = (1. - omega)*x[i] + (sum + mdiag[i]*x[i])*idiag[i]; 124317ab2063SBarry Smith } 124477d8c4bbSBarry Smith #endif 1245efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 124617ab2063SBarry Smith } 124717ab2063SBarry Smith } 12481ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 12491ebc52fbSHong Zhang if (bb != xx) {ierr = VecRestoreArray(bb,(PetscScalar**)&b);CHKERRQ(ierr);} 12503a40ed3dSBarry Smith PetscFunctionReturn(0); 125117ab2063SBarry Smith } 125217ab2063SBarry Smith 12534a2ae208SSatish Balay #undef __FUNCT__ 12544a2ae208SSatish Balay #define __FUNCT__ "MatGetInfo_SeqAIJ" 1255dfbe8321SBarry Smith PetscErrorCode MatGetInfo_SeqAIJ(Mat A,MatInfoType flag,MatInfo *info) 125617ab2063SBarry Smith { 1257416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 12584e220ebcSLois Curfman McInnes 12593a40ed3dSBarry Smith PetscFunctionBegin; 1260273d9f13SBarry Smith info->rows_global = (double)A->m; 1261273d9f13SBarry Smith info->columns_global = (double)A->n; 1262273d9f13SBarry Smith info->rows_local = (double)A->m; 1263273d9f13SBarry Smith info->columns_local = (double)A->n; 12644e220ebcSLois Curfman McInnes info->block_size = 1.0; 12654e220ebcSLois Curfman McInnes info->nz_allocated = (double)a->maxnz; 12664e220ebcSLois Curfman McInnes info->nz_used = (double)a->nz; 12674e220ebcSLois Curfman McInnes info->nz_unneeded = (double)(a->maxnz - a->nz); 12684e220ebcSLois Curfman McInnes info->assemblies = (double)A->num_ass; 12694e220ebcSLois Curfman McInnes info->mallocs = (double)a->reallocs; 12704e220ebcSLois Curfman McInnes info->memory = A->mem; 12714e220ebcSLois Curfman McInnes if (A->factor) { 12724e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 12734e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 12744e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 12754e220ebcSLois Curfman McInnes } else { 12764e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 12774e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 12784e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 12794e220ebcSLois Curfman McInnes } 12803a40ed3dSBarry Smith PetscFunctionReturn(0); 128117ab2063SBarry Smith } 128217ab2063SBarry Smith 12834a2ae208SSatish Balay #undef __FUNCT__ 12844a2ae208SSatish Balay #define __FUNCT__ "MatZeroRows_SeqAIJ" 1285dfbe8321SBarry Smith PetscErrorCode MatZeroRows_SeqAIJ(Mat A,IS is,const PetscScalar *diag) 128617ab2063SBarry Smith { 1287416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 12886849ba73SBarry Smith PetscErrorCode ierr; 128997f1f81fSBarry Smith PetscInt i,N,*rows,m = A->m - 1; 129017ab2063SBarry Smith 12913a40ed3dSBarry Smith PetscFunctionBegin; 1292b9b97703SBarry Smith ierr = ISGetLocalSize(is,&N);CHKERRQ(ierr); 129317ab2063SBarry Smith ierr = ISGetIndices(is,&rows);CHKERRQ(ierr); 1294f1e2ffcdSBarry Smith if (a->keepzeroedrows) { 1295f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 129677431f27SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 1297bfeeae90SHong Zhang ierr = PetscMemzero(&a->a[a->i[rows[i]]],a->ilen[rows[i]]*sizeof(PetscScalar));CHKERRQ(ierr); 1298f1e2ffcdSBarry Smith } 1299f1e2ffcdSBarry Smith if (diag) { 1300f1e2ffcdSBarry Smith ierr = MatMissingDiagonal_SeqAIJ(A);CHKERRQ(ierr); 1301f1e2ffcdSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 1302f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 1303f1e2ffcdSBarry Smith a->a[a->diag[rows[i]]] = *diag; 1304f1e2ffcdSBarry Smith } 1305f1e2ffcdSBarry Smith } 130688e51ccdSHong Zhang A->same_nonzero = PETSC_TRUE; 1307f1e2ffcdSBarry Smith } else { 130817ab2063SBarry Smith if (diag) { 130917ab2063SBarry Smith for (i=0; i<N; i++) { 131077431f27SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 13117ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 1312416022c9SBarry Smith a->ilen[rows[i]] = 1; 1313bfeeae90SHong Zhang a->a[a->i[rows[i]]] = *diag; 1314bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 13157ae801bdSBarry Smith } else { /* in case row was completely empty */ 1316d64ed03dSBarry Smith ierr = MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],diag,INSERT_VALUES);CHKERRQ(ierr); 131717ab2063SBarry Smith } 131817ab2063SBarry Smith } 13193a40ed3dSBarry Smith } else { 132017ab2063SBarry Smith for (i=0; i<N; i++) { 132177431f27SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 1322416022c9SBarry Smith a->ilen[rows[i]] = 0; 132317ab2063SBarry Smith } 132417ab2063SBarry Smith } 132588e51ccdSHong Zhang A->same_nonzero = PETSC_FALSE; 1326f1e2ffcdSBarry Smith } 13277ae801bdSBarry Smith ierr = ISRestoreIndices(is,&rows);CHKERRQ(ierr); 132843a90d84SBarry Smith ierr = MatAssemblyEnd_SeqAIJ(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 13293a40ed3dSBarry Smith PetscFunctionReturn(0); 133017ab2063SBarry Smith } 133117ab2063SBarry Smith 13324a2ae208SSatish Balay #undef __FUNCT__ 13334a2ae208SSatish Balay #define __FUNCT__ "MatGetRow_SeqAIJ" 133497f1f81fSBarry Smith PetscErrorCode MatGetRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 133517ab2063SBarry Smith { 1336416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 133797f1f81fSBarry Smith PetscInt *itmp; 133817ab2063SBarry Smith 13393a40ed3dSBarry Smith PetscFunctionBegin; 134077431f27SBarry Smith if (row < 0 || row >= A->m) SETERRQ1(PETSC_ERR_ARG_OUTOFRANGE,"Row %D out of range",row); 134117ab2063SBarry Smith 1342416022c9SBarry Smith *nz = a->i[row+1] - a->i[row]; 1343bfeeae90SHong Zhang if (v) *v = a->a + a->i[row]; 134417ab2063SBarry Smith if (idx) { 1345bfeeae90SHong Zhang itmp = a->j + a->i[row]; 1346bfeeae90SHong Zhang if (*nz) { 13474e093b46SBarry Smith *idx = itmp; 134817ab2063SBarry Smith } 134917ab2063SBarry Smith else *idx = 0; 135017ab2063SBarry Smith } 13513a40ed3dSBarry Smith PetscFunctionReturn(0); 135217ab2063SBarry Smith } 135317ab2063SBarry Smith 1354bfeeae90SHong Zhang /* remove this function? */ 13554a2ae208SSatish Balay #undef __FUNCT__ 13564a2ae208SSatish Balay #define __FUNCT__ "MatRestoreRow_SeqAIJ" 135797f1f81fSBarry Smith PetscErrorCode MatRestoreRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 135817ab2063SBarry Smith { 13593a40ed3dSBarry Smith PetscFunctionBegin; 13603a40ed3dSBarry Smith PetscFunctionReturn(0); 136117ab2063SBarry Smith } 136217ab2063SBarry Smith 13634a2ae208SSatish Balay #undef __FUNCT__ 13644a2ae208SSatish Balay #define __FUNCT__ "MatNorm_SeqAIJ" 1365dfbe8321SBarry Smith PetscErrorCode MatNorm_SeqAIJ(Mat A,NormType type,PetscReal *nrm) 136617ab2063SBarry Smith { 1367416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 136887828ca2SBarry Smith PetscScalar *v = a->a; 136936db0b34SBarry Smith PetscReal sum = 0.0; 13706849ba73SBarry Smith PetscErrorCode ierr; 137197f1f81fSBarry Smith PetscInt i,j; 137217ab2063SBarry Smith 13733a40ed3dSBarry Smith PetscFunctionBegin; 137417ab2063SBarry Smith if (type == NORM_FROBENIUS) { 1375416022c9SBarry Smith for (i=0; i<a->nz; i++) { 1376aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 137736db0b34SBarry Smith sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 137817ab2063SBarry Smith #else 137917ab2063SBarry Smith sum += (*v)*(*v); v++; 138017ab2063SBarry Smith #endif 138117ab2063SBarry Smith } 1382064f8208SBarry Smith *nrm = sqrt(sum); 13833a40ed3dSBarry Smith } else if (type == NORM_1) { 138436db0b34SBarry Smith PetscReal *tmp; 138597f1f81fSBarry Smith PetscInt *jj = a->j; 1386b0a32e0cSBarry Smith ierr = PetscMalloc((A->n+1)*sizeof(PetscReal),&tmp);CHKERRQ(ierr); 1387273d9f13SBarry Smith ierr = PetscMemzero(tmp,A->n*sizeof(PetscReal));CHKERRQ(ierr); 1388064f8208SBarry Smith *nrm = 0.0; 1389416022c9SBarry Smith for (j=0; j<a->nz; j++) { 1390bfeeae90SHong Zhang tmp[*jj++] += PetscAbsScalar(*v); v++; 139117ab2063SBarry Smith } 1392273d9f13SBarry Smith for (j=0; j<A->n; j++) { 1393064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 139417ab2063SBarry Smith } 1395606d414cSSatish Balay ierr = PetscFree(tmp);CHKERRQ(ierr); 13963a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 1397064f8208SBarry Smith *nrm = 0.0; 1398273d9f13SBarry Smith for (j=0; j<A->m; j++) { 1399bfeeae90SHong Zhang v = a->a + a->i[j]; 140017ab2063SBarry Smith sum = 0.0; 1401416022c9SBarry Smith for (i=0; i<a->i[j+1]-a->i[j]; i++) { 1402cddf8d76SBarry Smith sum += PetscAbsScalar(*v); v++; 140317ab2063SBarry Smith } 1404064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 140517ab2063SBarry Smith } 14063a40ed3dSBarry Smith } else { 140729bbc08cSBarry Smith SETERRQ(PETSC_ERR_SUP,"No support for two norm"); 140817ab2063SBarry Smith } 14093a40ed3dSBarry Smith PetscFunctionReturn(0); 141017ab2063SBarry Smith } 141117ab2063SBarry Smith 14124a2ae208SSatish Balay #undef __FUNCT__ 14134a2ae208SSatish Balay #define __FUNCT__ "MatTranspose_SeqAIJ" 1414dfbe8321SBarry Smith PetscErrorCode MatTranspose_SeqAIJ(Mat A,Mat *B) 141517ab2063SBarry Smith { 1416416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1417416022c9SBarry Smith Mat C; 14186849ba73SBarry Smith PetscErrorCode ierr; 141997f1f81fSBarry Smith PetscInt i,*aj = a->j,*ai = a->i,m = A->m,len,*col; 142087828ca2SBarry Smith PetscScalar *array = a->a; 142117ab2063SBarry Smith 14223a40ed3dSBarry Smith PetscFunctionBegin; 1423273d9f13SBarry Smith if (!B && m != A->n) SETERRQ(PETSC_ERR_ARG_SIZ,"Square matrix only for in-place"); 142497f1f81fSBarry Smith ierr = PetscMalloc((1+A->n)*sizeof(PetscInt),&col);CHKERRQ(ierr); 142597f1f81fSBarry Smith ierr = PetscMemzero(col,(1+A->n)*sizeof(PetscInt));CHKERRQ(ierr); 1426bfeeae90SHong Zhang 1427bfeeae90SHong Zhang for (i=0; i<ai[m]; i++) col[aj[i]] += 1; 1428f204ca49SKris Buschelman ierr = MatCreate(A->comm,A->n,m,A->n,m,&C);CHKERRQ(ierr); 1429f204ca49SKris Buschelman ierr = MatSetType(C,A->type_name);CHKERRQ(ierr); 1430*ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,col);CHKERRQ(ierr); 1431606d414cSSatish Balay ierr = PetscFree(col);CHKERRQ(ierr); 143217ab2063SBarry Smith for (i=0; i<m; i++) { 143317ab2063SBarry Smith len = ai[i+1]-ai[i]; 1434416022c9SBarry Smith ierr = MatSetValues(C,len,aj,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 1435b9b97703SBarry Smith array += len; 1436b9b97703SBarry Smith aj += len; 143717ab2063SBarry Smith } 143817ab2063SBarry Smith 14396d4a8577SBarry Smith ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 14406d4a8577SBarry Smith ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 144117ab2063SBarry Smith 1442f1e2ffcdSBarry Smith if (B) { 1443416022c9SBarry Smith *B = C; 144417ab2063SBarry Smith } else { 1445273d9f13SBarry Smith ierr = MatHeaderCopy(A,C);CHKERRQ(ierr); 144617ab2063SBarry Smith } 14473a40ed3dSBarry Smith PetscFunctionReturn(0); 144817ab2063SBarry Smith } 144917ab2063SBarry Smith 1450cd0d46ebSvictorle EXTERN_C_BEGIN 1451cd0d46ebSvictorle #undef __FUNCT__ 14525fbd3699SBarry Smith #define __FUNCT__ "MatIsTranspose_SeqAIJ" 1453be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatIsTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscTruth *f) 1454cd0d46ebSvictorle { 1455cd0d46ebSvictorle Mat_SeqAIJ *aij = (Mat_SeqAIJ *) A->data,*bij = (Mat_SeqAIJ*) A->data; 145697f1f81fSBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; PetscScalar *va,*vb; 14576849ba73SBarry Smith PetscErrorCode ierr; 145897f1f81fSBarry Smith PetscInt ma,na,mb,nb, i; 1459cd0d46ebSvictorle 1460cd0d46ebSvictorle PetscFunctionBegin; 1461cd0d46ebSvictorle bij = (Mat_SeqAIJ *) B->data; 1462cd0d46ebSvictorle 1463cd0d46ebSvictorle ierr = MatGetSize(A,&ma,&na);CHKERRQ(ierr); 1464cd0d46ebSvictorle ierr = MatGetSize(B,&mb,&nb);CHKERRQ(ierr); 14655485867bSBarry Smith if (ma!=nb || na!=mb){ 14665485867bSBarry Smith *f = PETSC_FALSE; 14675485867bSBarry Smith PetscFunctionReturn(0); 14685485867bSBarry Smith } 1469cd0d46ebSvictorle aii = aij->i; bii = bij->i; 1470cd0d46ebSvictorle adx = aij->j; bdx = bij->j; 1471cd0d46ebSvictorle va = aij->a; vb = bij->a; 147297f1f81fSBarry Smith ierr = PetscMalloc(ma*sizeof(PetscInt),&aptr);CHKERRQ(ierr); 147397f1f81fSBarry Smith ierr = PetscMalloc(mb*sizeof(PetscInt),&bptr);CHKERRQ(ierr); 1474cd0d46ebSvictorle for (i=0; i<ma; i++) aptr[i] = aii[i]; 1475cd0d46ebSvictorle for (i=0; i<mb; i++) bptr[i] = bii[i]; 1476cd0d46ebSvictorle 1477cd0d46ebSvictorle *f = PETSC_TRUE; 1478cd0d46ebSvictorle for (i=0; i<ma; i++) { 1479cd0d46ebSvictorle while (aptr[i]<aii[i+1]) { 148097f1f81fSBarry Smith PetscInt idc,idr; 14815485867bSBarry Smith PetscScalar vc,vr; 1482cd0d46ebSvictorle /* column/row index/value */ 14835485867bSBarry Smith idc = adx[aptr[i]]; 14845485867bSBarry Smith idr = bdx[bptr[idc]]; 14855485867bSBarry Smith vc = va[aptr[i]]; 14865485867bSBarry Smith vr = vb[bptr[idc]]; 14875485867bSBarry Smith if (i!=idr || PetscAbsScalar(vc-vr) > tol) { 14885485867bSBarry Smith *f = PETSC_FALSE; 14895485867bSBarry Smith goto done; 1490cd0d46ebSvictorle } else { 14915485867bSBarry Smith aptr[i]++; 14925485867bSBarry Smith if (B || i!=idc) bptr[idc]++; 1493cd0d46ebSvictorle } 1494cd0d46ebSvictorle } 1495cd0d46ebSvictorle } 1496cd0d46ebSvictorle done: 1497cd0d46ebSvictorle ierr = PetscFree(aptr);CHKERRQ(ierr); 14983aeef889SHong Zhang if (B) { 14993aeef889SHong Zhang ierr = PetscFree(bptr);CHKERRQ(ierr); 15003aeef889SHong Zhang } 1501cd0d46ebSvictorle PetscFunctionReturn(0); 1502cd0d46ebSvictorle } 1503cd0d46ebSvictorle EXTERN_C_END 1504cd0d46ebSvictorle 15059e29f15eSvictorle #undef __FUNCT__ 15069e29f15eSvictorle #define __FUNCT__ "MatIsSymmetric_SeqAIJ" 1507dfbe8321SBarry Smith PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A,PetscReal tol,PetscTruth *f) 15089e29f15eSvictorle { 1509dfbe8321SBarry Smith PetscErrorCode ierr; 15109e29f15eSvictorle PetscFunctionBegin; 15115485867bSBarry Smith ierr = MatIsTranspose_SeqAIJ(A,A,tol,f);CHKERRQ(ierr); 15129e29f15eSvictorle PetscFunctionReturn(0); 15139e29f15eSvictorle } 15149e29f15eSvictorle 15154a2ae208SSatish Balay #undef __FUNCT__ 15164a2ae208SSatish Balay #define __FUNCT__ "MatDiagonalScale_SeqAIJ" 1517dfbe8321SBarry Smith PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A,Vec ll,Vec rr) 151817ab2063SBarry Smith { 1519416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 152087828ca2SBarry Smith PetscScalar *l,*r,x,*v; 1521dfbe8321SBarry Smith PetscErrorCode ierr; 152297f1f81fSBarry Smith PetscInt i,j,m = A->m,n = A->n,M,nz = a->nz,*jj; 152317ab2063SBarry Smith 15243a40ed3dSBarry Smith PetscFunctionBegin; 152517ab2063SBarry Smith if (ll) { 15263ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 15273ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 1528e1311b90SBarry Smith ierr = VecGetLocalSize(ll,&m);CHKERRQ(ierr); 1529273d9f13SBarry Smith if (m != A->m) SETERRQ(PETSC_ERR_ARG_SIZ,"Left scaling vector wrong length"); 15301ebc52fbSHong Zhang ierr = VecGetArray(ll,&l);CHKERRQ(ierr); 1531416022c9SBarry Smith v = a->a; 153217ab2063SBarry Smith for (i=0; i<m; i++) { 153317ab2063SBarry Smith x = l[i]; 1534416022c9SBarry Smith M = a->i[i+1] - a->i[i]; 153517ab2063SBarry Smith for (j=0; j<M; j++) { (*v++) *= x;} 153617ab2063SBarry Smith } 15371ebc52fbSHong Zhang ierr = VecRestoreArray(ll,&l);CHKERRQ(ierr); 1538efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 153917ab2063SBarry Smith } 154017ab2063SBarry Smith if (rr) { 1541e1311b90SBarry Smith ierr = VecGetLocalSize(rr,&n);CHKERRQ(ierr); 1542273d9f13SBarry Smith if (n != A->n) SETERRQ(PETSC_ERR_ARG_SIZ,"Right scaling vector wrong length"); 15431ebc52fbSHong Zhang ierr = VecGetArray(rr,&r);CHKERRQ(ierr); 1544416022c9SBarry Smith v = a->a; jj = a->j; 154517ab2063SBarry Smith for (i=0; i<nz; i++) { 1546bfeeae90SHong Zhang (*v++) *= r[*jj++]; 154717ab2063SBarry Smith } 15481ebc52fbSHong Zhang ierr = VecRestoreArray(rr,&r);CHKERRQ(ierr); 1549efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 155017ab2063SBarry Smith } 15513a40ed3dSBarry Smith PetscFunctionReturn(0); 155217ab2063SBarry Smith } 155317ab2063SBarry Smith 15544a2ae208SSatish Balay #undef __FUNCT__ 15554a2ae208SSatish Balay #define __FUNCT__ "MatGetSubMatrix_SeqAIJ" 155697f1f81fSBarry Smith PetscErrorCode MatGetSubMatrix_SeqAIJ(Mat A,IS isrow,IS iscol,PetscInt csize,MatReuse scall,Mat *B) 155717ab2063SBarry Smith { 1558db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*c; 15596849ba73SBarry Smith PetscErrorCode ierr; 156097f1f81fSBarry Smith PetscInt *smap,i,k,kstart,kend,oldcols = A->n,*lens; 156197f1f81fSBarry Smith PetscInt row,mat_i,*mat_j,tcol,first,step,*mat_ilen,sum,lensi; 156297f1f81fSBarry Smith PetscInt *irow,*icol,nrows,ncols; 156397f1f81fSBarry Smith PetscInt *starts,*j_new,*i_new,*aj = a->j,*ai = a->i,ii,*ailen = a->ilen; 156487828ca2SBarry Smith PetscScalar *a_new,*mat_a; 1565416022c9SBarry Smith Mat C; 1566fee21e36SBarry Smith PetscTruth stride; 156717ab2063SBarry Smith 15683a40ed3dSBarry Smith PetscFunctionBegin; 1569d64ed03dSBarry Smith ierr = ISSorted(isrow,(PetscTruth*)&i);CHKERRQ(ierr); 157029bbc08cSBarry Smith if (!i) SETERRQ(PETSC_ERR_ARG_WRONGSTATE,"ISrow is not sorted"); 1571d64ed03dSBarry Smith ierr = ISSorted(iscol,(PetscTruth*)&i);CHKERRQ(ierr); 157229bbc08cSBarry Smith if (!i) SETERRQ(PETSC_ERR_ARG_WRONGSTATE,"IScol is not sorted"); 157399141d43SSatish Balay 157417ab2063SBarry Smith ierr = ISGetIndices(isrow,&irow);CHKERRQ(ierr); 1575b9b97703SBarry Smith ierr = ISGetLocalSize(isrow,&nrows);CHKERRQ(ierr); 1576b9b97703SBarry Smith ierr = ISGetLocalSize(iscol,&ncols);CHKERRQ(ierr); 157717ab2063SBarry Smith 1578fee21e36SBarry Smith ierr = ISStrideGetInfo(iscol,&first,&step);CHKERRQ(ierr); 1579fee21e36SBarry Smith ierr = ISStride(iscol,&stride);CHKERRQ(ierr); 1580fee21e36SBarry Smith if (stride && step == 1) { 158102834360SBarry Smith /* special case of contiguous rows */ 158297f1f81fSBarry Smith ierr = PetscMalloc((2*nrows+1)*sizeof(PetscInt),&lens);CHKERRQ(ierr); 158331ebf83bSSatish Balay starts = lens + nrows; 158402834360SBarry Smith /* loop over new rows determining lens and starting points */ 158502834360SBarry Smith for (i=0; i<nrows; i++) { 1586bfeeae90SHong Zhang kstart = ai[irow[i]]; 1587a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 158802834360SBarry Smith for (k=kstart; k<kend; k++) { 1589bfeeae90SHong Zhang if (aj[k] >= first) { 159002834360SBarry Smith starts[i] = k; 159102834360SBarry Smith break; 159202834360SBarry Smith } 159302834360SBarry Smith } 1594a2744918SBarry Smith sum = 0; 159502834360SBarry Smith while (k < kend) { 1596bfeeae90SHong Zhang if (aj[k++] >= first+ncols) break; 1597a2744918SBarry Smith sum++; 159802834360SBarry Smith } 1599a2744918SBarry Smith lens[i] = sum; 160002834360SBarry Smith } 160102834360SBarry Smith /* create submatrix */ 1602cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 160397f1f81fSBarry Smith PetscInt n_cols,n_rows; 160408480c60SBarry Smith ierr = MatGetSize(*B,&n_rows,&n_cols);CHKERRQ(ierr); 160529bbc08cSBarry Smith if (n_rows != nrows || n_cols != ncols) SETERRQ(PETSC_ERR_ARG_SIZ,"Reused submatrix wrong size"); 1606d8ced48eSBarry Smith ierr = MatZeroEntries(*B);CHKERRQ(ierr); 160708480c60SBarry Smith C = *B; 16083a40ed3dSBarry Smith } else { 1609e2d9671bSKris Buschelman ierr = MatCreate(A->comm,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE,&C);CHKERRQ(ierr); 1610e2d9671bSKris Buschelman ierr = MatSetType(C,A->type_name);CHKERRQ(ierr); 1611*ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens);CHKERRQ(ierr); 161208480c60SBarry Smith } 1613db02288aSLois Curfman McInnes c = (Mat_SeqAIJ*)C->data; 1614db02288aSLois Curfman McInnes 161502834360SBarry Smith /* loop over rows inserting into submatrix */ 1616db02288aSLois Curfman McInnes a_new = c->a; 1617db02288aSLois Curfman McInnes j_new = c->j; 1618db02288aSLois Curfman McInnes i_new = c->i; 1619bfeeae90SHong Zhang 162002834360SBarry Smith for (i=0; i<nrows; i++) { 1621a2744918SBarry Smith ii = starts[i]; 1622a2744918SBarry Smith lensi = lens[i]; 1623a2744918SBarry Smith for (k=0; k<lensi; k++) { 1624a2744918SBarry Smith *j_new++ = aj[ii+k] - first; 162502834360SBarry Smith } 162687828ca2SBarry Smith ierr = PetscMemcpy(a_new,a->a + starts[i],lensi*sizeof(PetscScalar));CHKERRQ(ierr); 1627a2744918SBarry Smith a_new += lensi; 1628a2744918SBarry Smith i_new[i+1] = i_new[i] + lensi; 1629a2744918SBarry Smith c->ilen[i] = lensi; 163002834360SBarry Smith } 1631606d414cSSatish Balay ierr = PetscFree(lens);CHKERRQ(ierr); 16323a40ed3dSBarry Smith } else { 163302834360SBarry Smith ierr = ISGetIndices(iscol,&icol);CHKERRQ(ierr); 163497f1f81fSBarry Smith ierr = PetscMalloc((1+oldcols)*sizeof(PetscInt),&smap);CHKERRQ(ierr); 1635bfeeae90SHong Zhang 163697f1f81fSBarry Smith ierr = PetscMalloc((1+nrows)*sizeof(PetscInt),&lens);CHKERRQ(ierr); 163797f1f81fSBarry Smith ierr = PetscMemzero(smap,oldcols*sizeof(PetscInt));CHKERRQ(ierr); 163817ab2063SBarry Smith for (i=0; i<ncols; i++) smap[icol[i]] = i+1; 163902834360SBarry Smith /* determine lens of each row */ 164002834360SBarry Smith for (i=0; i<nrows; i++) { 1641bfeeae90SHong Zhang kstart = ai[irow[i]]; 164202834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 164302834360SBarry Smith lens[i] = 0; 164402834360SBarry Smith for (k=kstart; k<kend; k++) { 1645bfeeae90SHong Zhang if (smap[aj[k]]) { 164602834360SBarry Smith lens[i]++; 164702834360SBarry Smith } 164802834360SBarry Smith } 164902834360SBarry Smith } 165017ab2063SBarry Smith /* Create and fill new matrix */ 1651a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 16520f5bd95cSBarry Smith PetscTruth equal; 16530f5bd95cSBarry Smith 165499141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 1655273d9f13SBarry Smith if ((*B)->m != nrows || (*B)->n != ncols) SETERRQ(PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong size"); 165697f1f81fSBarry Smith ierr = PetscMemcmp(c->ilen,lens,(*B)->m*sizeof(PetscInt),&equal);CHKERRQ(ierr); 16570f5bd95cSBarry Smith if (!equal) { 165829bbc08cSBarry Smith SETERRQ(PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong no of nonzeros"); 165999141d43SSatish Balay } 166097f1f81fSBarry Smith ierr = PetscMemzero(c->ilen,(*B)->m*sizeof(PetscInt));CHKERRQ(ierr); 166108480c60SBarry Smith C = *B; 16623a40ed3dSBarry Smith } else { 1663e2d9671bSKris Buschelman ierr = MatCreate(A->comm,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE,&C);CHKERRQ(ierr); 1664e2d9671bSKris Buschelman ierr = MatSetType(C,A->type_name);CHKERRQ(ierr); 1665*ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens);CHKERRQ(ierr); 166608480c60SBarry Smith } 166799141d43SSatish Balay c = (Mat_SeqAIJ *)(C->data); 166817ab2063SBarry Smith for (i=0; i<nrows; i++) { 166999141d43SSatish Balay row = irow[i]; 1670bfeeae90SHong Zhang kstart = ai[row]; 167199141d43SSatish Balay kend = kstart + a->ilen[row]; 1672bfeeae90SHong Zhang mat_i = c->i[i]; 167399141d43SSatish Balay mat_j = c->j + mat_i; 167499141d43SSatish Balay mat_a = c->a + mat_i; 167599141d43SSatish Balay mat_ilen = c->ilen + i; 167617ab2063SBarry Smith for (k=kstart; k<kend; k++) { 1677bfeeae90SHong Zhang if ((tcol=smap[a->j[k]])) { 1678ed480e8bSBarry Smith *mat_j++ = tcol - 1; 167999141d43SSatish Balay *mat_a++ = a->a[k]; 168099141d43SSatish Balay (*mat_ilen)++; 168199141d43SSatish Balay 168217ab2063SBarry Smith } 168317ab2063SBarry Smith } 168417ab2063SBarry Smith } 168502834360SBarry Smith /* Free work space */ 168602834360SBarry Smith ierr = ISRestoreIndices(iscol,&icol);CHKERRQ(ierr); 1687606d414cSSatish Balay ierr = PetscFree(smap);CHKERRQ(ierr); 1688606d414cSSatish Balay ierr = PetscFree(lens);CHKERRQ(ierr); 168902834360SBarry Smith } 16906d4a8577SBarry Smith ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 16916d4a8577SBarry Smith ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 169217ab2063SBarry Smith 169317ab2063SBarry Smith ierr = ISRestoreIndices(isrow,&irow);CHKERRQ(ierr); 1694416022c9SBarry Smith *B = C; 16953a40ed3dSBarry Smith PetscFunctionReturn(0); 169617ab2063SBarry Smith } 169717ab2063SBarry Smith 1698a871dcd8SBarry Smith /* 1699a871dcd8SBarry Smith */ 17004a2ae208SSatish Balay #undef __FUNCT__ 17014a2ae208SSatish Balay #define __FUNCT__ "MatILUFactor_SeqAIJ" 1702dfbe8321SBarry Smith PetscErrorCode MatILUFactor_SeqAIJ(Mat inA,IS row,IS col,MatFactorInfo *info) 1703a871dcd8SBarry Smith { 170463b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 1705dfbe8321SBarry Smith PetscErrorCode ierr; 170663b91edcSBarry Smith Mat outA; 1707b8a78c4aSBarry Smith PetscTruth row_identity,col_identity; 170863b91edcSBarry Smith 17093a40ed3dSBarry Smith PetscFunctionBegin; 1710d3d32019SBarry Smith if (info->levels != 0) SETERRQ(PETSC_ERR_SUP,"Only levels=0 supported for in-place ilu"); 1711b8a78c4aSBarry Smith ierr = ISIdentity(row,&row_identity);CHKERRQ(ierr); 1712b8a78c4aSBarry Smith ierr = ISIdentity(col,&col_identity);CHKERRQ(ierr); 1713b8a78c4aSBarry Smith if (!row_identity || !col_identity) { 1714634064b4SBarry Smith SETERRQ(PETSC_ERR_ARG_WRONG,"Row and column permutations must be identity for in-place ILU"); 1715b8a78c4aSBarry Smith } 1716a871dcd8SBarry Smith 171763b91edcSBarry Smith outA = inA; 171863b91edcSBarry Smith inA->factor = FACTOR_LU; 171963b91edcSBarry Smith a->row = row; 172063b91edcSBarry Smith a->col = col; 1721c38d4ed2SBarry Smith ierr = PetscObjectReference((PetscObject)row);CHKERRQ(ierr); 1722c38d4ed2SBarry Smith ierr = PetscObjectReference((PetscObject)col);CHKERRQ(ierr); 172363b91edcSBarry Smith 172436db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 1725b9b97703SBarry Smith if (a->icol) {ierr = ISDestroy(a->icol);CHKERRQ(ierr);} /* need to remove old one */ 17264c49b128SBarry Smith ierr = ISInvertPermutation(col,PETSC_DECIDE,&a->icol);CHKERRQ(ierr); 172752e6d16bSBarry Smith ierr = PetscLogObjectParent(inA,a->icol);CHKERRQ(ierr); 1728f0ec6fceSSatish Balay 172994a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 173087828ca2SBarry Smith ierr = PetscMalloc((inA->m+1)*sizeof(PetscScalar),&a->solve_work);CHKERRQ(ierr); 173194a9d846SBarry Smith } 173263b91edcSBarry Smith 173308480c60SBarry Smith if (!a->diag) { 1734f1e2ffcdSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(inA);CHKERRQ(ierr); 173563b91edcSBarry Smith } 1736af281ebdSHong Zhang ierr = MatLUFactorNumeric_SeqAIJ(inA,info,&outA);CHKERRQ(ierr); 17373a40ed3dSBarry Smith PetscFunctionReturn(0); 1738a871dcd8SBarry Smith } 1739a871dcd8SBarry Smith 1740d9eff348SSatish Balay #include "petscblaslapack.h" 17414a2ae208SSatish Balay #undef __FUNCT__ 17424a2ae208SSatish Balay #define __FUNCT__ "MatScale_SeqAIJ" 1743dfbe8321SBarry Smith PetscErrorCode MatScale_SeqAIJ(const PetscScalar *alpha,Mat inA) 1744f0b747eeSBarry Smith { 1745f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 17464ce68768SBarry Smith PetscBLASInt bnz = (PetscBLASInt)a->nz,one = 1; 1747efee365bSSatish Balay PetscErrorCode ierr; 1748efee365bSSatish Balay 17493a40ed3dSBarry Smith 17503a40ed3dSBarry Smith PetscFunctionBegin; 175171044d3cSBarry Smith BLASscal_(&bnz,(PetscScalar*)alpha,a->a,&one); 1752efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 17533a40ed3dSBarry Smith PetscFunctionReturn(0); 1754f0b747eeSBarry Smith } 1755f0b747eeSBarry Smith 17564a2ae208SSatish Balay #undef __FUNCT__ 17574a2ae208SSatish Balay #define __FUNCT__ "MatGetSubMatrices_SeqAIJ" 175897f1f81fSBarry Smith PetscErrorCode MatGetSubMatrices_SeqAIJ(Mat A,PetscInt n,const IS irow[],const IS icol[],MatReuse scall,Mat *B[]) 1759cddf8d76SBarry Smith { 1760dfbe8321SBarry Smith PetscErrorCode ierr; 176197f1f81fSBarry Smith PetscInt i; 1762cddf8d76SBarry Smith 17633a40ed3dSBarry Smith PetscFunctionBegin; 1764cddf8d76SBarry Smith if (scall == MAT_INITIAL_MATRIX) { 1765b0a32e0cSBarry Smith ierr = PetscMalloc((n+1)*sizeof(Mat),B);CHKERRQ(ierr); 1766cddf8d76SBarry Smith } 1767cddf8d76SBarry Smith 1768cddf8d76SBarry Smith for (i=0; i<n; i++) { 17696a6a5d1dSBarry Smith ierr = MatGetSubMatrix_SeqAIJ(A,irow[i],icol[i],PETSC_DECIDE,scall,&(*B)[i]);CHKERRQ(ierr); 1770cddf8d76SBarry Smith } 17713a40ed3dSBarry Smith PetscFunctionReturn(0); 1772cddf8d76SBarry Smith } 1773cddf8d76SBarry Smith 17744a2ae208SSatish Balay #undef __FUNCT__ 17754a2ae208SSatish Balay #define __FUNCT__ "MatIncreaseOverlap_SeqAIJ" 177697f1f81fSBarry Smith PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A,PetscInt is_max,IS is[],PetscInt ov) 17774dcbc457SBarry Smith { 1778e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 17796849ba73SBarry Smith PetscErrorCode ierr; 178097f1f81fSBarry Smith PetscInt row,i,j,k,l,m,n,*idx,*nidx,isz,val; 178197f1f81fSBarry Smith PetscInt start,end,*ai,*aj; 1782f1af5d2fSBarry Smith PetscBT table; 1783bbd702dbSSatish Balay 17843a40ed3dSBarry Smith PetscFunctionBegin; 1785273d9f13SBarry Smith m = A->m; 1786e4d965acSSatish Balay ai = a->i; 1787bfeeae90SHong Zhang aj = a->j; 17888a047759SSatish Balay 1789a45adfd6SMatthew Knepley if (ov < 0) SETERRQ(PETSC_ERR_ARG_OUTOFRANGE,"illegal negative overlap value used"); 179006763907SSatish Balay 179197f1f81fSBarry Smith ierr = PetscMalloc((m+1)*sizeof(PetscInt),&nidx);CHKERRQ(ierr); 17926831982aSBarry Smith ierr = PetscBTCreate(m,table);CHKERRQ(ierr); 179306763907SSatish Balay 1794e4d965acSSatish Balay for (i=0; i<is_max; i++) { 1795b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 1796e4d965acSSatish Balay isz = 0; 17976831982aSBarry Smith ierr = PetscBTMemzero(m,table);CHKERRQ(ierr); 1798e4d965acSSatish Balay 1799e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 18004dcbc457SBarry Smith ierr = ISGetIndices(is[i],&idx);CHKERRQ(ierr); 1801b9b97703SBarry Smith ierr = ISGetLocalSize(is[i],&n);CHKERRQ(ierr); 1802e4d965acSSatish Balay 1803dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 1804e4d965acSSatish Balay for (j=0; j<n ; ++j){ 1805f1af5d2fSBarry Smith if(!PetscBTLookupSet(table,idx[j])) { nidx[isz++] = idx[j];} 18064dcbc457SBarry Smith } 180706763907SSatish Balay ierr = ISRestoreIndices(is[i],&idx);CHKERRQ(ierr); 180806763907SSatish Balay ierr = ISDestroy(is[i]);CHKERRQ(ierr); 1809e4d965acSSatish Balay 181004a348a9SBarry Smith k = 0; 181104a348a9SBarry Smith for (j=0; j<ov; j++){ /* for each overlap */ 181204a348a9SBarry Smith n = isz; 181306763907SSatish Balay for (; k<n ; k++){ /* do only those rows in nidx[k], which are not done yet */ 1814e4d965acSSatish Balay row = nidx[k]; 1815e4d965acSSatish Balay start = ai[row]; 1816e4d965acSSatish Balay end = ai[row+1]; 181704a348a9SBarry Smith for (l = start; l<end ; l++){ 1818efb16452SHong Zhang val = aj[l] ; 1819f1af5d2fSBarry Smith if (!PetscBTLookupSet(table,val)) {nidx[isz++] = val;} 1820e4d965acSSatish Balay } 1821e4d965acSSatish Balay } 1822e4d965acSSatish Balay } 1823029af93fSBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,isz,nidx,(is+i));CHKERRQ(ierr); 1824e4d965acSSatish Balay } 18256831982aSBarry Smith ierr = PetscBTDestroy(table);CHKERRQ(ierr); 1826606d414cSSatish Balay ierr = PetscFree(nidx);CHKERRQ(ierr); 18273a40ed3dSBarry Smith PetscFunctionReturn(0); 18284dcbc457SBarry Smith } 182917ab2063SBarry Smith 18300513a670SBarry Smith /* -------------------------------------------------------------- */ 18314a2ae208SSatish Balay #undef __FUNCT__ 18324a2ae208SSatish Balay #define __FUNCT__ "MatPermute_SeqAIJ" 1833dfbe8321SBarry Smith PetscErrorCode MatPermute_SeqAIJ(Mat A,IS rowp,IS colp,Mat *B) 18340513a670SBarry Smith { 18350513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 18366849ba73SBarry Smith PetscErrorCode ierr; 183797f1f81fSBarry Smith PetscInt i,nz,m = A->m,n = A->n,*col; 183897f1f81fSBarry Smith PetscInt *row,*cnew,j,*lens; 183956cd22aeSBarry Smith IS icolp,irowp; 184097f1f81fSBarry Smith PetscInt *cwork; 184132ec9ce4SBarry Smith PetscScalar *vwork; 18420513a670SBarry Smith 18433a40ed3dSBarry Smith PetscFunctionBegin; 18444c49b128SBarry Smith ierr = ISInvertPermutation(rowp,PETSC_DECIDE,&irowp);CHKERRQ(ierr); 184556cd22aeSBarry Smith ierr = ISGetIndices(irowp,&row);CHKERRQ(ierr); 18464c49b128SBarry Smith ierr = ISInvertPermutation(colp,PETSC_DECIDE,&icolp);CHKERRQ(ierr); 184756cd22aeSBarry Smith ierr = ISGetIndices(icolp,&col);CHKERRQ(ierr); 18480513a670SBarry Smith 18490513a670SBarry Smith /* determine lengths of permuted rows */ 185097f1f81fSBarry Smith ierr = PetscMalloc((m+1)*sizeof(PetscInt),&lens);CHKERRQ(ierr); 18510513a670SBarry Smith for (i=0; i<m; i++) { 18520513a670SBarry Smith lens[row[i]] = a->i[i+1] - a->i[i]; 18530513a670SBarry Smith } 1854f204ca49SKris Buschelman ierr = MatCreate(A->comm,m,n,m,n,B);CHKERRQ(ierr); 1855f204ca49SKris Buschelman ierr = MatSetType(*B,A->type_name);CHKERRQ(ierr); 1856*ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(*B,0,lens);CHKERRQ(ierr); 1857606d414cSSatish Balay ierr = PetscFree(lens);CHKERRQ(ierr); 18580513a670SBarry Smith 185997f1f81fSBarry Smith ierr = PetscMalloc(n*sizeof(PetscInt),&cnew);CHKERRQ(ierr); 18600513a670SBarry Smith for (i=0; i<m; i++) { 186132ec9ce4SBarry Smith ierr = MatGetRow_SeqAIJ(A,i,&nz,&cwork,&vwork);CHKERRQ(ierr); 18620513a670SBarry Smith for (j=0; j<nz; j++) { cnew[j] = col[cwork[j]];} 1863cdc0ba36SBarry Smith ierr = MatSetValues_SeqAIJ(*B,1,&row[i],nz,cnew,vwork,INSERT_VALUES);CHKERRQ(ierr); 186432ec9ce4SBarry Smith ierr = MatRestoreRow_SeqAIJ(A,i,&nz,&cwork,&vwork);CHKERRQ(ierr); 18650513a670SBarry Smith } 1866606d414cSSatish Balay ierr = PetscFree(cnew);CHKERRQ(ierr); 18673c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 18680513a670SBarry Smith ierr = MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 18690513a670SBarry Smith ierr = MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 187056cd22aeSBarry Smith ierr = ISRestoreIndices(irowp,&row);CHKERRQ(ierr); 187156cd22aeSBarry Smith ierr = ISRestoreIndices(icolp,&col);CHKERRQ(ierr); 187256cd22aeSBarry Smith ierr = ISDestroy(irowp);CHKERRQ(ierr); 187356cd22aeSBarry Smith ierr = ISDestroy(icolp);CHKERRQ(ierr); 18743a40ed3dSBarry Smith PetscFunctionReturn(0); 18750513a670SBarry Smith } 18760513a670SBarry Smith 18774a2ae208SSatish Balay #undef __FUNCT__ 18784a2ae208SSatish Balay #define __FUNCT__ "MatPrintHelp_SeqAIJ" 1879dfbe8321SBarry Smith PetscErrorCode MatPrintHelp_SeqAIJ(Mat A) 1880682d7d0cSBarry Smith { 1881c38d4ed2SBarry Smith static PetscTruth called = PETSC_FALSE; 1882682d7d0cSBarry Smith MPI_Comm comm = A->comm; 1883dfbe8321SBarry Smith PetscErrorCode ierr; 1884682d7d0cSBarry Smith 18853a40ed3dSBarry Smith PetscFunctionBegin; 18864846f1f5SKris Buschelman ierr = MatPrintHelp_Inode(A);CHKERRQ(ierr); 1887c38d4ed2SBarry Smith if (called) {PetscFunctionReturn(0);} else called = PETSC_TRUE; 1888d132466eSBarry Smith ierr = (*PetscHelpPrintf)(comm," Options for MATSEQAIJ and MATMPIAIJ matrix formats (the defaults):\n");CHKERRQ(ierr); 1889d132466eSBarry Smith ierr = (*PetscHelpPrintf)(comm," -mat_lu_pivotthreshold <threshold>: Set pivoting threshold\n");CHKERRQ(ierr); 1890d132466eSBarry Smith ierr = (*PetscHelpPrintf)(comm," -mat_aij_oneindex: internal indices begin at 1 instead of the default 0.\n");CHKERRQ(ierr); 189173e7a558SHong Zhang ierr = (*PetscHelpPrintf)(comm," -mat_no_compressedrow: Do not use compressedrow\n");CHKERRQ(ierr); 18923a40ed3dSBarry Smith PetscFunctionReturn(0); 1893682d7d0cSBarry Smith } 189497304618SKris Buschelman 18954a2ae208SSatish Balay #undef __FUNCT__ 18964a2ae208SSatish Balay #define __FUNCT__ "MatCopy_SeqAIJ" 1897dfbe8321SBarry Smith PetscErrorCode MatCopy_SeqAIJ(Mat A,Mat B,MatStructure str) 1898cb5b572fSBarry Smith { 1899dfbe8321SBarry Smith PetscErrorCode ierr; 1900cb5b572fSBarry Smith 1901cb5b572fSBarry Smith PetscFunctionBegin; 190233f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 190333f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 1904be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1905be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ*)B->data; 1906be6bf707SBarry Smith 1907bfeeae90SHong Zhang if (a->i[A->m] != b->i[B->m]) { 1908634064b4SBarry Smith SETERRQ(PETSC_ERR_ARG_INCOMP,"Number of nonzeros in two matrices are different"); 1909cb5b572fSBarry Smith } 1910bfeeae90SHong Zhang ierr = PetscMemcpy(b->a,a->a,(a->i[A->m])*sizeof(PetscScalar));CHKERRQ(ierr); 1911cb5b572fSBarry Smith } else { 1912cb5b572fSBarry Smith ierr = MatCopy_Basic(A,B,str);CHKERRQ(ierr); 1913cb5b572fSBarry Smith } 1914cb5b572fSBarry Smith PetscFunctionReturn(0); 1915cb5b572fSBarry Smith } 1916cb5b572fSBarry Smith 19174a2ae208SSatish Balay #undef __FUNCT__ 19184a2ae208SSatish Balay #define __FUNCT__ "MatSetUpPreallocation_SeqAIJ" 1919dfbe8321SBarry Smith PetscErrorCode MatSetUpPreallocation_SeqAIJ(Mat A) 1920273d9f13SBarry Smith { 1921dfbe8321SBarry Smith PetscErrorCode ierr; 1922273d9f13SBarry Smith 1923273d9f13SBarry Smith PetscFunctionBegin; 1924*ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(A,PETSC_DEFAULT,0);CHKERRQ(ierr); 1925273d9f13SBarry Smith PetscFunctionReturn(0); 1926273d9f13SBarry Smith } 1927273d9f13SBarry Smith 19284a2ae208SSatish Balay #undef __FUNCT__ 19294a2ae208SSatish Balay #define __FUNCT__ "MatGetArray_SeqAIJ" 1930dfbe8321SBarry Smith PetscErrorCode MatGetArray_SeqAIJ(Mat A,PetscScalar *array[]) 19316c0721eeSBarry Smith { 19326c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 19336c0721eeSBarry Smith PetscFunctionBegin; 19346c0721eeSBarry Smith *array = a->a; 19356c0721eeSBarry Smith PetscFunctionReturn(0); 19366c0721eeSBarry Smith } 19376c0721eeSBarry Smith 19384a2ae208SSatish Balay #undef __FUNCT__ 19394a2ae208SSatish Balay #define __FUNCT__ "MatRestoreArray_SeqAIJ" 1940dfbe8321SBarry Smith PetscErrorCode MatRestoreArray_SeqAIJ(Mat A,PetscScalar *array[]) 19416c0721eeSBarry Smith { 19426c0721eeSBarry Smith PetscFunctionBegin; 19436c0721eeSBarry Smith PetscFunctionReturn(0); 19446c0721eeSBarry Smith } 1945273d9f13SBarry Smith 1946ee4f033dSBarry Smith #undef __FUNCT__ 1947ee4f033dSBarry Smith #define __FUNCT__ "MatFDColoringApply_SeqAIJ" 1948dfbe8321SBarry Smith PetscErrorCode MatFDColoringApply_SeqAIJ(Mat J,MatFDColoring coloring,Vec x1,MatStructure *flag,void *sctx) 1949ee4f033dSBarry Smith { 19506849ba73SBarry Smith PetscErrorCode (*f)(void*,Vec,Vec,void*) = (PetscErrorCode (*)(void*,Vec,Vec,void *))coloring->f; 19516849ba73SBarry Smith PetscErrorCode ierr; 195297f1f81fSBarry Smith PetscInt k,N,start,end,l,row,col,srow,**vscaleforrow,m1,m2; 195387828ca2SBarry Smith PetscScalar dx,mone = -1.0,*y,*xx,*w3_array; 195487828ca2SBarry Smith PetscScalar *vscale_array; 1955ee4f033dSBarry Smith PetscReal epsilon = coloring->error_rel,umin = coloring->umin; 1956ee4f033dSBarry Smith Vec w1,w2,w3; 1957ee4f033dSBarry Smith void *fctx = coloring->fctx; 1958ee4f033dSBarry Smith PetscTruth flg; 1959ee4f033dSBarry Smith 1960ee4f033dSBarry Smith PetscFunctionBegin; 1961ee4f033dSBarry Smith if (!coloring->w1) { 1962ee4f033dSBarry Smith ierr = VecDuplicate(x1,&coloring->w1);CHKERRQ(ierr); 196352e6d16bSBarry Smith ierr = PetscLogObjectParent(coloring,coloring->w1);CHKERRQ(ierr); 1964ee4f033dSBarry Smith ierr = VecDuplicate(x1,&coloring->w2);CHKERRQ(ierr); 196552e6d16bSBarry Smith ierr = PetscLogObjectParent(coloring,coloring->w2);CHKERRQ(ierr); 1966ee4f033dSBarry Smith ierr = VecDuplicate(x1,&coloring->w3);CHKERRQ(ierr); 196752e6d16bSBarry Smith ierr = PetscLogObjectParent(coloring,coloring->w3);CHKERRQ(ierr); 1968ee4f033dSBarry Smith } 1969ee4f033dSBarry Smith w1 = coloring->w1; w2 = coloring->w2; w3 = coloring->w3; 1970ee4f033dSBarry Smith 1971ee4f033dSBarry Smith ierr = MatSetUnfactored(J);CHKERRQ(ierr); 1972e82a3eeeSBarry Smith ierr = PetscOptionsHasName(coloring->prefix,"-mat_fd_coloring_dont_rezero",&flg);CHKERRQ(ierr); 1973ee4f033dSBarry Smith if (flg) { 197463ba0a88SBarry Smith ierr = PetscLogInfo((coloring,"MatFDColoringApply_SeqAIJ: Not calling MatZeroEntries()\n"));CHKERRQ(ierr); 1975ee4f033dSBarry Smith } else { 19760b9b6f31SBarry Smith PetscTruth assembled; 19770b9b6f31SBarry Smith ierr = MatAssembled(J,&assembled);CHKERRQ(ierr); 19780b9b6f31SBarry Smith if (assembled) { 1979ee4f033dSBarry Smith ierr = MatZeroEntries(J);CHKERRQ(ierr); 1980ee4f033dSBarry Smith } 19810b9b6f31SBarry Smith } 1982ee4f033dSBarry Smith 1983ee4f033dSBarry Smith ierr = VecGetOwnershipRange(x1,&start,&end);CHKERRQ(ierr); 1984ee4f033dSBarry Smith ierr = VecGetSize(x1,&N);CHKERRQ(ierr); 1985ee4f033dSBarry Smith 1986ee4f033dSBarry Smith /* 1987ee4f033dSBarry Smith This is a horrible, horrible, hack. See DMMGComputeJacobian_Multigrid() it inproperly sets 1988ee4f033dSBarry Smith coloring->F for the coarser grids from the finest 1989ee4f033dSBarry Smith */ 1990ee4f033dSBarry Smith if (coloring->F) { 1991ee4f033dSBarry Smith ierr = VecGetLocalSize(coloring->F,&m1);CHKERRQ(ierr); 1992ee4f033dSBarry Smith ierr = VecGetLocalSize(w1,&m2);CHKERRQ(ierr); 1993ee4f033dSBarry Smith if (m1 != m2) { 1994ee4f033dSBarry Smith coloring->F = 0; 1995ee4f033dSBarry Smith } 1996ee4f033dSBarry Smith } 1997ee4f033dSBarry Smith 1998ee4f033dSBarry Smith if (coloring->F) { 1999ee4f033dSBarry Smith w1 = coloring->F; 2000ee4f033dSBarry Smith coloring->F = 0; 2001ee4f033dSBarry Smith } else { 200266f9b7ceSBarry Smith ierr = PetscLogEventBegin(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr); 2003ee4f033dSBarry Smith ierr = (*f)(sctx,x1,w1,fctx);CHKERRQ(ierr); 200466f9b7ceSBarry Smith ierr = PetscLogEventEnd(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr); 2005ee4f033dSBarry Smith } 2006ee4f033dSBarry Smith 2007ee4f033dSBarry Smith /* 2008ee4f033dSBarry Smith Compute all the scale factors and share with other processors 2009ee4f033dSBarry Smith */ 20101ebc52fbSHong Zhang ierr = VecGetArray(x1,&xx);CHKERRQ(ierr);xx = xx - start; 20111ebc52fbSHong Zhang ierr = VecGetArray(coloring->vscale,&vscale_array);CHKERRQ(ierr);vscale_array = vscale_array - start; 2012ee4f033dSBarry Smith for (k=0; k<coloring->ncolors; k++) { 2013ee4f033dSBarry Smith /* 2014ee4f033dSBarry Smith Loop over each column associated with color adding the 2015ee4f033dSBarry Smith perturbation to the vector w3. 2016ee4f033dSBarry Smith */ 2017ee4f033dSBarry Smith for (l=0; l<coloring->ncolumns[k]; l++) { 2018ee4f033dSBarry Smith col = coloring->columns[k][l]; /* column of the matrix we are probing for */ 2019ee4f033dSBarry Smith dx = xx[col]; 2020ee4f033dSBarry Smith if (dx == 0.0) dx = 1.0; 2021ee4f033dSBarry Smith #if !defined(PETSC_USE_COMPLEX) 2022ee4f033dSBarry Smith if (dx < umin && dx >= 0.0) dx = umin; 2023ee4f033dSBarry Smith else if (dx < 0.0 && dx > -umin) dx = -umin; 2024ee4f033dSBarry Smith #else 2025ee4f033dSBarry Smith if (PetscAbsScalar(dx) < umin && PetscRealPart(dx) >= 0.0) dx = umin; 2026ee4f033dSBarry Smith else if (PetscRealPart(dx) < 0.0 && PetscAbsScalar(dx) < umin) dx = -umin; 2027ee4f033dSBarry Smith #endif 2028ee4f033dSBarry Smith dx *= epsilon; 2029ee4f033dSBarry Smith vscale_array[col] = 1.0/dx; 2030ee4f033dSBarry Smith } 2031ee4f033dSBarry Smith } 20321ebc52fbSHong Zhang vscale_array = vscale_array + start;ierr = VecRestoreArray(coloring->vscale,&vscale_array);CHKERRQ(ierr); 2033ee4f033dSBarry Smith ierr = VecGhostUpdateBegin(coloring->vscale,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2034ee4f033dSBarry Smith ierr = VecGhostUpdateEnd(coloring->vscale,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2035ee4f033dSBarry Smith 2036ee4f033dSBarry Smith /* ierr = VecView(coloring->vscale,PETSC_VIEWER_STDOUT_WORLD); 2037ee4f033dSBarry Smith ierr = VecView(x1,PETSC_VIEWER_STDOUT_WORLD);*/ 2038ee4f033dSBarry Smith 2039ee4f033dSBarry Smith if (coloring->vscaleforrow) vscaleforrow = coloring->vscaleforrow; 2040ee4f033dSBarry Smith else vscaleforrow = coloring->columnsforrow; 2041ee4f033dSBarry Smith 20421ebc52fbSHong Zhang ierr = VecGetArray(coloring->vscale,&vscale_array);CHKERRQ(ierr); 2043ee4f033dSBarry Smith /* 2044ee4f033dSBarry Smith Loop over each color 2045ee4f033dSBarry Smith */ 2046ee4f033dSBarry Smith for (k=0; k<coloring->ncolors; k++) { 204749b058dcSBarry Smith coloring->currentcolor = k; 2048ee4f033dSBarry Smith ierr = VecCopy(x1,w3);CHKERRQ(ierr); 20491ebc52fbSHong Zhang ierr = VecGetArray(w3,&w3_array);CHKERRQ(ierr);w3_array = w3_array - start; 2050ee4f033dSBarry Smith /* 2051ee4f033dSBarry Smith Loop over each column associated with color adding the 2052ee4f033dSBarry Smith perturbation to the vector w3. 2053ee4f033dSBarry Smith */ 2054ee4f033dSBarry Smith for (l=0; l<coloring->ncolumns[k]; l++) { 2055ee4f033dSBarry Smith col = coloring->columns[k][l]; /* column of the matrix we are probing for */ 2056ee4f033dSBarry Smith dx = xx[col]; 20575b8514ebSBarry Smith if (dx == 0.0) dx = 1.0; 2058ee4f033dSBarry Smith #if !defined(PETSC_USE_COMPLEX) 2059ee4f033dSBarry Smith if (dx < umin && dx >= 0.0) dx = umin; 2060ee4f033dSBarry Smith else if (dx < 0.0 && dx > -umin) dx = -umin; 2061ee4f033dSBarry Smith #else 2062ee4f033dSBarry Smith if (PetscAbsScalar(dx) < umin && PetscRealPart(dx) >= 0.0) dx = umin; 2063ee4f033dSBarry Smith else if (PetscRealPart(dx) < 0.0 && PetscAbsScalar(dx) < umin) dx = -umin; 2064ee4f033dSBarry Smith #endif 2065ee4f033dSBarry Smith dx *= epsilon; 2066634064b4SBarry Smith if (!PetscAbsScalar(dx)) SETERRQ(PETSC_ERR_PLIB,"Computed 0 differencing parameter"); 2067ee4f033dSBarry Smith w3_array[col] += dx; 2068ee4f033dSBarry Smith } 20691ebc52fbSHong Zhang w3_array = w3_array + start; ierr = VecRestoreArray(w3,&w3_array);CHKERRQ(ierr); 2070ee4f033dSBarry Smith 2071ee4f033dSBarry Smith /* 2072ee4f033dSBarry Smith Evaluate function at x1 + dx (here dx is a vector of perturbations) 2073ee4f033dSBarry Smith */ 2074ee4f033dSBarry Smith 207566f9b7ceSBarry Smith ierr = PetscLogEventBegin(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr); 2076ee4f033dSBarry Smith ierr = (*f)(sctx,w3,w2,fctx);CHKERRQ(ierr); 207766f9b7ceSBarry Smith ierr = PetscLogEventEnd(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr); 2078ee4f033dSBarry Smith ierr = VecAXPY(&mone,w1,w2);CHKERRQ(ierr); 2079ee4f033dSBarry Smith 2080ee4f033dSBarry Smith /* 2081ee4f033dSBarry Smith Loop over rows of vector, putting results into Jacobian matrix 2082ee4f033dSBarry Smith */ 20831ebc52fbSHong Zhang ierr = VecGetArray(w2,&y);CHKERRQ(ierr); 2084ee4f033dSBarry Smith for (l=0; l<coloring->nrows[k]; l++) { 2085ee4f033dSBarry Smith row = coloring->rows[k][l]; 2086ee4f033dSBarry Smith col = coloring->columnsforrow[k][l]; 2087ee4f033dSBarry Smith y[row] *= vscale_array[vscaleforrow[k][l]]; 2088ee4f033dSBarry Smith srow = row + start; 2089ee4f033dSBarry Smith ierr = MatSetValues_SeqAIJ(J,1,&srow,1,&col,y+row,INSERT_VALUES);CHKERRQ(ierr); 2090ee4f033dSBarry Smith } 20911ebc52fbSHong Zhang ierr = VecRestoreArray(w2,&y);CHKERRQ(ierr); 2092ee4f033dSBarry Smith } 209349b058dcSBarry Smith coloring->currentcolor = k; 20941ebc52fbSHong Zhang ierr = VecRestoreArray(coloring->vscale,&vscale_array);CHKERRQ(ierr); 20951ebc52fbSHong Zhang xx = xx + start; ierr = VecRestoreArray(x1,&xx);CHKERRQ(ierr); 2096ee4f033dSBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2097ee4f033dSBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2098ee4f033dSBarry Smith PetscFunctionReturn(0); 2099ee4f033dSBarry Smith } 2100ee4f033dSBarry Smith 2101ac90fabeSBarry Smith #include "petscblaslapack.h" 2102ac90fabeSBarry Smith #undef __FUNCT__ 2103ac90fabeSBarry Smith #define __FUNCT__ "MatAXPY_SeqAIJ" 2104dfbe8321SBarry Smith PetscErrorCode MatAXPY_SeqAIJ(const PetscScalar a[],Mat X,Mat Y,MatStructure str) 2105ac90fabeSBarry Smith { 2106dfbe8321SBarry Smith PetscErrorCode ierr; 210797f1f81fSBarry Smith PetscInt i; 2108ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data,*y = (Mat_SeqAIJ *)Y->data; 21094ce68768SBarry Smith PetscBLASInt one=1,bnz = (PetscBLASInt)x->nz; 2110ac90fabeSBarry Smith 2111ac90fabeSBarry Smith PetscFunctionBegin; 2112ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 211371044d3cSBarry Smith BLASaxpy_(&bnz,(PetscScalar*)a,x->a,&one,y->a,&one); 2114c537a176SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 2115a30b2313SHong Zhang if (y->xtoy && y->XtoY != X) { 2116a30b2313SHong Zhang ierr = PetscFree(y->xtoy);CHKERRQ(ierr); 2117a30b2313SHong Zhang ierr = MatDestroy(y->XtoY);CHKERRQ(ierr); 2118a30b2313SHong Zhang } 2119a30b2313SHong Zhang if (!y->xtoy) { /* get xtoy */ 212024f910e3SHong Zhang ierr = MatAXPYGetxtoy_Private(X->m,x->i,x->j,PETSC_NULL, y->i,y->j,PETSC_NULL, &y->xtoy);CHKERRQ(ierr); 2121a30b2313SHong Zhang y->XtoY = X; 2122c537a176SHong Zhang } 2123a30b2313SHong Zhang for (i=0; i<x->nz; i++) y->a[y->xtoy[i]] += (*a)*(x->a[i]); 212463ba0a88SBarry Smith ierr = PetscLogInfo((0,"MatAXPY_SeqAIJ: ratio of nnz(X)/nnz(Y): %d/%d = %g\n",x->nz,y->nz,(PetscReal)(x->nz)/y->nz));CHKERRQ(ierr); 2125ac90fabeSBarry Smith } else { 2126ac90fabeSBarry Smith ierr = MatAXPY_Basic(a,X,Y,str);CHKERRQ(ierr); 2127ac90fabeSBarry Smith } 2128ac90fabeSBarry Smith PetscFunctionReturn(0); 2129ac90fabeSBarry Smith } 2130ac90fabeSBarry Smith 2131521d7252SBarry Smith #undef __FUNCT__ 2132521d7252SBarry Smith #define __FUNCT__ "MatSetBlockSize_SeqAIJ" 2133521d7252SBarry Smith PetscErrorCode MatSetBlockSize_SeqAIJ(Mat A,PetscInt bs) 2134521d7252SBarry Smith { 2135521d7252SBarry Smith PetscFunctionBegin; 2136521d7252SBarry Smith PetscFunctionReturn(0); 2137521d7252SBarry Smith } 2138521d7252SBarry Smith 2139682d7d0cSBarry Smith /* -------------------------------------------------------------------*/ 21400a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 2141cb5b572fSBarry Smith MatGetRow_SeqAIJ, 2142cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 2143cb5b572fSBarry Smith MatMult_SeqAIJ, 214497304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 21457c922b88SBarry Smith MatMultTranspose_SeqAIJ, 21467c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 2147cb5b572fSBarry Smith MatSolve_SeqAIJ, 2148cb5b572fSBarry Smith MatSolveAdd_SeqAIJ, 21497c922b88SBarry Smith MatSolveTranspose_SeqAIJ, 215097304618SKris Buschelman /*10*/ MatSolveTransposeAdd_SeqAIJ, 2151cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 2152cb5b572fSBarry Smith 0, 215317ab2063SBarry Smith MatRelax_SeqAIJ, 215417ab2063SBarry Smith MatTranspose_SeqAIJ, 215597304618SKris Buschelman /*15*/ MatGetInfo_SeqAIJ, 2156cb5b572fSBarry Smith MatEqual_SeqAIJ, 2157cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 2158cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 2159cb5b572fSBarry Smith MatNorm_SeqAIJ, 216097304618SKris Buschelman /*20*/ 0, 2161cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 216217ab2063SBarry Smith MatCompress_SeqAIJ, 2163cb5b572fSBarry Smith MatSetOption_SeqAIJ, 2164cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 216597304618SKris Buschelman /*25*/ MatZeroRows_SeqAIJ, 2166cb5b572fSBarry Smith MatLUFactorSymbolic_SeqAIJ, 2167cb5b572fSBarry Smith MatLUFactorNumeric_SeqAIJ, 2168f76d2b81SHong Zhang MatCholeskyFactorSymbolic_SeqAIJ, 2169a6175056SHong Zhang MatCholeskyFactorNumeric_SeqAIJ, 217097304618SKris Buschelman /*30*/ MatSetUpPreallocation_SeqAIJ, 2171cb5b572fSBarry Smith MatILUFactorSymbolic_SeqAIJ, 2172861ba921SHong Zhang MatICCFactorSymbolic_SeqAIJ, 21736c0721eeSBarry Smith MatGetArray_SeqAIJ, 21746c0721eeSBarry Smith MatRestoreArray_SeqAIJ, 217597304618SKris Buschelman /*35*/ MatDuplicate_SeqAIJ, 2176cb5b572fSBarry Smith 0, 2177cb5b572fSBarry Smith 0, 2178cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 2179cb5b572fSBarry Smith 0, 218097304618SKris Buschelman /*40*/ MatAXPY_SeqAIJ, 2181cb5b572fSBarry Smith MatGetSubMatrices_SeqAIJ, 2182cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 2183cb5b572fSBarry Smith MatGetValues_SeqAIJ, 2184cb5b572fSBarry Smith MatCopy_SeqAIJ, 218597304618SKris Buschelman /*45*/ MatPrintHelp_SeqAIJ, 2186cb5b572fSBarry Smith MatScale_SeqAIJ, 2187cb5b572fSBarry Smith 0, 2188cb5b572fSBarry Smith 0, 21896945ee14SBarry Smith MatILUDTFactor_SeqAIJ, 2190521d7252SBarry Smith /*50*/ MatSetBlockSize_SeqAIJ, 21913b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 21923b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 21933b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 2194a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 219597304618SKris Buschelman /*55*/ MatFDColoringCreate_SeqAIJ, 2196b9617806SBarry Smith 0, 21970513a670SBarry Smith 0, 2198cda55fadSBarry Smith MatPermute_SeqAIJ, 2199cda55fadSBarry Smith 0, 220097304618SKris Buschelman /*60*/ 0, 2201b9b97703SBarry Smith MatDestroy_SeqAIJ, 2202b9b97703SBarry Smith MatView_SeqAIJ, 22038a124369SBarry Smith MatGetPetscMaps_Petsc, 2204ee4f033dSBarry Smith 0, 220597304618SKris Buschelman /*65*/ 0, 2206ee4f033dSBarry Smith 0, 2207ee4f033dSBarry Smith 0, 2208ee4f033dSBarry Smith 0, 2209ee4f033dSBarry Smith 0, 221097304618SKris Buschelman /*70*/ 0, 2211ee4f033dSBarry Smith 0, 2212ee4f033dSBarry Smith MatSetColoring_SeqAIJ, 2213dcf5cc72SBarry Smith #if defined(PETSC_HAVE_ADIC) 2214ee4f033dSBarry Smith MatSetValuesAdic_SeqAIJ, 2215dcf5cc72SBarry Smith #else 2216dcf5cc72SBarry Smith 0, 2217dcf5cc72SBarry Smith #endif 2218ee4f033dSBarry Smith MatSetValuesAdifor_SeqAIJ, 221997304618SKris Buschelman /*75*/ MatFDColoringApply_SeqAIJ, 222097304618SKris Buschelman 0, 222197304618SKris Buschelman 0, 222297304618SKris Buschelman 0, 222397304618SKris Buschelman 0, 222497304618SKris Buschelman /*80*/ 0, 222597304618SKris Buschelman 0, 222697304618SKris Buschelman 0, 222797304618SKris Buschelman 0, 2228bc011b1eSHong Zhang MatLoad_SeqAIJ, 2229bc011b1eSHong Zhang /*85*/ MatIsSymmetric_SeqAIJ, 22306284ec50SHong Zhang 0, 22316284ec50SHong Zhang 0, 22326284ec50SHong Zhang 0, 2233bc011b1eSHong Zhang 0, 2234bc011b1eSHong Zhang /*90*/ MatMatMult_SeqAIJ_SeqAIJ, 223526be0446SHong Zhang MatMatMultSymbolic_SeqAIJ_SeqAIJ, 223626be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 2237d439da42SKris Buschelman MatPtAP_Basic, 22387ba1a0bfSKris Buschelman MatPtAPSymbolic_SeqAIJ, 22397ba1a0bfSKris Buschelman /*95*/ MatPtAPNumeric_SeqAIJ, 2240bc011b1eSHong Zhang MatMatMultTranspose_SeqAIJ_SeqAIJ, 2241bc011b1eSHong Zhang MatMatMultTransposeSymbolic_SeqAIJ_SeqAIJ, 2242bc011b1eSHong Zhang MatMatMultTransposeNumeric_SeqAIJ_SeqAIJ, 22437ba1a0bfSKris Buschelman MatPtAPSymbolic_SeqAIJ_SeqAIJ, 22447ba1a0bfSKris Buschelman /*100*/MatPtAPNumeric_SeqAIJ_SeqAIJ, 2245609c6c4dSKris Buschelman 0, 2246609c6c4dSKris Buschelman 0, 22479e29f15eSvictorle }; 224817ab2063SBarry Smith 2249fb2e594dSBarry Smith EXTERN_C_BEGIN 22504a2ae208SSatish Balay #undef __FUNCT__ 22514a2ae208SSatish Balay #define __FUNCT__ "MatSeqAIJSetColumnIndices_SeqAIJ" 2252be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat,PetscInt *indices) 2253bef8e0ddSBarry Smith { 2254bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 225597f1f81fSBarry Smith PetscInt i,nz,n; 2256bef8e0ddSBarry Smith 2257bef8e0ddSBarry Smith PetscFunctionBegin; 2258bef8e0ddSBarry Smith 2259bef8e0ddSBarry Smith nz = aij->maxnz; 2260273d9f13SBarry Smith n = mat->n; 2261bef8e0ddSBarry Smith for (i=0; i<nz; i++) { 2262bef8e0ddSBarry Smith aij->j[i] = indices[i]; 2263bef8e0ddSBarry Smith } 2264bef8e0ddSBarry Smith aij->nz = nz; 2265bef8e0ddSBarry Smith for (i=0; i<n; i++) { 2266bef8e0ddSBarry Smith aij->ilen[i] = aij->imax[i]; 2267bef8e0ddSBarry Smith } 2268bef8e0ddSBarry Smith 2269bef8e0ddSBarry Smith PetscFunctionReturn(0); 2270bef8e0ddSBarry Smith } 2271fb2e594dSBarry Smith EXTERN_C_END 2272bef8e0ddSBarry Smith 22734a2ae208SSatish Balay #undef __FUNCT__ 22744a2ae208SSatish Balay #define __FUNCT__ "MatSeqAIJSetColumnIndices" 2275bef8e0ddSBarry Smith /*@ 2276bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 2277bef8e0ddSBarry Smith in the matrix. 2278bef8e0ddSBarry Smith 2279bef8e0ddSBarry Smith Input Parameters: 2280bef8e0ddSBarry Smith + mat - the SeqAIJ matrix 2281bef8e0ddSBarry Smith - indices - the column indices 2282bef8e0ddSBarry Smith 228315091d37SBarry Smith Level: advanced 228415091d37SBarry Smith 2285bef8e0ddSBarry Smith Notes: 2286bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 2287bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 2288bef8e0ddSBarry Smith of the MatSetValues() operation. 2289bef8e0ddSBarry Smith 2290bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 2291d1be2dadSMatthew Knepley MatCreateSeqAIJ(), and the columns indices MUST be sorted. 2292bef8e0ddSBarry Smith 2293bef8e0ddSBarry Smith MUST be called before any calls to MatSetValues(); 2294bef8e0ddSBarry Smith 2295b9617806SBarry Smith The indices should start with zero, not one. 2296b9617806SBarry Smith 2297bef8e0ddSBarry Smith @*/ 2298be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatSeqAIJSetColumnIndices(Mat mat,PetscInt *indices) 2299bef8e0ddSBarry Smith { 230097f1f81fSBarry Smith PetscErrorCode ierr,(*f)(Mat,PetscInt *); 2301bef8e0ddSBarry Smith 2302bef8e0ddSBarry Smith PetscFunctionBegin; 23034482741eSBarry Smith PetscValidHeaderSpecific(mat,MAT_COOKIE,1); 23044482741eSBarry Smith PetscValidPointer(indices,2); 2305c134de8dSSatish Balay ierr = PetscObjectQueryFunction((PetscObject)mat,"MatSeqAIJSetColumnIndices_C",(void (**)(void))&f);CHKERRQ(ierr); 2306bef8e0ddSBarry Smith if (f) { 2307bef8e0ddSBarry Smith ierr = (*f)(mat,indices);CHKERRQ(ierr); 2308bef8e0ddSBarry Smith } else { 2309634064b4SBarry Smith SETERRQ(PETSC_ERR_SUP,"Wrong type of matrix to set column indices"); 2310bef8e0ddSBarry Smith } 2311bef8e0ddSBarry Smith PetscFunctionReturn(0); 2312bef8e0ddSBarry Smith } 2313bef8e0ddSBarry Smith 2314be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/ 2315be6bf707SBarry Smith 2316fb2e594dSBarry Smith EXTERN_C_BEGIN 23174a2ae208SSatish Balay #undef __FUNCT__ 23184a2ae208SSatish Balay #define __FUNCT__ "MatStoreValues_SeqAIJ" 2319be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatStoreValues_SeqAIJ(Mat mat) 2320be6bf707SBarry Smith { 2321be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 23226849ba73SBarry Smith PetscErrorCode ierr; 23236849ba73SBarry Smith size_t nz = aij->i[mat->m]; 2324be6bf707SBarry Smith 2325be6bf707SBarry Smith PetscFunctionBegin; 2326be6bf707SBarry Smith if (aij->nonew != 1) { 2327634064b4SBarry Smith SETERRQ(PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NO_NEW_NONZERO_LOCATIONS);first"); 2328be6bf707SBarry Smith } 2329be6bf707SBarry Smith 2330be6bf707SBarry Smith /* allocate space for values if not already there */ 2331be6bf707SBarry Smith if (!aij->saved_values) { 233287828ca2SBarry Smith ierr = PetscMalloc((nz+1)*sizeof(PetscScalar),&aij->saved_values);CHKERRQ(ierr); 2333be6bf707SBarry Smith } 2334be6bf707SBarry Smith 2335be6bf707SBarry Smith /* copy values over */ 233687828ca2SBarry Smith ierr = PetscMemcpy(aij->saved_values,aij->a,nz*sizeof(PetscScalar));CHKERRQ(ierr); 2337be6bf707SBarry Smith PetscFunctionReturn(0); 2338be6bf707SBarry Smith } 2339fb2e594dSBarry Smith EXTERN_C_END 2340be6bf707SBarry Smith 23414a2ae208SSatish Balay #undef __FUNCT__ 2342b9617806SBarry Smith #define __FUNCT__ "MatStoreValues" 2343be6bf707SBarry Smith /*@ 2344be6bf707SBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows, for 2345be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 2346be6bf707SBarry Smith nonlinear portion. 2347be6bf707SBarry Smith 2348be6bf707SBarry Smith Collect on Mat 2349be6bf707SBarry Smith 2350be6bf707SBarry Smith Input Parameters: 23510e609b76SBarry Smith . mat - the matrix (currently only AIJ matrices support this option) 2352be6bf707SBarry Smith 235315091d37SBarry Smith Level: advanced 235415091d37SBarry Smith 2355be6bf707SBarry Smith Common Usage, with SNESSolve(): 2356be6bf707SBarry Smith $ Create Jacobian matrix 2357be6bf707SBarry Smith $ Set linear terms into matrix 2358be6bf707SBarry Smith $ Apply boundary conditions to matrix, at this time matrix must have 2359be6bf707SBarry Smith $ final nonzero structure (i.e. setting the nonlinear terms and applying 2360be6bf707SBarry Smith $ boundary conditions again will not change the nonzero structure 2361be6bf707SBarry Smith $ ierr = MatSetOption(mat,MAT_NO_NEW_NONZERO_LOCATIONS); 2362be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 2363be6bf707SBarry Smith $ Call SNESSetJacobian() with matrix 2364be6bf707SBarry Smith $ In your Jacobian routine 2365be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 2366be6bf707SBarry Smith $ Set nonlinear terms in matrix 2367be6bf707SBarry Smith 2368be6bf707SBarry Smith Common Usage without SNESSolve(), i.e. when you handle nonlinear solve yourself: 2369be6bf707SBarry Smith $ // build linear portion of Jacobian 2370be6bf707SBarry Smith $ ierr = MatSetOption(mat,MAT_NO_NEW_NONZERO_LOCATIONS); 2371be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 2372be6bf707SBarry Smith $ loop over nonlinear iterations 2373be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 2374be6bf707SBarry Smith $ // call MatSetValues(mat,...) to set nonliner portion of Jacobian 2375be6bf707SBarry Smith $ // call MatAssemblyBegin/End() on matrix 2376be6bf707SBarry Smith $ Solve linear system with Jacobian 2377be6bf707SBarry Smith $ endloop 2378be6bf707SBarry Smith 2379be6bf707SBarry Smith Notes: 2380be6bf707SBarry Smith Matrix must already be assemblied before calling this routine 2381be6bf707SBarry Smith Must set the matrix option MatSetOption(mat,MAT_NO_NEW_NONZERO_LOCATIONS); before 2382be6bf707SBarry Smith calling this routine. 2383be6bf707SBarry Smith 2384be6bf707SBarry Smith .seealso: MatRetrieveValues() 2385be6bf707SBarry Smith 2386be6bf707SBarry Smith @*/ 2387be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatStoreValues(Mat mat) 2388be6bf707SBarry Smith { 2389dfbe8321SBarry Smith PetscErrorCode ierr,(*f)(Mat); 2390be6bf707SBarry Smith 2391be6bf707SBarry Smith PetscFunctionBegin; 23924482741eSBarry Smith PetscValidHeaderSpecific(mat,MAT_COOKIE,1); 239329bbc08cSBarry Smith if (!mat->assembled) SETERRQ(PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 239429bbc08cSBarry Smith if (mat->factor) SETERRQ(PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2395be6bf707SBarry Smith 2396c134de8dSSatish Balay ierr = PetscObjectQueryFunction((PetscObject)mat,"MatStoreValues_C",(void (**)(void))&f);CHKERRQ(ierr); 2397be6bf707SBarry Smith if (f) { 2398be6bf707SBarry Smith ierr = (*f)(mat);CHKERRQ(ierr); 2399be6bf707SBarry Smith } else { 2400634064b4SBarry Smith SETERRQ(PETSC_ERR_SUP,"Wrong type of matrix to store values"); 2401be6bf707SBarry Smith } 2402be6bf707SBarry Smith PetscFunctionReturn(0); 2403be6bf707SBarry Smith } 2404be6bf707SBarry Smith 2405fb2e594dSBarry Smith EXTERN_C_BEGIN 24064a2ae208SSatish Balay #undef __FUNCT__ 24074a2ae208SSatish Balay #define __FUNCT__ "MatRetrieveValues_SeqAIJ" 2408be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatRetrieveValues_SeqAIJ(Mat mat) 2409be6bf707SBarry Smith { 2410be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 24116849ba73SBarry Smith PetscErrorCode ierr; 241297f1f81fSBarry Smith PetscInt nz = aij->i[mat->m]; 2413be6bf707SBarry Smith 2414be6bf707SBarry Smith PetscFunctionBegin; 2415be6bf707SBarry Smith if (aij->nonew != 1) { 2416634064b4SBarry Smith SETERRQ(PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NO_NEW_NONZERO_LOCATIONS);first"); 2417be6bf707SBarry Smith } 2418be6bf707SBarry Smith if (!aij->saved_values) { 2419634064b4SBarry Smith SETERRQ(PETSC_ERR_ORDER,"Must call MatStoreValues(A);first"); 2420be6bf707SBarry Smith } 2421be6bf707SBarry Smith /* copy values over */ 242287828ca2SBarry Smith ierr = PetscMemcpy(aij->a,aij->saved_values,nz*sizeof(PetscScalar));CHKERRQ(ierr); 2423be6bf707SBarry Smith PetscFunctionReturn(0); 2424be6bf707SBarry Smith } 2425fb2e594dSBarry Smith EXTERN_C_END 2426be6bf707SBarry Smith 24274a2ae208SSatish Balay #undef __FUNCT__ 24284a2ae208SSatish Balay #define __FUNCT__ "MatRetrieveValues" 2429be6bf707SBarry Smith /*@ 2430be6bf707SBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for 2431be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 2432be6bf707SBarry Smith nonlinear portion. 2433be6bf707SBarry Smith 2434be6bf707SBarry Smith Collect on Mat 2435be6bf707SBarry Smith 2436be6bf707SBarry Smith Input Parameters: 2437be6bf707SBarry Smith . mat - the matrix (currently on AIJ matrices support this option) 2438be6bf707SBarry Smith 243915091d37SBarry Smith Level: advanced 244015091d37SBarry Smith 2441be6bf707SBarry Smith .seealso: MatStoreValues() 2442be6bf707SBarry Smith 2443be6bf707SBarry Smith @*/ 2444be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatRetrieveValues(Mat mat) 2445be6bf707SBarry Smith { 2446dfbe8321SBarry Smith PetscErrorCode ierr,(*f)(Mat); 2447be6bf707SBarry Smith 2448be6bf707SBarry Smith PetscFunctionBegin; 24494482741eSBarry Smith PetscValidHeaderSpecific(mat,MAT_COOKIE,1); 245029bbc08cSBarry Smith if (!mat->assembled) SETERRQ(PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 245129bbc08cSBarry Smith if (mat->factor) SETERRQ(PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2452be6bf707SBarry Smith 2453c134de8dSSatish Balay ierr = PetscObjectQueryFunction((PetscObject)mat,"MatRetrieveValues_C",(void (**)(void))&f);CHKERRQ(ierr); 2454be6bf707SBarry Smith if (f) { 2455be6bf707SBarry Smith ierr = (*f)(mat);CHKERRQ(ierr); 2456be6bf707SBarry Smith } else { 2457634064b4SBarry Smith SETERRQ(PETSC_ERR_SUP,"Wrong type of matrix to retrieve values"); 2458be6bf707SBarry Smith } 2459be6bf707SBarry Smith PetscFunctionReturn(0); 2460be6bf707SBarry Smith } 2461be6bf707SBarry Smith 2462f83d6046SBarry Smith 2463be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/ 24644a2ae208SSatish Balay #undef __FUNCT__ 24654a2ae208SSatish Balay #define __FUNCT__ "MatCreateSeqAIJ" 246617ab2063SBarry Smith /*@C 2467682d7d0cSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in AIJ (compressed row) format 24680d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 24696e62573dSLois Curfman McInnes the user should preallocate the matrix storage by setting the parameter nz 247051c19458SBarry Smith (or the array nnz). By setting these parameters accurately, performance 24712bd5e0b2SLois Curfman McInnes during matrix assembly can be increased by more than a factor of 50. 247217ab2063SBarry Smith 2473db81eaa0SLois Curfman McInnes Collective on MPI_Comm 2474db81eaa0SLois Curfman McInnes 247517ab2063SBarry Smith Input Parameters: 2476db81eaa0SLois Curfman McInnes + comm - MPI communicator, set to PETSC_COMM_SELF 247717ab2063SBarry Smith . m - number of rows 247817ab2063SBarry Smith . n - number of columns 247917ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 248051c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 24812bd5e0b2SLois Curfman McInnes (possibly different for each row) or PETSC_NULL 248217ab2063SBarry Smith 248317ab2063SBarry Smith Output Parameter: 2484416022c9SBarry Smith . A - the matrix 248517ab2063SBarry Smith 2486b259b22eSLois Curfman McInnes Notes: 248749a6f317SBarry Smith If nnz is given then nz is ignored 248849a6f317SBarry Smith 248917ab2063SBarry Smith The AIJ format (also called the Yale sparse matrix format or 249017ab2063SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 24910002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 249244cd7ae7SLois Curfman McInnes either one (as in Fortran) or zero. See the users' manual for details. 249317ab2063SBarry Smith 249417ab2063SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 2495a40aa06bSLois Curfman McInnes Set nz=PETSC_DEFAULT and nnz=PETSC_NULL for PETSc to control dynamic memory 24963d323bbdSBarry Smith allocation. For large problems you MUST preallocate memory or you 24976da5968aSLois Curfman McInnes will get TERRIBLE performance, see the users' manual chapter on matrices. 249817ab2063SBarry Smith 2499682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 25004fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 2501682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 25026c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 25036c7ebb05SLois Curfman McInnes 25046c7ebb05SLois Curfman McInnes Options Database Keys: 2505698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 2506698d4c6aSKris Buschelman . -mat_inode_limit <limit> - Sets inode limit (max limit=5) 2507db81eaa0SLois Curfman McInnes - -mat_aij_oneindex - Internally use indexing starting at 1 2508db81eaa0SLois Curfman McInnes rather than 0. Note that when calling MatSetValues(), 2509db81eaa0SLois Curfman McInnes the user still MUST index entries starting at 0! 251017ab2063SBarry Smith 2511027ccd11SLois Curfman McInnes Level: intermediate 2512027ccd11SLois Curfman McInnes 251336db0b34SBarry Smith .seealso: MatCreate(), MatCreateMPIAIJ(), MatSetValues(), MatSeqAIJSetColumnIndices(), MatCreateSeqAIJWithArrays() 251436db0b34SBarry Smith 251517ab2063SBarry Smith @*/ 2516be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatCreateSeqAIJ(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt nz,const PetscInt nnz[],Mat *A) 251717ab2063SBarry Smith { 2518dfbe8321SBarry Smith PetscErrorCode ierr; 25196945ee14SBarry Smith 25203a40ed3dSBarry Smith PetscFunctionBegin; 2521273d9f13SBarry Smith ierr = MatCreate(comm,m,n,m,n,A);CHKERRQ(ierr); 2522273d9f13SBarry Smith ierr = MatSetType(*A,MATSEQAIJ);CHKERRQ(ierr); 2523*ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(*A,nz,(PetscInt*)nnz);CHKERRQ(ierr); 2524273d9f13SBarry Smith PetscFunctionReturn(0); 2525273d9f13SBarry Smith } 2526273d9f13SBarry Smith 25274a2ae208SSatish Balay #undef __FUNCT__ 25284a2ae208SSatish Balay #define __FUNCT__ "MatSeqAIJSetPreallocation" 2529273d9f13SBarry Smith /*@C 2530273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 2531273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 2532273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 2533273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 2534273d9f13SBarry Smith 2535273d9f13SBarry Smith Collective on MPI_Comm 2536273d9f13SBarry Smith 2537273d9f13SBarry Smith Input Parameters: 253845bfc511SMatthew Knepley + B - The matrix 2539273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 2540273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 2541273d9f13SBarry Smith (possibly different for each row) or PETSC_NULL 2542273d9f13SBarry Smith 2543273d9f13SBarry Smith Notes: 254449a6f317SBarry Smith If nnz is given then nz is ignored 254549a6f317SBarry Smith 2546273d9f13SBarry Smith The AIJ format (also called the Yale sparse matrix format or 2547273d9f13SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 2548273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 2549273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 2550273d9f13SBarry Smith 2551273d9f13SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 2552273d9f13SBarry Smith Set nz=PETSC_DEFAULT and nnz=PETSC_NULL for PETSc to control dynamic memory 2553273d9f13SBarry Smith allocation. For large problems you MUST preallocate memory or you 2554273d9f13SBarry Smith will get TERRIBLE performance, see the users' manual chapter on matrices. 2555273d9f13SBarry Smith 2556a96a251dSBarry Smith Developers: Use nz of MAT_SKIP_ALLOCATION to not allocate any space for the matrix 2557a96a251dSBarry Smith entries or columns indices 2558a96a251dSBarry Smith 2559273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 2560273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 2561273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 2562273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 2563273d9f13SBarry Smith 2564273d9f13SBarry Smith Options Database Keys: 2565698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 2566698d4c6aSKris Buschelman . -mat_inode_limit <limit> - Sets inode limit (max limit=5) 2567273d9f13SBarry Smith - -mat_aij_oneindex - Internally use indexing starting at 1 2568273d9f13SBarry Smith rather than 0. Note that when calling MatSetValues(), 2569273d9f13SBarry Smith the user still MUST index entries starting at 0! 2570273d9f13SBarry Smith 2571273d9f13SBarry Smith Level: intermediate 2572273d9f13SBarry Smith 2573273d9f13SBarry Smith .seealso: MatCreate(), MatCreateMPIAIJ(), MatSetValues(), MatSeqAIJSetColumnIndices(), MatCreateSeqAIJWithArrays() 2574273d9f13SBarry Smith 2575273d9f13SBarry Smith @*/ 2576be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatSeqAIJSetPreallocation(Mat B,PetscInt nz,const PetscInt nnz[]) 2577273d9f13SBarry Smith { 257897f1f81fSBarry Smith PetscErrorCode ierr,(*f)(Mat,PetscInt,const PetscInt[]); 2579a23d5eceSKris Buschelman 2580a23d5eceSKris Buschelman PetscFunctionBegin; 2581a23d5eceSKris Buschelman ierr = PetscObjectQueryFunction((PetscObject)B,"MatSeqAIJSetPreallocation_C",(void (**)(void))&f);CHKERRQ(ierr); 2582a23d5eceSKris Buschelman if (f) { 2583a23d5eceSKris Buschelman ierr = (*f)(B,nz,nnz);CHKERRQ(ierr); 2584a23d5eceSKris Buschelman } 2585a23d5eceSKris Buschelman PetscFunctionReturn(0); 2586a23d5eceSKris Buschelman } 2587a23d5eceSKris Buschelman 2588a23d5eceSKris Buschelman EXTERN_C_BEGIN 2589a23d5eceSKris Buschelman #undef __FUNCT__ 2590a23d5eceSKris Buschelman #define __FUNCT__ "MatSeqAIJSetPreallocation_SeqAIJ" 2591be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatSeqAIJSetPreallocation_SeqAIJ(Mat B,PetscInt nz,PetscInt *nnz) 2592a23d5eceSKris Buschelman { 2593273d9f13SBarry Smith Mat_SeqAIJ *b; 2594a43ee2ecSKris Buschelman PetscTruth skipallocation = PETSC_FALSE; 25956849ba73SBarry Smith PetscErrorCode ierr; 259697f1f81fSBarry Smith PetscInt i; 2597273d9f13SBarry Smith 2598273d9f13SBarry Smith PetscFunctionBegin; 2599d5d45c9bSBarry Smith 2600a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 2601c461c341SBarry Smith skipallocation = PETSC_TRUE; 2602c461c341SBarry Smith nz = 0; 2603c461c341SBarry Smith } 2604c461c341SBarry Smith 2605435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 2606435da068SBarry Smith if (nz < 0) SETERRQ1(PETSC_ERR_ARG_OUTOFRANGE,"nz cannot be less than 0: value %d",nz); 2607b73539f3SBarry Smith if (nnz) { 2608273d9f13SBarry Smith for (i=0; i<B->m; i++) { 260929bbc08cSBarry Smith if (nnz[i] < 0) SETERRQ2(PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be less than 0: local row %d value %d",i,nnz[i]); 26103a7fca6bSBarry Smith if (nnz[i] > B->n) SETERRQ3(PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be greater than row length: local row %d value %d rowlength %d",i,nnz[i],B->n); 2611b73539f3SBarry Smith } 2612b73539f3SBarry Smith } 2613b73539f3SBarry Smith 2614273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 2615273d9f13SBarry Smith b = (Mat_SeqAIJ*)B->data; 2616273d9f13SBarry Smith 2617*ab93d7beSBarry Smith if (!skipallocation) { 2618*ab93d7beSBarry Smith ierr = PetscMalloc2(B->m,PetscInt,&b->imax,B->m,PetscInt,&b->ilen);CHKERRQ(ierr); 2619273d9f13SBarry Smith if (!nnz) { 2620435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 2621273d9f13SBarry Smith else if (nz <= 0) nz = 1; 2622273d9f13SBarry Smith for (i=0; i<B->m; i++) b->imax[i] = nz; 2623273d9f13SBarry Smith nz = nz*B->m; 2624273d9f13SBarry Smith } else { 2625273d9f13SBarry Smith nz = 0; 2626273d9f13SBarry Smith for (i=0; i<B->m; i++) {b->imax[i] = nnz[i]; nz += nnz[i];} 2627273d9f13SBarry Smith } 2628273d9f13SBarry Smith 2629*ab93d7beSBarry Smith /* b->ilen will count nonzeros in each row so far. */ 2630*ab93d7beSBarry Smith for (i=0; i<B->m; i++) { b->ilen[i] = 0;} 2631*ab93d7beSBarry Smith 2632273d9f13SBarry Smith /* allocate the matrix space */ 2633a96a251dSBarry Smith ierr = PetscMalloc3(nz,PetscScalar,&b->a,nz,PetscInt,&b->j,B->m+1,PetscInt,&b->i);CHKERRQ(ierr); 263497f1f81fSBarry Smith ierr = PetscMemzero(b->j,nz*sizeof(PetscInt));CHKERRQ(ierr); 2635bfeeae90SHong Zhang b->i[0] = 0; 26365da197adSKris Buschelman for (i=1; i<B->m+1; i++) { 26375da197adSKris Buschelman b->i[i] = b->i[i-1] + b->imax[i-1]; 26385da197adSKris Buschelman } 2639273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 2640273d9f13SBarry Smith b->freedata = PETSC_TRUE; 2641c461c341SBarry Smith } else { 2642c461c341SBarry Smith b->freedata = PETSC_FALSE; 2643c461c341SBarry Smith } 2644273d9f13SBarry Smith 2645273d9f13SBarry Smith b->nz = 0; 2646273d9f13SBarry Smith b->maxnz = nz; 2647273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 2648273d9f13SBarry Smith PetscFunctionReturn(0); 2649273d9f13SBarry Smith } 2650a23d5eceSKris Buschelman EXTERN_C_END 2651273d9f13SBarry Smith 26520bad9183SKris Buschelman /*MC 2653fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 26540bad9183SKris Buschelman based on compressed sparse row format. 26550bad9183SKris Buschelman 26560bad9183SKris Buschelman Options Database Keys: 26570bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 26580bad9183SKris Buschelman 26590bad9183SKris Buschelman Level: beginner 26600bad9183SKris Buschelman 2661f587520bSBarry Smith .seealso: MatCreateSeqAIJ(), MatSetFromOptions(), MatSetType(), MatCreate(), MatType 26620bad9183SKris Buschelman M*/ 26630bad9183SKris Buschelman 2664a6175056SHong Zhang EXTERN_C_BEGIN 26654a2ae208SSatish Balay #undef __FUNCT__ 26664a2ae208SSatish Balay #define __FUNCT__ "MatCreate_SeqAIJ" 2667be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatCreate_SeqAIJ(Mat B) 2668273d9f13SBarry Smith { 2669273d9f13SBarry Smith Mat_SeqAIJ *b; 2670dfbe8321SBarry Smith PetscErrorCode ierr; 267138baddfdSBarry Smith PetscMPIInt size; 2672273d9f13SBarry Smith 2673273d9f13SBarry Smith PetscFunctionBegin; 2674273d9f13SBarry Smith ierr = MPI_Comm_size(B->comm,&size);CHKERRQ(ierr); 2675273d9f13SBarry Smith if (size > 1) SETERRQ(PETSC_ERR_ARG_OUTOFRANGE,"Comm must be of size 1"); 2676273d9f13SBarry Smith 2677273d9f13SBarry Smith B->m = B->M = PetscMax(B->m,B->M); 2678273d9f13SBarry Smith B->n = B->N = PetscMax(B->n,B->N); 2679273d9f13SBarry Smith 2680b0a32e0cSBarry Smith ierr = PetscNew(Mat_SeqAIJ,&b);CHKERRQ(ierr); 2681b0a32e0cSBarry Smith B->data = (void*)b; 2682549d3d68SSatish Balay ierr = PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps));CHKERRQ(ierr); 2683416022c9SBarry Smith B->factor = 0; 268490f02eecSBarry Smith B->mapping = 0; 2685416022c9SBarry Smith b->row = 0; 2686416022c9SBarry Smith b->col = 0; 268782bf6240SBarry Smith b->icol = 0; 2688b810aeb4SBarry Smith b->reallocs = 0; 268917ab2063SBarry Smith 26908a124369SBarry Smith ierr = PetscMapCreateMPI(B->comm,B->m,B->m,&B->rmap);CHKERRQ(ierr); 26918a124369SBarry Smith ierr = PetscMapCreateMPI(B->comm,B->n,B->n,&B->cmap);CHKERRQ(ierr); 2692a5ae1ecdSBarry Smith 2693f1e2ffcdSBarry Smith b->sorted = PETSC_FALSE; 269436db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 2695f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 2696416022c9SBarry Smith b->nonew = 0; 2697416022c9SBarry Smith b->diag = 0; 2698416022c9SBarry Smith b->solve_work = 0; 26992a1b7f2aSHong Zhang B->spptr = 0; 2700be6bf707SBarry Smith b->saved_values = 0; 2701d7f994e1SBarry Smith b->idiag = 0; 2702d7f994e1SBarry Smith b->ssor = 0; 2703f1e2ffcdSBarry Smith b->keepzeroedrows = PETSC_FALSE; 2704a30b2313SHong Zhang b->xtoy = 0; 2705a30b2313SHong Zhang b->XtoY = 0; 270673e7a558SHong Zhang b->compressedrow.use = PETSC_FALSE; 2707d487561eSHong Zhang b->compressedrow.nrows = B->m; 2708d487561eSHong Zhang b->compressedrow.i = PETSC_NULL; 2709d487561eSHong Zhang b->compressedrow.rindex = PETSC_NULL; 2710d487561eSHong Zhang b->compressedrow.checked = PETSC_FALSE; 271188e51ccdSHong Zhang B->same_nonzero = PETSC_FALSE; 271217ab2063SBarry Smith 271335d8aa7fSBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ);CHKERRQ(ierr); 271435d8aa7fSBarry Smith 2715f1af5d2fSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatSeqAIJSetColumnIndices_C", 2716bef8e0ddSBarry Smith "MatSeqAIJSetColumnIndices_SeqAIJ", 2717bc4b532fSSatish Balay MatSeqAIJSetColumnIndices_SeqAIJ);CHKERRQ(ierr); 2718f1af5d2fSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatStoreValues_C", 2719be6bf707SBarry Smith "MatStoreValues_SeqAIJ", 2720bc4b532fSSatish Balay MatStoreValues_SeqAIJ);CHKERRQ(ierr); 2721f1af5d2fSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatRetrieveValues_C", 2722be6bf707SBarry Smith "MatRetrieveValues_SeqAIJ", 2723bc4b532fSSatish Balay MatRetrieveValues_SeqAIJ);CHKERRQ(ierr); 2724b24ad042SBarry Smith #if !defined(PETSC_USE_64BIT_INT) 2725a6175056SHong Zhang ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatConvert_seqaij_seqsbaij_C", 2726a6175056SHong Zhang "MatConvert_SeqAIJ_SeqSBAIJ", 2727a6175056SHong Zhang MatConvert_SeqAIJ_SeqSBAIJ);CHKERRQ(ierr); 2728b24ad042SBarry Smith #endif 272985fc7724SBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatConvert_seqaij_seqbaij_C", 273085fc7724SBarry Smith "MatConvert_SeqAIJ_SeqBAIJ", 273185fc7724SBarry Smith MatConvert_SeqAIJ_SeqBAIJ);CHKERRQ(ierr); 27325fbd3699SBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatIsTranspose_C", 27335fbd3699SBarry Smith "MatIsTranspose_SeqAIJ", 27345fbd3699SBarry Smith MatIsTranspose_SeqAIJ);CHKERRQ(ierr); 2735a23d5eceSKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatSeqAIJSetPreallocation_C", 2736a23d5eceSKris Buschelman "MatSeqAIJSetPreallocation_SeqAIJ", 2737a23d5eceSKris Buschelman MatSeqAIJSetPreallocation_SeqAIJ);CHKERRQ(ierr); 273805b94e36SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatReorderForNonzeroDiagonal_C", 273905b94e36SKris Buschelman "MatReorderForNonzeroDiagonal_SeqAIJ", 274005b94e36SKris Buschelman MatReorderForNonzeroDiagonal_SeqAIJ);CHKERRQ(ierr); 27414846f1f5SKris Buschelman ierr = MatCreate_Inode(B);CHKERRQ(ierr); 27423a40ed3dSBarry Smith PetscFunctionReturn(0); 274317ab2063SBarry Smith } 2744273d9f13SBarry Smith EXTERN_C_END 274517ab2063SBarry Smith 27464a2ae208SSatish Balay #undef __FUNCT__ 27474a2ae208SSatish Balay #define __FUNCT__ "MatDuplicate_SeqAIJ" 2748dfbe8321SBarry Smith PetscErrorCode MatDuplicate_SeqAIJ(Mat A,MatDuplicateOption cpvalues,Mat *B) 274917ab2063SBarry Smith { 2750416022c9SBarry Smith Mat C; 2751416022c9SBarry Smith Mat_SeqAIJ *c,*a = (Mat_SeqAIJ*)A->data; 27526849ba73SBarry Smith PetscErrorCode ierr; 275397f1f81fSBarry Smith PetscInt i,m = A->m; 275417ab2063SBarry Smith 27553a40ed3dSBarry Smith PetscFunctionBegin; 27564043dd9cSLois Curfman McInnes *B = 0; 2757273d9f13SBarry Smith ierr = MatCreate(A->comm,A->m,A->n,A->m,A->n,&C);CHKERRQ(ierr); 2758be5d1d56SKris Buschelman ierr = MatSetType(C,A->type_name);CHKERRQ(ierr); 27591d5dac46SHong Zhang ierr = PetscMemcpy(C->ops,A->ops,sizeof(struct _MatOps));CHKERRQ(ierr); 27601d5dac46SHong Zhang 2761273d9f13SBarry Smith c = (Mat_SeqAIJ*)C->data; 2762273d9f13SBarry Smith 2763416022c9SBarry Smith C->factor = A->factor; 27646ad4291fSHong Zhang 2765416022c9SBarry Smith c->row = 0; 2766416022c9SBarry Smith c->col = 0; 276782bf6240SBarry Smith c->icol = 0; 27686ad4291fSHong Zhang c->reallocs = 0; 276917ab2063SBarry Smith 27706ad4291fSHong Zhang C->assembled = PETSC_TRUE; 277117ab2063SBarry Smith 277297f1f81fSBarry Smith ierr = PetscMalloc((m+1)*sizeof(PetscInt),&c->imax);CHKERRQ(ierr); 277397f1f81fSBarry Smith ierr = PetscMalloc((m+1)*sizeof(PetscInt),&c->ilen);CHKERRQ(ierr); 277417ab2063SBarry Smith for (i=0; i<m; i++) { 2775416022c9SBarry Smith c->imax[i] = a->imax[i]; 2776416022c9SBarry Smith c->ilen[i] = a->ilen[i]; 277717ab2063SBarry Smith } 277817ab2063SBarry Smith 277917ab2063SBarry Smith /* allocate the matrix space */ 2780a96a251dSBarry Smith ierr = PetscMalloc3(a->i[m],PetscScalar,&c->a,a->i[m],PetscInt,&c->j,m+1,PetscInt,&c->i);CHKERRQ(ierr); 2781f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 278297f1f81fSBarry Smith ierr = PetscMemcpy(c->i,a->i,(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 278317ab2063SBarry Smith if (m > 0) { 278497f1f81fSBarry Smith ierr = PetscMemcpy(c->j,a->j,(a->i[m])*sizeof(PetscInt));CHKERRQ(ierr); 2785be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 2786bfeeae90SHong Zhang ierr = PetscMemcpy(c->a,a->a,(a->i[m])*sizeof(PetscScalar));CHKERRQ(ierr); 2787be6bf707SBarry Smith } else { 2788bfeeae90SHong Zhang ierr = PetscMemzero(c->a,(a->i[m])*sizeof(PetscScalar));CHKERRQ(ierr); 278917ab2063SBarry Smith } 279008480c60SBarry Smith } 279117ab2063SBarry Smith 2792416022c9SBarry Smith c->sorted = a->sorted; 27936ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 2794416022c9SBarry Smith c->roworiented = a->roworiented; 2795416022c9SBarry Smith c->nonew = a->nonew; 2796416022c9SBarry Smith if (a->diag) { 279797f1f81fSBarry Smith ierr = PetscMalloc((m+1)*sizeof(PetscInt),&c->diag);CHKERRQ(ierr); 279852e6d16bSBarry Smith ierr = PetscLogObjectMemory(C,(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 279917ab2063SBarry Smith for (i=0; i<m; i++) { 2800416022c9SBarry Smith c->diag[i] = a->diag[i]; 280117ab2063SBarry Smith } 28023a40ed3dSBarry Smith } else c->diag = 0; 28036ad4291fSHong Zhang c->solve_work = 0; 28046ad4291fSHong Zhang c->saved_values = 0; 28056ad4291fSHong Zhang c->idiag = 0; 28066ad4291fSHong Zhang c->ssor = 0; 28076ad4291fSHong Zhang c->keepzeroedrows = a->keepzeroedrows; 28086ad4291fSHong Zhang c->freedata = PETSC_TRUE; 28096ad4291fSHong Zhang c->xtoy = 0; 28106ad4291fSHong Zhang c->XtoY = 0; 28116ad4291fSHong Zhang 2812416022c9SBarry Smith c->nz = a->nz; 2813416022c9SBarry Smith c->maxnz = a->maxnz; 2814273d9f13SBarry Smith C->preallocated = PETSC_TRUE; 2815754ec7b1SSatish Balay 28166ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 28176ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 28186ad4291fSHong Zhang c->compressedrow.checked = a->compressedrow.checked; 28196ad4291fSHong Zhang if ( a->compressedrow.checked && a->compressedrow.use){ 28206ad4291fSHong Zhang i = a->compressedrow.nrows; 28216ad4291fSHong Zhang ierr = PetscMalloc((2*i+1)*sizeof(PetscInt),&c->compressedrow.i);CHKERRQ(ierr); 28226ad4291fSHong Zhang c->compressedrow.rindex = c->compressedrow.i + i + 1; 28236ad4291fSHong Zhang ierr = PetscMemcpy(c->compressedrow.i,a->compressedrow.i,(i+1)*sizeof(PetscInt));CHKERRQ(ierr); 28246ad4291fSHong Zhang ierr = PetscMemcpy(c->compressedrow.rindex,a->compressedrow.rindex,i*sizeof(PetscInt));CHKERRQ(ierr); 282527ea64f8SHong Zhang } else { 282627ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 282727ea64f8SHong Zhang c->compressedrow.i = PETSC_NULL; 282827ea64f8SHong Zhang c->compressedrow.rindex = PETSC_NULL; 28296ad4291fSHong Zhang } 283088e51ccdSHong Zhang C->same_nonzero = A->same_nonzero; 28316ad4291fSHong Zhang 28324846f1f5SKris Buschelman ierr = MatDuplicate_Inode(A,cpvalues,&C);CHKERRQ(ierr); 28334846f1f5SKris Buschelman 2834416022c9SBarry Smith *B = C; 2835b0a32e0cSBarry Smith ierr = PetscFListDuplicate(A->qlist,&C->qlist);CHKERRQ(ierr); 28363a40ed3dSBarry Smith PetscFunctionReturn(0); 283717ab2063SBarry Smith } 283817ab2063SBarry Smith 28394a2ae208SSatish Balay #undef __FUNCT__ 28404a2ae208SSatish Balay #define __FUNCT__ "MatLoad_SeqAIJ" 2841dfbe8321SBarry Smith PetscErrorCode MatLoad_SeqAIJ(PetscViewer viewer,const MatType type,Mat *A) 284217ab2063SBarry Smith { 2843416022c9SBarry Smith Mat_SeqAIJ *a; 2844416022c9SBarry Smith Mat B; 28456849ba73SBarry Smith PetscErrorCode ierr; 28463c601197SSatish Balay PetscInt i,sum,nz,header[4],*rowlengths = 0,M,N; 284738baddfdSBarry Smith int fd; 284838baddfdSBarry Smith PetscMPIInt size; 2849bcd2baecSBarry Smith MPI_Comm comm; 285017ab2063SBarry Smith 28513a40ed3dSBarry Smith PetscFunctionBegin; 2852e864ced6SBarry Smith ierr = PetscObjectGetComm((PetscObject)viewer,&comm);CHKERRQ(ierr); 2853d132466eSBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 285429bbc08cSBarry Smith if (size > 1) SETERRQ(PETSC_ERR_ARG_SIZ,"view must have one processor"); 2855b0a32e0cSBarry Smith ierr = PetscViewerBinaryGetDescriptor(viewer,&fd);CHKERRQ(ierr); 28560752156aSBarry Smith ierr = PetscBinaryRead(fd,header,4,PETSC_INT);CHKERRQ(ierr); 2857552e946dSBarry Smith if (header[0] != MAT_FILE_COOKIE) SETERRQ(PETSC_ERR_FILE_UNEXPECTED,"not matrix object in file"); 285817ab2063SBarry Smith M = header[1]; N = header[2]; nz = header[3]; 285917ab2063SBarry Smith 2860d64ed03dSBarry Smith if (nz < 0) { 286129bbc08cSBarry Smith SETERRQ(PETSC_ERR_FILE_UNEXPECTED,"Matrix stored in special format on disk,cannot load as SeqAIJ"); 2862d64ed03dSBarry Smith } 2863d64ed03dSBarry Smith 286417ab2063SBarry Smith /* read in row lengths */ 286597f1f81fSBarry Smith ierr = PetscMalloc(M*sizeof(PetscInt),&rowlengths);CHKERRQ(ierr); 28660752156aSBarry Smith ierr = PetscBinaryRead(fd,rowlengths,M,PETSC_INT);CHKERRQ(ierr); 286717ab2063SBarry Smith 28683c601197SSatish Balay /* check if sum of rowlengths is same as nz */ 28693c601197SSatish Balay for (i=0,sum=0; i< M; i++) sum +=rowlengths[i]; 28703c601197SSatish Balay if (sum != nz) SETERRQ2(PETSC_ERR_FILE_READ,"Inconsistant matrix data in file. no-nonzeros = %d, sum-row-lengths = %d\n",nz,sum); 28713c601197SSatish Balay 287217ab2063SBarry Smith /* create our matrix */ 2873b3a1e11cSKris Buschelman ierr = MatCreate(comm,PETSC_DECIDE,PETSC_DECIDE,M,N,&B);CHKERRQ(ierr); 2874b3a1e11cSKris Buschelman ierr = MatSetType(B,type);CHKERRQ(ierr); 2875*ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(B,0,rowlengths);CHKERRQ(ierr); 2876416022c9SBarry Smith a = (Mat_SeqAIJ*)B->data; 287717ab2063SBarry Smith 287817ab2063SBarry Smith /* read in column indices and adjust for Fortran indexing*/ 28790752156aSBarry Smith ierr = PetscBinaryRead(fd,a->j,nz,PETSC_INT);CHKERRQ(ierr); 288017ab2063SBarry Smith 288117ab2063SBarry Smith /* read in nonzero values */ 28820752156aSBarry Smith ierr = PetscBinaryRead(fd,a->a,nz,PETSC_SCALAR);CHKERRQ(ierr); 288317ab2063SBarry Smith 288417ab2063SBarry Smith /* set matrix "i" values */ 2885efb16452SHong Zhang a->i[0] = 0; 288617ab2063SBarry Smith for (i=1; i<= M; i++) { 2887416022c9SBarry Smith a->i[i] = a->i[i-1] + rowlengths[i-1]; 2888416022c9SBarry Smith a->ilen[i-1] = rowlengths[i-1]; 288917ab2063SBarry Smith } 2890606d414cSSatish Balay ierr = PetscFree(rowlengths);CHKERRQ(ierr); 289117ab2063SBarry Smith 28926d4a8577SBarry Smith ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 28936d4a8577SBarry Smith ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2894b3a1e11cSKris Buschelman *A = B; 28953a40ed3dSBarry Smith PetscFunctionReturn(0); 289617ab2063SBarry Smith } 289717ab2063SBarry Smith 28984a2ae208SSatish Balay #undef __FUNCT__ 2899b9617806SBarry Smith #define __FUNCT__ "MatEqual_SeqAIJ" 2900dfbe8321SBarry Smith PetscErrorCode MatEqual_SeqAIJ(Mat A,Mat B,PetscTruth* flg) 29017264ac53SSatish Balay { 29027264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data,*b = (Mat_SeqAIJ *)B->data; 2903dfbe8321SBarry Smith PetscErrorCode ierr; 29047264ac53SSatish Balay 29053a40ed3dSBarry Smith PetscFunctionBegin; 2906bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 2907bfeeae90SHong Zhang if ((A->m != B->m) || (A->n != B->n) ||(a->nz != b->nz)) { 2908ca44d042SBarry Smith *flg = PETSC_FALSE; 2909ca44d042SBarry Smith PetscFunctionReturn(0); 2910bcd2baecSBarry Smith } 29117264ac53SSatish Balay 29127264ac53SSatish Balay /* if the a->i are the same */ 291397f1f81fSBarry Smith ierr = PetscMemcmp(a->i,b->i,(A->m+1)*sizeof(PetscInt),flg);CHKERRQ(ierr); 2914abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 29157264ac53SSatish Balay 29167264ac53SSatish Balay /* if a->j are the same */ 291797f1f81fSBarry Smith ierr = PetscMemcmp(a->j,b->j,(a->nz)*sizeof(PetscInt),flg);CHKERRQ(ierr); 2918abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 2919bcd2baecSBarry Smith 2920bcd2baecSBarry Smith /* if a->a are the same */ 292187828ca2SBarry Smith ierr = PetscMemcmp(a->a,b->a,(a->nz)*sizeof(PetscScalar),flg);CHKERRQ(ierr); 29220f5bd95cSBarry Smith 29233a40ed3dSBarry Smith PetscFunctionReturn(0); 29247264ac53SSatish Balay 29257264ac53SSatish Balay } 292636db0b34SBarry Smith 29274a2ae208SSatish Balay #undef __FUNCT__ 29284a2ae208SSatish Balay #define __FUNCT__ "MatCreateSeqAIJWithArrays" 292936db0b34SBarry Smith /*@C 293036db0b34SBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential AIJ matrix using matrix elements (in CSR format) 293136db0b34SBarry Smith provided by the user. 293236db0b34SBarry Smith 293336db0b34SBarry Smith Coolective on MPI_Comm 293436db0b34SBarry Smith 293536db0b34SBarry Smith Input Parameters: 293636db0b34SBarry Smith + comm - must be an MPI communicator of size 1 293736db0b34SBarry Smith . m - number of rows 293836db0b34SBarry Smith . n - number of columns 293936db0b34SBarry Smith . i - row indices 294036db0b34SBarry Smith . j - column indices 294136db0b34SBarry Smith - a - matrix values 294236db0b34SBarry Smith 294336db0b34SBarry Smith Output Parameter: 294436db0b34SBarry Smith . mat - the matrix 294536db0b34SBarry Smith 294636db0b34SBarry Smith Level: intermediate 294736db0b34SBarry Smith 294836db0b34SBarry Smith Notes: 29490551d7c0SBarry Smith The i, j, and a arrays are not copied by this routine, the user must free these arrays 295036db0b34SBarry Smith once the matrix is destroyed 295136db0b34SBarry Smith 295236db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 295336db0b34SBarry Smith 2954bfeeae90SHong Zhang The i and j indices are 0 based 295536db0b34SBarry Smith 295636db0b34SBarry Smith .seealso: MatCreate(), MatCreateMPIAIJ(), MatCreateSeqAIJ() 295736db0b34SBarry Smith 295836db0b34SBarry Smith @*/ 2959be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatCreateSeqAIJWithArrays(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt* i,PetscInt*j,PetscScalar *a,Mat *mat) 296036db0b34SBarry Smith { 2961dfbe8321SBarry Smith PetscErrorCode ierr; 296297f1f81fSBarry Smith PetscInt ii; 296336db0b34SBarry Smith Mat_SeqAIJ *aij; 296436db0b34SBarry Smith 296536db0b34SBarry Smith PetscFunctionBegin; 2966a96a251dSBarry Smith if (i[0]) { 2967634064b4SBarry Smith SETERRQ(PETSC_ERR_ARG_OUTOFRANGE,"i (row indices) must start with 0"); 296836db0b34SBarry Smith } 2969*ab93d7beSBarry Smith ierr = MatCreate(comm,m,n,m,n,mat);CHKERRQ(ierr); 2970*ab93d7beSBarry Smith ierr = MatSetType(*mat,MATSEQAIJ);CHKERRQ(ierr); 2971*ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(*mat,MAT_SKIP_ALLOCATION,0);CHKERRQ(ierr); 2972*ab93d7beSBarry Smith aij = (Mat_SeqAIJ*)(*mat)->data; 2973*ab93d7beSBarry Smith ierr = PetscMalloc2(m,PetscInt,&aij->imax,m,PetscInt,&aij->ilen);CHKERRQ(ierr); 2974*ab93d7beSBarry Smith 297536db0b34SBarry Smith aij->i = i; 297636db0b34SBarry Smith aij->j = j; 297736db0b34SBarry Smith aij->a = a; 297836db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 297936db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 298036db0b34SBarry Smith aij->freedata = PETSC_FALSE; 298136db0b34SBarry Smith 298236db0b34SBarry Smith for (ii=0; ii<m; ii++) { 298336db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii+1] - i[ii]; 29842515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 298579a5c55eSBarry Smith if (i[ii+1] - i[ii] < 0) SETERRQ2(PETSC_ERR_ARG_OUTOFRANGE,"Negative row length in i (row indices) row = %d length = %d",ii,i[ii+1] - i[ii]); 298636db0b34SBarry Smith #endif 298736db0b34SBarry Smith } 29882515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 298936db0b34SBarry Smith for (ii=0; ii<aij->i[m]; ii++) { 299079a5c55eSBarry Smith if (j[ii] < 0) SETERRQ2(PETSC_ERR_ARG_OUTOFRANGE,"Negative column index at location = %d index = %d",ii,j[ii]); 299179a5c55eSBarry Smith if (j[ii] > n - 1) SETERRQ2(PETSC_ERR_ARG_OUTOFRANGE,"Column index to large at location = %d index = %d",ii,j[ii]); 299236db0b34SBarry Smith } 299336db0b34SBarry Smith #endif 299436db0b34SBarry Smith 2995b65db4caSBarry Smith ierr = MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2996b65db4caSBarry Smith ierr = MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 299736db0b34SBarry Smith PetscFunctionReturn(0); 299836db0b34SBarry Smith } 299936db0b34SBarry Smith 3000cc8ba8e1SBarry Smith #undef __FUNCT__ 3001ee4f033dSBarry Smith #define __FUNCT__ "MatSetColoring_SeqAIJ" 3002dfbe8321SBarry Smith PetscErrorCode MatSetColoring_SeqAIJ(Mat A,ISColoring coloring) 3003cc8ba8e1SBarry Smith { 3004dfbe8321SBarry Smith PetscErrorCode ierr; 3005cc8ba8e1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 300636db0b34SBarry Smith 3007cc8ba8e1SBarry Smith PetscFunctionBegin; 300812c595b3SBarry Smith if (coloring->ctype == IS_COLORING_LOCAL) { 3009cc8ba8e1SBarry Smith ierr = ISColoringReference(coloring);CHKERRQ(ierr); 3010cc8ba8e1SBarry Smith a->coloring = coloring; 301112c595b3SBarry Smith } else if (coloring->ctype == IS_COLORING_GHOSTED) { 301297f1f81fSBarry Smith PetscInt i,*larray; 301312c595b3SBarry Smith ISColoring ocoloring; 301408b6dcc0SBarry Smith ISColoringValue *colors; 301512c595b3SBarry Smith 301612c595b3SBarry Smith /* set coloring for diagonal portion */ 301797f1f81fSBarry Smith ierr = PetscMalloc((A->n+1)*sizeof(PetscInt),&larray);CHKERRQ(ierr); 301812c595b3SBarry Smith for (i=0; i<A->n; i++) { 301912c595b3SBarry Smith larray[i] = i; 302012c595b3SBarry Smith } 302112c595b3SBarry Smith ierr = ISGlobalToLocalMappingApply(A->mapping,IS_GTOLM_MASK,A->n,larray,PETSC_NULL,larray);CHKERRQ(ierr); 302208b6dcc0SBarry Smith ierr = PetscMalloc((A->n+1)*sizeof(ISColoringValue),&colors);CHKERRQ(ierr); 302312c595b3SBarry Smith for (i=0; i<A->n; i++) { 302412c595b3SBarry Smith colors[i] = coloring->colors[larray[i]]; 302512c595b3SBarry Smith } 302612c595b3SBarry Smith ierr = PetscFree(larray);CHKERRQ(ierr); 302712c595b3SBarry Smith ierr = ISColoringCreate(PETSC_COMM_SELF,A->n,colors,&ocoloring);CHKERRQ(ierr); 302812c595b3SBarry Smith a->coloring = ocoloring; 302912c595b3SBarry Smith } 3030cc8ba8e1SBarry Smith PetscFunctionReturn(0); 3031cc8ba8e1SBarry Smith } 3032cc8ba8e1SBarry Smith 3033dcf5cc72SBarry Smith #if defined(PETSC_HAVE_ADIC) 3034ee4f033dSBarry Smith EXTERN_C_BEGIN 303529c1e371SBarry Smith #include "adic/ad_utils.h" 3036ee4f033dSBarry Smith EXTERN_C_END 3037cc8ba8e1SBarry Smith 3038cc8ba8e1SBarry Smith #undef __FUNCT__ 3039ee4f033dSBarry Smith #define __FUNCT__ "MatSetValuesAdic_SeqAIJ" 3040dfbe8321SBarry Smith PetscErrorCode MatSetValuesAdic_SeqAIJ(Mat A,void *advalues) 3041cc8ba8e1SBarry Smith { 3042cc8ba8e1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 304397f1f81fSBarry Smith PetscInt m = A->m,*ii = a->i,*jj = a->j,nz,i,j,nlen; 30444440f671SBarry Smith PetscScalar *v = a->a,*values = ((PetscScalar*)advalues)+1; 304508b6dcc0SBarry Smith ISColoringValue *color; 3046cc8ba8e1SBarry Smith 3047cc8ba8e1SBarry Smith PetscFunctionBegin; 3048e005ede5SBarry Smith if (!a->coloring) SETERRQ(PETSC_ERR_ARG_WRONGSTATE,"Coloring not set for matrix"); 30494440f671SBarry Smith nlen = PetscADGetDerivTypeSize()/sizeof(PetscScalar); 3050cc8ba8e1SBarry Smith color = a->coloring->colors; 3051cc8ba8e1SBarry Smith /* loop over rows */ 3052cc8ba8e1SBarry Smith for (i=0; i<m; i++) { 3053cc8ba8e1SBarry Smith nz = ii[i+1] - ii[i]; 3054cc8ba8e1SBarry Smith /* loop over columns putting computed value into matrix */ 3055cc8ba8e1SBarry Smith for (j=0; j<nz; j++) { 3056cc8ba8e1SBarry Smith *v++ = values[color[*jj++]]; 3057cc8ba8e1SBarry Smith } 30584440f671SBarry Smith values += nlen; /* jump to next row of derivatives */ 3059ee4f033dSBarry Smith } 3060ee4f033dSBarry Smith PetscFunctionReturn(0); 3061ee4f033dSBarry Smith } 3062ee4f033dSBarry Smith #endif 3063ee4f033dSBarry Smith 3064ee4f033dSBarry Smith #undef __FUNCT__ 3065ee4f033dSBarry Smith #define __FUNCT__ "MatSetValuesAdifor_SeqAIJ" 306697f1f81fSBarry Smith PetscErrorCode MatSetValuesAdifor_SeqAIJ(Mat A,PetscInt nl,void *advalues) 3067ee4f033dSBarry Smith { 3068ee4f033dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 306997f1f81fSBarry Smith PetscInt m = A->m,*ii = a->i,*jj = a->j,nz,i,j; 307087828ca2SBarry Smith PetscScalar *v = a->a,*values = (PetscScalar *)advalues; 307108b6dcc0SBarry Smith ISColoringValue *color; 3072ee4f033dSBarry Smith 3073ee4f033dSBarry Smith PetscFunctionBegin; 3074e005ede5SBarry Smith if (!a->coloring) SETERRQ(PETSC_ERR_ARG_WRONGSTATE,"Coloring not set for matrix"); 3075ee4f033dSBarry Smith color = a->coloring->colors; 3076ee4f033dSBarry Smith /* loop over rows */ 3077ee4f033dSBarry Smith for (i=0; i<m; i++) { 3078ee4f033dSBarry Smith nz = ii[i+1] - ii[i]; 3079ee4f033dSBarry Smith /* loop over columns putting computed value into matrix */ 3080ee4f033dSBarry Smith for (j=0; j<nz; j++) { 3081ee4f033dSBarry Smith *v++ = values[color[*jj++]]; 3082ee4f033dSBarry Smith } 3083ee4f033dSBarry Smith values += nl; /* jump to next row of derivatives */ 3084cc8ba8e1SBarry Smith } 3085cc8ba8e1SBarry Smith PetscFunctionReturn(0); 3086cc8ba8e1SBarry Smith } 308736db0b34SBarry Smith 3088