1b377110cSBarry Smith 2d5d45c9bSBarry Smith /* 33369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 4d5d45c9bSBarry Smith matrix storage format. 5d5d45c9bSBarry Smith */ 63369ce9aSBarry Smith 77c4f633dSBarry Smith 8c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 9c6db04a5SJed Brown #include <petscblaslapack.h> 10c6db04a5SJed Brown #include <petscbt.h> 1117ab2063SBarry Smith 120716a85fSBarry Smith 130716a85fSBarry Smith #undef __FUNCT__ 140716a85fSBarry Smith #define __FUNCT__ "MatGetColumnNorms_SeqAIJ" 150716a85fSBarry Smith PetscErrorCode MatGetColumnNorms_SeqAIJ(Mat A,NormType type,PetscReal *norms) 160716a85fSBarry Smith { 170716a85fSBarry Smith PetscErrorCode ierr; 180716a85fSBarry Smith PetscInt i,m,n; 190716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 200716a85fSBarry Smith 210716a85fSBarry Smith PetscFunctionBegin; 220716a85fSBarry Smith ierr = MatGetSize(A,&m,&n);CHKERRQ(ierr); 230716a85fSBarry Smith ierr = PetscMemzero(norms,n*sizeof(PetscReal));CHKERRQ(ierr); 240716a85fSBarry Smith if (type == NORM_2) { 250716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 260716a85fSBarry Smith norms[aij->j[i]] += PetscAbsScalar(aij->a[i]*aij->a[i]); 270716a85fSBarry Smith } 280716a85fSBarry Smith } else if (type == NORM_1) { 290716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 300716a85fSBarry Smith norms[aij->j[i]] += PetscAbsScalar(aij->a[i]); 310716a85fSBarry Smith } 320716a85fSBarry Smith } else if (type == NORM_INFINITY) { 330716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 340716a85fSBarry Smith norms[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]),norms[aij->j[i]]); 350716a85fSBarry Smith } 360716a85fSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Unknown NormType"); 370716a85fSBarry Smith 380716a85fSBarry Smith if (type == NORM_2) { 398f1a2a5eSBarry Smith for (i=0; i<n; i++) norms[i] = PetscSqrtReal(norms[i]); 400716a85fSBarry Smith } 410716a85fSBarry Smith PetscFunctionReturn(0); 420716a85fSBarry Smith } 430716a85fSBarry Smith 444a2ae208SSatish Balay #undef __FUNCT__ 456ce1633cSBarry Smith #define __FUNCT__ "MatFindZeroDiagonals_SeqAIJ" 466ce1633cSBarry Smith PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A,IS *zrows) 476ce1633cSBarry Smith { 486ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 496ce1633cSBarry Smith const MatScalar *aa = a->a; 506ce1633cSBarry Smith PetscInt i,m=A->rmap->n,cnt = 0; 516ce1633cSBarry Smith const PetscInt *jj = a->j,*diag; 526ce1633cSBarry Smith PetscInt *rows; 536ce1633cSBarry Smith PetscErrorCode ierr; 546ce1633cSBarry Smith 556ce1633cSBarry Smith PetscFunctionBegin; 566ce1633cSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 576ce1633cSBarry Smith diag = a->diag; 586ce1633cSBarry Smith for (i=0; i<m; i++) { 596ce1633cSBarry Smith if ((jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 606ce1633cSBarry Smith cnt++; 616ce1633cSBarry Smith } 626ce1633cSBarry Smith } 636ce1633cSBarry Smith ierr = PetscMalloc(cnt*sizeof(PetscInt),&rows);CHKERRQ(ierr); 646ce1633cSBarry Smith cnt = 0; 656ce1633cSBarry Smith for (i=0; i<m; i++) { 666ce1633cSBarry Smith if ((jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 676ce1633cSBarry Smith rows[cnt++] = i; 686ce1633cSBarry Smith } 696ce1633cSBarry Smith } 706ce1633cSBarry Smith ierr = ISCreateGeneral(((PetscObject)A)->comm,cnt,rows,PETSC_OWN_POINTER,zrows);CHKERRQ(ierr); 716ce1633cSBarry Smith PetscFunctionReturn(0); 726ce1633cSBarry Smith } 736ce1633cSBarry Smith 746ce1633cSBarry Smith #undef __FUNCT__ 75b3a44c85SBarry Smith #define __FUNCT__ "MatFindNonzeroRows_SeqAIJ" 76b3a44c85SBarry Smith PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A,IS *keptrows) 77b3a44c85SBarry Smith { 78b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 79b3a44c85SBarry Smith const MatScalar *aa; 80b3a44c85SBarry Smith PetscInt m=A->rmap->n,cnt = 0; 81b3a44c85SBarry Smith const PetscInt *ii; 82b3a44c85SBarry Smith PetscInt n,i,j,*rows; 83b3a44c85SBarry Smith PetscErrorCode ierr; 84b3a44c85SBarry Smith 85b3a44c85SBarry Smith PetscFunctionBegin; 86b3a44c85SBarry Smith *keptrows = 0; 87b3a44c85SBarry Smith ii = a->i; 88b3a44c85SBarry Smith for (i=0; i<m; i++) { 89b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 90b3a44c85SBarry Smith if (!n) { 91b3a44c85SBarry Smith cnt++; 92b3a44c85SBarry Smith goto ok1; 93b3a44c85SBarry Smith } 94b3a44c85SBarry Smith aa = a->a + ii[i]; 95b3a44c85SBarry Smith for (j=0; j<n; j++) { 96b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 97b3a44c85SBarry Smith } 98b3a44c85SBarry Smith cnt++; 99b3a44c85SBarry Smith ok1:; 100b3a44c85SBarry Smith } 101b3a44c85SBarry Smith if (!cnt) PetscFunctionReturn(0); 102b3a44c85SBarry Smith ierr = PetscMalloc((A->rmap->n-cnt)*sizeof(PetscInt),&rows);CHKERRQ(ierr); 103b3a44c85SBarry Smith cnt = 0; 104b3a44c85SBarry Smith for (i=0; i<m; i++) { 105b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 106b3a44c85SBarry Smith if (!n) continue; 107b3a44c85SBarry Smith aa = a->a + ii[i]; 108b3a44c85SBarry Smith for (j=0; j<n; j++) { 109b3a44c85SBarry Smith if (aa[j] != 0.0) { 110b3a44c85SBarry Smith rows[cnt++] = i; 111b3a44c85SBarry Smith break; 112b3a44c85SBarry Smith } 113b3a44c85SBarry Smith } 114b3a44c85SBarry Smith } 115b3a44c85SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,cnt,rows,PETSC_OWN_POINTER,keptrows);CHKERRQ(ierr); 116b3a44c85SBarry Smith PetscFunctionReturn(0); 117b3a44c85SBarry Smith } 118b3a44c85SBarry Smith 119b3a44c85SBarry Smith #undef __FUNCT__ 12079299369SBarry Smith #define __FUNCT__ "MatDiagonalSet_SeqAIJ" 1217087cfbeSBarry Smith PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y,Vec D,InsertMode is) 12279299369SBarry Smith { 12379299369SBarry Smith PetscErrorCode ierr; 12479299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) Y->data; 125d0f46423SBarry Smith PetscInt i,*diag, m = Y->rmap->n; 12654f21887SBarry Smith MatScalar *aa = aij->a; 12754f21887SBarry Smith PetscScalar *v; 128ace3abfcSBarry Smith PetscBool missing; 12979299369SBarry Smith 13079299369SBarry Smith PetscFunctionBegin; 13109f38230SBarry Smith if (Y->assembled) { 13209f38230SBarry Smith ierr = MatMissingDiagonal_SeqAIJ(Y,&missing,PETSC_NULL);CHKERRQ(ierr); 13309f38230SBarry Smith if (!missing) { 13479299369SBarry Smith diag = aij->diag; 13579299369SBarry Smith ierr = VecGetArray(D,&v);CHKERRQ(ierr); 13679299369SBarry Smith if (is == INSERT_VALUES) { 13779299369SBarry Smith for (i=0; i<m; i++) { 13879299369SBarry Smith aa[diag[i]] = v[i]; 13979299369SBarry Smith } 14079299369SBarry Smith } else { 14179299369SBarry Smith for (i=0; i<m; i++) { 14279299369SBarry Smith aa[diag[i]] += v[i]; 14379299369SBarry Smith } 14479299369SBarry Smith } 14579299369SBarry Smith ierr = VecRestoreArray(D,&v);CHKERRQ(ierr); 14679299369SBarry Smith PetscFunctionReturn(0); 14779299369SBarry Smith } 14809f38230SBarry Smith } 14909f38230SBarry Smith ierr = MatDiagonalSet_Default(Y,D,is);CHKERRQ(ierr); 15009f38230SBarry Smith PetscFunctionReturn(0); 15109f38230SBarry Smith } 15279299369SBarry Smith 15379299369SBarry Smith #undef __FUNCT__ 1544a2ae208SSatish Balay #define __FUNCT__ "MatGetRowIJ_SeqAIJ" 155ace3abfcSBarry Smith PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *m,PetscInt *ia[],PetscInt *ja[],PetscBool *done) 15617ab2063SBarry Smith { 157416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 158dfbe8321SBarry Smith PetscErrorCode ierr; 15997f1f81fSBarry Smith PetscInt i,ishift; 16017ab2063SBarry Smith 1613a40ed3dSBarry Smith PetscFunctionBegin; 162d0f46423SBarry Smith *m = A->rmap->n; 1633a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 164bfeeae90SHong Zhang ishift = 0; 16553e63a63SBarry Smith if (symmetric && !A->structurally_symmetric) { 166d0f46423SBarry Smith ierr = MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,ishift,oshift,ia,ja);CHKERRQ(ierr); 167bfeeae90SHong Zhang } else if (oshift == 1) { 168d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 1693b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 170d0f46423SBarry Smith ierr = PetscMalloc((A->rmap->n+1)*sizeof(PetscInt),ia);CHKERRQ(ierr); 171d0f46423SBarry Smith for (i=0; i<A->rmap->n+1; i++) (*ia)[i] = a->i[i] + 1; 172ecc77c7aSBarry Smith if (ja) { 17397f1f81fSBarry Smith ierr = PetscMalloc((nz+1)*sizeof(PetscInt),ja);CHKERRQ(ierr); 1743b2fbd54SBarry Smith for (i=0; i<nz; i++) (*ja)[i] = a->j[i] + 1; 175ecc77c7aSBarry Smith } 1766945ee14SBarry Smith } else { 177ecc77c7aSBarry Smith *ia = a->i; 178ecc77c7aSBarry Smith if (ja) *ja = a->j; 179a2ce50c7SBarry Smith } 1803a40ed3dSBarry Smith PetscFunctionReturn(0); 181a2744918SBarry Smith } 182a2744918SBarry Smith 1834a2ae208SSatish Balay #undef __FUNCT__ 1844a2ae208SSatish Balay #define __FUNCT__ "MatRestoreRowIJ_SeqAIJ" 185ace3abfcSBarry Smith PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,PetscInt *ia[],PetscInt *ja[],PetscBool *done) 1866945ee14SBarry Smith { 187dfbe8321SBarry Smith PetscErrorCode ierr; 1886945ee14SBarry Smith 1893a40ed3dSBarry Smith PetscFunctionBegin; 1903a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 191bfeeae90SHong Zhang if ((symmetric && !A->structurally_symmetric) || oshift == 1) { 192606d414cSSatish Balay ierr = PetscFree(*ia);CHKERRQ(ierr); 193ecc77c7aSBarry Smith if (ja) {ierr = PetscFree(*ja);CHKERRQ(ierr);} 194bcd2baecSBarry Smith } 1953a40ed3dSBarry Smith PetscFunctionReturn(0); 19617ab2063SBarry Smith } 19717ab2063SBarry Smith 1984a2ae208SSatish Balay #undef __FUNCT__ 1994a2ae208SSatish Balay #define __FUNCT__ "MatGetColumnIJ_SeqAIJ" 200ace3abfcSBarry Smith PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *nn,PetscInt *ia[],PetscInt *ja[],PetscBool *done) 2013b2fbd54SBarry Smith { 2023b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 203dfbe8321SBarry Smith PetscErrorCode ierr; 204d0f46423SBarry Smith PetscInt i,*collengths,*cia,*cja,n = A->cmap->n,m = A->rmap->n; 20597f1f81fSBarry Smith PetscInt nz = a->i[m],row,*jj,mr,col; 2063b2fbd54SBarry Smith 2073a40ed3dSBarry Smith PetscFunctionBegin; 208899cda47SBarry Smith *nn = n; 2093a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2103b2fbd54SBarry Smith if (symmetric) { 211d0f46423SBarry Smith ierr = MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,0,oshift,ia,ja);CHKERRQ(ierr); 2123b2fbd54SBarry Smith } else { 21397f1f81fSBarry Smith ierr = PetscMalloc((n+1)*sizeof(PetscInt),&collengths);CHKERRQ(ierr); 21497f1f81fSBarry Smith ierr = PetscMemzero(collengths,n*sizeof(PetscInt));CHKERRQ(ierr); 21597f1f81fSBarry Smith ierr = PetscMalloc((n+1)*sizeof(PetscInt),&cia);CHKERRQ(ierr); 21697f1f81fSBarry Smith ierr = PetscMalloc((nz+1)*sizeof(PetscInt),&cja);CHKERRQ(ierr); 2173b2fbd54SBarry Smith jj = a->j; 2183b2fbd54SBarry Smith for (i=0; i<nz; i++) { 219bfeeae90SHong Zhang collengths[jj[i]]++; 2203b2fbd54SBarry Smith } 2213b2fbd54SBarry Smith cia[0] = oshift; 2223b2fbd54SBarry Smith for (i=0; i<n; i++) { 2233b2fbd54SBarry Smith cia[i+1] = cia[i] + collengths[i]; 2243b2fbd54SBarry Smith } 22597f1f81fSBarry Smith ierr = PetscMemzero(collengths,n*sizeof(PetscInt));CHKERRQ(ierr); 2263b2fbd54SBarry Smith jj = a->j; 227a93ec695SBarry Smith for (row=0; row<m; row++) { 228a93ec695SBarry Smith mr = a->i[row+1] - a->i[row]; 229a93ec695SBarry Smith for (i=0; i<mr; i++) { 230bfeeae90SHong Zhang col = *jj++; 2313b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2323b2fbd54SBarry Smith } 2333b2fbd54SBarry Smith } 234606d414cSSatish Balay ierr = PetscFree(collengths);CHKERRQ(ierr); 2353b2fbd54SBarry Smith *ia = cia; *ja = cja; 2363b2fbd54SBarry Smith } 2373a40ed3dSBarry Smith PetscFunctionReturn(0); 2383b2fbd54SBarry Smith } 2393b2fbd54SBarry Smith 2404a2ae208SSatish Balay #undef __FUNCT__ 2414a2ae208SSatish Balay #define __FUNCT__ "MatRestoreColumnIJ_SeqAIJ" 242ace3abfcSBarry Smith PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,PetscInt *ia[],PetscInt *ja[],PetscBool *done) 2433b2fbd54SBarry Smith { 244dfbe8321SBarry Smith PetscErrorCode ierr; 245606d414cSSatish Balay 2463a40ed3dSBarry Smith PetscFunctionBegin; 2473a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2483b2fbd54SBarry Smith 249606d414cSSatish Balay ierr = PetscFree(*ia);CHKERRQ(ierr); 250606d414cSSatish Balay ierr = PetscFree(*ja);CHKERRQ(ierr); 2513b2fbd54SBarry Smith 2523a40ed3dSBarry Smith PetscFunctionReturn(0); 2533b2fbd54SBarry Smith } 2543b2fbd54SBarry Smith 25587d4246cSBarry Smith #undef __FUNCT__ 25687d4246cSBarry Smith #define __FUNCT__ "MatSetValuesRow_SeqAIJ" 25787d4246cSBarry Smith PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A,PetscInt row,const PetscScalar v[]) 25887d4246cSBarry Smith { 25987d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 26087d4246cSBarry Smith PetscInt *ai = a->i; 26187d4246cSBarry Smith PetscErrorCode ierr; 26287d4246cSBarry Smith 26387d4246cSBarry Smith PetscFunctionBegin; 26487d4246cSBarry Smith ierr = PetscMemcpy(a->a+ai[row],v,(ai[row+1]-ai[row])*sizeof(PetscScalar));CHKERRQ(ierr); 26587d4246cSBarry Smith PetscFunctionReturn(0); 26687d4246cSBarry Smith } 26787d4246cSBarry Smith 2684a2ae208SSatish Balay #undef __FUNCT__ 2694a2ae208SSatish Balay #define __FUNCT__ "MatSetValues_SeqAIJ" 27097f1f81fSBarry Smith PetscErrorCode MatSetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 27117ab2063SBarry Smith { 272416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 273e2ee6c50SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 27497f1f81fSBarry Smith PetscInt *imax = a->imax,*ai = a->i,*ailen = a->ilen; 2756849ba73SBarry Smith PetscErrorCode ierr; 276e2ee6c50SBarry Smith PetscInt *aj = a->j,nonew = a->nonew,lastcol = -1; 27754f21887SBarry Smith MatScalar *ap,value,*aa = a->a; 278ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 279ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 28017ab2063SBarry Smith 2813a40ed3dSBarry Smith PetscFunctionBegin; 28271fd2e92SBarry Smith if (v) PetscValidScalarPointer(v,6); 28317ab2063SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 284416022c9SBarry Smith row = im[k]; 2855ef9f2a5SBarry Smith if (row < 0) continue; 2862515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 287e32f2f54SBarry Smith if (row >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",row,A->rmap->n-1); 2883b2fbd54SBarry Smith #endif 289bfeeae90SHong Zhang rp = aj + ai[row]; ap = aa + ai[row]; 29017ab2063SBarry Smith rmax = imax[row]; nrow = ailen[row]; 291416022c9SBarry Smith low = 0; 292c71e6ed7SBarry Smith high = nrow; 29317ab2063SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 2945ef9f2a5SBarry Smith if (in[l] < 0) continue; 2952515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 296e32f2f54SBarry Smith if (in[l] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",in[l],A->cmap->n-1); 2973b2fbd54SBarry Smith #endif 298bfeeae90SHong Zhang col = in[l]; 29916371a99SBarry Smith if (v) { 3004b0e389bSBarry Smith if (roworiented) { 3015ef9f2a5SBarry Smith value = v[l + k*n]; 302bef8e0ddSBarry Smith } else { 3034b0e389bSBarry Smith value = v[k + l*m]; 3044b0e389bSBarry Smith } 30516371a99SBarry Smith } else { 30675567043SBarry Smith value = 0.; 30716371a99SBarry Smith } 308abc0a331SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 30936db0b34SBarry Smith 3107cd84e04SBarry Smith if (col <= lastcol) low = 0; else high = nrow; 311e2ee6c50SBarry Smith lastcol = col; 312416022c9SBarry Smith while (high-low > 5) { 313416022c9SBarry Smith t = (low+high)/2; 314416022c9SBarry Smith if (rp[t] > col) high = t; 315416022c9SBarry Smith else low = t; 31617ab2063SBarry Smith } 317416022c9SBarry Smith for (i=low; i<high; i++) { 31817ab2063SBarry Smith if (rp[i] > col) break; 31917ab2063SBarry Smith if (rp[i] == col) { 320416022c9SBarry Smith if (is == ADD_VALUES) ap[i] += value; 32117ab2063SBarry Smith else ap[i] = value; 322e44c0bd4SBarry Smith low = i + 1; 32317ab2063SBarry Smith goto noinsert; 32417ab2063SBarry Smith } 32517ab2063SBarry Smith } 326abc0a331SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 327c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 328e32f2f54SBarry Smith if (nonew == -1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero at (%D,%D) in the matrix",row,col); 329fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 330c03d1d03SSatish Balay N = nrow++ - 1; a->nz++; high++; 331416022c9SBarry Smith /* shift up all the later entries in this row */ 332416022c9SBarry Smith for (ii=N; ii>=i; ii--) { 33317ab2063SBarry Smith rp[ii+1] = rp[ii]; 33417ab2063SBarry Smith ap[ii+1] = ap[ii]; 33517ab2063SBarry Smith } 33617ab2063SBarry Smith rp[i] = col; 33717ab2063SBarry Smith ap[i] = value; 338416022c9SBarry Smith low = i + 1; 339e44c0bd4SBarry Smith noinsert:; 34017ab2063SBarry Smith } 34117ab2063SBarry Smith ailen[row] = nrow; 34217ab2063SBarry Smith } 34388e51ccdSHong Zhang A->same_nonzero = PETSC_FALSE; 3443a40ed3dSBarry Smith PetscFunctionReturn(0); 34517ab2063SBarry Smith } 34617ab2063SBarry Smith 34781824310SBarry Smith 3484a2ae208SSatish Balay #undef __FUNCT__ 3494a2ae208SSatish Balay #define __FUNCT__ "MatGetValues_SeqAIJ" 350a77337e4SBarry Smith PetscErrorCode MatGetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],PetscScalar v[]) 3517eb43aa7SLois Curfman McInnes { 3527eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 35397f1f81fSBarry Smith PetscInt *rp,k,low,high,t,row,nrow,i,col,l,*aj = a->j; 35497f1f81fSBarry Smith PetscInt *ai = a->i,*ailen = a->ilen; 35554f21887SBarry Smith MatScalar *ap,*aa = a->a; 3567eb43aa7SLois Curfman McInnes 3573a40ed3dSBarry Smith PetscFunctionBegin; 3587eb43aa7SLois Curfman McInnes for (k=0; k<m; k++) { /* loop over rows */ 3597eb43aa7SLois Curfman McInnes row = im[k]; 360e32f2f54SBarry Smith if (row < 0) {v += n; continue;} /* SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row: %D",row); */ 361e32f2f54SBarry Smith if (row >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",row,A->rmap->n-1); 362bfeeae90SHong Zhang rp = aj + ai[row]; ap = aa + ai[row]; 3637eb43aa7SLois Curfman McInnes nrow = ailen[row]; 3647eb43aa7SLois Curfman McInnes for (l=0; l<n; l++) { /* loop over columns */ 365e32f2f54SBarry Smith if (in[l] < 0) {v++; continue;} /* SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column: %D",in[l]); */ 366e32f2f54SBarry Smith if (in[l] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",in[l],A->cmap->n-1); 367bfeeae90SHong Zhang col = in[l] ; 3687eb43aa7SLois Curfman McInnes high = nrow; low = 0; /* assume unsorted */ 3697eb43aa7SLois Curfman McInnes while (high-low > 5) { 3707eb43aa7SLois Curfman McInnes t = (low+high)/2; 3717eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 3727eb43aa7SLois Curfman McInnes else low = t; 3737eb43aa7SLois Curfman McInnes } 3747eb43aa7SLois Curfman McInnes for (i=low; i<high; i++) { 3757eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 3767eb43aa7SLois Curfman McInnes if (rp[i] == col) { 377b49de8d1SLois Curfman McInnes *v++ = ap[i]; 3787eb43aa7SLois Curfman McInnes goto finished; 3797eb43aa7SLois Curfman McInnes } 3807eb43aa7SLois Curfman McInnes } 38197e567efSBarry Smith *v++ = 0.0; 3827eb43aa7SLois Curfman McInnes finished:; 3837eb43aa7SLois Curfman McInnes } 3847eb43aa7SLois Curfman McInnes } 3853a40ed3dSBarry Smith PetscFunctionReturn(0); 3867eb43aa7SLois Curfman McInnes } 3877eb43aa7SLois Curfman McInnes 38817ab2063SBarry Smith 3894a2ae208SSatish Balay #undef __FUNCT__ 3904a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqAIJ_Binary" 391dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Binary(Mat A,PetscViewer viewer) 39217ab2063SBarry Smith { 393416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3946849ba73SBarry Smith PetscErrorCode ierr; 3956f69ff64SBarry Smith PetscInt i,*col_lens; 3966f69ff64SBarry Smith int fd; 39717ab2063SBarry Smith 3983a40ed3dSBarry Smith PetscFunctionBegin; 399b0a32e0cSBarry Smith ierr = PetscViewerBinaryGetDescriptor(viewer,&fd);CHKERRQ(ierr); 400d0f46423SBarry Smith ierr = PetscMalloc((4+A->rmap->n)*sizeof(PetscInt),&col_lens);CHKERRQ(ierr); 4010700a824SBarry Smith col_lens[0] = MAT_FILE_CLASSID; 402d0f46423SBarry Smith col_lens[1] = A->rmap->n; 403d0f46423SBarry Smith col_lens[2] = A->cmap->n; 404416022c9SBarry Smith col_lens[3] = a->nz; 405416022c9SBarry Smith 406416022c9SBarry Smith /* store lengths of each row and write (including header) to file */ 407d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 408416022c9SBarry Smith col_lens[4+i] = a->i[i+1] - a->i[i]; 40917ab2063SBarry Smith } 410d0f46423SBarry Smith ierr = PetscBinaryWrite(fd,col_lens,4+A->rmap->n,PETSC_INT,PETSC_TRUE);CHKERRQ(ierr); 411606d414cSSatish Balay ierr = PetscFree(col_lens);CHKERRQ(ierr); 412416022c9SBarry Smith 413416022c9SBarry Smith /* store column indices (zero start index) */ 4146f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,a->j,a->nz,PETSC_INT,PETSC_FALSE);CHKERRQ(ierr); 415416022c9SBarry Smith 416416022c9SBarry Smith /* store nonzero values */ 4176f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,a->a,a->nz,PETSC_SCALAR,PETSC_FALSE);CHKERRQ(ierr); 4183a40ed3dSBarry Smith PetscFunctionReturn(0); 41917ab2063SBarry Smith } 420416022c9SBarry Smith 42109573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat,PetscViewer); 422cd155464SBarry Smith 4234a2ae208SSatish Balay #undef __FUNCT__ 4244a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqAIJ_ASCII" 425dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_ASCII(Mat A,PetscViewer viewer) 426416022c9SBarry Smith { 427416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 428dfbe8321SBarry Smith PetscErrorCode ierr; 429d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,shift=0; 430e060cb09SBarry Smith const char *name; 431f3ef73ceSBarry Smith PetscViewerFormat format; 43217ab2063SBarry Smith 4333a40ed3dSBarry Smith PetscFunctionBegin; 434b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 43571c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 43697f1f81fSBarry Smith PetscInt nofinalvalue = 0; 437d0f46423SBarry Smith if ((a->i[m] == a->i[m-1]) || (a->j[a->nz-1] != A->cmap->n-!shift)) { 438d00d2cf4SBarry Smith nofinalvalue = 1; 439d00d2cf4SBarry Smith } 440d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 441d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Size = %D %D \n",m,A->cmap->n);CHKERRQ(ierr); 44277431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Nonzeros = %D \n",a->nz);CHKERRQ(ierr); 44377431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"zzz = zeros(%D,3);\n",a->nz+nofinalvalue);CHKERRQ(ierr); 444b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"zzz = [\n");CHKERRQ(ierr); 44517ab2063SBarry Smith 44617ab2063SBarry Smith for (i=0; i<m; i++) { 447416022c9SBarry Smith for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 448aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 44977431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e + %18.16ei \n",i+1,a->j[j]+!shift,PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 45017ab2063SBarry Smith #else 45177431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e\n",i+1,a->j[j]+!shift,a->a[j]);CHKERRQ(ierr); 45217ab2063SBarry Smith #endif 45317ab2063SBarry Smith } 45417ab2063SBarry Smith } 455d00d2cf4SBarry Smith if (nofinalvalue) { 456d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e\n",m,A->cmap->n,0.0);CHKERRQ(ierr); 457d00d2cf4SBarry Smith } 458317d6ea6SBarry Smith ierr = PetscObjectGetName((PetscObject)A,&name);CHKERRQ(ierr); 459fb9695e5SSatish Balay ierr = PetscViewerASCIIPrintf(viewer,"];\n %s = spconvert(zzz);\n",name);CHKERRQ(ierr); 460d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 46168369a75SKris Buschelman } else if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO) { 462cd155464SBarry Smith PetscFunctionReturn(0); 463fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 464d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 4657566de4bSShri Abhyankar ierr = PetscObjectPrintClassNamePrefixType((PetscObject)A,viewer,"Matrix Object");CHKERRQ(ierr); 46644cd7ae7SLois Curfman McInnes for (i=0; i<m; i++) { 46777431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 46844cd7ae7SLois Curfman McInnes for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 469aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 47036db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 471a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G + %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 47236db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 473a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G - %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 47436db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 475a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,PetscRealPart(a->a[j]));CHKERRQ(ierr); 4766831982aSBarry Smith } 47744cd7ae7SLois Curfman McInnes #else 478a83599f4SBarry Smith if (a->a[j] != 0.0) {ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,a->a[j]);CHKERRQ(ierr);} 47944cd7ae7SLois Curfman McInnes #endif 48044cd7ae7SLois Curfman McInnes } 481b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 48244cd7ae7SLois Curfman McInnes } 483d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 484fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 48597f1f81fSBarry Smith PetscInt nzd=0,fshift=1,*sptr; 486d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 4877566de4bSShri Abhyankar ierr = PetscObjectPrintClassNamePrefixType((PetscObject)A,viewer,"Matrix Object");CHKERRQ(ierr); 48897f1f81fSBarry Smith ierr = PetscMalloc((m+1)*sizeof(PetscInt),&sptr);CHKERRQ(ierr); 489496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 490496be53dSLois Curfman McInnes sptr[i] = nzd+1; 491496be53dSLois Curfman McInnes for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 492496be53dSLois Curfman McInnes if (a->j[j] >= i) { 493aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 49436db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 495496be53dSLois Curfman McInnes #else 496496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 497496be53dSLois Curfman McInnes #endif 498496be53dSLois Curfman McInnes } 499496be53dSLois Curfman McInnes } 500496be53dSLois Curfman McInnes } 5012e44a96cSLois Curfman McInnes sptr[m] = nzd+1; 50277431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %D %D\n\n",m,nzd);CHKERRQ(ierr); 5032e44a96cSLois Curfman McInnes for (i=0; i<m+1; i+=6) { 50477431f27SBarry Smith if (i+4<m) {ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4],sptr[i+5]);CHKERRQ(ierr);} 50577431f27SBarry Smith else if (i+3<m) {ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4]);CHKERRQ(ierr);} 50677431f27SBarry Smith else if (i+2<m) {ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3]);CHKERRQ(ierr);} 50777431f27SBarry Smith else if (i+1<m) {ierr = PetscViewerASCIIPrintf(viewer," %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2]);CHKERRQ(ierr);} 50877431f27SBarry Smith else if (i<m) {ierr = PetscViewerASCIIPrintf(viewer," %D %D\n",sptr[i],sptr[i+1]);CHKERRQ(ierr);} 50977431f27SBarry Smith else {ierr = PetscViewerASCIIPrintf(viewer," %D\n",sptr[i]);CHKERRQ(ierr);} 510496be53dSLois Curfman McInnes } 511b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 512606d414cSSatish Balay ierr = PetscFree(sptr);CHKERRQ(ierr); 513496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 514496be53dSLois Curfman McInnes for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 51577431f27SBarry Smith if (a->j[j] >= i) {ierr = PetscViewerASCIIPrintf(viewer," %D ",a->j[j]+fshift);CHKERRQ(ierr);} 516496be53dSLois Curfman McInnes } 517b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 518496be53dSLois Curfman McInnes } 519b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 520496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 521496be53dSLois Curfman McInnes for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 522496be53dSLois Curfman McInnes if (a->j[j] >= i) { 523aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 52436db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) { 525b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %18.16e %18.16e ",PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 5266831982aSBarry Smith } 527496be53dSLois Curfman McInnes #else 528b0a32e0cSBarry Smith if (a->a[j] != 0.0) {ierr = PetscViewerASCIIPrintf(viewer," %18.16e ",a->a[j]);CHKERRQ(ierr);} 529496be53dSLois Curfman McInnes #endif 530496be53dSLois Curfman McInnes } 531496be53dSLois Curfman McInnes } 532b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 533496be53dSLois Curfman McInnes } 534d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 535fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 53697f1f81fSBarry Smith PetscInt cnt = 0,jcnt; 53787828ca2SBarry Smith PetscScalar value; 53802594712SBarry Smith 539d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 5407566de4bSShri Abhyankar ierr = PetscObjectPrintClassNamePrefixType((PetscObject)A,viewer,"Matrix Object");CHKERRQ(ierr); 54102594712SBarry Smith for (i=0; i<m; i++) { 54202594712SBarry Smith jcnt = 0; 543d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 544e24b481bSBarry Smith if (jcnt < a->i[i+1]-a->i[i] && j == a->j[cnt]) { 54502594712SBarry Smith value = a->a[cnt++]; 546e24b481bSBarry Smith jcnt++; 54702594712SBarry Smith } else { 54802594712SBarry Smith value = 0.0; 54902594712SBarry Smith } 550aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 551b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %7.5e+%7.5e i ",PetscRealPart(value),PetscImaginaryPart(value));CHKERRQ(ierr); 55202594712SBarry Smith #else 553b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %7.5e ",value);CHKERRQ(ierr); 55402594712SBarry Smith #endif 55502594712SBarry Smith } 556b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 55702594712SBarry Smith } 558d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 5593c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 560d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 5617566de4bSShri Abhyankar ierr = PetscObjectPrintClassNamePrefixType((PetscObject)A,viewer,"Matrix Object");CHKERRQ(ierr); 5623c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 5633c215bfdSMatthew Knepley ierr = PetscViewerASCIIPrintf(viewer,"%%matrix complex general\n");CHKERRQ(ierr); 5643c215bfdSMatthew Knepley #else 5653c215bfdSMatthew Knepley ierr = PetscViewerASCIIPrintf(viewer,"%%matrix real general\n");CHKERRQ(ierr); 5663c215bfdSMatthew Knepley #endif 567d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %D\n", m, A->cmap->n, a->nz);CHKERRQ(ierr); 5683c215bfdSMatthew Knepley for (i=0; i<m; i++) { 5693c215bfdSMatthew Knepley for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 5703c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 5713c215bfdSMatthew Knepley if (PetscImaginaryPart(a->a[j]) > 0.0) { 5723c215bfdSMatthew Knepley ierr = PetscViewerASCIIPrintf(viewer,"%D %D, %G %G\n", i+shift,a->j[j]+shift,PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 5733c215bfdSMatthew Knepley } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 5743c215bfdSMatthew Knepley ierr = PetscViewerASCIIPrintf(viewer,"%D %D, %G -%G\n", i+shift,a->j[j]+shift,PetscRealPart(a->a[j]),-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 5753c215bfdSMatthew Knepley } else { 5763c215bfdSMatthew Knepley ierr = PetscViewerASCIIPrintf(viewer,"%D %D, %G\n", i+shift,a->j[j]+shift,PetscRealPart(a->a[j]));CHKERRQ(ierr); 5773c215bfdSMatthew Knepley } 5783c215bfdSMatthew Knepley #else 5793c215bfdSMatthew Knepley ierr = PetscViewerASCIIPrintf(viewer,"%D %D %G\n", i+shift, a->j[j]+shift, a->a[j]);CHKERRQ(ierr); 5803c215bfdSMatthew Knepley #endif 5813c215bfdSMatthew Knepley } 5823c215bfdSMatthew Knepley } 583d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 5843a40ed3dSBarry Smith } else { 585d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 5867566de4bSShri Abhyankar ierr = PetscObjectPrintClassNamePrefixType((PetscObject)A,viewer,"Matrix Object");CHKERRQ(ierr); 587d5f3da31SBarry Smith if (A->factortype){ 58816cd7e1dSShri Abhyankar for (i=0; i<m; i++) { 58916cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 59016cd7e1dSShri Abhyankar /* L part */ 59116cd7e1dSShri Abhyankar for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 59216cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 59316cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 59416cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G + %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 59516cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 59616cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G - %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 59716cd7e1dSShri Abhyankar } else { 59816cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,PetscRealPart(a->a[j]));CHKERRQ(ierr); 59916cd7e1dSShri Abhyankar } 60016cd7e1dSShri Abhyankar #else 60116cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,a->a[j]);CHKERRQ(ierr); 60216cd7e1dSShri Abhyankar #endif 60316cd7e1dSShri Abhyankar } 60416cd7e1dSShri Abhyankar /* diagonal */ 60516cd7e1dSShri Abhyankar j = a->diag[i]; 60616cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 60716cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 6082c990fa1SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (%D, %G + %G i)",a->j[j]+shift,PetscRealPart(1.0/a->a[j]),PetscImaginaryPart(1.0/a->a[j]));CHKERRQ(ierr); 60916cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 6102c990fa1SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (%D, %G - %G i)",a->j[j]+shift,PetscRealPart(1.0/a->a[j]),-PetscImaginaryPart(1.0/a->a[j]));CHKERRQ(ierr); 61116cd7e1dSShri Abhyankar } else { 6122c990fa1SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,PetscRealPart(1.0/a->a[j]));CHKERRQ(ierr); 61316cd7e1dSShri Abhyankar } 61416cd7e1dSShri Abhyankar #else 6152c990fa1SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,1.0/a->a[j]);CHKERRQ(ierr); 61616cd7e1dSShri Abhyankar #endif 61716cd7e1dSShri Abhyankar 61816cd7e1dSShri Abhyankar /* U part */ 61916cd7e1dSShri Abhyankar for (j=a->diag[i+1]+1+shift; j<a->diag[i]+shift; j++) { 62016cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 62116cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 62216cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G + %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 62316cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 62416cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G - %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 62516cd7e1dSShri Abhyankar } else { 62616cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,PetscRealPart(a->a[j]));CHKERRQ(ierr); 62716cd7e1dSShri Abhyankar } 62816cd7e1dSShri Abhyankar #else 62916cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,a->a[j]);CHKERRQ(ierr); 63016cd7e1dSShri Abhyankar #endif 63116cd7e1dSShri Abhyankar } 63216cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 63316cd7e1dSShri Abhyankar } 63416cd7e1dSShri Abhyankar } else { 63517ab2063SBarry Smith for (i=0; i<m; i++) { 63677431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 637416022c9SBarry Smith for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 638aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 63936db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 640a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G + %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 64136db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 642a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G - %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 6433a40ed3dSBarry Smith } else { 644a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,PetscRealPart(a->a[j]));CHKERRQ(ierr); 64517ab2063SBarry Smith } 64617ab2063SBarry Smith #else 647a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,a->a[j]);CHKERRQ(ierr); 64817ab2063SBarry Smith #endif 64917ab2063SBarry Smith } 650b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 65117ab2063SBarry Smith } 65216cd7e1dSShri Abhyankar } 653d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 65417ab2063SBarry Smith } 655b0a32e0cSBarry Smith ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 6563a40ed3dSBarry Smith PetscFunctionReturn(0); 657416022c9SBarry Smith } 658416022c9SBarry Smith 6594a2ae208SSatish Balay #undef __FUNCT__ 6604a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqAIJ_Draw_Zoom" 661dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw,void *Aa) 662416022c9SBarry Smith { 663480ef9eaSBarry Smith Mat A = (Mat) Aa; 664416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 665dfbe8321SBarry Smith PetscErrorCode ierr; 666d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,color; 66736db0b34SBarry Smith PetscReal xl,yl,xr,yr,x_l,x_r,y_l,y_r,maxv = 0.0; 668b0a32e0cSBarry Smith PetscViewer viewer; 669f3ef73ceSBarry Smith PetscViewerFormat format; 670cddf8d76SBarry Smith 6713a40ed3dSBarry Smith PetscFunctionBegin; 672480ef9eaSBarry Smith ierr = PetscObjectQuery((PetscObject)A,"Zoomviewer",(PetscObject*)&viewer);CHKERRQ(ierr); 673b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 67419bcc07fSBarry Smith 675b0a32e0cSBarry Smith ierr = PetscDrawGetCoordinates(draw,&xl,&yl,&xr,&yr);CHKERRQ(ierr); 676416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 6770513a670SBarry Smith 678fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 6790513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 680b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 681416022c9SBarry Smith for (i=0; i<m; i++) { 682cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 683bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 684bfeeae90SHong Zhang x_l = a->j[j] ; x_r = x_l + 1.0; 685aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 68636db0b34SBarry Smith if (PetscRealPart(a->a[j]) >= 0.) continue; 687cddf8d76SBarry Smith #else 688cddf8d76SBarry Smith if (a->a[j] >= 0.) continue; 689cddf8d76SBarry Smith #endif 690b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 691cddf8d76SBarry Smith } 692cddf8d76SBarry Smith } 693b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 694cddf8d76SBarry Smith for (i=0; i<m; i++) { 695cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 696bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 697bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 698cddf8d76SBarry Smith if (a->a[j] != 0.) continue; 699b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 700cddf8d76SBarry Smith } 701cddf8d76SBarry Smith } 702b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 703cddf8d76SBarry Smith for (i=0; i<m; i++) { 704cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 705bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 706bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 707aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 70836db0b34SBarry Smith if (PetscRealPart(a->a[j]) <= 0.) continue; 709cddf8d76SBarry Smith #else 710cddf8d76SBarry Smith if (a->a[j] <= 0.) continue; 711cddf8d76SBarry Smith #endif 712b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 713416022c9SBarry Smith } 714416022c9SBarry Smith } 7150513a670SBarry Smith } else { 7160513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 7170513a670SBarry Smith /* first determine max of all nonzero values */ 71897f1f81fSBarry Smith PetscInt nz = a->nz,count; 719b0a32e0cSBarry Smith PetscDraw popup; 72036db0b34SBarry Smith PetscReal scale; 7210513a670SBarry Smith 7220513a670SBarry Smith for (i=0; i<nz; i++) { 7230513a670SBarry Smith if (PetscAbsScalar(a->a[i]) > maxv) maxv = PetscAbsScalar(a->a[i]); 7240513a670SBarry Smith } 725b0a32e0cSBarry Smith scale = (245.0 - PETSC_DRAW_BASIC_COLORS)/maxv; 726b0a32e0cSBarry Smith ierr = PetscDrawGetPopup(draw,&popup);CHKERRQ(ierr); 727b0a32e0cSBarry Smith if (popup) {ierr = PetscDrawScalePopup(popup,0.0,maxv);CHKERRQ(ierr);} 7280513a670SBarry Smith count = 0; 7290513a670SBarry Smith for (i=0; i<m; i++) { 7300513a670SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 731bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 732bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 73397f1f81fSBarry Smith color = PETSC_DRAW_BASIC_COLORS + (PetscInt)(scale*PetscAbsScalar(a->a[count])); 734b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 7350513a670SBarry Smith count++; 7360513a670SBarry Smith } 7370513a670SBarry Smith } 7380513a670SBarry Smith } 739480ef9eaSBarry Smith PetscFunctionReturn(0); 740480ef9eaSBarry Smith } 741cddf8d76SBarry Smith 7424a2ae208SSatish Balay #undef __FUNCT__ 7434a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqAIJ_Draw" 744dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw(Mat A,PetscViewer viewer) 745480ef9eaSBarry Smith { 746dfbe8321SBarry Smith PetscErrorCode ierr; 747b0a32e0cSBarry Smith PetscDraw draw; 74836db0b34SBarry Smith PetscReal xr,yr,xl,yl,h,w; 749ace3abfcSBarry Smith PetscBool isnull; 750480ef9eaSBarry Smith 751480ef9eaSBarry Smith PetscFunctionBegin; 752b0a32e0cSBarry Smith ierr = PetscViewerDrawGetDraw(viewer,0,&draw);CHKERRQ(ierr); 753b0a32e0cSBarry Smith ierr = PetscDrawIsNull(draw,&isnull);CHKERRQ(ierr); 754480ef9eaSBarry Smith if (isnull) PetscFunctionReturn(0); 755480ef9eaSBarry Smith 756480ef9eaSBarry Smith ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",(PetscObject)viewer);CHKERRQ(ierr); 757d0f46423SBarry Smith xr = A->cmap->n; yr = A->rmap->n; h = yr/10.0; w = xr/10.0; 758480ef9eaSBarry Smith xr += w; yr += h; xl = -w; yl = -h; 759b0a32e0cSBarry Smith ierr = PetscDrawSetCoordinates(draw,xl,yl,xr,yr);CHKERRQ(ierr); 760b0a32e0cSBarry Smith ierr = PetscDrawZoom(draw,MatView_SeqAIJ_Draw_Zoom,A);CHKERRQ(ierr); 761480ef9eaSBarry Smith ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",PETSC_NULL);CHKERRQ(ierr); 7623a40ed3dSBarry Smith PetscFunctionReturn(0); 763416022c9SBarry Smith } 764416022c9SBarry Smith 7654a2ae208SSatish Balay #undef __FUNCT__ 7664a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqAIJ" 767dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ(Mat A,PetscViewer viewer) 768416022c9SBarry Smith { 769dfbe8321SBarry Smith PetscErrorCode ierr; 770ace3abfcSBarry Smith PetscBool iascii,isbinary,isdraw; 771416022c9SBarry Smith 7723a40ed3dSBarry Smith PetscFunctionBegin; 7732692d6eeSBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 7742692d6eeSBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 7752692d6eeSBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSCVIEWERDRAW,&isdraw);CHKERRQ(ierr); 776c45a1595SBarry Smith if (iascii) { 7773a40ed3dSBarry Smith ierr = MatView_SeqAIJ_ASCII(A,viewer);CHKERRQ(ierr); 7780f5bd95cSBarry Smith } else if (isbinary) { 7793a40ed3dSBarry Smith ierr = MatView_SeqAIJ_Binary(A,viewer);CHKERRQ(ierr); 7800f5bd95cSBarry Smith } else if (isdraw) { 7813a40ed3dSBarry Smith ierr = MatView_SeqAIJ_Draw(A,viewer);CHKERRQ(ierr); 782*913ac41fSBarry Smith } else SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"Viewer type %s not supported by SeqAIJ matrices",((PetscObject)viewer)->type_name); 7834108e4d5SBarry Smith ierr = MatView_SeqAIJ_Inode(A,viewer);CHKERRQ(ierr); 7843a40ed3dSBarry Smith PetscFunctionReturn(0); 78517ab2063SBarry Smith } 78619bcc07fSBarry Smith 7874a2ae208SSatish Balay #undef __FUNCT__ 7884a2ae208SSatish Balay #define __FUNCT__ "MatAssemblyEnd_SeqAIJ" 789dfbe8321SBarry Smith PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A,MatAssemblyType mode) 79017ab2063SBarry Smith { 791416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 7926849ba73SBarry Smith PetscErrorCode ierr; 79397f1f81fSBarry Smith PetscInt fshift = 0,i,j,*ai = a->i,*aj = a->j,*imax = a->imax; 794d0f46423SBarry Smith PetscInt m = A->rmap->n,*ip,N,*ailen = a->ilen,rmax = 0; 79554f21887SBarry Smith MatScalar *aa = a->a,*ap; 7963447b6efSHong Zhang PetscReal ratio=0.6; 79717ab2063SBarry Smith 7983a40ed3dSBarry Smith PetscFunctionBegin; 7993a40ed3dSBarry Smith if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0); 80017ab2063SBarry Smith 80143ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 80217ab2063SBarry Smith for (i=1; i<m; i++) { 803416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 80417ab2063SBarry Smith fshift += imax[i-1] - ailen[i-1]; 80594a9d846SBarry Smith rmax = PetscMax(rmax,ailen[i]); 80617ab2063SBarry Smith if (fshift) { 807bfeeae90SHong Zhang ip = aj + ai[i] ; 808bfeeae90SHong Zhang ap = aa + ai[i] ; 80917ab2063SBarry Smith N = ailen[i]; 81017ab2063SBarry Smith for (j=0; j<N; j++) { 81117ab2063SBarry Smith ip[j-fshift] = ip[j]; 81217ab2063SBarry Smith ap[j-fshift] = ap[j]; 81317ab2063SBarry Smith } 81417ab2063SBarry Smith } 81517ab2063SBarry Smith ai[i] = ai[i-1] + ailen[i-1]; 81617ab2063SBarry Smith } 81717ab2063SBarry Smith if (m) { 81817ab2063SBarry Smith fshift += imax[m-1] - ailen[m-1]; 81917ab2063SBarry Smith ai[m] = ai[m-1] + ailen[m-1]; 82017ab2063SBarry Smith } 82117ab2063SBarry Smith /* reset ilen and imax for each row */ 82217ab2063SBarry Smith for (i=0; i<m; i++) { 82317ab2063SBarry Smith ailen[i] = imax[i] = ai[i+1] - ai[i]; 82417ab2063SBarry Smith } 825bfeeae90SHong Zhang a->nz = ai[m]; 82665e19b50SBarry Smith if (fshift && a->nounused == -1) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_PLIB, "Unused space detected in matrix: %D X %D, %D unneeded", m, A->cmap->n, fshift); 82717ab2063SBarry Smith 82809f38230SBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 829d0f46423SBarry Smith ierr = PetscInfo4(A,"Matrix size: %D X %D; storage space: %D unneeded,%D used\n",m,A->cmap->n,fshift,a->nz);CHKERRQ(ierr); 830ae15b995SBarry Smith ierr = PetscInfo1(A,"Number of mallocs during MatSetValues() is %D\n",a->reallocs);CHKERRQ(ierr); 831ae15b995SBarry Smith ierr = PetscInfo1(A,"Maximum nonzeros in any row is %D\n",rmax);CHKERRQ(ierr); 8328e58a170SBarry Smith A->info.mallocs += a->reallocs; 833dd5f02e7SSatish Balay a->reallocs = 0; 8344e220ebcSLois Curfman McInnes A->info.nz_unneeded = (double)fshift; 83536db0b34SBarry Smith a->rmax = rmax; 8364e220ebcSLois Curfman McInnes 837cd6b891eSBarry Smith ierr = MatCheckCompressedRow(A,&a->compressedrow,a->i,m,ratio);CHKERRQ(ierr); 83888e51ccdSHong Zhang A->same_nonzero = PETSC_TRUE; 83971c2f376SKris Buschelman 8404108e4d5SBarry Smith ierr = MatAssemblyEnd_SeqAIJ_Inode(A,mode);CHKERRQ(ierr); 84171f1c65dSBarry Smith 84271f1c65dSBarry Smith a->idiagvalid = PETSC_FALSE; 843bbead8a2SBarry Smith a->ibdiagvalid = PETSC_FALSE; 8443a40ed3dSBarry Smith PetscFunctionReturn(0); 84517ab2063SBarry Smith } 84617ab2063SBarry Smith 8474a2ae208SSatish Balay #undef __FUNCT__ 84899cafbc1SBarry Smith #define __FUNCT__ "MatRealPart_SeqAIJ" 84999cafbc1SBarry Smith PetscErrorCode MatRealPart_SeqAIJ(Mat A) 85099cafbc1SBarry Smith { 85199cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 85299cafbc1SBarry Smith PetscInt i,nz = a->nz; 85354f21887SBarry Smith MatScalar *aa = a->a; 85499cafbc1SBarry Smith 85599cafbc1SBarry Smith PetscFunctionBegin; 85699cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscRealPart(aa[i]); 85799cafbc1SBarry Smith PetscFunctionReturn(0); 85899cafbc1SBarry Smith } 85999cafbc1SBarry Smith 86099cafbc1SBarry Smith #undef __FUNCT__ 86199cafbc1SBarry Smith #define __FUNCT__ "MatImaginaryPart_SeqAIJ" 86299cafbc1SBarry Smith PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 86399cafbc1SBarry Smith { 86499cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 86599cafbc1SBarry Smith PetscInt i,nz = a->nz; 86654f21887SBarry Smith MatScalar *aa = a->a; 86799cafbc1SBarry Smith 86899cafbc1SBarry Smith PetscFunctionBegin; 86999cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 87099cafbc1SBarry Smith PetscFunctionReturn(0); 87199cafbc1SBarry Smith } 87299cafbc1SBarry Smith 87399cafbc1SBarry Smith #undef __FUNCT__ 8744a2ae208SSatish Balay #define __FUNCT__ "MatZeroEntries_SeqAIJ" 875dfbe8321SBarry Smith PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 87617ab2063SBarry Smith { 877416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 878dfbe8321SBarry Smith PetscErrorCode ierr; 8793a40ed3dSBarry Smith 8803a40ed3dSBarry Smith PetscFunctionBegin; 881d0f46423SBarry Smith ierr = PetscMemzero(a->a,(a->i[A->rmap->n])*sizeof(PetscScalar));CHKERRQ(ierr); 8823a40ed3dSBarry Smith PetscFunctionReturn(0); 88317ab2063SBarry Smith } 884416022c9SBarry Smith 8854a2ae208SSatish Balay #undef __FUNCT__ 8864a2ae208SSatish Balay #define __FUNCT__ "MatDestroy_SeqAIJ" 887dfbe8321SBarry Smith PetscErrorCode MatDestroy_SeqAIJ(Mat A) 88817ab2063SBarry Smith { 889416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 890dfbe8321SBarry Smith PetscErrorCode ierr; 891d5d45c9bSBarry Smith 8923a40ed3dSBarry Smith PetscFunctionBegin; 893aa482453SBarry Smith #if defined(PETSC_USE_LOG) 894d0f46423SBarry Smith PetscLogObjectState((PetscObject)A,"Rows=%D, Cols=%D, NZ=%D",A->rmap->n,A->cmap->n,a->nz); 89517ab2063SBarry Smith #endif 896e6b907acSBarry Smith ierr = MatSeqXAIJFreeAIJ(A,&a->a,&a->j,&a->i);CHKERRQ(ierr); 8976bf464f9SBarry Smith ierr = ISDestroy(&a->row);CHKERRQ(ierr); 8986bf464f9SBarry Smith ierr = ISDestroy(&a->col);CHKERRQ(ierr); 89905b42c5fSBarry Smith ierr = PetscFree(a->diag);CHKERRQ(ierr); 900d48dcb14SBarry Smith ierr = PetscFree(a->ibdiag);CHKERRQ(ierr); 90105b42c5fSBarry Smith ierr = PetscFree2(a->imax,a->ilen);CHKERRQ(ierr); 90271f1c65dSBarry Smith ierr = PetscFree3(a->idiag,a->mdiag,a->ssor_work);CHKERRQ(ierr); 90305b42c5fSBarry Smith ierr = PetscFree(a->solve_work);CHKERRQ(ierr); 9046bf464f9SBarry Smith ierr = ISDestroy(&a->icol);CHKERRQ(ierr); 90505b42c5fSBarry Smith ierr = PetscFree(a->saved_values);CHKERRQ(ierr); 9066bf464f9SBarry Smith ierr = ISColoringDestroy(&a->coloring);CHKERRQ(ierr); 90705b42c5fSBarry Smith ierr = PetscFree(a->xtoy);CHKERRQ(ierr); 9086bf464f9SBarry Smith ierr = MatDestroy(&a->XtoY);CHKERRQ(ierr); 909cd6b891eSBarry Smith ierr = PetscFree2(a->compressedrow.i,a->compressedrow.rindex);CHKERRQ(ierr); 910a30b2313SHong Zhang 9114108e4d5SBarry Smith ierr = MatDestroy_SeqAIJ_Inode(A);CHKERRQ(ierr); 912bf0cc555SLisandro Dalcin ierr = PetscFree(A->data);CHKERRQ(ierr); 913901853e0SKris Buschelman 914dbd8c25aSHong Zhang ierr = PetscObjectChangeTypeName((PetscObject)A,0);CHKERRQ(ierr); 915901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatSeqAIJSetColumnIndices_C","",PETSC_NULL);CHKERRQ(ierr); 916901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatStoreValues_C","",PETSC_NULL);CHKERRQ(ierr); 917901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatRetrieveValues_C","",PETSC_NULL);CHKERRQ(ierr); 918901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatConvert_seqaij_seqsbaij_C","",PETSC_NULL);CHKERRQ(ierr); 919901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatConvert_seqaij_seqbaij_C","",PETSC_NULL);CHKERRQ(ierr); 9205a11e1b2SBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatConvert_seqaij_seqaijperm_C","",PETSC_NULL);CHKERRQ(ierr); 921901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatIsTranspose_C","",PETSC_NULL);CHKERRQ(ierr); 922901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatSeqAIJSetPreallocation_C","",PETSC_NULL);CHKERRQ(ierr); 923a1661176SMatthew Knepley ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatSeqAIJSetPreallocationCSR_C","",PETSC_NULL);CHKERRQ(ierr); 924901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatReorderForNonzeroDiagonal_C","",PETSC_NULL);CHKERRQ(ierr); 9253a40ed3dSBarry Smith PetscFunctionReturn(0); 92617ab2063SBarry Smith } 92717ab2063SBarry Smith 9284a2ae208SSatish Balay #undef __FUNCT__ 9294a2ae208SSatish Balay #define __FUNCT__ "MatSetOption_SeqAIJ" 930ace3abfcSBarry Smith PetscErrorCode MatSetOption_SeqAIJ(Mat A,MatOption op,PetscBool flg) 93117ab2063SBarry Smith { 932416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 9334846f1f5SKris Buschelman PetscErrorCode ierr; 9343a40ed3dSBarry Smith 9353a40ed3dSBarry Smith PetscFunctionBegin; 936a65d3064SKris Buschelman switch (op) { 937a65d3064SKris Buschelman case MAT_ROW_ORIENTED: 9384e0d8c25SBarry Smith a->roworiented = flg; 939a65d3064SKris Buschelman break; 940a9817697SBarry Smith case MAT_KEEP_NONZERO_PATTERN: 941a9817697SBarry Smith a->keepnonzeropattern = flg; 942a65d3064SKris Buschelman break; 943512a5fc5SBarry Smith case MAT_NEW_NONZERO_LOCATIONS: 944512a5fc5SBarry Smith a->nonew = (flg ? 0 : 1); 945a65d3064SKris Buschelman break; 946a65d3064SKris Buschelman case MAT_NEW_NONZERO_LOCATION_ERR: 9474e0d8c25SBarry Smith a->nonew = (flg ? -1 : 0); 948a65d3064SKris Buschelman break; 949a65d3064SKris Buschelman case MAT_NEW_NONZERO_ALLOCATION_ERR: 9504e0d8c25SBarry Smith a->nonew = (flg ? -2 : 0); 951a65d3064SKris Buschelman break; 95228b2fa4aSMatthew Knepley case MAT_UNUSED_NONZERO_LOCATION_ERR: 95328b2fa4aSMatthew Knepley a->nounused = (flg ? -1 : 0); 95428b2fa4aSMatthew Knepley break; 955a65d3064SKris Buschelman case MAT_IGNORE_ZERO_ENTRIES: 9564e0d8c25SBarry Smith a->ignorezeroentries = flg; 9570df259c2SBarry Smith break; 958cd6b891eSBarry Smith case MAT_CHECK_COMPRESSED_ROW: 959cd6b891eSBarry Smith a->compressedrow.check = flg; 960d487561eSHong Zhang break; 9613d472b54SHong Zhang case MAT_SPD: 9623d472b54SHong Zhang A->spd_set = PETSC_TRUE; 9633d472b54SHong Zhang A->spd = flg; 9643d472b54SHong Zhang if (flg) { 9653d472b54SHong Zhang A->symmetric = PETSC_TRUE; 9663d472b54SHong Zhang A->structurally_symmetric = PETSC_TRUE; 9673d472b54SHong Zhang A->symmetric_set = PETSC_TRUE; 9683d472b54SHong Zhang A->structurally_symmetric_set = PETSC_TRUE; 9693d472b54SHong Zhang } 9703d472b54SHong Zhang break; 971b1646e73SJed Brown case MAT_SYMMETRIC: 972b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 973b1646e73SJed Brown case MAT_HERMITIAN: 974b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 9754e0d8c25SBarry Smith case MAT_NEW_DIAGONALS: 976a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 977a65d3064SKris Buschelman case MAT_USE_HASH_TABLE: 978290bbb0aSBarry Smith ierr = PetscInfo1(A,"Option %s ignored\n",MatOptions[op]);CHKERRQ(ierr); 979a65d3064SKris Buschelman break; 980b87ac2d8SJed Brown case MAT_USE_INODES: 981b87ac2d8SJed Brown /* Not an error because MatSetOption_SeqAIJ_Inode handles this one */ 982b87ac2d8SJed Brown break; 983a65d3064SKris Buschelman default: 984e32f2f54SBarry Smith SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"unknown option %d",op); 985a65d3064SKris Buschelman } 9864108e4d5SBarry Smith ierr = MatSetOption_SeqAIJ_Inode(A,op,flg);CHKERRQ(ierr); 9873a40ed3dSBarry Smith PetscFunctionReturn(0); 98817ab2063SBarry Smith } 98917ab2063SBarry Smith 9904a2ae208SSatish Balay #undef __FUNCT__ 9914a2ae208SSatish Balay #define __FUNCT__ "MatGetDiagonal_SeqAIJ" 992dfbe8321SBarry Smith PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A,Vec v) 99317ab2063SBarry Smith { 994416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 9956849ba73SBarry Smith PetscErrorCode ierr; 996d3e70bfaSHong Zhang PetscInt i,j,n,*ai=a->i,*aj=a->j,nz; 99735e7444dSHong Zhang PetscScalar *aa=a->a,*x,zero=0.0; 99817ab2063SBarry Smith 9993a40ed3dSBarry Smith PetscFunctionBegin; 1000d3e70bfaSHong Zhang ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 1001e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 100235e7444dSHong Zhang 1003d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU){ 1004d3e70bfaSHong Zhang PetscInt *diag=a->diag; 100535e7444dSHong Zhang ierr = VecGetArray(v,&x);CHKERRQ(ierr); 10062c990fa1SHong Zhang for (i=0; i<n; i++) x[i] = 1.0/aa[diag[i]]; 100735e7444dSHong Zhang ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 100835e7444dSHong Zhang PetscFunctionReturn(0); 100935e7444dSHong Zhang } 101035e7444dSHong Zhang 10112dcb1b2aSMatthew Knepley ierr = VecSet(v,zero);CHKERRQ(ierr); 10121ebc52fbSHong Zhang ierr = VecGetArray(v,&x);CHKERRQ(ierr); 101335e7444dSHong Zhang for (i=0; i<n; i++) { 101435e7444dSHong Zhang nz = ai[i+1] - ai[i]; 10152f5a7c2eSBarry Smith if (!nz) x[i] = 0.0; 101635e7444dSHong Zhang for (j=ai[i]; j<ai[i+1]; j++){ 101735e7444dSHong Zhang if (aj[j] == i) { 101835e7444dSHong Zhang x[i] = aa[j]; 101917ab2063SBarry Smith break; 102017ab2063SBarry Smith } 102117ab2063SBarry Smith } 102217ab2063SBarry Smith } 10231ebc52fbSHong Zhang ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 10243a40ed3dSBarry Smith PetscFunctionReturn(0); 102517ab2063SBarry Smith } 102617ab2063SBarry Smith 1027c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 10284a2ae208SSatish Balay #undef __FUNCT__ 10294a2ae208SSatish Balay #define __FUNCT__ "MatMultTransposeAdd_SeqAIJ" 1030dfbe8321SBarry Smith PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A,Vec xx,Vec zz,Vec yy) 103117ab2063SBarry Smith { 1032416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 10335c897100SBarry Smith PetscScalar *x,*y; 1034dfbe8321SBarry Smith PetscErrorCode ierr; 1035d0f46423SBarry Smith PetscInt m = A->rmap->n; 10365c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1037a77337e4SBarry Smith MatScalar *v; 1038a77337e4SBarry Smith PetscScalar alpha; 103904fbf559SBarry Smith PetscInt n,i,j,*idx,*ii,*ridx=PETSC_NULL; 10403447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1041ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 10425c897100SBarry Smith #endif 104317ab2063SBarry Smith 10443a40ed3dSBarry Smith PetscFunctionBegin; 10452e8a6d31SBarry Smith if (zz != yy) {ierr = VecCopy(zz,yy);CHKERRQ(ierr);} 10461ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 10471ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 10485c897100SBarry Smith 10495c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1050bfeeae90SHong Zhang fortranmulttransposeaddaij_(&m,x,a->i,a->j,a->a,y); 10515c897100SBarry Smith #else 10523447b6efSHong Zhang if (usecprow){ 10533447b6efSHong Zhang m = cprow.nrows; 10543447b6efSHong Zhang ii = cprow.i; 10557b2bb3b9SHong Zhang ridx = cprow.rindex; 10563447b6efSHong Zhang } else { 10573447b6efSHong Zhang ii = a->i; 10583447b6efSHong Zhang } 105917ab2063SBarry Smith for (i=0; i<m; i++) { 10603447b6efSHong Zhang idx = a->j + ii[i] ; 10613447b6efSHong Zhang v = a->a + ii[i] ; 10623447b6efSHong Zhang n = ii[i+1] - ii[i]; 10633447b6efSHong Zhang if (usecprow){ 10647b2bb3b9SHong Zhang alpha = x[ridx[i]]; 10653447b6efSHong Zhang } else { 106617ab2063SBarry Smith alpha = x[i]; 10673447b6efSHong Zhang } 106804fbf559SBarry Smith for (j=0; j<n; j++) y[idx[j]] += alpha*v[j]; 106917ab2063SBarry Smith } 10705c897100SBarry Smith #endif 1071dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 10721ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 10731ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 10743a40ed3dSBarry Smith PetscFunctionReturn(0); 107517ab2063SBarry Smith } 107617ab2063SBarry Smith 10774a2ae208SSatish Balay #undef __FUNCT__ 10785c897100SBarry Smith #define __FUNCT__ "MatMultTranspose_SeqAIJ" 1079dfbe8321SBarry Smith PetscErrorCode MatMultTranspose_SeqAIJ(Mat A,Vec xx,Vec yy) 10805c897100SBarry Smith { 1081dfbe8321SBarry Smith PetscErrorCode ierr; 10825c897100SBarry Smith 10835c897100SBarry Smith PetscFunctionBegin; 1084170fe5c8SBarry Smith ierr = VecSet(yy,0.0);CHKERRQ(ierr); 10855c897100SBarry Smith ierr = MatMultTransposeAdd_SeqAIJ(A,xx,yy,yy);CHKERRQ(ierr); 10865c897100SBarry Smith PetscFunctionReturn(0); 10875c897100SBarry Smith } 10885c897100SBarry Smith 1089c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 10905c897100SBarry Smith #undef __FUNCT__ 10914a2ae208SSatish Balay #define __FUNCT__ "MatMult_SeqAIJ" 1092dfbe8321SBarry Smith PetscErrorCode MatMult_SeqAIJ(Mat A,Vec xx,Vec yy) 109317ab2063SBarry Smith { 1094416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1095d9fead3dSBarry Smith PetscScalar *y; 109654f21887SBarry Smith const PetscScalar *x; 109754f21887SBarry Smith const MatScalar *aa; 1098dfbe8321SBarry Smith PetscErrorCode ierr; 1099003131ecSBarry Smith PetscInt m=A->rmap->n; 1100003131ecSBarry Smith const PetscInt *aj,*ii,*ridx=PETSC_NULL; 11018aee2decSHong Zhang PetscInt n,i,nonzerorow=0; 1102362ced78SSatish Balay PetscScalar sum; 1103ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 110417ab2063SBarry Smith 1105b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 110697952fefSHong Zhang #pragma disjoint(*x,*y,*aa) 1107fee21e36SBarry Smith #endif 1108fee21e36SBarry Smith 11093a40ed3dSBarry Smith PetscFunctionBegin; 11103649974fSBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 11111ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 111297952fefSHong Zhang aj = a->j; 111397952fefSHong Zhang aa = a->a; 1114416022c9SBarry Smith ii = a->i; 11154eb6d288SHong Zhang if (usecprow){ /* use compressed row format */ 111697952fefSHong Zhang m = a->compressedrow.nrows; 111797952fefSHong Zhang ii = a->compressedrow.i; 111897952fefSHong Zhang ridx = a->compressedrow.rindex; 111997952fefSHong Zhang for (i=0; i<m; i++){ 112097952fefSHong Zhang n = ii[i+1] - ii[i]; 112197952fefSHong Zhang aj = a->j + ii[i]; 112297952fefSHong Zhang aa = a->a + ii[i]; 112397952fefSHong Zhang sum = 0.0; 1124a46b3154SVictor Eijkhout nonzerorow += (n>0); 1125003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 1126003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 112797952fefSHong Zhang y[*ridx++] = sum; 112897952fefSHong Zhang } 112997952fefSHong Zhang } else { /* do not use compressed row format */ 1130b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 1131b05257ddSBarry Smith fortranmultaij_(&m,x,ii,aj,aa,y); 1132b05257ddSBarry Smith #else 113317ab2063SBarry Smith for (i=0; i<m; i++) { 1134003131ecSBarry Smith n = ii[i+1] - ii[i]; 1135003131ecSBarry Smith aj = a->j + ii[i]; 1136003131ecSBarry Smith aa = a->a + ii[i]; 113717ab2063SBarry Smith sum = 0.0; 1138a46b3154SVictor Eijkhout nonzerorow += (n>0); 1139003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 114017ab2063SBarry Smith y[i] = sum; 114117ab2063SBarry Smith } 11428d195f9aSBarry Smith #endif 1143b05257ddSBarry Smith } 1144dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*a->nz - nonzerorow);CHKERRQ(ierr); 11453649974fSBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 11461ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 11473a40ed3dSBarry Smith PetscFunctionReturn(0); 114817ab2063SBarry Smith } 114917ab2063SBarry Smith 115063db405bSBarry Smith #if defined(PETSC_HAVE_PTHREADCLASSES) 115163db405bSBarry Smith 11520ca81413SKerry Stevens //******************* 1153700485ddSSatish Balay #if defined(PETSC_HAVE_PTHREADCLASSES) 1154cfcfc605SKerry Stevens extern PetscBool PetscUseThreadPool; 1155cfcfc605SKerry Stevens void* DoCoreAffinity(void); 1156cfcfc605SKerry Stevens 11570ca81413SKerry Stevens typedef struct { 11580ca81413SKerry Stevens const MatScalar* matdata; 11590ca81413SKerry Stevens const PetscScalar* vecdata; 11600ca81413SKerry Stevens PetscScalar* vecout; 11610ca81413SKerry Stevens const PetscInt* colindnz; 11620ca81413SKerry Stevens const PetscInt* rownumnz; 11630ca81413SKerry Stevens PetscInt numrows; 11640ca81413SKerry Stevens const PetscInt* specidx; 11650ca81413SKerry Stevens PetscInt nzr; 11660ca81413SKerry Stevens } MatMult_KernelData; 11670ca81413SKerry Stevens 11680ca81413SKerry Stevens void* MatMult_Kernel(void *arg) 11690ca81413SKerry Stevens { 1170cfcfc605SKerry Stevens if(PetscUseThreadPool==PETSC_FALSE) { 1171cfcfc605SKerry Stevens DoCoreAffinity(); 1172cfcfc605SKerry Stevens } 11730ca81413SKerry Stevens MatMult_KernelData *data = (MatMult_KernelData*)arg; 11740ca81413SKerry Stevens PetscScalar sum; 11750ca81413SKerry Stevens const MatScalar *aabase = data->matdata,*aa; 11760ca81413SKerry Stevens const PetscScalar *x = data->vecdata; 11770ca81413SKerry Stevens PetscScalar *y = data->vecout; 11780ca81413SKerry Stevens const PetscInt *ajbase = data->colindnz,*aj; 11790ca81413SKerry Stevens const PetscInt *ii = data->rownumnz; 11800ca81413SKerry Stevens PetscInt m = data->numrows; 11810ca81413SKerry Stevens const PetscInt *ridx = data->specidx; 11820ca81413SKerry Stevens PetscInt i,n,nonzerorow = 0; 11830ca81413SKerry Stevens 11840ca81413SKerry Stevens if(ridx!=NULL) { 11850ca81413SKerry Stevens for (i=0; i<m; i++){ 11860ca81413SKerry Stevens n = ii[i+1] - ii[i]; 11870ca81413SKerry Stevens aj = ajbase + ii[i]; 11880ca81413SKerry Stevens aa = aabase + ii[i]; 11890ca81413SKerry Stevens sum = 0.0; 1190cfcfc605SKerry Stevens if(n>0) { 119151d315f7SKerry Stevens PetscSparseDensePlusDot(sum,x,aa,aj,n); 119251d315f7SKerry Stevens nonzerorow++; 1193cfcfc605SKerry Stevens } 11940ca81413SKerry Stevens y[*ridx++] = sum; 11950ca81413SKerry Stevens } 11960ca81413SKerry Stevens } 11970ca81413SKerry Stevens else { 119851d315f7SKerry Stevens PetscInt ibase = data->nzr; 11990ca81413SKerry Stevens for (i=0; i<m; i++) { 12000ca81413SKerry Stevens n = ii[i+1] - ii[i]; 12010ca81413SKerry Stevens aj = ajbase + ii[i]; 12020ca81413SKerry Stevens aa = aabase + ii[i]; 12030ca81413SKerry Stevens sum = 0.0; 1204cfcfc605SKerry Stevens if(n>0) { 120551d315f7SKerry Stevens PetscSparseDensePlusDot(sum,x,aa,aj,n); 120651d315f7SKerry Stevens nonzerorow++; 1207cfcfc605SKerry Stevens } 120851d315f7SKerry Stevens y[i+ibase] = sum; 12090ca81413SKerry Stevens } 12100ca81413SKerry Stevens } 12110ca81413SKerry Stevens data->nzr = nonzerorow; 12120ca81413SKerry Stevens return NULL; 12130ca81413SKerry Stevens } 1214700485ddSSatish Balay #endif 12150ca81413SKerry Stevens 12160ca81413SKerry Stevens extern PetscMPIInt PetscMaxThreads; 12174b83fb64SBarry Smith extern PetscErrorCode (*MainJob)(void* (*pFunc)(void*),void**,PetscInt); 121851d315f7SKerry Stevens 12190ca81413SKerry Stevens #undef __FUNCT__ 12207d6a0e61SBarry Smith #define __FUNCT__ "MatMult_SeqAIJPThread" 12217d6a0e61SBarry Smith PetscErrorCode MatMult_SeqAIJPThread(Mat A,Vec xx,Vec yy) 12220ca81413SKerry Stevens { 12230ca81413SKerry Stevens Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 12240ca81413SKerry Stevens PetscScalar *y; 12250ca81413SKerry Stevens const PetscScalar *x; 12260ca81413SKerry Stevens PetscErrorCode ierr; 12270ca81413SKerry Stevens PetscInt m=A->rmap->n,nonzerorow=0; 12280ca81413SKerry Stevens PetscBool usecprow=a->compressedrow.use; 12290ca81413SKerry Stevens 12300ca81413SKerry Stevens #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 12310ca81413SKerry Stevens #pragma disjoint(*x,*y,*aa) 12320ca81413SKerry Stevens #endif 12330ca81413SKerry Stevens 12340ca81413SKerry Stevens PetscFunctionBegin; 12350ca81413SKerry Stevens ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 12360ca81413SKerry Stevens ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 12370ca81413SKerry Stevens 12380ca81413SKerry Stevens if(usecprow) { 12390ca81413SKerry Stevens PetscInt NumPerThread,iindex; 12400ca81413SKerry Stevens const MatScalar *aa = a->a; 12410ca81413SKerry Stevens const PetscInt *aj = a->j,*ii = a->compressedrow.i,*ridx=a->compressedrow.rindex; 12420ca81413SKerry Stevens PetscInt i,iStartVal,iEndVal,iStartIndex,iEndIndex; 12430ca81413SKerry Stevens const PetscInt iNumThreads = PetscMaxThreads; //this number could be different 1244cfcfc605SKerry Stevens MatMult_KernelData* kerneldatap = (MatMult_KernelData*)malloc(iNumThreads*sizeof(MatMult_KernelData)); 1245cfcfc605SKerry Stevens MatMult_KernelData** pdata = (MatMult_KernelData**)malloc(iNumThreads*sizeof(MatMult_KernelData*)); 12460ca81413SKerry Stevens 12470ca81413SKerry Stevens m = a->compressedrow.nrows; 12480ca81413SKerry Stevens NumPerThread = ii[m]/iNumThreads; 12490ca81413SKerry Stevens iindex = 0; 12500ca81413SKerry Stevens for(i=0; i<iNumThreads;i++) { 12510ca81413SKerry Stevens iStartIndex = iindex; 12520ca81413SKerry Stevens iStartVal = ii[iStartIndex]; 12530ca81413SKerry Stevens iEndVal = iStartVal; 12540ca81413SKerry Stevens //determine number of rows to process 12550ca81413SKerry Stevens while(iEndVal-iStartVal<NumPerThread) { 12560ca81413SKerry Stevens iindex++; 12570ca81413SKerry Stevens iEndVal = ii[iindex]; 12580ca81413SKerry Stevens } 12590ca81413SKerry Stevens //determine whether to go back 1 12600ca81413SKerry Stevens if(iEndVal-iStartVal-NumPerThread>NumPerThread-(ii[iindex-1]-iStartVal)) { 12610ca81413SKerry Stevens iindex--; 12620ca81413SKerry Stevens iEndVal = ii[iindex]; 12630ca81413SKerry Stevens } 12640ca81413SKerry Stevens iEndIndex = iindex; 1265cfcfc605SKerry Stevens kerneldatap[i].matdata = aa; 12660ca81413SKerry Stevens kerneldatap[i].vecdata = x; 12670ca81413SKerry Stevens kerneldatap[i].vecout = y; 12680ca81413SKerry Stevens kerneldatap[i].colindnz = aj; 12690ca81413SKerry Stevens kerneldatap[i].rownumnz = ii + iStartIndex; 12700ca81413SKerry Stevens kerneldatap[i].numrows = iEndIndex - iStartIndex + 1; 12710ca81413SKerry Stevens kerneldatap[i].specidx = ridx + iStartVal; 12720ca81413SKerry Stevens kerneldatap[i].nzr = 0; 1273cfcfc605SKerry Stevens pdata[i] = &kerneldatap[i]; 12740ca81413SKerry Stevens iindex++; 12750ca81413SKerry Stevens } 1276cfcfc605SKerry Stevens ierr = MainJob(MatMult_Kernel,(void**)pdata,iNumThreads); 1277cfcfc605SKerry Stevens /* collect results */ 127851d315f7SKerry Stevens for(i=0; i<iNumThreads; i++) { 1279cfcfc605SKerry Stevens nonzerorow += kerneldatap[i].nzr; 128051d315f7SKerry Stevens } 1281cfcfc605SKerry Stevens free(kerneldatap); 1282cfcfc605SKerry Stevens free(pdata); 128351d315f7SKerry Stevens } 128451d315f7SKerry Stevens else { 128551d315f7SKerry Stevens #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 128651d315f7SKerry Stevens fortranmultaij_(&m,x,a->i,a->j,a->a,y); 128751d315f7SKerry Stevens #else 128851d315f7SKerry Stevens PetscInt i,iindex; 128951d315f7SKerry Stevens const MatScalar *aa = a->a; 129051d315f7SKerry Stevens const PetscInt *aj = a->j,*ii = a->i; 129151d315f7SKerry Stevens const PetscInt iNumThreads = PetscMaxThreads; //this number could be different 129251d315f7SKerry Stevens PetscInt Q = m/iNumThreads; 129351d315f7SKerry Stevens PetscInt R = m-Q*iNumThreads; 129451d315f7SKerry Stevens PetscBool S; 129551d315f7SKerry Stevens 129651d315f7SKerry Stevens MatMult_KernelData* kerneldatap = (MatMult_KernelData*)malloc(iNumThreads*sizeof(MatMult_KernelData)); 129751d315f7SKerry Stevens MatMult_KernelData** pdata = (MatMult_KernelData**)malloc(iNumThreads*sizeof(MatMult_KernelData*)); 129851d315f7SKerry Stevens 129951d315f7SKerry Stevens iindex = 0; 130051d315f7SKerry Stevens for(i=0; i<iNumThreads;i++) { 1301b50af74fSBarry Smith S = (PetscBool)(i<R); 130251d315f7SKerry Stevens kerneldatap[i].matdata = aa; 130351d315f7SKerry Stevens kerneldatap[i].vecdata = x; 130451d315f7SKerry Stevens kerneldatap[i].vecout = y; 130551d315f7SKerry Stevens kerneldatap[i].colindnz = aj; 130651d315f7SKerry Stevens kerneldatap[i].rownumnz = ii + iindex; 130751d315f7SKerry Stevens kerneldatap[i].numrows = S?Q+1:Q; 130851d315f7SKerry Stevens kerneldatap[i].specidx = PETSC_NULL; 130951d315f7SKerry Stevens kerneldatap[i].nzr = iindex; //serves as the 'base' row (needed to access correctly into output vector y) 131051d315f7SKerry Stevens pdata[i] = &kerneldatap[i]; 131151d315f7SKerry Stevens iindex += kerneldatap[i].numrows; 131251d315f7SKerry Stevens } 13130ca81413SKerry Stevens MainJob(MatMult_Kernel,(void**)pdata,iNumThreads); 13140ca81413SKerry Stevens //collect results 13150ca81413SKerry Stevens for(i=0; i<iNumThreads; i++) { 13160ca81413SKerry Stevens nonzerorow += kerneldatap[i].nzr; 13170ca81413SKerry Stevens } 131851d315f7SKerry Stevens free(kerneldatap); 131951d315f7SKerry Stevens free(pdata); 13200ca81413SKerry Stevens #endif 13210ca81413SKerry Stevens } 13220ca81413SKerry Stevens 13230ca81413SKerry Stevens ierr = PetscLogFlops(2.0*a->nz - nonzerorow);CHKERRQ(ierr); 13240ca81413SKerry Stevens ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 13250ca81413SKerry Stevens ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 13260ca81413SKerry Stevens PetscFunctionReturn(0); 13270ca81413SKerry Stevens } 13280ca81413SKerry Stevens //******************* 1329ba61063dSBarry Smith #endif 13300ca81413SKerry Stevens 1331c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 13324a2ae208SSatish Balay #undef __FUNCT__ 13334a2ae208SSatish Balay #define __FUNCT__ "MatMultAdd_SeqAIJ" 1334dfbe8321SBarry Smith PetscErrorCode MatMultAdd_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz) 133517ab2063SBarry Smith { 1336416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1337f15663dcSBarry Smith PetscScalar *y,*z; 1338f15663dcSBarry Smith const PetscScalar *x; 133954f21887SBarry Smith const MatScalar *aa; 1340dfbe8321SBarry Smith PetscErrorCode ierr; 1341d0f46423SBarry Smith PetscInt m = A->rmap->n,*aj,*ii; 1342f15663dcSBarry Smith PetscInt n,i,*ridx=PETSC_NULL; 1343362ced78SSatish Balay PetscScalar sum; 1344ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 13459ea0dfa2SSatish Balay 13463a40ed3dSBarry Smith PetscFunctionBegin; 1347f15663dcSBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 13481ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 13492e8a6d31SBarry Smith if (zz != yy) { 13501ebc52fbSHong Zhang ierr = VecGetArray(zz,&z);CHKERRQ(ierr); 13512e8a6d31SBarry Smith } else { 13522e8a6d31SBarry Smith z = y; 13532e8a6d31SBarry Smith } 1354bfeeae90SHong Zhang 135597952fefSHong Zhang aj = a->j; 135697952fefSHong Zhang aa = a->a; 1357cddf8d76SBarry Smith ii = a->i; 13584eb6d288SHong Zhang if (usecprow){ /* use compressed row format */ 13594eb6d288SHong Zhang if (zz != yy){ 13604eb6d288SHong Zhang ierr = PetscMemcpy(z,y,m*sizeof(PetscScalar));CHKERRQ(ierr); 13614eb6d288SHong Zhang } 136297952fefSHong Zhang m = a->compressedrow.nrows; 136397952fefSHong Zhang ii = a->compressedrow.i; 136497952fefSHong Zhang ridx = a->compressedrow.rindex; 136597952fefSHong Zhang for (i=0; i<m; i++){ 136697952fefSHong Zhang n = ii[i+1] - ii[i]; 136797952fefSHong Zhang aj = a->j + ii[i]; 136897952fefSHong Zhang aa = a->a + ii[i]; 136997952fefSHong Zhang sum = y[*ridx]; 1370f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 137197952fefSHong Zhang z[*ridx++] = sum; 137297952fefSHong Zhang } 137397952fefSHong Zhang } else { /* do not use compressed row format */ 1374f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 1375f15663dcSBarry Smith fortranmultaddaij_(&m,x,ii,aj,aa,y,z); 1376f15663dcSBarry Smith #else 137717ab2063SBarry Smith for (i=0; i<m; i++) { 1378f15663dcSBarry Smith n = ii[i+1] - ii[i]; 1379f15663dcSBarry Smith aj = a->j + ii[i]; 1380f15663dcSBarry Smith aa = a->a + ii[i]; 138117ab2063SBarry Smith sum = y[i]; 1382f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 138317ab2063SBarry Smith z[i] = sum; 138417ab2063SBarry Smith } 138502ab625aSSatish Balay #endif 1386f15663dcSBarry Smith } 1387dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1388f15663dcSBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 13891ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 13902e8a6d31SBarry Smith if (zz != yy) { 13911ebc52fbSHong Zhang ierr = VecRestoreArray(zz,&z);CHKERRQ(ierr); 13922e8a6d31SBarry Smith } 13938154be41SBarry Smith #if defined(PETSC_HAVE_CUSP) 13946b375ea7SVictor Minden /* 1395918e98c3SVictor Minden ierr = VecView(xx,0);CHKERRQ(ierr); 1396918e98c3SVictor Minden ierr = VecView(zz,0);CHKERRQ(ierr); 1397918e98c3SVictor Minden ierr = MatView(A,0);CHKERRQ(ierr); 13986b375ea7SVictor Minden */ 1399918e98c3SVictor Minden #endif 14003a40ed3dSBarry Smith PetscFunctionReturn(0); 140117ab2063SBarry Smith } 140217ab2063SBarry Smith 140317ab2063SBarry Smith /* 140417ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 140517ab2063SBarry Smith */ 14064a2ae208SSatish Balay #undef __FUNCT__ 14074a2ae208SSatish Balay #define __FUNCT__ "MatMarkDiagonal_SeqAIJ" 1408dfbe8321SBarry Smith PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 140917ab2063SBarry Smith { 1410416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 14116849ba73SBarry Smith PetscErrorCode ierr; 1412d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n; 141317ab2063SBarry Smith 14143a40ed3dSBarry Smith PetscFunctionBegin; 141509f38230SBarry Smith if (!a->diag) { 141609f38230SBarry Smith ierr = PetscMalloc(m*sizeof(PetscInt),&a->diag);CHKERRQ(ierr); 14179518dbb4SMatthew Knepley ierr = PetscLogObjectMemory(A, m*sizeof(PetscInt));CHKERRQ(ierr); 141809f38230SBarry Smith } 1419d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 142009f38230SBarry Smith a->diag[i] = a->i[i+1]; 1421bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1422bfeeae90SHong Zhang if (a->j[j] == i) { 142309f38230SBarry Smith a->diag[i] = j; 142417ab2063SBarry Smith break; 142517ab2063SBarry Smith } 142617ab2063SBarry Smith } 142717ab2063SBarry Smith } 14283a40ed3dSBarry Smith PetscFunctionReturn(0); 142917ab2063SBarry Smith } 143017ab2063SBarry Smith 1431be5855fcSBarry Smith /* 1432be5855fcSBarry Smith Checks for missing diagonals 1433be5855fcSBarry Smith */ 14344a2ae208SSatish Balay #undef __FUNCT__ 14354a2ae208SSatish Balay #define __FUNCT__ "MatMissingDiagonal_SeqAIJ" 1436ace3abfcSBarry Smith PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A,PetscBool *missing,PetscInt *d) 1437be5855fcSBarry Smith { 1438be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 143997f1f81fSBarry Smith PetscInt *diag,*jj = a->j,i; 1440be5855fcSBarry Smith 1441be5855fcSBarry Smith PetscFunctionBegin; 144209f38230SBarry Smith *missing = PETSC_FALSE; 1443d0f46423SBarry Smith if (A->rmap->n > 0 && !jj) { 144409f38230SBarry Smith *missing = PETSC_TRUE; 144509f38230SBarry Smith if (d) *d = 0; 144609f38230SBarry Smith PetscInfo(A,"Matrix has no entries therefor is missing diagonal"); 144709f38230SBarry Smith } else { 1448f1e2ffcdSBarry Smith diag = a->diag; 1449d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 1450bfeeae90SHong Zhang if (jj[diag[i]] != i) { 145109f38230SBarry Smith *missing = PETSC_TRUE; 145209f38230SBarry Smith if (d) *d = i; 145309f38230SBarry Smith PetscInfo1(A,"Matrix is missing diagonal number %D",i); 145409f38230SBarry Smith } 1455be5855fcSBarry Smith } 1456be5855fcSBarry Smith } 1457be5855fcSBarry Smith PetscFunctionReturn(0); 1458be5855fcSBarry Smith } 1459be5855fcSBarry Smith 146071f1c65dSBarry Smith EXTERN_C_BEGIN 146171f1c65dSBarry Smith #undef __FUNCT__ 146271f1c65dSBarry Smith #define __FUNCT__ "MatInvertDiagonal_SeqAIJ" 14637087cfbeSBarry Smith PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A,PetscScalar omega,PetscScalar fshift) 146471f1c65dSBarry Smith { 146571f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 146671f1c65dSBarry Smith PetscErrorCode ierr; 1467d0f46423SBarry Smith PetscInt i,*diag,m = A->rmap->n; 146854f21887SBarry Smith MatScalar *v = a->a; 146954f21887SBarry Smith PetscScalar *idiag,*mdiag; 147071f1c65dSBarry Smith 147171f1c65dSBarry Smith PetscFunctionBegin; 147271f1c65dSBarry Smith if (a->idiagvalid) PetscFunctionReturn(0); 147371f1c65dSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 147471f1c65dSBarry Smith diag = a->diag; 147571f1c65dSBarry Smith if (!a->idiag) { 147671f1c65dSBarry Smith ierr = PetscMalloc3(m,PetscScalar,&a->idiag,m,PetscScalar,&a->mdiag,m,PetscScalar,&a->ssor_work);CHKERRQ(ierr); 147771f1c65dSBarry Smith ierr = PetscLogObjectMemory(A, 3*m*sizeof(PetscScalar));CHKERRQ(ierr); 147871f1c65dSBarry Smith v = a->a; 147971f1c65dSBarry Smith } 148071f1c65dSBarry Smith mdiag = a->mdiag; 148171f1c65dSBarry Smith idiag = a->idiag; 148271f1c65dSBarry Smith 1483028cd4eaSSatish Balay if (omega == 1.0 && !PetscAbsScalar(fshift)) { 148471f1c65dSBarry Smith for (i=0; i<m; i++) { 148571f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1486e32f2f54SBarry Smith if (!PetscAbsScalar(mdiag[i])) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Zero diagonal on row %D",i); 148771f1c65dSBarry Smith idiag[i] = 1.0/v[diag[i]]; 148871f1c65dSBarry Smith } 148971f1c65dSBarry Smith ierr = PetscLogFlops(m);CHKERRQ(ierr); 149071f1c65dSBarry Smith } else { 149171f1c65dSBarry Smith for (i=0; i<m; i++) { 149271f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 149371f1c65dSBarry Smith idiag[i] = omega/(fshift + v[diag[i]]); 149471f1c65dSBarry Smith } 1495dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*m);CHKERRQ(ierr); 149671f1c65dSBarry Smith } 149771f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 149871f1c65dSBarry Smith PetscFunctionReturn(0); 149971f1c65dSBarry Smith } 15005a9745a3SMatthew Knepley EXTERN_C_END 150171f1c65dSBarry Smith 1502c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 15034a2ae208SSatish Balay #undef __FUNCT__ 150441f059aeSBarry Smith #define __FUNCT__ "MatSOR_SeqAIJ" 150541f059aeSBarry Smith PetscErrorCode MatSOR_SeqAIJ(Mat A,Vec bb,PetscReal omega,MatSORType flag,PetscReal fshift,PetscInt its,PetscInt lits,Vec xx) 150617ab2063SBarry Smith { 1507416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1508e6d1f457SBarry Smith PetscScalar *x,d,sum,*t,scale; 1509e6d1f457SBarry Smith const MatScalar *v = a->a,*idiag=0,*mdiag; 151054f21887SBarry Smith const PetscScalar *b, *bs,*xb, *ts; 1511dfbe8321SBarry Smith PetscErrorCode ierr; 1512d0f46423SBarry Smith PetscInt n = A->cmap->n,m = A->rmap->n,i; 151397f1f81fSBarry Smith const PetscInt *idx,*diag; 151417ab2063SBarry Smith 15153a40ed3dSBarry Smith PetscFunctionBegin; 1516b965ef7fSBarry Smith its = its*lits; 151791723122SBarry Smith 151871f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 151971f1c65dSBarry Smith if (!a->idiagvalid) {ierr = MatInvertDiagonal_SeqAIJ(A,omega,fshift);CHKERRQ(ierr);} 152071f1c65dSBarry Smith a->fshift = fshift; 152171f1c65dSBarry Smith a->omega = omega; 1522ed480e8bSBarry Smith 152371f1c65dSBarry Smith diag = a->diag; 152471f1c65dSBarry Smith t = a->ssor_work; 1525ed480e8bSBarry Smith idiag = a->idiag; 152671f1c65dSBarry Smith mdiag = a->mdiag; 1527ed480e8bSBarry Smith 15281ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 15293649974fSBarry Smith ierr = VecGetArrayRead(bb,&b);CHKERRQ(ierr); 153071f1c65dSBarry Smith CHKMEMQ; 1531ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 153217ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 153317ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1534ed480e8bSBarry Smith bs = b; 153517ab2063SBarry Smith for (i=0; i<m; i++) { 153671f1c65dSBarry Smith d = fshift + mdiag[i]; 1537416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1538ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1539ed480e8bSBarry Smith v = a->a + diag[i] + 1; 154017ab2063SBarry Smith sum = b[i]*d/omega; 1541003131ecSBarry Smith PetscSparseDensePlusDot(sum,bs,v,idx,n); 154217ab2063SBarry Smith x[i] = sum; 154317ab2063SBarry Smith } 15441ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 15453649974fSBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 1546efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 15473a40ed3dSBarry Smith PetscFunctionReturn(0); 154817ab2063SBarry Smith } 1549c783ea89SBarry Smith 155048af12d7SBarry Smith if (flag == SOR_APPLY_LOWER) { 1551e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"SOR_APPLY_LOWER is not implemented"); 15523a40ed3dSBarry Smith } else if (flag & SOR_EISENSTAT) { 155317ab2063SBarry Smith /* Let A = L + U + D; where L is lower trianglar, 1554887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 155517ab2063SBarry Smith 155617ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 155717ab2063SBarry Smith 1558887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 155917ab2063SBarry Smith */ 156017ab2063SBarry Smith scale = (2.0/omega) - 1.0; 156117ab2063SBarry Smith 156217ab2063SBarry Smith /* x = (E + U)^{-1} b */ 156317ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1564416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1565ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1566ed480e8bSBarry Smith v = a->a + diag[i] + 1; 156717ab2063SBarry Smith sum = b[i]; 1568e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 1569ed480e8bSBarry Smith x[i] = sum*idiag[i]; 157017ab2063SBarry Smith } 157117ab2063SBarry Smith 157217ab2063SBarry Smith /* t = b - (2*E - D)x */ 1573416022c9SBarry Smith v = a->a; 1574ed480e8bSBarry Smith for (i=0; i<m; i++) { t[i] = b[i] - scale*(v[*diag++])*x[i]; } 157517ab2063SBarry Smith 157617ab2063SBarry Smith /* t = (E + L)^{-1}t */ 1577ed480e8bSBarry Smith ts = t; 1578416022c9SBarry Smith diag = a->diag; 157917ab2063SBarry Smith for (i=0; i<m; i++) { 1580416022c9SBarry Smith n = diag[i] - a->i[i]; 1581ed480e8bSBarry Smith idx = a->j + a->i[i]; 1582ed480e8bSBarry Smith v = a->a + a->i[i]; 158317ab2063SBarry Smith sum = t[i]; 1584003131ecSBarry Smith PetscSparseDenseMinusDot(sum,ts,v,idx,n); 1585ed480e8bSBarry Smith t[i] = sum*idiag[i]; 1586733d66baSBarry Smith /* x = x + t */ 1587733d66baSBarry Smith x[i] += t[i]; 158817ab2063SBarry Smith } 158917ab2063SBarry Smith 1590dc0b31edSSatish Balay ierr = PetscLogFlops(6.0*m-1 + 2.0*a->nz);CHKERRQ(ierr); 15911ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 15923649974fSBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 15933a40ed3dSBarry Smith PetscFunctionReturn(0); 159417ab2063SBarry Smith } 159517ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 159617ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP){ 159717ab2063SBarry Smith for (i=0; i<m; i++) { 1598416022c9SBarry Smith n = diag[i] - a->i[i]; 1599ed480e8bSBarry Smith idx = a->j + a->i[i]; 1600ed480e8bSBarry Smith v = a->a + a->i[i]; 160117ab2063SBarry Smith sum = b[i]; 1602e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 16035c99c7daSBarry Smith t[i] = sum; 1604ed480e8bSBarry Smith x[i] = sum*idiag[i]; 160517ab2063SBarry Smith } 16065c99c7daSBarry Smith xb = t; 1607efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 16083a40ed3dSBarry Smith } else xb = b; 160917ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP){ 161017ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1611416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1612ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1613ed480e8bSBarry Smith v = a->a + diag[i] + 1; 161417ab2063SBarry Smith sum = xb[i]; 1615e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 16165c99c7daSBarry Smith if (xb == b) { 1617ed480e8bSBarry Smith x[i] = sum*idiag[i]; 16185c99c7daSBarry Smith } else { 16195c99c7daSBarry Smith x[i] = (1-omega)*x[i] + sum*idiag[i]; 162017ab2063SBarry Smith } 16215c99c7daSBarry Smith } 1622efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 162317ab2063SBarry Smith } 162417ab2063SBarry Smith its--; 162517ab2063SBarry Smith } 162617ab2063SBarry Smith while (its--) { 162717ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP){ 162817ab2063SBarry Smith for (i=0; i<m; i++) { 1629416022c9SBarry Smith n = a->i[i+1] - a->i[i]; 1630ed480e8bSBarry Smith idx = a->j + a->i[i]; 1631ed480e8bSBarry Smith v = a->a + a->i[i]; 163217ab2063SBarry Smith sum = b[i]; 1633e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 1634ed480e8bSBarry Smith x[i] = (1. - omega)*x[i] + (sum + mdiag[i]*x[i])*idiag[i]; 163517ab2063SBarry Smith } 16369f863219SBarry Smith ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 163717ab2063SBarry Smith } 163817ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP){ 163917ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1640416022c9SBarry Smith n = a->i[i+1] - a->i[i]; 1641ed480e8bSBarry Smith idx = a->j + a->i[i]; 1642ed480e8bSBarry Smith v = a->a + a->i[i]; 164317ab2063SBarry Smith sum = b[i]; 1644e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 1645ed480e8bSBarry Smith x[i] = (1. - omega)*x[i] + (sum + mdiag[i]*x[i])*idiag[i]; 164617ab2063SBarry Smith } 16479f863219SBarry Smith ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 164817ab2063SBarry Smith } 164917ab2063SBarry Smith } 16501ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 16513649974fSBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 165271f1c65dSBarry Smith CHKMEMQ; PetscFunctionReturn(0); 165317ab2063SBarry Smith } 165417ab2063SBarry Smith 16552af78befSBarry Smith 16564a2ae208SSatish Balay #undef __FUNCT__ 16574a2ae208SSatish Balay #define __FUNCT__ "MatGetInfo_SeqAIJ" 1658dfbe8321SBarry Smith PetscErrorCode MatGetInfo_SeqAIJ(Mat A,MatInfoType flag,MatInfo *info) 165917ab2063SBarry Smith { 1660416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 16614e220ebcSLois Curfman McInnes 16623a40ed3dSBarry Smith PetscFunctionBegin; 16634e220ebcSLois Curfman McInnes info->block_size = 1.0; 16644e220ebcSLois Curfman McInnes info->nz_allocated = (double)a->maxnz; 16654e220ebcSLois Curfman McInnes info->nz_used = (double)a->nz; 16664e220ebcSLois Curfman McInnes info->nz_unneeded = (double)(a->maxnz - a->nz); 16674e220ebcSLois Curfman McInnes info->assemblies = (double)A->num_ass; 16688e58a170SBarry Smith info->mallocs = (double)A->info.mallocs; 16697adad957SLisandro Dalcin info->memory = ((PetscObject)A)->mem; 1670d5f3da31SBarry Smith if (A->factortype) { 16714e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 16724e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 16734e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 16744e220ebcSLois Curfman McInnes } else { 16754e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 16764e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 16774e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 16784e220ebcSLois Curfman McInnes } 16793a40ed3dSBarry Smith PetscFunctionReturn(0); 168017ab2063SBarry Smith } 168117ab2063SBarry Smith 16824a2ae208SSatish Balay #undef __FUNCT__ 16834a2ae208SSatish Balay #define __FUNCT__ "MatZeroRows_SeqAIJ" 16842b40b63fSBarry Smith PetscErrorCode MatZeroRows_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 168517ab2063SBarry Smith { 1686416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 16873b98c0a2SBarry Smith PetscInt i,m = A->rmap->n - 1,d = 0; 16886849ba73SBarry Smith PetscErrorCode ierr; 168997b48c8fSBarry Smith const PetscScalar *xx; 169097b48c8fSBarry Smith PetscScalar *bb; 1691ace3abfcSBarry Smith PetscBool missing; 169217ab2063SBarry Smith 16933a40ed3dSBarry Smith PetscFunctionBegin; 169497b48c8fSBarry Smith if (x && b) { 169597b48c8fSBarry Smith ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 169697b48c8fSBarry Smith ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 169797b48c8fSBarry Smith for (i=0; i<N; i++) { 169897b48c8fSBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 169997b48c8fSBarry Smith bb[rows[i]] = diag*xx[rows[i]]; 170097b48c8fSBarry Smith } 170197b48c8fSBarry Smith ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 170297b48c8fSBarry Smith ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 170397b48c8fSBarry Smith } 170497b48c8fSBarry Smith 1705a9817697SBarry Smith if (a->keepnonzeropattern) { 1706f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 1707e32f2f54SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 1708bfeeae90SHong Zhang ierr = PetscMemzero(&a->a[a->i[rows[i]]],a->ilen[rows[i]]*sizeof(PetscScalar));CHKERRQ(ierr); 1709f1e2ffcdSBarry Smith } 1710f4df32b1SMatthew Knepley if (diag != 0.0) { 171109f38230SBarry Smith ierr = MatMissingDiagonal_SeqAIJ(A,&missing,&d);CHKERRQ(ierr); 1712e32f2f54SBarry Smith if (missing) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in row %D",d); 1713f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 1714f4df32b1SMatthew Knepley a->a[a->diag[rows[i]]] = diag; 1715f1e2ffcdSBarry Smith } 1716f1e2ffcdSBarry Smith } 171788e51ccdSHong Zhang A->same_nonzero = PETSC_TRUE; 1718f1e2ffcdSBarry Smith } else { 1719f4df32b1SMatthew Knepley if (diag != 0.0) { 172017ab2063SBarry Smith for (i=0; i<N; i++) { 1721e32f2f54SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 17227ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 1723416022c9SBarry Smith a->ilen[rows[i]] = 1; 1724f4df32b1SMatthew Knepley a->a[a->i[rows[i]]] = diag; 1725bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 17267ae801bdSBarry Smith } else { /* in case row was completely empty */ 1727f4df32b1SMatthew Knepley ierr = MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],&diag,INSERT_VALUES);CHKERRQ(ierr); 172817ab2063SBarry Smith } 172917ab2063SBarry Smith } 17303a40ed3dSBarry Smith } else { 173117ab2063SBarry Smith for (i=0; i<N; i++) { 1732e32f2f54SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 1733416022c9SBarry Smith a->ilen[rows[i]] = 0; 173417ab2063SBarry Smith } 173517ab2063SBarry Smith } 173688e51ccdSHong Zhang A->same_nonzero = PETSC_FALSE; 1737f1e2ffcdSBarry Smith } 173843a90d84SBarry Smith ierr = MatAssemblyEnd_SeqAIJ(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 17393a40ed3dSBarry Smith PetscFunctionReturn(0); 174017ab2063SBarry Smith } 174117ab2063SBarry Smith 17424a2ae208SSatish Balay #undef __FUNCT__ 17436e169961SBarry Smith #define __FUNCT__ "MatZeroRowsColumns_SeqAIJ" 17446e169961SBarry Smith PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 17456e169961SBarry Smith { 17466e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 17476e169961SBarry Smith PetscInt i,j,m = A->rmap->n - 1,d = 0; 17486e169961SBarry Smith PetscErrorCode ierr; 17492b40b63fSBarry Smith PetscBool missing,*zeroed,vecs = PETSC_FALSE; 17506e169961SBarry Smith const PetscScalar *xx; 17516e169961SBarry Smith PetscScalar *bb; 17526e169961SBarry Smith 17536e169961SBarry Smith PetscFunctionBegin; 17546e169961SBarry Smith if (x && b) { 17556e169961SBarry Smith ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 17566e169961SBarry Smith ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 17572b40b63fSBarry Smith vecs = PETSC_TRUE; 17586e169961SBarry Smith } 17596e169961SBarry Smith ierr = PetscMalloc(A->rmap->n*sizeof(PetscBool),&zeroed);CHKERRQ(ierr); 17606e169961SBarry Smith ierr = PetscMemzero(zeroed,A->rmap->n*sizeof(PetscBool));CHKERRQ(ierr); 17616e169961SBarry Smith for (i=0; i<N; i++) { 17626e169961SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 17636e169961SBarry Smith ierr = PetscMemzero(&a->a[a->i[rows[i]]],a->ilen[rows[i]]*sizeof(PetscScalar));CHKERRQ(ierr); 17646e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 17656e169961SBarry Smith } 17666e169961SBarry Smith for (i=0; i<A->rmap->n; i++) { 17676e169961SBarry Smith if (!zeroed[i]) { 17686e169961SBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 17696e169961SBarry Smith if (zeroed[a->j[j]]) { 17702b40b63fSBarry Smith if (vecs) bb[i] -= a->a[j]*xx[a->j[j]]; 17716e169961SBarry Smith a->a[j] = 0.0; 17726e169961SBarry Smith } 17736e169961SBarry Smith } 17742b40b63fSBarry Smith } else if (vecs) bb[i] = diag*xx[i]; 17756e169961SBarry Smith } 17766e169961SBarry Smith if (x && b) { 17776e169961SBarry Smith ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 17786e169961SBarry Smith ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 17796e169961SBarry Smith } 17806e169961SBarry Smith ierr = PetscFree(zeroed);CHKERRQ(ierr); 17816e169961SBarry Smith if (diag != 0.0) { 17826e169961SBarry Smith ierr = MatMissingDiagonal_SeqAIJ(A,&missing,&d);CHKERRQ(ierr); 17836e169961SBarry Smith if (missing) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in row %D",d); 17846e169961SBarry Smith for (i=0; i<N; i++) { 17856e169961SBarry Smith a->a[a->diag[rows[i]]] = diag; 17866e169961SBarry Smith } 17876e169961SBarry Smith } 17886e169961SBarry Smith A->same_nonzero = PETSC_TRUE; 17896e169961SBarry Smith ierr = MatAssemblyEnd_SeqAIJ(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 17906e169961SBarry Smith PetscFunctionReturn(0); 17916e169961SBarry Smith } 17926e169961SBarry Smith 17936e169961SBarry Smith #undef __FUNCT__ 17944a2ae208SSatish Balay #define __FUNCT__ "MatGetRow_SeqAIJ" 1795a77337e4SBarry Smith PetscErrorCode MatGetRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 179617ab2063SBarry Smith { 1797416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 179897f1f81fSBarry Smith PetscInt *itmp; 179917ab2063SBarry Smith 18003a40ed3dSBarry Smith PetscFunctionBegin; 1801e32f2f54SBarry Smith if (row < 0 || row >= A->rmap->n) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D out of range",row); 180217ab2063SBarry Smith 1803416022c9SBarry Smith *nz = a->i[row+1] - a->i[row]; 1804bfeeae90SHong Zhang if (v) *v = a->a + a->i[row]; 180517ab2063SBarry Smith if (idx) { 1806bfeeae90SHong Zhang itmp = a->j + a->i[row]; 1807bfeeae90SHong Zhang if (*nz) { 18084e093b46SBarry Smith *idx = itmp; 180917ab2063SBarry Smith } 181017ab2063SBarry Smith else *idx = 0; 181117ab2063SBarry Smith } 18123a40ed3dSBarry Smith PetscFunctionReturn(0); 181317ab2063SBarry Smith } 181417ab2063SBarry Smith 1815bfeeae90SHong Zhang /* remove this function? */ 18164a2ae208SSatish Balay #undef __FUNCT__ 18174a2ae208SSatish Balay #define __FUNCT__ "MatRestoreRow_SeqAIJ" 1818a77337e4SBarry Smith PetscErrorCode MatRestoreRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 181917ab2063SBarry Smith { 18203a40ed3dSBarry Smith PetscFunctionBegin; 18213a40ed3dSBarry Smith PetscFunctionReturn(0); 182217ab2063SBarry Smith } 182317ab2063SBarry Smith 18244a2ae208SSatish Balay #undef __FUNCT__ 18254a2ae208SSatish Balay #define __FUNCT__ "MatNorm_SeqAIJ" 1826dfbe8321SBarry Smith PetscErrorCode MatNorm_SeqAIJ(Mat A,NormType type,PetscReal *nrm) 182717ab2063SBarry Smith { 1828416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 182954f21887SBarry Smith MatScalar *v = a->a; 183036db0b34SBarry Smith PetscReal sum = 0.0; 18316849ba73SBarry Smith PetscErrorCode ierr; 183297f1f81fSBarry Smith PetscInt i,j; 183317ab2063SBarry Smith 18343a40ed3dSBarry Smith PetscFunctionBegin; 183517ab2063SBarry Smith if (type == NORM_FROBENIUS) { 1836416022c9SBarry Smith for (i=0; i<a->nz; i++) { 1837aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 183836db0b34SBarry Smith sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 183917ab2063SBarry Smith #else 184017ab2063SBarry Smith sum += (*v)*(*v); v++; 184117ab2063SBarry Smith #endif 184217ab2063SBarry Smith } 18438f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 18443a40ed3dSBarry Smith } else if (type == NORM_1) { 184536db0b34SBarry Smith PetscReal *tmp; 184697f1f81fSBarry Smith PetscInt *jj = a->j; 1847d0f46423SBarry Smith ierr = PetscMalloc((A->cmap->n+1)*sizeof(PetscReal),&tmp);CHKERRQ(ierr); 1848d0f46423SBarry Smith ierr = PetscMemzero(tmp,A->cmap->n*sizeof(PetscReal));CHKERRQ(ierr); 1849064f8208SBarry Smith *nrm = 0.0; 1850416022c9SBarry Smith for (j=0; j<a->nz; j++) { 1851bfeeae90SHong Zhang tmp[*jj++] += PetscAbsScalar(*v); v++; 185217ab2063SBarry Smith } 1853d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1854064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 185517ab2063SBarry Smith } 1856606d414cSSatish Balay ierr = PetscFree(tmp);CHKERRQ(ierr); 18573a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 1858064f8208SBarry Smith *nrm = 0.0; 1859d0f46423SBarry Smith for (j=0; j<A->rmap->n; j++) { 1860bfeeae90SHong Zhang v = a->a + a->i[j]; 186117ab2063SBarry Smith sum = 0.0; 1862416022c9SBarry Smith for (i=0; i<a->i[j+1]-a->i[j]; i++) { 1863cddf8d76SBarry Smith sum += PetscAbsScalar(*v); v++; 186417ab2063SBarry Smith } 1865064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 186617ab2063SBarry Smith } 18673a40ed3dSBarry Smith } else { 1868e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"No support for two norm"); 186917ab2063SBarry Smith } 18703a40ed3dSBarry Smith PetscFunctionReturn(0); 187117ab2063SBarry Smith } 187217ab2063SBarry Smith 18734a2ae208SSatish Balay #undef __FUNCT__ 18744a2ae208SSatish Balay #define __FUNCT__ "MatTranspose_SeqAIJ" 1875fc4dec0aSBarry Smith PetscErrorCode MatTranspose_SeqAIJ(Mat A,MatReuse reuse,Mat *B) 187617ab2063SBarry Smith { 1877416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1878416022c9SBarry Smith Mat C; 18796849ba73SBarry Smith PetscErrorCode ierr; 1880d0f46423SBarry Smith PetscInt i,*aj = a->j,*ai = a->i,m = A->rmap->n,len,*col; 188154f21887SBarry Smith MatScalar *array = a->a; 188217ab2063SBarry Smith 18833a40ed3dSBarry Smith PetscFunctionBegin; 1884e32f2f54SBarry Smith if (reuse == MAT_REUSE_MATRIX && A == *B && m != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Square matrix only for in-place"); 1885fc4dec0aSBarry Smith 1886fc4dec0aSBarry Smith if (reuse == MAT_INITIAL_MATRIX || *B == A) { 1887d0f46423SBarry Smith ierr = PetscMalloc((1+A->cmap->n)*sizeof(PetscInt),&col);CHKERRQ(ierr); 1888d0f46423SBarry Smith ierr = PetscMemzero(col,(1+A->cmap->n)*sizeof(PetscInt));CHKERRQ(ierr); 1889bfeeae90SHong Zhang 1890bfeeae90SHong Zhang for (i=0; i<ai[m]; i++) col[aj[i]] += 1; 18917adad957SLisandro Dalcin ierr = MatCreate(((PetscObject)A)->comm,&C);CHKERRQ(ierr); 1892d0f46423SBarry Smith ierr = MatSetSizes(C,A->cmap->n,m,A->cmap->n,m);CHKERRQ(ierr); 18937adad957SLisandro Dalcin ierr = MatSetType(C,((PetscObject)A)->type_name);CHKERRQ(ierr); 1894ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,col);CHKERRQ(ierr); 1895606d414cSSatish Balay ierr = PetscFree(col);CHKERRQ(ierr); 1896a541d17aSBarry Smith } else { 1897a541d17aSBarry Smith C = *B; 1898a541d17aSBarry Smith } 1899a541d17aSBarry Smith 190017ab2063SBarry Smith for (i=0; i<m; i++) { 190117ab2063SBarry Smith len = ai[i+1]-ai[i]; 190287d4246cSBarry Smith ierr = MatSetValues_SeqAIJ(C,len,aj,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 1903b9b97703SBarry Smith array += len; 1904b9b97703SBarry Smith aj += len; 190517ab2063SBarry Smith } 19066d4a8577SBarry Smith ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 19076d4a8577SBarry Smith ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 190817ab2063SBarry Smith 1909815cbec1SBarry Smith if (reuse == MAT_INITIAL_MATRIX || *B != A) { 1910416022c9SBarry Smith *B = C; 191117ab2063SBarry Smith } else { 1912eb6b5d47SBarry Smith ierr = MatHeaderMerge(A,C);CHKERRQ(ierr); 191317ab2063SBarry Smith } 19143a40ed3dSBarry Smith PetscFunctionReturn(0); 191517ab2063SBarry Smith } 191617ab2063SBarry Smith 1917cd0d46ebSvictorle EXTERN_C_BEGIN 1918cd0d46ebSvictorle #undef __FUNCT__ 19195fbd3699SBarry Smith #define __FUNCT__ "MatIsTranspose_SeqAIJ" 19207087cfbeSBarry Smith PetscErrorCode MatIsTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 1921cd0d46ebSvictorle { 1922cd0d46ebSvictorle Mat_SeqAIJ *aij = (Mat_SeqAIJ *) A->data,*bij = (Mat_SeqAIJ*) A->data; 192354f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 192454f21887SBarry Smith MatScalar *va,*vb; 19256849ba73SBarry Smith PetscErrorCode ierr; 192697f1f81fSBarry Smith PetscInt ma,na,mb,nb, i; 1927cd0d46ebSvictorle 1928cd0d46ebSvictorle PetscFunctionBegin; 1929cd0d46ebSvictorle bij = (Mat_SeqAIJ *) B->data; 1930cd0d46ebSvictorle 1931cd0d46ebSvictorle ierr = MatGetSize(A,&ma,&na);CHKERRQ(ierr); 1932cd0d46ebSvictorle ierr = MatGetSize(B,&mb,&nb);CHKERRQ(ierr); 19335485867bSBarry Smith if (ma!=nb || na!=mb){ 19345485867bSBarry Smith *f = PETSC_FALSE; 19355485867bSBarry Smith PetscFunctionReturn(0); 19365485867bSBarry Smith } 1937cd0d46ebSvictorle aii = aij->i; bii = bij->i; 1938cd0d46ebSvictorle adx = aij->j; bdx = bij->j; 1939cd0d46ebSvictorle va = aij->a; vb = bij->a; 194097f1f81fSBarry Smith ierr = PetscMalloc(ma*sizeof(PetscInt),&aptr);CHKERRQ(ierr); 194197f1f81fSBarry Smith ierr = PetscMalloc(mb*sizeof(PetscInt),&bptr);CHKERRQ(ierr); 1942cd0d46ebSvictorle for (i=0; i<ma; i++) aptr[i] = aii[i]; 1943cd0d46ebSvictorle for (i=0; i<mb; i++) bptr[i] = bii[i]; 1944cd0d46ebSvictorle 1945cd0d46ebSvictorle *f = PETSC_TRUE; 1946cd0d46ebSvictorle for (i=0; i<ma; i++) { 1947cd0d46ebSvictorle while (aptr[i]<aii[i+1]) { 194897f1f81fSBarry Smith PetscInt idc,idr; 19495485867bSBarry Smith PetscScalar vc,vr; 1950cd0d46ebSvictorle /* column/row index/value */ 19515485867bSBarry Smith idc = adx[aptr[i]]; 19525485867bSBarry Smith idr = bdx[bptr[idc]]; 19535485867bSBarry Smith vc = va[aptr[i]]; 19545485867bSBarry Smith vr = vb[bptr[idc]]; 19555485867bSBarry Smith if (i!=idr || PetscAbsScalar(vc-vr) > tol) { 19565485867bSBarry Smith *f = PETSC_FALSE; 19575485867bSBarry Smith goto done; 1958cd0d46ebSvictorle } else { 19595485867bSBarry Smith aptr[i]++; 19605485867bSBarry Smith if (B || i!=idc) bptr[idc]++; 1961cd0d46ebSvictorle } 1962cd0d46ebSvictorle } 1963cd0d46ebSvictorle } 1964cd0d46ebSvictorle done: 1965cd0d46ebSvictorle ierr = PetscFree(aptr);CHKERRQ(ierr); 19663aeef889SHong Zhang ierr = PetscFree(bptr);CHKERRQ(ierr); 1967cd0d46ebSvictorle PetscFunctionReturn(0); 1968cd0d46ebSvictorle } 1969cd0d46ebSvictorle EXTERN_C_END 1970cd0d46ebSvictorle 19711cbb95d3SBarry Smith EXTERN_C_BEGIN 19721cbb95d3SBarry Smith #undef __FUNCT__ 19731cbb95d3SBarry Smith #define __FUNCT__ "MatIsHermitianTranspose_SeqAIJ" 19747087cfbeSBarry Smith PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 19751cbb95d3SBarry Smith { 19761cbb95d3SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *) A->data,*bij = (Mat_SeqAIJ*) A->data; 197754f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 197854f21887SBarry Smith MatScalar *va,*vb; 19791cbb95d3SBarry Smith PetscErrorCode ierr; 19801cbb95d3SBarry Smith PetscInt ma,na,mb,nb, i; 19811cbb95d3SBarry Smith 19821cbb95d3SBarry Smith PetscFunctionBegin; 19831cbb95d3SBarry Smith bij = (Mat_SeqAIJ *) B->data; 19841cbb95d3SBarry Smith 19851cbb95d3SBarry Smith ierr = MatGetSize(A,&ma,&na);CHKERRQ(ierr); 19861cbb95d3SBarry Smith ierr = MatGetSize(B,&mb,&nb);CHKERRQ(ierr); 19871cbb95d3SBarry Smith if (ma!=nb || na!=mb){ 19881cbb95d3SBarry Smith *f = PETSC_FALSE; 19891cbb95d3SBarry Smith PetscFunctionReturn(0); 19901cbb95d3SBarry Smith } 19911cbb95d3SBarry Smith aii = aij->i; bii = bij->i; 19921cbb95d3SBarry Smith adx = aij->j; bdx = bij->j; 19931cbb95d3SBarry Smith va = aij->a; vb = bij->a; 19941cbb95d3SBarry Smith ierr = PetscMalloc(ma*sizeof(PetscInt),&aptr);CHKERRQ(ierr); 19951cbb95d3SBarry Smith ierr = PetscMalloc(mb*sizeof(PetscInt),&bptr);CHKERRQ(ierr); 19961cbb95d3SBarry Smith for (i=0; i<ma; i++) aptr[i] = aii[i]; 19971cbb95d3SBarry Smith for (i=0; i<mb; i++) bptr[i] = bii[i]; 19981cbb95d3SBarry Smith 19991cbb95d3SBarry Smith *f = PETSC_TRUE; 20001cbb95d3SBarry Smith for (i=0; i<ma; i++) { 20011cbb95d3SBarry Smith while (aptr[i]<aii[i+1]) { 20021cbb95d3SBarry Smith PetscInt idc,idr; 20031cbb95d3SBarry Smith PetscScalar vc,vr; 20041cbb95d3SBarry Smith /* column/row index/value */ 20051cbb95d3SBarry Smith idc = adx[aptr[i]]; 20061cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 20071cbb95d3SBarry Smith vc = va[aptr[i]]; 20081cbb95d3SBarry Smith vr = vb[bptr[idc]]; 20091cbb95d3SBarry Smith if (i!=idr || PetscAbsScalar(vc-PetscConj(vr)) > tol) { 20101cbb95d3SBarry Smith *f = PETSC_FALSE; 20111cbb95d3SBarry Smith goto done; 20121cbb95d3SBarry Smith } else { 20131cbb95d3SBarry Smith aptr[i]++; 20141cbb95d3SBarry Smith if (B || i!=idc) bptr[idc]++; 20151cbb95d3SBarry Smith } 20161cbb95d3SBarry Smith } 20171cbb95d3SBarry Smith } 20181cbb95d3SBarry Smith done: 20191cbb95d3SBarry Smith ierr = PetscFree(aptr);CHKERRQ(ierr); 20201cbb95d3SBarry Smith ierr = PetscFree(bptr);CHKERRQ(ierr); 20211cbb95d3SBarry Smith PetscFunctionReturn(0); 20221cbb95d3SBarry Smith } 20231cbb95d3SBarry Smith EXTERN_C_END 20241cbb95d3SBarry Smith 20259e29f15eSvictorle #undef __FUNCT__ 20269e29f15eSvictorle #define __FUNCT__ "MatIsSymmetric_SeqAIJ" 2027ace3abfcSBarry Smith PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 20289e29f15eSvictorle { 2029dfbe8321SBarry Smith PetscErrorCode ierr; 20309e29f15eSvictorle PetscFunctionBegin; 20315485867bSBarry Smith ierr = MatIsTranspose_SeqAIJ(A,A,tol,f);CHKERRQ(ierr); 20329e29f15eSvictorle PetscFunctionReturn(0); 20339e29f15eSvictorle } 20349e29f15eSvictorle 20354a2ae208SSatish Balay #undef __FUNCT__ 20361cbb95d3SBarry Smith #define __FUNCT__ "MatIsHermitian_SeqAIJ" 2037ace3abfcSBarry Smith PetscErrorCode MatIsHermitian_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 20381cbb95d3SBarry Smith { 20391cbb95d3SBarry Smith PetscErrorCode ierr; 20401cbb95d3SBarry Smith PetscFunctionBegin; 20411cbb95d3SBarry Smith ierr = MatIsHermitianTranspose_SeqAIJ(A,A,tol,f);CHKERRQ(ierr); 20421cbb95d3SBarry Smith PetscFunctionReturn(0); 20431cbb95d3SBarry Smith } 20441cbb95d3SBarry Smith 20451cbb95d3SBarry Smith #undef __FUNCT__ 20464a2ae208SSatish Balay #define __FUNCT__ "MatDiagonalScale_SeqAIJ" 2047dfbe8321SBarry Smith PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A,Vec ll,Vec rr) 204817ab2063SBarry Smith { 2049416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 205054f21887SBarry Smith PetscScalar *l,*r,x; 205154f21887SBarry Smith MatScalar *v; 2052dfbe8321SBarry Smith PetscErrorCode ierr; 2053d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,M,nz = a->nz,*jj; 205417ab2063SBarry Smith 20553a40ed3dSBarry Smith PetscFunctionBegin; 205617ab2063SBarry Smith if (ll) { 20573ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 20583ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 2059e1311b90SBarry Smith ierr = VecGetLocalSize(ll,&m);CHKERRQ(ierr); 2060e32f2f54SBarry Smith if (m != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Left scaling vector wrong length"); 20611ebc52fbSHong Zhang ierr = VecGetArray(ll,&l);CHKERRQ(ierr); 2062416022c9SBarry Smith v = a->a; 206317ab2063SBarry Smith for (i=0; i<m; i++) { 206417ab2063SBarry Smith x = l[i]; 2065416022c9SBarry Smith M = a->i[i+1] - a->i[i]; 206617ab2063SBarry Smith for (j=0; j<M; j++) { (*v++) *= x;} 206717ab2063SBarry Smith } 20681ebc52fbSHong Zhang ierr = VecRestoreArray(ll,&l);CHKERRQ(ierr); 2069efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 207017ab2063SBarry Smith } 207117ab2063SBarry Smith if (rr) { 2072e1311b90SBarry Smith ierr = VecGetLocalSize(rr,&n);CHKERRQ(ierr); 2073e32f2f54SBarry Smith if (n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Right scaling vector wrong length"); 20741ebc52fbSHong Zhang ierr = VecGetArray(rr,&r);CHKERRQ(ierr); 2075416022c9SBarry Smith v = a->a; jj = a->j; 207617ab2063SBarry Smith for (i=0; i<nz; i++) { 2077bfeeae90SHong Zhang (*v++) *= r[*jj++]; 207817ab2063SBarry Smith } 20791ebc52fbSHong Zhang ierr = VecRestoreArray(rr,&r);CHKERRQ(ierr); 2080efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 208117ab2063SBarry Smith } 20823a40ed3dSBarry Smith PetscFunctionReturn(0); 208317ab2063SBarry Smith } 208417ab2063SBarry Smith 20854a2ae208SSatish Balay #undef __FUNCT__ 20864a2ae208SSatish Balay #define __FUNCT__ "MatGetSubMatrix_SeqAIJ" 208797f1f81fSBarry Smith PetscErrorCode MatGetSubMatrix_SeqAIJ(Mat A,IS isrow,IS iscol,PetscInt csize,MatReuse scall,Mat *B) 208817ab2063SBarry Smith { 2089db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*c; 20906849ba73SBarry Smith PetscErrorCode ierr; 2091d0f46423SBarry Smith PetscInt *smap,i,k,kstart,kend,oldcols = A->cmap->n,*lens; 209297f1f81fSBarry Smith PetscInt row,mat_i,*mat_j,tcol,first,step,*mat_ilen,sum,lensi; 20935d0c19d7SBarry Smith const PetscInt *irow,*icol; 20945d0c19d7SBarry Smith PetscInt nrows,ncols; 209597f1f81fSBarry Smith PetscInt *starts,*j_new,*i_new,*aj = a->j,*ai = a->i,ii,*ailen = a->ilen; 209654f21887SBarry Smith MatScalar *a_new,*mat_a; 2097416022c9SBarry Smith Mat C; 2098ace3abfcSBarry Smith PetscBool stride,sorted; 209917ab2063SBarry Smith 21003a40ed3dSBarry Smith PetscFunctionBegin; 210114ca34e6SBarry Smith ierr = ISSorted(isrow,&sorted);CHKERRQ(ierr); 2102e32f2f54SBarry Smith if (!sorted) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"ISrow is not sorted"); 210314ca34e6SBarry Smith ierr = ISSorted(iscol,&sorted);CHKERRQ(ierr); 2104e32f2f54SBarry Smith if (!sorted) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"IScol is not sorted"); 210599141d43SSatish Balay 210617ab2063SBarry Smith ierr = ISGetIndices(isrow,&irow);CHKERRQ(ierr); 2107b9b97703SBarry Smith ierr = ISGetLocalSize(isrow,&nrows);CHKERRQ(ierr); 2108b9b97703SBarry Smith ierr = ISGetLocalSize(iscol,&ncols);CHKERRQ(ierr); 210917ab2063SBarry Smith 2110fee21e36SBarry Smith ierr = ISStrideGetInfo(iscol,&first,&step);CHKERRQ(ierr); 21110dbe5b1eSSatish Balay ierr = PetscTypeCompare((PetscObject)iscol,ISSTRIDE,&stride);CHKERRQ(ierr); 2112fee21e36SBarry Smith if (stride && step == 1) { 211302834360SBarry Smith /* special case of contiguous rows */ 21140e83c824SBarry Smith ierr = PetscMalloc2(nrows,PetscInt,&lens,nrows,PetscInt,&starts);CHKERRQ(ierr); 211502834360SBarry Smith /* loop over new rows determining lens and starting points */ 211602834360SBarry Smith for (i=0; i<nrows; i++) { 2117bfeeae90SHong Zhang kstart = ai[irow[i]]; 2118a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 211902834360SBarry Smith for (k=kstart; k<kend; k++) { 2120bfeeae90SHong Zhang if (aj[k] >= first) { 212102834360SBarry Smith starts[i] = k; 212202834360SBarry Smith break; 212302834360SBarry Smith } 212402834360SBarry Smith } 2125a2744918SBarry Smith sum = 0; 212602834360SBarry Smith while (k < kend) { 2127bfeeae90SHong Zhang if (aj[k++] >= first+ncols) break; 2128a2744918SBarry Smith sum++; 212902834360SBarry Smith } 2130a2744918SBarry Smith lens[i] = sum; 213102834360SBarry Smith } 213202834360SBarry Smith /* create submatrix */ 2133cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 213497f1f81fSBarry Smith PetscInt n_cols,n_rows; 213508480c60SBarry Smith ierr = MatGetSize(*B,&n_rows,&n_cols);CHKERRQ(ierr); 2136e32f2f54SBarry Smith if (n_rows != nrows || n_cols != ncols) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Reused submatrix wrong size"); 2137d8ced48eSBarry Smith ierr = MatZeroEntries(*B);CHKERRQ(ierr); 213808480c60SBarry Smith C = *B; 21393a40ed3dSBarry Smith } else { 21407adad957SLisandro Dalcin ierr = MatCreate(((PetscObject)A)->comm,&C);CHKERRQ(ierr); 2141f69a0ea3SMatthew Knepley ierr = MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr); 21427adad957SLisandro Dalcin ierr = MatSetType(C,((PetscObject)A)->type_name);CHKERRQ(ierr); 2143ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens);CHKERRQ(ierr); 214408480c60SBarry Smith } 2145db02288aSLois Curfman McInnes c = (Mat_SeqAIJ*)C->data; 2146db02288aSLois Curfman McInnes 214702834360SBarry Smith /* loop over rows inserting into submatrix */ 2148db02288aSLois Curfman McInnes a_new = c->a; 2149db02288aSLois Curfman McInnes j_new = c->j; 2150db02288aSLois Curfman McInnes i_new = c->i; 2151bfeeae90SHong Zhang 215202834360SBarry Smith for (i=0; i<nrows; i++) { 2153a2744918SBarry Smith ii = starts[i]; 2154a2744918SBarry Smith lensi = lens[i]; 2155a2744918SBarry Smith for (k=0; k<lensi; k++) { 2156a2744918SBarry Smith *j_new++ = aj[ii+k] - first; 215702834360SBarry Smith } 215887828ca2SBarry Smith ierr = PetscMemcpy(a_new,a->a + starts[i],lensi*sizeof(PetscScalar));CHKERRQ(ierr); 2159a2744918SBarry Smith a_new += lensi; 2160a2744918SBarry Smith i_new[i+1] = i_new[i] + lensi; 2161a2744918SBarry Smith c->ilen[i] = lensi; 216202834360SBarry Smith } 21630e83c824SBarry Smith ierr = PetscFree2(lens,starts);CHKERRQ(ierr); 21643a40ed3dSBarry Smith } else { 216502834360SBarry Smith ierr = ISGetIndices(iscol,&icol);CHKERRQ(ierr); 21660e83c824SBarry Smith ierr = PetscMalloc(oldcols*sizeof(PetscInt),&smap);CHKERRQ(ierr); 216797f1f81fSBarry Smith ierr = PetscMemzero(smap,oldcols*sizeof(PetscInt));CHKERRQ(ierr); 21680e83c824SBarry Smith ierr = PetscMalloc((1+nrows)*sizeof(PetscInt),&lens);CHKERRQ(ierr); 21694dcab191SBarry Smith for (i=0; i<ncols; i++) { 21704dcab191SBarry Smith #if defined(PETSC_USE_DEBUG) 21714dcab191SBarry Smith if (icol[i] >= oldcols) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Requesting column beyond largest column icol[%D] %D <= A->cmap->n %D",i,icol[i],oldcols); 21724dcab191SBarry Smith #endif 21734dcab191SBarry Smith smap[icol[i]] = i+1; 21744dcab191SBarry Smith } 21754dcab191SBarry Smith 217602834360SBarry Smith /* determine lens of each row */ 217702834360SBarry Smith for (i=0; i<nrows; i++) { 2178bfeeae90SHong Zhang kstart = ai[irow[i]]; 217902834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 218002834360SBarry Smith lens[i] = 0; 218102834360SBarry Smith for (k=kstart; k<kend; k++) { 2182bfeeae90SHong Zhang if (smap[aj[k]]) { 218302834360SBarry Smith lens[i]++; 218402834360SBarry Smith } 218502834360SBarry Smith } 218602834360SBarry Smith } 218717ab2063SBarry Smith /* Create and fill new matrix */ 2188a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2189ace3abfcSBarry Smith PetscBool equal; 21900f5bd95cSBarry Smith 219199141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2192e32f2f54SBarry Smith if ((*B)->rmap->n != nrows || (*B)->cmap->n != ncols) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong size"); 2193d0f46423SBarry Smith ierr = PetscMemcmp(c->ilen,lens,(*B)->rmap->n*sizeof(PetscInt),&equal);CHKERRQ(ierr); 21940f5bd95cSBarry Smith if (!equal) { 2195e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong no of nonzeros"); 219699141d43SSatish Balay } 2197d0f46423SBarry Smith ierr = PetscMemzero(c->ilen,(*B)->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 219808480c60SBarry Smith C = *B; 21993a40ed3dSBarry Smith } else { 22007adad957SLisandro Dalcin ierr = MatCreate(((PetscObject)A)->comm,&C);CHKERRQ(ierr); 2201f69a0ea3SMatthew Knepley ierr = MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr); 22027adad957SLisandro Dalcin ierr = MatSetType(C,((PetscObject)A)->type_name);CHKERRQ(ierr); 2203ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens);CHKERRQ(ierr); 220408480c60SBarry Smith } 220599141d43SSatish Balay c = (Mat_SeqAIJ *)(C->data); 220617ab2063SBarry Smith for (i=0; i<nrows; i++) { 220799141d43SSatish Balay row = irow[i]; 2208bfeeae90SHong Zhang kstart = ai[row]; 220999141d43SSatish Balay kend = kstart + a->ilen[row]; 2210bfeeae90SHong Zhang mat_i = c->i[i]; 221199141d43SSatish Balay mat_j = c->j + mat_i; 221299141d43SSatish Balay mat_a = c->a + mat_i; 221399141d43SSatish Balay mat_ilen = c->ilen + i; 221417ab2063SBarry Smith for (k=kstart; k<kend; k++) { 2215bfeeae90SHong Zhang if ((tcol=smap[a->j[k]])) { 2216ed480e8bSBarry Smith *mat_j++ = tcol - 1; 221799141d43SSatish Balay *mat_a++ = a->a[k]; 221899141d43SSatish Balay (*mat_ilen)++; 221999141d43SSatish Balay 222017ab2063SBarry Smith } 222117ab2063SBarry Smith } 222217ab2063SBarry Smith } 222302834360SBarry Smith /* Free work space */ 222402834360SBarry Smith ierr = ISRestoreIndices(iscol,&icol);CHKERRQ(ierr); 2225606d414cSSatish Balay ierr = PetscFree(smap);CHKERRQ(ierr); 2226606d414cSSatish Balay ierr = PetscFree(lens);CHKERRQ(ierr); 222702834360SBarry Smith } 22286d4a8577SBarry Smith ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 22296d4a8577SBarry Smith ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 223017ab2063SBarry Smith 223117ab2063SBarry Smith ierr = ISRestoreIndices(isrow,&irow);CHKERRQ(ierr); 2232416022c9SBarry Smith *B = C; 22333a40ed3dSBarry Smith PetscFunctionReturn(0); 223417ab2063SBarry Smith } 223517ab2063SBarry Smith 22361df811f5SHong Zhang #undef __FUNCT__ 223782d44351SHong Zhang #define __FUNCT__ "MatGetMultiProcBlock_SeqAIJ" 223882d44351SHong Zhang PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat,MPI_Comm subComm,Mat* subMat) 223982d44351SHong Zhang { 224082d44351SHong Zhang PetscErrorCode ierr; 224182d44351SHong Zhang Mat B; 224282d44351SHong Zhang 224382d44351SHong Zhang PetscFunctionBegin; 224482d44351SHong Zhang ierr = MatCreate(subComm,&B);CHKERRQ(ierr); 224582d44351SHong Zhang ierr = MatSetSizes(B,mat->rmap->n,mat->cmap->n,mat->rmap->n,mat->cmap->n);CHKERRQ(ierr); 224682d44351SHong Zhang ierr = MatSetType(B,MATSEQAIJ);CHKERRQ(ierr); 224782d44351SHong Zhang ierr = MatDuplicateNoCreate_SeqAIJ(B,mat,MAT_COPY_VALUES,PETSC_TRUE);CHKERRQ(ierr); 224882d44351SHong Zhang *subMat = B; 224982d44351SHong Zhang PetscFunctionReturn(0); 225082d44351SHong Zhang } 225182d44351SHong Zhang 225282d44351SHong Zhang #undef __FUNCT__ 22534a2ae208SSatish Balay #define __FUNCT__ "MatILUFactor_SeqAIJ" 22540481f469SBarry Smith PetscErrorCode MatILUFactor_SeqAIJ(Mat inA,IS row,IS col,const MatFactorInfo *info) 2255a871dcd8SBarry Smith { 225663b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 2257dfbe8321SBarry Smith PetscErrorCode ierr; 225863b91edcSBarry Smith Mat outA; 2259ace3abfcSBarry Smith PetscBool row_identity,col_identity; 226063b91edcSBarry Smith 22613a40ed3dSBarry Smith PetscFunctionBegin; 2262e32f2f54SBarry Smith if (info->levels != 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Only levels=0 supported for in-place ilu"); 22631df811f5SHong Zhang 2264b8a78c4aSBarry Smith ierr = ISIdentity(row,&row_identity);CHKERRQ(ierr); 2265b8a78c4aSBarry Smith ierr = ISIdentity(col,&col_identity);CHKERRQ(ierr); 2266a871dcd8SBarry Smith 226763b91edcSBarry Smith outA = inA; 2268d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 2269c38d4ed2SBarry Smith ierr = PetscObjectReference((PetscObject)row);CHKERRQ(ierr); 22706bf464f9SBarry Smith ierr = ISDestroy(&a->row);CHKERRQ(ierr); 2271c3122656SLisandro Dalcin a->row = row; 2272c38d4ed2SBarry Smith ierr = PetscObjectReference((PetscObject)col);CHKERRQ(ierr); 22736bf464f9SBarry Smith ierr = ISDestroy(&a->col);CHKERRQ(ierr); 2274c3122656SLisandro Dalcin a->col = col; 227563b91edcSBarry Smith 227636db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 22776bf464f9SBarry Smith ierr = ISDestroy(&a->icol);CHKERRQ(ierr); 22784c49b128SBarry Smith ierr = ISInvertPermutation(col,PETSC_DECIDE,&a->icol);CHKERRQ(ierr); 227952e6d16bSBarry Smith ierr = PetscLogObjectParent(inA,a->icol);CHKERRQ(ierr); 2280f0ec6fceSSatish Balay 228194a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 2282d0f46423SBarry Smith ierr = PetscMalloc((inA->rmap->n+1)*sizeof(PetscScalar),&a->solve_work);CHKERRQ(ierr); 2283d0f46423SBarry Smith ierr = PetscLogObjectMemory(inA, (inA->rmap->n+1)*sizeof(PetscScalar));CHKERRQ(ierr); 228494a9d846SBarry Smith } 228563b91edcSBarry Smith 2286f1e2ffcdSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(inA);CHKERRQ(ierr); 2287137fb511SHong Zhang if (row_identity && col_identity) { 2288ad04f41aSHong Zhang ierr = MatLUFactorNumeric_SeqAIJ_inplace(outA,inA,info);CHKERRQ(ierr); 2289137fb511SHong Zhang } else { 2290719d5645SBarry Smith ierr = MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA,inA,info);CHKERRQ(ierr); 2291137fb511SHong Zhang } 22923a40ed3dSBarry Smith PetscFunctionReturn(0); 2293a871dcd8SBarry Smith } 2294a871dcd8SBarry Smith 22954a2ae208SSatish Balay #undef __FUNCT__ 22964a2ae208SSatish Balay #define __FUNCT__ "MatScale_SeqAIJ" 2297f4df32b1SMatthew Knepley PetscErrorCode MatScale_SeqAIJ(Mat inA,PetscScalar alpha) 2298f0b747eeSBarry Smith { 2299f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 2300f4df32b1SMatthew Knepley PetscScalar oalpha = alpha; 2301efee365bSSatish Balay PetscErrorCode ierr; 23020805154bSBarry Smith PetscBLASInt one = 1,bnz = PetscBLASIntCast(a->nz); 23033a40ed3dSBarry Smith 23043a40ed3dSBarry Smith PetscFunctionBegin; 2305f4df32b1SMatthew Knepley BLASscal_(&bnz,&oalpha,a->a,&one); 2306efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 23073a40ed3dSBarry Smith PetscFunctionReturn(0); 2308f0b747eeSBarry Smith } 2309f0b747eeSBarry Smith 23104a2ae208SSatish Balay #undef __FUNCT__ 23114a2ae208SSatish Balay #define __FUNCT__ "MatGetSubMatrices_SeqAIJ" 231297f1f81fSBarry Smith PetscErrorCode MatGetSubMatrices_SeqAIJ(Mat A,PetscInt n,const IS irow[],const IS icol[],MatReuse scall,Mat *B[]) 2313cddf8d76SBarry Smith { 2314dfbe8321SBarry Smith PetscErrorCode ierr; 231597f1f81fSBarry Smith PetscInt i; 2316cddf8d76SBarry Smith 23173a40ed3dSBarry Smith PetscFunctionBegin; 2318cddf8d76SBarry Smith if (scall == MAT_INITIAL_MATRIX) { 2319b0a32e0cSBarry Smith ierr = PetscMalloc((n+1)*sizeof(Mat),B);CHKERRQ(ierr); 2320cddf8d76SBarry Smith } 2321cddf8d76SBarry Smith 2322cddf8d76SBarry Smith for (i=0; i<n; i++) { 23236a6a5d1dSBarry Smith ierr = MatGetSubMatrix_SeqAIJ(A,irow[i],icol[i],PETSC_DECIDE,scall,&(*B)[i]);CHKERRQ(ierr); 2324cddf8d76SBarry Smith } 23253a40ed3dSBarry Smith PetscFunctionReturn(0); 2326cddf8d76SBarry Smith } 2327cddf8d76SBarry Smith 23284a2ae208SSatish Balay #undef __FUNCT__ 23294a2ae208SSatish Balay #define __FUNCT__ "MatIncreaseOverlap_SeqAIJ" 233097f1f81fSBarry Smith PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A,PetscInt is_max,IS is[],PetscInt ov) 23314dcbc457SBarry Smith { 2332e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 23336849ba73SBarry Smith PetscErrorCode ierr; 23345d0c19d7SBarry Smith PetscInt row,i,j,k,l,m,n,*nidx,isz,val; 23355d0c19d7SBarry Smith const PetscInt *idx; 233697f1f81fSBarry Smith PetscInt start,end,*ai,*aj; 2337f1af5d2fSBarry Smith PetscBT table; 2338bbd702dbSSatish Balay 23393a40ed3dSBarry Smith PetscFunctionBegin; 2340d0f46423SBarry Smith m = A->rmap->n; 2341e4d965acSSatish Balay ai = a->i; 2342bfeeae90SHong Zhang aj = a->j; 23438a047759SSatish Balay 2344e32f2f54SBarry Smith if (ov < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"illegal negative overlap value used"); 234506763907SSatish Balay 234697f1f81fSBarry Smith ierr = PetscMalloc((m+1)*sizeof(PetscInt),&nidx);CHKERRQ(ierr); 23476831982aSBarry Smith ierr = PetscBTCreate(m,table);CHKERRQ(ierr); 234806763907SSatish Balay 2349e4d965acSSatish Balay for (i=0; i<is_max; i++) { 2350b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2351e4d965acSSatish Balay isz = 0; 23526831982aSBarry Smith ierr = PetscBTMemzero(m,table);CHKERRQ(ierr); 2353e4d965acSSatish Balay 2354e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 23554dcbc457SBarry Smith ierr = ISGetIndices(is[i],&idx);CHKERRQ(ierr); 2356b9b97703SBarry Smith ierr = ISGetLocalSize(is[i],&n);CHKERRQ(ierr); 2357e4d965acSSatish Balay 2358dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2359e4d965acSSatish Balay for (j=0; j<n ; ++j){ 2360f1af5d2fSBarry Smith if(!PetscBTLookupSet(table,idx[j])) { nidx[isz++] = idx[j];} 23614dcbc457SBarry Smith } 236206763907SSatish Balay ierr = ISRestoreIndices(is[i],&idx);CHKERRQ(ierr); 23636bf464f9SBarry Smith ierr = ISDestroy(&is[i]);CHKERRQ(ierr); 2364e4d965acSSatish Balay 236504a348a9SBarry Smith k = 0; 236604a348a9SBarry Smith for (j=0; j<ov; j++){ /* for each overlap */ 236704a348a9SBarry Smith n = isz; 236806763907SSatish Balay for (; k<n ; k++){ /* do only those rows in nidx[k], which are not done yet */ 2369e4d965acSSatish Balay row = nidx[k]; 2370e4d965acSSatish Balay start = ai[row]; 2371e4d965acSSatish Balay end = ai[row+1]; 237204a348a9SBarry Smith for (l = start; l<end ; l++){ 2373efb16452SHong Zhang val = aj[l] ; 2374f1af5d2fSBarry Smith if (!PetscBTLookupSet(table,val)) {nidx[isz++] = val;} 2375e4d965acSSatish Balay } 2376e4d965acSSatish Balay } 2377e4d965acSSatish Balay } 237870b3c8c7SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,isz,nidx,PETSC_COPY_VALUES,(is+i));CHKERRQ(ierr); 2379e4d965acSSatish Balay } 23806831982aSBarry Smith ierr = PetscBTDestroy(table);CHKERRQ(ierr); 2381606d414cSSatish Balay ierr = PetscFree(nidx);CHKERRQ(ierr); 23823a40ed3dSBarry Smith PetscFunctionReturn(0); 23834dcbc457SBarry Smith } 238417ab2063SBarry Smith 23850513a670SBarry Smith /* -------------------------------------------------------------- */ 23864a2ae208SSatish Balay #undef __FUNCT__ 23874a2ae208SSatish Balay #define __FUNCT__ "MatPermute_SeqAIJ" 2388dfbe8321SBarry Smith PetscErrorCode MatPermute_SeqAIJ(Mat A,IS rowp,IS colp,Mat *B) 23890513a670SBarry Smith { 23900513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 23916849ba73SBarry Smith PetscErrorCode ierr; 23923b98c0a2SBarry Smith PetscInt i,nz = 0,m = A->rmap->n,n = A->cmap->n; 23935d0c19d7SBarry Smith const PetscInt *row,*col; 23945d0c19d7SBarry Smith PetscInt *cnew,j,*lens; 239556cd22aeSBarry Smith IS icolp,irowp; 23963b98c0a2SBarry Smith PetscInt *cwork = PETSC_NULL; 23973b98c0a2SBarry Smith PetscScalar *vwork = PETSC_NULL; 23980513a670SBarry Smith 23993a40ed3dSBarry Smith PetscFunctionBegin; 24004c49b128SBarry Smith ierr = ISInvertPermutation(rowp,PETSC_DECIDE,&irowp);CHKERRQ(ierr); 240156cd22aeSBarry Smith ierr = ISGetIndices(irowp,&row);CHKERRQ(ierr); 24024c49b128SBarry Smith ierr = ISInvertPermutation(colp,PETSC_DECIDE,&icolp);CHKERRQ(ierr); 240356cd22aeSBarry Smith ierr = ISGetIndices(icolp,&col);CHKERRQ(ierr); 24040513a670SBarry Smith 24050513a670SBarry Smith /* determine lengths of permuted rows */ 240697f1f81fSBarry Smith ierr = PetscMalloc((m+1)*sizeof(PetscInt),&lens);CHKERRQ(ierr); 24070513a670SBarry Smith for (i=0; i<m; i++) { 24080513a670SBarry Smith lens[row[i]] = a->i[i+1] - a->i[i]; 24090513a670SBarry Smith } 24107adad957SLisandro Dalcin ierr = MatCreate(((PetscObject)A)->comm,B);CHKERRQ(ierr); 2411f69a0ea3SMatthew Knepley ierr = MatSetSizes(*B,m,n,m,n);CHKERRQ(ierr); 24127adad957SLisandro Dalcin ierr = MatSetType(*B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2413ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(*B,0,lens);CHKERRQ(ierr); 2414606d414cSSatish Balay ierr = PetscFree(lens);CHKERRQ(ierr); 24150513a670SBarry Smith 241697f1f81fSBarry Smith ierr = PetscMalloc(n*sizeof(PetscInt),&cnew);CHKERRQ(ierr); 24170513a670SBarry Smith for (i=0; i<m; i++) { 241832ec9ce4SBarry Smith ierr = MatGetRow_SeqAIJ(A,i,&nz,&cwork,&vwork);CHKERRQ(ierr); 24190513a670SBarry Smith for (j=0; j<nz; j++) { cnew[j] = col[cwork[j]];} 2420cdc0ba36SBarry Smith ierr = MatSetValues_SeqAIJ(*B,1,&row[i],nz,cnew,vwork,INSERT_VALUES);CHKERRQ(ierr); 242132ec9ce4SBarry Smith ierr = MatRestoreRow_SeqAIJ(A,i,&nz,&cwork,&vwork);CHKERRQ(ierr); 24220513a670SBarry Smith } 2423606d414cSSatish Balay ierr = PetscFree(cnew);CHKERRQ(ierr); 24243c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 24250513a670SBarry Smith ierr = MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 24260513a670SBarry Smith ierr = MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 242756cd22aeSBarry Smith ierr = ISRestoreIndices(irowp,&row);CHKERRQ(ierr); 242856cd22aeSBarry Smith ierr = ISRestoreIndices(icolp,&col);CHKERRQ(ierr); 24296bf464f9SBarry Smith ierr = ISDestroy(&irowp);CHKERRQ(ierr); 24306bf464f9SBarry Smith ierr = ISDestroy(&icolp);CHKERRQ(ierr); 24313a40ed3dSBarry Smith PetscFunctionReturn(0); 24320513a670SBarry Smith } 24330513a670SBarry Smith 24344a2ae208SSatish Balay #undef __FUNCT__ 24354a2ae208SSatish Balay #define __FUNCT__ "MatCopy_SeqAIJ" 2436dfbe8321SBarry Smith PetscErrorCode MatCopy_SeqAIJ(Mat A,Mat B,MatStructure str) 2437cb5b572fSBarry Smith { 2438dfbe8321SBarry Smith PetscErrorCode ierr; 2439cb5b572fSBarry Smith 2440cb5b572fSBarry Smith PetscFunctionBegin; 244133f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 244233f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2443be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2444be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ*)B->data; 2445be6bf707SBarry Smith 2446700c5bfcSBarry Smith if (a->i[A->rmap->n] != b->i[B->rmap->n]) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Number of nonzeros in two matrices are different"); 2447d0f46423SBarry Smith ierr = PetscMemcpy(b->a,a->a,(a->i[A->rmap->n])*sizeof(PetscScalar));CHKERRQ(ierr); 2448cb5b572fSBarry Smith } else { 2449cb5b572fSBarry Smith ierr = MatCopy_Basic(A,B,str);CHKERRQ(ierr); 2450cb5b572fSBarry Smith } 2451cb5b572fSBarry Smith PetscFunctionReturn(0); 2452cb5b572fSBarry Smith } 2453cb5b572fSBarry Smith 24544a2ae208SSatish Balay #undef __FUNCT__ 24554a2ae208SSatish Balay #define __FUNCT__ "MatSetUpPreallocation_SeqAIJ" 2456dfbe8321SBarry Smith PetscErrorCode MatSetUpPreallocation_SeqAIJ(Mat A) 2457273d9f13SBarry Smith { 2458dfbe8321SBarry Smith PetscErrorCode ierr; 2459273d9f13SBarry Smith 2460273d9f13SBarry Smith PetscFunctionBegin; 2461ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(A,PETSC_DEFAULT,0);CHKERRQ(ierr); 2462273d9f13SBarry Smith PetscFunctionReturn(0); 2463273d9f13SBarry Smith } 2464273d9f13SBarry Smith 24654a2ae208SSatish Balay #undef __FUNCT__ 24664a2ae208SSatish Balay #define __FUNCT__ "MatGetArray_SeqAIJ" 2467a77337e4SBarry Smith PetscErrorCode MatGetArray_SeqAIJ(Mat A,PetscScalar *array[]) 24686c0721eeSBarry Smith { 24696c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 24706c0721eeSBarry Smith PetscFunctionBegin; 24716c0721eeSBarry Smith *array = a->a; 24726c0721eeSBarry Smith PetscFunctionReturn(0); 24736c0721eeSBarry Smith } 24746c0721eeSBarry Smith 24754a2ae208SSatish Balay #undef __FUNCT__ 24764a2ae208SSatish Balay #define __FUNCT__ "MatRestoreArray_SeqAIJ" 2477dfbe8321SBarry Smith PetscErrorCode MatRestoreArray_SeqAIJ(Mat A,PetscScalar *array[]) 24786c0721eeSBarry Smith { 24796c0721eeSBarry Smith PetscFunctionBegin; 24806c0721eeSBarry Smith PetscFunctionReturn(0); 24816c0721eeSBarry Smith } 2482273d9f13SBarry Smith 2483ee4f033dSBarry Smith #undef __FUNCT__ 2484ee4f033dSBarry Smith #define __FUNCT__ "MatFDColoringApply_SeqAIJ" 2485dfbe8321SBarry Smith PetscErrorCode MatFDColoringApply_SeqAIJ(Mat J,MatFDColoring coloring,Vec x1,MatStructure *flag,void *sctx) 2486ee4f033dSBarry Smith { 24876849ba73SBarry Smith PetscErrorCode (*f)(void*,Vec,Vec,void*) = (PetscErrorCode (*)(void*,Vec,Vec,void *))coloring->f; 24886849ba73SBarry Smith PetscErrorCode ierr; 248997f1f81fSBarry Smith PetscInt k,N,start,end,l,row,col,srow,**vscaleforrow,m1,m2; 2490efb30889SBarry Smith PetscScalar dx,*y,*xx,*w3_array; 249187828ca2SBarry Smith PetscScalar *vscale_array; 2492ee4f033dSBarry Smith PetscReal epsilon = coloring->error_rel,umin = coloring->umin; 2493ee4f033dSBarry Smith Vec w1,w2,w3; 2494ee4f033dSBarry Smith void *fctx = coloring->fctx; 2495ace3abfcSBarry Smith PetscBool flg = PETSC_FALSE; 2496ee4f033dSBarry Smith 2497ee4f033dSBarry Smith PetscFunctionBegin; 2498ee4f033dSBarry Smith if (!coloring->w1) { 2499ee4f033dSBarry Smith ierr = VecDuplicate(x1,&coloring->w1);CHKERRQ(ierr); 250052e6d16bSBarry Smith ierr = PetscLogObjectParent(coloring,coloring->w1);CHKERRQ(ierr); 2501ee4f033dSBarry Smith ierr = VecDuplicate(x1,&coloring->w2);CHKERRQ(ierr); 250252e6d16bSBarry Smith ierr = PetscLogObjectParent(coloring,coloring->w2);CHKERRQ(ierr); 2503ee4f033dSBarry Smith ierr = VecDuplicate(x1,&coloring->w3);CHKERRQ(ierr); 250452e6d16bSBarry Smith ierr = PetscLogObjectParent(coloring,coloring->w3);CHKERRQ(ierr); 2505ee4f033dSBarry Smith } 2506ee4f033dSBarry Smith w1 = coloring->w1; w2 = coloring->w2; w3 = coloring->w3; 2507ee4f033dSBarry Smith 2508ee4f033dSBarry Smith ierr = MatSetUnfactored(J);CHKERRQ(ierr); 2509acfcf0e5SJed Brown ierr = PetscOptionsGetBool(((PetscObject)coloring)->prefix,"-mat_fd_coloring_dont_rezero",&flg,PETSC_NULL);CHKERRQ(ierr); 2510ee4f033dSBarry Smith if (flg) { 2511ae15b995SBarry Smith ierr = PetscInfo(coloring,"Not calling MatZeroEntries()\n");CHKERRQ(ierr); 2512ee4f033dSBarry Smith } else { 2513ace3abfcSBarry Smith PetscBool assembled; 25140b9b6f31SBarry Smith ierr = MatAssembled(J,&assembled);CHKERRQ(ierr); 25150b9b6f31SBarry Smith if (assembled) { 2516ee4f033dSBarry Smith ierr = MatZeroEntries(J);CHKERRQ(ierr); 2517ee4f033dSBarry Smith } 25180b9b6f31SBarry Smith } 2519ee4f033dSBarry Smith 2520ee4f033dSBarry Smith ierr = VecGetOwnershipRange(x1,&start,&end);CHKERRQ(ierr); 2521ee4f033dSBarry Smith ierr = VecGetSize(x1,&N);CHKERRQ(ierr); 2522ee4f033dSBarry Smith 2523ee4f033dSBarry Smith /* 2524ee4f033dSBarry Smith This is a horrible, horrible, hack. See DMMGComputeJacobian_Multigrid() it inproperly sets 2525ee4f033dSBarry Smith coloring->F for the coarser grids from the finest 2526ee4f033dSBarry Smith */ 2527ee4f033dSBarry Smith if (coloring->F) { 2528ee4f033dSBarry Smith ierr = VecGetLocalSize(coloring->F,&m1);CHKERRQ(ierr); 2529ee4f033dSBarry Smith ierr = VecGetLocalSize(w1,&m2);CHKERRQ(ierr); 2530ee4f033dSBarry Smith if (m1 != m2) { 2531ee4f033dSBarry Smith coloring->F = 0; 2532ee4f033dSBarry Smith } 2533ee4f033dSBarry Smith } 2534ee4f033dSBarry Smith 2535ee4f033dSBarry Smith if (coloring->F) { 2536ee4f033dSBarry Smith w1 = coloring->F; 2537ee4f033dSBarry Smith coloring->F = 0; 2538ee4f033dSBarry Smith } else { 253966f9b7ceSBarry Smith ierr = PetscLogEventBegin(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr); 2540ee4f033dSBarry Smith ierr = (*f)(sctx,x1,w1,fctx);CHKERRQ(ierr); 254166f9b7ceSBarry Smith ierr = PetscLogEventEnd(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr); 2542ee4f033dSBarry Smith } 2543ee4f033dSBarry Smith 2544ee4f033dSBarry Smith /* 2545ee4f033dSBarry Smith Compute all the scale factors and share with other processors 2546ee4f033dSBarry Smith */ 25471ebc52fbSHong Zhang ierr = VecGetArray(x1,&xx);CHKERRQ(ierr);xx = xx - start; 25481ebc52fbSHong Zhang ierr = VecGetArray(coloring->vscale,&vscale_array);CHKERRQ(ierr);vscale_array = vscale_array - start; 2549ee4f033dSBarry Smith for (k=0; k<coloring->ncolors; k++) { 2550ee4f033dSBarry Smith /* 2551ee4f033dSBarry Smith Loop over each column associated with color adding the 2552ee4f033dSBarry Smith perturbation to the vector w3. 2553ee4f033dSBarry Smith */ 2554ee4f033dSBarry Smith for (l=0; l<coloring->ncolumns[k]; l++) { 2555ee4f033dSBarry Smith col = coloring->columns[k][l]; /* column of the matrix we are probing for */ 2556ee4f033dSBarry Smith dx = xx[col]; 2557ee4f033dSBarry Smith if (dx == 0.0) dx = 1.0; 2558ee4f033dSBarry Smith #if !defined(PETSC_USE_COMPLEX) 2559ee4f033dSBarry Smith if (dx < umin && dx >= 0.0) dx = umin; 2560ee4f033dSBarry Smith else if (dx < 0.0 && dx > -umin) dx = -umin; 2561ee4f033dSBarry Smith #else 2562ee4f033dSBarry Smith if (PetscAbsScalar(dx) < umin && PetscRealPart(dx) >= 0.0) dx = umin; 2563ee4f033dSBarry Smith else if (PetscRealPart(dx) < 0.0 && PetscAbsScalar(dx) < umin) dx = -umin; 2564ee4f033dSBarry Smith #endif 2565ee4f033dSBarry Smith dx *= epsilon; 2566ee4f033dSBarry Smith vscale_array[col] = 1.0/dx; 2567ee4f033dSBarry Smith } 2568ee4f033dSBarry Smith } 25691ebc52fbSHong Zhang vscale_array = vscale_array + start;ierr = VecRestoreArray(coloring->vscale,&vscale_array);CHKERRQ(ierr); 2570ee4f033dSBarry Smith ierr = VecGhostUpdateBegin(coloring->vscale,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2571ee4f033dSBarry Smith ierr = VecGhostUpdateEnd(coloring->vscale,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2572ee4f033dSBarry Smith 2573ee4f033dSBarry Smith /* ierr = VecView(coloring->vscale,PETSC_VIEWER_STDOUT_WORLD); 2574ee4f033dSBarry Smith ierr = VecView(x1,PETSC_VIEWER_STDOUT_WORLD);*/ 2575ee4f033dSBarry Smith 2576ee4f033dSBarry Smith if (coloring->vscaleforrow) vscaleforrow = coloring->vscaleforrow; 2577ee4f033dSBarry Smith else vscaleforrow = coloring->columnsforrow; 2578ee4f033dSBarry Smith 25791ebc52fbSHong Zhang ierr = VecGetArray(coloring->vscale,&vscale_array);CHKERRQ(ierr); 2580ee4f033dSBarry Smith /* 2581ee4f033dSBarry Smith Loop over each color 2582ee4f033dSBarry Smith */ 2583ee4f033dSBarry Smith for (k=0; k<coloring->ncolors; k++) { 258449b058dcSBarry Smith coloring->currentcolor = k; 2585ee4f033dSBarry Smith ierr = VecCopy(x1,w3);CHKERRQ(ierr); 25861ebc52fbSHong Zhang ierr = VecGetArray(w3,&w3_array);CHKERRQ(ierr);w3_array = w3_array - start; 2587ee4f033dSBarry Smith /* 2588ee4f033dSBarry Smith Loop over each column associated with color adding the 2589ee4f033dSBarry Smith perturbation to the vector w3. 2590ee4f033dSBarry Smith */ 2591ee4f033dSBarry Smith for (l=0; l<coloring->ncolumns[k]; l++) { 2592ee4f033dSBarry Smith col = coloring->columns[k][l]; /* column of the matrix we are probing for */ 2593ee4f033dSBarry Smith dx = xx[col]; 25945b8514ebSBarry Smith if (dx == 0.0) dx = 1.0; 2595ee4f033dSBarry Smith #if !defined(PETSC_USE_COMPLEX) 2596ee4f033dSBarry Smith if (dx < umin && dx >= 0.0) dx = umin; 2597ee4f033dSBarry Smith else if (dx < 0.0 && dx > -umin) dx = -umin; 2598ee4f033dSBarry Smith #else 2599ee4f033dSBarry Smith if (PetscAbsScalar(dx) < umin && PetscRealPart(dx) >= 0.0) dx = umin; 2600ee4f033dSBarry Smith else if (PetscRealPart(dx) < 0.0 && PetscAbsScalar(dx) < umin) dx = -umin; 2601ee4f033dSBarry Smith #endif 2602ee4f033dSBarry Smith dx *= epsilon; 2603e32f2f54SBarry Smith if (!PetscAbsScalar(dx)) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Computed 0 differencing parameter"); 2604ee4f033dSBarry Smith w3_array[col] += dx; 2605ee4f033dSBarry Smith } 26061ebc52fbSHong Zhang w3_array = w3_array + start; ierr = VecRestoreArray(w3,&w3_array);CHKERRQ(ierr); 2607ee4f033dSBarry Smith 2608ee4f033dSBarry Smith /* 2609ee4f033dSBarry Smith Evaluate function at x1 + dx (here dx is a vector of perturbations) 2610ee4f033dSBarry Smith */ 2611ee4f033dSBarry Smith 261266f9b7ceSBarry Smith ierr = PetscLogEventBegin(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr); 2613ee4f033dSBarry Smith ierr = (*f)(sctx,w3,w2,fctx);CHKERRQ(ierr); 261466f9b7ceSBarry Smith ierr = PetscLogEventEnd(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr); 2615efb30889SBarry Smith ierr = VecAXPY(w2,-1.0,w1);CHKERRQ(ierr); 2616ee4f033dSBarry Smith 2617ee4f033dSBarry Smith /* 2618ee4f033dSBarry Smith Loop over rows of vector, putting results into Jacobian matrix 2619ee4f033dSBarry Smith */ 26201ebc52fbSHong Zhang ierr = VecGetArray(w2,&y);CHKERRQ(ierr); 2621ee4f033dSBarry Smith for (l=0; l<coloring->nrows[k]; l++) { 2622ee4f033dSBarry Smith row = coloring->rows[k][l]; 2623ee4f033dSBarry Smith col = coloring->columnsforrow[k][l]; 2624ee4f033dSBarry Smith y[row] *= vscale_array[vscaleforrow[k][l]]; 2625ee4f033dSBarry Smith srow = row + start; 2626ee4f033dSBarry Smith ierr = MatSetValues_SeqAIJ(J,1,&srow,1,&col,y+row,INSERT_VALUES);CHKERRQ(ierr); 2627ee4f033dSBarry Smith } 26281ebc52fbSHong Zhang ierr = VecRestoreArray(w2,&y);CHKERRQ(ierr); 2629ee4f033dSBarry Smith } 263049b058dcSBarry Smith coloring->currentcolor = k; 26311ebc52fbSHong Zhang ierr = VecRestoreArray(coloring->vscale,&vscale_array);CHKERRQ(ierr); 26321ebc52fbSHong Zhang xx = xx + start; ierr = VecRestoreArray(x1,&xx);CHKERRQ(ierr); 2633ee4f033dSBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2634ee4f033dSBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2635ee4f033dSBarry Smith PetscFunctionReturn(0); 2636ee4f033dSBarry Smith } 2637ee4f033dSBarry Smith 26388229c054SShri Abhyankar /* 26398229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 26408229c054SShri Abhyankar have different nonzero structure. 26418229c054SShri Abhyankar */ 2642ac90fabeSBarry Smith #undef __FUNCT__ 26438229c054SShri Abhyankar #define __FUNCT__ "MatAXPYGetPreallocation_SeqAIJ" 26448229c054SShri Abhyankar PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y,Mat X,PetscInt* nnz) 2645ec7775f6SShri Abhyankar { 26468229c054SShri Abhyankar PetscInt i,m=Y->rmap->N; 2647ec7775f6SShri Abhyankar Mat_SeqAIJ *x = (Mat_SeqAIJ*)X->data; 2648ec7775f6SShri Abhyankar Mat_SeqAIJ *y = (Mat_SeqAIJ*)Y->data; 2649ec7775f6SShri Abhyankar const PetscInt *xi = x->i,*yi = y->i; 2650ec7775f6SShri Abhyankar 2651ec7775f6SShri Abhyankar PetscFunctionBegin; 2652ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 2653ec7775f6SShri Abhyankar for(i=0; i<m; i++) { 26548af7cee1SJed Brown PetscInt j,k,nzx = xi[i+1] - xi[i],nzy = yi[i+1] - yi[i]; 26558af7cee1SJed Brown const PetscInt *xj = x->j+xi[i],*yj = y->j+yi[i]; 26568af7cee1SJed Brown nnz[i] = 0; 26578af7cee1SJed Brown for (j=0,k=0; j<nzx; j++) { /* Point in X */ 26588af7cee1SJed Brown for (; k<nzy && yj[k]<xj[j]; k++) nnz[i]++; /* Catch up to X */ 26598af7cee1SJed Brown if (k<nzy && yj[k]==xj[j]) k++; /* Skip duplicate */ 26608af7cee1SJed Brown nnz[i]++; 26618af7cee1SJed Brown } 26628af7cee1SJed Brown for (; k<nzy; k++) nnz[i]++; 2663ec7775f6SShri Abhyankar } 2664ec7775f6SShri Abhyankar PetscFunctionReturn(0); 2665ec7775f6SShri Abhyankar } 2666ec7775f6SShri Abhyankar 2667ec7775f6SShri Abhyankar #undef __FUNCT__ 2668ac90fabeSBarry Smith #define __FUNCT__ "MatAXPY_SeqAIJ" 2669f4df32b1SMatthew Knepley PetscErrorCode MatAXPY_SeqAIJ(Mat Y,PetscScalar a,Mat X,MatStructure str) 2670ac90fabeSBarry Smith { 2671dfbe8321SBarry Smith PetscErrorCode ierr; 267297f1f81fSBarry Smith PetscInt i; 2673ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data,*y = (Mat_SeqAIJ *)Y->data; 26740805154bSBarry Smith PetscBLASInt one=1,bnz = PetscBLASIntCast(x->nz); 2675ac90fabeSBarry Smith 2676ac90fabeSBarry Smith PetscFunctionBegin; 2677ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 2678f4df32b1SMatthew Knepley PetscScalar alpha = a; 2679f4df32b1SMatthew Knepley BLASaxpy_(&bnz,&alpha,x->a,&one,y->a,&one); 2680c537a176SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 2681a30b2313SHong Zhang if (y->xtoy && y->XtoY != X) { 2682a30b2313SHong Zhang ierr = PetscFree(y->xtoy);CHKERRQ(ierr); 26836bf464f9SBarry Smith ierr = MatDestroy(&y->XtoY);CHKERRQ(ierr); 2684a30b2313SHong Zhang } 2685a30b2313SHong Zhang if (!y->xtoy) { /* get xtoy */ 2686d0f46423SBarry Smith ierr = MatAXPYGetxtoy_Private(X->rmap->n,x->i,x->j,PETSC_NULL, y->i,y->j,PETSC_NULL, &y->xtoy);CHKERRQ(ierr); 2687a30b2313SHong Zhang y->XtoY = X; 2688407f6b05SHong Zhang ierr = PetscObjectReference((PetscObject)X);CHKERRQ(ierr); 2689c537a176SHong Zhang } 2690f4df32b1SMatthew Knepley for (i=0; i<x->nz; i++) y->a[y->xtoy[i]] += a*(x->a[i]); 26911e2582c4SBarry Smith ierr = PetscInfo3(Y,"ratio of nnz(X)/nnz(Y): %d/%d = %G\n",x->nz,y->nz,(PetscReal)(x->nz)/y->nz);CHKERRQ(ierr); 2692ac90fabeSBarry Smith } else { 26938229c054SShri Abhyankar Mat B; 26948229c054SShri Abhyankar PetscInt *nnz; 269516b2e9dcSShri Abhyankar ierr = PetscMalloc(Y->rmap->N*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 2696ec7775f6SShri Abhyankar ierr = MatCreate(((PetscObject)Y)->comm,&B);CHKERRQ(ierr); 2697bc5a2726SShri Abhyankar ierr = PetscObjectSetName((PetscObject)B,((PetscObject)Y)->name);CHKERRQ(ierr); 26984aa94f47SShri Abhyankar ierr = MatSetSizes(B,Y->rmap->n,Y->cmap->n,Y->rmap->N,Y->cmap->N);CHKERRQ(ierr); 2699ec7775f6SShri Abhyankar ierr = MatSetType(B,MATSEQAIJ);CHKERRQ(ierr); 27008229c054SShri Abhyankar ierr = MatAXPYGetPreallocation_SeqAIJ(Y,X,nnz);CHKERRQ(ierr); 27018229c054SShri Abhyankar ierr = MatSeqAIJSetPreallocation(B,PETSC_NULL,nnz);CHKERRQ(ierr); 2702ec7775f6SShri Abhyankar ierr = MatAXPY_BasicWithPreallocation(B,Y,a,X,str);CHKERRQ(ierr); 2703ec7775f6SShri Abhyankar ierr = MatHeaderReplace(Y,B);CHKERRQ(ierr); 27048229c054SShri Abhyankar ierr = PetscFree(nnz);CHKERRQ(ierr); 2705ac90fabeSBarry Smith } 2706ac90fabeSBarry Smith PetscFunctionReturn(0); 2707ac90fabeSBarry Smith } 2708ac90fabeSBarry Smith 2709521d7252SBarry Smith #undef __FUNCT__ 2710521d7252SBarry Smith #define __FUNCT__ "MatSetBlockSize_SeqAIJ" 2711521d7252SBarry Smith PetscErrorCode MatSetBlockSize_SeqAIJ(Mat A,PetscInt bs) 2712521d7252SBarry Smith { 271341c166b1SJed Brown PetscErrorCode ierr; 271441c166b1SJed Brown 2715521d7252SBarry Smith PetscFunctionBegin; 271641c166b1SJed Brown ierr = PetscLayoutSetBlockSize(A->rmap,bs);CHKERRQ(ierr); 271741c166b1SJed Brown ierr = PetscLayoutSetBlockSize(A->cmap,bs);CHKERRQ(ierr); 2718521d7252SBarry Smith PetscFunctionReturn(0); 2719521d7252SBarry Smith } 2720521d7252SBarry Smith 2721354c94deSBarry Smith #undef __FUNCT__ 2722354c94deSBarry Smith #define __FUNCT__ "MatConjugate_SeqAIJ" 27237087cfbeSBarry Smith PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 2724354c94deSBarry Smith { 2725354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 2726354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 2727354c94deSBarry Smith PetscInt i,nz; 2728354c94deSBarry Smith PetscScalar *a; 2729354c94deSBarry Smith 2730354c94deSBarry Smith PetscFunctionBegin; 2731354c94deSBarry Smith nz = aij->nz; 2732354c94deSBarry Smith a = aij->a; 2733354c94deSBarry Smith for (i=0; i<nz; i++) { 2734354c94deSBarry Smith a[i] = PetscConj(a[i]); 2735354c94deSBarry Smith } 2736354c94deSBarry Smith #else 2737354c94deSBarry Smith PetscFunctionBegin; 2738354c94deSBarry Smith #endif 2739354c94deSBarry Smith PetscFunctionReturn(0); 2740354c94deSBarry Smith } 2741354c94deSBarry Smith 2742e34fafa9SBarry Smith #undef __FUNCT__ 2743985db425SBarry Smith #define __FUNCT__ "MatGetRowMaxAbs_SeqAIJ" 2744985db425SBarry Smith PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 2745e34fafa9SBarry Smith { 2746e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2747e34fafa9SBarry Smith PetscErrorCode ierr; 2748d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 2749e34fafa9SBarry Smith PetscReal atmp; 2750985db425SBarry Smith PetscScalar *x; 2751e34fafa9SBarry Smith MatScalar *aa; 2752e34fafa9SBarry Smith 2753e34fafa9SBarry Smith PetscFunctionBegin; 2754e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2755e34fafa9SBarry Smith aa = a->a; 2756e34fafa9SBarry Smith ai = a->i; 2757e34fafa9SBarry Smith aj = a->j; 2758e34fafa9SBarry Smith 2759985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 2760e34fafa9SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2761e34fafa9SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 2762e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2763e34fafa9SBarry Smith for (i=0; i<m; i++) { 2764e34fafa9SBarry Smith ncols = ai[1] - ai[0]; ai++; 27659189402eSHong Zhang x[i] = 0.0; 2766e34fafa9SBarry Smith for (j=0; j<ncols; j++){ 2767985db425SBarry Smith atmp = PetscAbsScalar(*aa); 2768985db425SBarry Smith if (PetscAbsScalar(x[i]) < atmp) {x[i] = atmp; if (idx) idx[i] = *aj;} 2769985db425SBarry Smith aa++; aj++; 2770985db425SBarry Smith } 2771985db425SBarry Smith } 2772985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2773985db425SBarry Smith PetscFunctionReturn(0); 2774985db425SBarry Smith } 2775985db425SBarry Smith 2776985db425SBarry Smith #undef __FUNCT__ 2777985db425SBarry Smith #define __FUNCT__ "MatGetRowMax_SeqAIJ" 2778985db425SBarry Smith PetscErrorCode MatGetRowMax_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 2779985db425SBarry Smith { 2780985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2781985db425SBarry Smith PetscErrorCode ierr; 2782d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 2783985db425SBarry Smith PetscScalar *x; 2784985db425SBarry Smith MatScalar *aa; 2785985db425SBarry Smith 2786985db425SBarry Smith PetscFunctionBegin; 2787e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2788985db425SBarry Smith aa = a->a; 2789985db425SBarry Smith ai = a->i; 2790985db425SBarry Smith aj = a->j; 2791985db425SBarry Smith 2792985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 2793985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2794985db425SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 2795e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2796985db425SBarry Smith for (i=0; i<m; i++) { 2797985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 2798d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 2799985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 2800985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 2801985db425SBarry Smith x[i] = 0.0; 2802985db425SBarry Smith if (idx) { 2803985db425SBarry Smith idx[i] = 0; /* in case ncols is zero */ 2804985db425SBarry Smith for (j=0;j<ncols;j++) { /* find first implicit 0.0 in the row */ 2805985db425SBarry Smith if (aj[j] > j) { 2806985db425SBarry Smith idx[i] = j; 2807985db425SBarry Smith break; 2808985db425SBarry Smith } 2809985db425SBarry Smith } 2810985db425SBarry Smith } 2811985db425SBarry Smith } 2812985db425SBarry Smith for (j=0; j<ncols; j++){ 2813985db425SBarry Smith if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 2814985db425SBarry Smith aa++; aj++; 2815985db425SBarry Smith } 2816985db425SBarry Smith } 2817985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2818985db425SBarry Smith PetscFunctionReturn(0); 2819985db425SBarry Smith } 2820985db425SBarry Smith 2821985db425SBarry Smith #undef __FUNCT__ 2822c87e5d42SMatthew Knepley #define __FUNCT__ "MatGetRowMinAbs_SeqAIJ" 2823c87e5d42SMatthew Knepley PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 2824c87e5d42SMatthew Knepley { 2825c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2826c87e5d42SMatthew Knepley PetscErrorCode ierr; 2827c87e5d42SMatthew Knepley PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 2828c87e5d42SMatthew Knepley PetscReal atmp; 2829c87e5d42SMatthew Knepley PetscScalar *x; 2830c87e5d42SMatthew Knepley MatScalar *aa; 2831c87e5d42SMatthew Knepley 2832c87e5d42SMatthew Knepley PetscFunctionBegin; 2833e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2834c87e5d42SMatthew Knepley aa = a->a; 2835c87e5d42SMatthew Knepley ai = a->i; 2836c87e5d42SMatthew Knepley aj = a->j; 2837c87e5d42SMatthew Knepley 2838c87e5d42SMatthew Knepley ierr = VecSet(v,0.0);CHKERRQ(ierr); 2839c87e5d42SMatthew Knepley ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2840c87e5d42SMatthew Knepley ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 2841e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2842c87e5d42SMatthew Knepley for (i=0; i<m; i++) { 2843c87e5d42SMatthew Knepley ncols = ai[1] - ai[0]; ai++; 2844289a08f5SMatthew Knepley if (ncols) { 2845289a08f5SMatthew Knepley /* Get first nonzero */ 2846289a08f5SMatthew Knepley for(j = 0; j < ncols; j++) { 2847289a08f5SMatthew Knepley atmp = PetscAbsScalar(aa[j]); 2848289a08f5SMatthew Knepley if (atmp > 1.0e-12) {x[i] = atmp; if (idx) idx[i] = aj[j]; break;} 2849289a08f5SMatthew Knepley } 2850289a08f5SMatthew Knepley if (j == ncols) {x[i] = *aa; if (idx) idx[i] = *aj;} 2851289a08f5SMatthew Knepley } else { 2852289a08f5SMatthew Knepley x[i] = 0.0; if (idx) idx[i] = 0; 2853289a08f5SMatthew Knepley } 2854c87e5d42SMatthew Knepley for(j = 0; j < ncols; j++) { 2855c87e5d42SMatthew Knepley atmp = PetscAbsScalar(*aa); 2856289a08f5SMatthew Knepley if (atmp > 1.0e-12 && PetscAbsScalar(x[i]) > atmp) {x[i] = atmp; if (idx) idx[i] = *aj;} 2857c87e5d42SMatthew Knepley aa++; aj++; 2858c87e5d42SMatthew Knepley } 2859c87e5d42SMatthew Knepley } 2860c87e5d42SMatthew Knepley ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2861c87e5d42SMatthew Knepley PetscFunctionReturn(0); 2862c87e5d42SMatthew Knepley } 2863c87e5d42SMatthew Knepley 2864c87e5d42SMatthew Knepley #undef __FUNCT__ 2865985db425SBarry Smith #define __FUNCT__ "MatGetRowMin_SeqAIJ" 2866985db425SBarry Smith PetscErrorCode MatGetRowMin_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 2867985db425SBarry Smith { 2868985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2869985db425SBarry Smith PetscErrorCode ierr; 2870d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 2871985db425SBarry Smith PetscScalar *x; 2872985db425SBarry Smith MatScalar *aa; 2873985db425SBarry Smith 2874985db425SBarry Smith PetscFunctionBegin; 2875e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2876985db425SBarry Smith aa = a->a; 2877985db425SBarry Smith ai = a->i; 2878985db425SBarry Smith aj = a->j; 2879985db425SBarry Smith 2880985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 2881985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2882985db425SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 2883e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2884985db425SBarry Smith for (i=0; i<m; i++) { 2885985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 2886d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 2887985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 2888985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 2889985db425SBarry Smith x[i] = 0.0; 2890985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 2891985db425SBarry Smith idx[i] = 0; /* in case ncols is zero */ 2892985db425SBarry Smith for (j=0;j<ncols;j++) { 2893985db425SBarry Smith if (aj[j] > j) { 2894985db425SBarry Smith idx[i] = j; 2895985db425SBarry Smith break; 2896985db425SBarry Smith } 2897985db425SBarry Smith } 2898985db425SBarry Smith } 2899985db425SBarry Smith } 2900985db425SBarry Smith for (j=0; j<ncols; j++){ 2901985db425SBarry Smith if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 2902985db425SBarry Smith aa++; aj++; 2903e34fafa9SBarry Smith } 2904e34fafa9SBarry Smith } 2905e34fafa9SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2906e34fafa9SBarry Smith PetscFunctionReturn(0); 2907e34fafa9SBarry Smith } 2908bbead8a2SBarry Smith 2909bbead8a2SBarry Smith #include <petscblaslapack.h> 2910bbead8a2SBarry Smith #include <../src/mat/blockinvert.h> 2911bbead8a2SBarry Smith 2912bbead8a2SBarry Smith #undef __FUNCT__ 2913bbead8a2SBarry Smith #define __FUNCT__ "MatInvertBlockDiagonal_SeqAIJ" 2914bbead8a2SBarry Smith PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A,PetscScalar **values) 2915bbead8a2SBarry Smith { 2916bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 2917bbead8a2SBarry Smith PetscErrorCode ierr; 291834fc4b71SJed Brown PetscInt i,bs = A->rmap->bs,mbs = A->rmap->n/A->rmap->bs,ipvt[5],bs2 = bs*bs,*v_pivots,ij[7],*IJ,j; 2919bbead8a2SBarry Smith MatScalar *diag,work[25],*v_work; 2920bbead8a2SBarry Smith PetscReal shift = 0.0; 2921bbead8a2SBarry Smith 2922bbead8a2SBarry Smith PetscFunctionBegin; 29234a0d0026SBarry Smith if (a->ibdiagvalid) { 29244a0d0026SBarry Smith if (values) *values = a->ibdiag; 29254a0d0026SBarry Smith PetscFunctionReturn(0); 29264a0d0026SBarry Smith } 2927bbead8a2SBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 2928bbead8a2SBarry Smith if (!a->ibdiag) { 2929bbead8a2SBarry Smith ierr = PetscMalloc(bs2*mbs*sizeof(PetscScalar),&a->ibdiag);CHKERRQ(ierr); 2930bbead8a2SBarry Smith ierr = PetscLogObjectMemory(A,bs2*mbs*sizeof(PetscScalar));CHKERRQ(ierr); 2931bbead8a2SBarry Smith } 2932bbead8a2SBarry Smith diag = a->ibdiag; 2933bbead8a2SBarry Smith if (values) *values = a->ibdiag; 2934bbead8a2SBarry Smith /* factor and invert each block */ 2935bbead8a2SBarry Smith switch (bs){ 2936bbead8a2SBarry Smith case 1: 2937bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 2938bbead8a2SBarry Smith ierr = MatGetValues(A,1,&i,1,&i,diag+i);CHKERRQ(ierr); 2939bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 2940bbead8a2SBarry Smith } 2941bbead8a2SBarry Smith break; 2942bbead8a2SBarry Smith case 2: 2943bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 2944bbead8a2SBarry Smith ij[0] = 2*i; ij[1] = 2*i + 1; 2945bbead8a2SBarry Smith ierr = MatGetValues(A,2,ij,2,ij,diag);CHKERRQ(ierr); 2946bbead8a2SBarry Smith ierr = Kernel_A_gets_inverse_A_2(diag,shift);CHKERRQ(ierr); 2947bbead8a2SBarry Smith diag += 4; 2948bbead8a2SBarry Smith } 2949bbead8a2SBarry Smith break; 2950bbead8a2SBarry Smith case 3: 2951bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 2952bbead8a2SBarry Smith ij[0] = 3*i; ij[1] = 3*i + 1; ij[2] = 3*i + 2; 2953bbead8a2SBarry Smith ierr = MatGetValues(A,3,ij,3,ij,diag);CHKERRQ(ierr); 2954bbead8a2SBarry Smith ierr = Kernel_A_gets_inverse_A_3(diag,shift);CHKERRQ(ierr); 2955bbead8a2SBarry Smith diag += 9; 2956bbead8a2SBarry Smith } 2957bbead8a2SBarry Smith break; 2958bbead8a2SBarry Smith case 4: 2959bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 2960bbead8a2SBarry Smith ij[0] = 4*i; ij[1] = 4*i + 1; ij[2] = 4*i + 2; ij[3] = 4*i + 3; 2961bbead8a2SBarry Smith ierr = MatGetValues(A,4,ij,4,ij,diag);CHKERRQ(ierr); 2962bbead8a2SBarry Smith ierr = Kernel_A_gets_inverse_A_4(diag,shift);CHKERRQ(ierr); 2963bbead8a2SBarry Smith diag += 16; 2964bbead8a2SBarry Smith } 2965bbead8a2SBarry Smith break; 2966bbead8a2SBarry Smith case 5: 2967bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 2968bbead8a2SBarry Smith ij[0] = 5*i; ij[1] = 5*i + 1; ij[2] = 5*i + 2; ij[3] = 5*i + 3; ij[4] = 5*i + 4; 2969bbead8a2SBarry Smith ierr = MatGetValues(A,5,ij,5,ij,diag);CHKERRQ(ierr); 2970bbead8a2SBarry Smith ierr = Kernel_A_gets_inverse_A_5(diag,ipvt,work,shift);CHKERRQ(ierr); 2971bbead8a2SBarry Smith diag += 25; 2972bbead8a2SBarry Smith } 2973bbead8a2SBarry Smith break; 2974bbead8a2SBarry Smith case 6: 2975bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 2976bbead8a2SBarry Smith ij[0] = 6*i; ij[1] = 6*i + 1; ij[2] = 6*i + 2; ij[3] = 6*i + 3; ij[4] = 6*i + 4; ij[5] = 6*i + 5; 2977bbead8a2SBarry Smith ierr = MatGetValues(A,6,ij,6,ij,diag);CHKERRQ(ierr); 2978bbead8a2SBarry Smith ierr = Kernel_A_gets_inverse_A_6(diag,shift);CHKERRQ(ierr); 2979bbead8a2SBarry Smith diag += 36; 2980bbead8a2SBarry Smith } 2981bbead8a2SBarry Smith break; 2982bbead8a2SBarry Smith case 7: 2983bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 2984bbead8a2SBarry Smith ij[0] = 7*i; ij[1] = 7*i + 1; ij[2] = 7*i + 2; ij[3] = 7*i + 3; ij[4] = 7*i + 4; ij[5] = 7*i + 5; ij[5] = 7*i + 6; 2985bbead8a2SBarry Smith ierr = MatGetValues(A,7,ij,7,ij,diag);CHKERRQ(ierr); 2986bbead8a2SBarry Smith ierr = Kernel_A_gets_inverse_A_7(diag,shift);CHKERRQ(ierr); 2987bbead8a2SBarry Smith diag += 49; 2988bbead8a2SBarry Smith } 2989bbead8a2SBarry Smith break; 2990bbead8a2SBarry Smith default: 2991bbead8a2SBarry Smith ierr = PetscMalloc3(bs,MatScalar,&v_work,bs,PetscInt,&v_pivots,bs,PetscInt,&IJ);CHKERRQ(ierr); 2992bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 2993bbead8a2SBarry Smith for (j=0; j<bs; j++) { 2994bbead8a2SBarry Smith IJ[j] = bs*i + j; 2995bbead8a2SBarry Smith } 2996bbead8a2SBarry Smith ierr = MatGetValues(A,bs,IJ,bs,IJ,diag);CHKERRQ(ierr); 2997bbead8a2SBarry Smith ierr = Kernel_A_gets_inverse_A(bs,diag,v_pivots,v_work);CHKERRQ(ierr); 2998bbead8a2SBarry Smith diag += bs2; 2999bbead8a2SBarry Smith } 3000bbead8a2SBarry Smith ierr = PetscFree3(v_work,v_pivots,IJ);CHKERRQ(ierr); 3001bbead8a2SBarry Smith } 3002bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 3003bbead8a2SBarry Smith PetscFunctionReturn(0); 3004bbead8a2SBarry Smith } 3005bbead8a2SBarry Smith 30067087cfbeSBarry Smith extern PetscErrorCode MatFDColoringApply_AIJ(Mat,MatFDColoring,Vec,MatStructure*,void*); 3007682d7d0cSBarry Smith /* -------------------------------------------------------------------*/ 30080a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3009cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3010cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3011cb5b572fSBarry Smith MatMult_SeqAIJ, 301297304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 30137c922b88SBarry Smith MatMultTranspose_SeqAIJ, 30147c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3015db4efbfdSBarry Smith 0, 3016db4efbfdSBarry Smith 0, 3017db4efbfdSBarry Smith 0, 3018db4efbfdSBarry Smith /*10*/ 0, 3019cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3020cb5b572fSBarry Smith 0, 302141f059aeSBarry Smith MatSOR_SeqAIJ, 302217ab2063SBarry Smith MatTranspose_SeqAIJ, 302397304618SKris Buschelman /*15*/ MatGetInfo_SeqAIJ, 3024cb5b572fSBarry Smith MatEqual_SeqAIJ, 3025cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3026cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3027cb5b572fSBarry Smith MatNorm_SeqAIJ, 302897304618SKris Buschelman /*20*/ 0, 3029cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3030cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3031cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3032d519adbfSMatthew Knepley /*24*/ MatZeroRows_SeqAIJ, 3033db4efbfdSBarry Smith 0, 3034db4efbfdSBarry Smith 0, 3035db4efbfdSBarry Smith 0, 3036db4efbfdSBarry Smith 0, 3037d519adbfSMatthew Knepley /*29*/ MatSetUpPreallocation_SeqAIJ, 3038db4efbfdSBarry Smith 0, 3039db4efbfdSBarry Smith 0, 30406c0721eeSBarry Smith MatGetArray_SeqAIJ, 30416c0721eeSBarry Smith MatRestoreArray_SeqAIJ, 3042d519adbfSMatthew Knepley /*34*/ MatDuplicate_SeqAIJ, 3043cb5b572fSBarry Smith 0, 3044cb5b572fSBarry Smith 0, 3045cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3046cb5b572fSBarry Smith 0, 3047d519adbfSMatthew Knepley /*39*/ MatAXPY_SeqAIJ, 3048cb5b572fSBarry Smith MatGetSubMatrices_SeqAIJ, 3049cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3050cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3051cb5b572fSBarry Smith MatCopy_SeqAIJ, 3052d519adbfSMatthew Knepley /*44*/ MatGetRowMax_SeqAIJ, 3053cb5b572fSBarry Smith MatScale_SeqAIJ, 3054cb5b572fSBarry Smith 0, 305579299369SBarry Smith MatDiagonalSet_SeqAIJ, 30566e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 3057d519adbfSMatthew Knepley /*49*/ MatSetBlockSize_SeqAIJ, 30583b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 30593b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 30603b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3061a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 3062d519adbfSMatthew Knepley /*54*/ MatFDColoringCreate_SeqAIJ, 3063b9617806SBarry Smith 0, 30640513a670SBarry Smith 0, 3065cda55fadSBarry Smith MatPermute_SeqAIJ, 3066cda55fadSBarry Smith 0, 3067d519adbfSMatthew Knepley /*59*/ 0, 3068b9b97703SBarry Smith MatDestroy_SeqAIJ, 3069b9b97703SBarry Smith MatView_SeqAIJ, 3070357abbc8SBarry Smith 0, 3071ee4f033dSBarry Smith 0, 3072d519adbfSMatthew Knepley /*64*/ 0, 3073ee4f033dSBarry Smith 0, 3074ee4f033dSBarry Smith 0, 3075ee4f033dSBarry Smith 0, 3076ee4f033dSBarry Smith 0, 3077d519adbfSMatthew Knepley /*69*/ MatGetRowMaxAbs_SeqAIJ, 3078c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3079ee4f033dSBarry Smith 0, 3080ee4f033dSBarry Smith MatSetColoring_SeqAIJ, 3081dcf5cc72SBarry Smith #if defined(PETSC_HAVE_ADIC) 3082ee4f033dSBarry Smith MatSetValuesAdic_SeqAIJ, 3083dcf5cc72SBarry Smith #else 3084dcf5cc72SBarry Smith 0, 3085dcf5cc72SBarry Smith #endif 3086d519adbfSMatthew Knepley /*74*/ MatSetValuesAdifor_SeqAIJ, 30873acb8795SBarry Smith MatFDColoringApply_AIJ, 308897304618SKris Buschelman 0, 308997304618SKris Buschelman 0, 309097304618SKris Buschelman 0, 30916ce1633cSBarry Smith /*79*/ MatFindZeroDiagonals_SeqAIJ, 309297304618SKris Buschelman 0, 309397304618SKris Buschelman 0, 309497304618SKris Buschelman 0, 3095bc011b1eSHong Zhang MatLoad_SeqAIJ, 3096d519adbfSMatthew Knepley /*84*/ MatIsSymmetric_SeqAIJ, 30971cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 30986284ec50SHong Zhang 0, 30996284ec50SHong Zhang 0, 3100bc011b1eSHong Zhang 0, 3101d519adbfSMatthew Knepley /*89*/ MatMatMult_SeqAIJ_SeqAIJ, 310226be0446SHong Zhang MatMatMultSymbolic_SeqAIJ_SeqAIJ, 310326be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3104d439da42SKris Buschelman MatPtAP_Basic, 31057ba1a0bfSKris Buschelman MatPtAPSymbolic_SeqAIJ, 3106d519adbfSMatthew Knepley /*94*/ MatPtAPNumeric_SeqAIJ, 3107bc011b1eSHong Zhang MatMatMultTranspose_SeqAIJ_SeqAIJ, 3108bc011b1eSHong Zhang MatMatMultTransposeSymbolic_SeqAIJ_SeqAIJ, 3109bc011b1eSHong Zhang MatMatMultTransposeNumeric_SeqAIJ_SeqAIJ, 31107ba1a0bfSKris Buschelman MatPtAPSymbolic_SeqAIJ_SeqAIJ, 3111d519adbfSMatthew Knepley /*99*/ MatPtAPNumeric_SeqAIJ_SeqAIJ, 3112609c6c4dSKris Buschelman 0, 3113609c6c4dSKris Buschelman 0, 311487d4246cSBarry Smith MatConjugate_SeqAIJ, 311587d4246cSBarry Smith 0, 3116d519adbfSMatthew Knepley /*104*/MatSetValuesRow_SeqAIJ, 311799cafbc1SBarry Smith MatRealPart_SeqAIJ, 3118f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3119f5edf698SHong Zhang 0, 31202bebee5dSHong Zhang 0, 3121cbd44569SHong Zhang /*109*/MatMatSolve_SeqAIJ, 3122985db425SBarry Smith 0, 31232af78befSBarry Smith MatGetRowMin_SeqAIJ, 31242af78befSBarry Smith 0, 3125599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3126d519adbfSMatthew Knepley /*114*/0, 3127599ef60dSHong Zhang 0, 31283c2a7987SHong Zhang 0, 3129fe97e370SBarry Smith 0, 3130fbdbba38SShri Abhyankar 0, 3131fbdbba38SShri Abhyankar /*119*/0, 3132fbdbba38SShri Abhyankar 0, 3133fbdbba38SShri Abhyankar 0, 313482d44351SHong Zhang 0, 3135b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 31360716a85fSBarry Smith /*124*/MatFindNonzeroRows_SeqAIJ, 3137bbead8a2SBarry Smith MatGetColumnNorms_SeqAIJ, 313837868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 313937868618SMatthew G Knepley 0, 314037868618SMatthew G Knepley 0, 314137868618SMatthew G Knepley /*129*/0 31429e29f15eSvictorle }; 314317ab2063SBarry Smith 3144fb2e594dSBarry Smith EXTERN_C_BEGIN 31454a2ae208SSatish Balay #undef __FUNCT__ 31464a2ae208SSatish Balay #define __FUNCT__ "MatSeqAIJSetColumnIndices_SeqAIJ" 31477087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat,PetscInt *indices) 3148bef8e0ddSBarry Smith { 3149bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 315097f1f81fSBarry Smith PetscInt i,nz,n; 3151bef8e0ddSBarry Smith 3152bef8e0ddSBarry Smith PetscFunctionBegin; 3153bef8e0ddSBarry Smith 3154bef8e0ddSBarry Smith nz = aij->maxnz; 3155d0f46423SBarry Smith n = mat->rmap->n; 3156bef8e0ddSBarry Smith for (i=0; i<nz; i++) { 3157bef8e0ddSBarry Smith aij->j[i] = indices[i]; 3158bef8e0ddSBarry Smith } 3159bef8e0ddSBarry Smith aij->nz = nz; 3160bef8e0ddSBarry Smith for (i=0; i<n; i++) { 3161bef8e0ddSBarry Smith aij->ilen[i] = aij->imax[i]; 3162bef8e0ddSBarry Smith } 3163bef8e0ddSBarry Smith 3164bef8e0ddSBarry Smith PetscFunctionReturn(0); 3165bef8e0ddSBarry Smith } 3166fb2e594dSBarry Smith EXTERN_C_END 3167bef8e0ddSBarry Smith 31684a2ae208SSatish Balay #undef __FUNCT__ 31694a2ae208SSatish Balay #define __FUNCT__ "MatSeqAIJSetColumnIndices" 3170bef8e0ddSBarry Smith /*@ 3171bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3172bef8e0ddSBarry Smith in the matrix. 3173bef8e0ddSBarry Smith 3174bef8e0ddSBarry Smith Input Parameters: 3175bef8e0ddSBarry Smith + mat - the SeqAIJ matrix 3176bef8e0ddSBarry Smith - indices - the column indices 3177bef8e0ddSBarry Smith 317815091d37SBarry Smith Level: advanced 317915091d37SBarry Smith 3180bef8e0ddSBarry Smith Notes: 3181bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3182bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 3183bef8e0ddSBarry Smith of the MatSetValues() operation. 3184bef8e0ddSBarry Smith 3185bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 3186d1be2dadSMatthew Knepley MatCreateSeqAIJ(), and the columns indices MUST be sorted. 3187bef8e0ddSBarry Smith 3188bef8e0ddSBarry Smith MUST be called before any calls to MatSetValues(); 3189bef8e0ddSBarry Smith 3190b9617806SBarry Smith The indices should start with zero, not one. 3191b9617806SBarry Smith 3192bef8e0ddSBarry Smith @*/ 31937087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat,PetscInt *indices) 3194bef8e0ddSBarry Smith { 31954ac538c5SBarry Smith PetscErrorCode ierr; 3196bef8e0ddSBarry Smith 3197bef8e0ddSBarry Smith PetscFunctionBegin; 31980700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 31994482741eSBarry Smith PetscValidPointer(indices,2); 32004ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatSeqAIJSetColumnIndices_C",(Mat,PetscInt *),(mat,indices));CHKERRQ(ierr); 3201bef8e0ddSBarry Smith PetscFunctionReturn(0); 3202bef8e0ddSBarry Smith } 3203bef8e0ddSBarry Smith 3204be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/ 3205be6bf707SBarry Smith 3206fb2e594dSBarry Smith EXTERN_C_BEGIN 32074a2ae208SSatish Balay #undef __FUNCT__ 32084a2ae208SSatish Balay #define __FUNCT__ "MatStoreValues_SeqAIJ" 32097087cfbeSBarry Smith PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3210be6bf707SBarry Smith { 3211be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 32126849ba73SBarry Smith PetscErrorCode ierr; 3213d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3214be6bf707SBarry Smith 3215be6bf707SBarry Smith PetscFunctionBegin; 3216be6bf707SBarry Smith if (aij->nonew != 1) { 3217e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3218be6bf707SBarry Smith } 3219be6bf707SBarry Smith 3220be6bf707SBarry Smith /* allocate space for values if not already there */ 3221be6bf707SBarry Smith if (!aij->saved_values) { 322287828ca2SBarry Smith ierr = PetscMalloc((nz+1)*sizeof(PetscScalar),&aij->saved_values);CHKERRQ(ierr); 32239518dbb4SMatthew Knepley ierr = PetscLogObjectMemory(mat,(nz+1)*sizeof(PetscScalar));CHKERRQ(ierr); 3224be6bf707SBarry Smith } 3225be6bf707SBarry Smith 3226be6bf707SBarry Smith /* copy values over */ 322787828ca2SBarry Smith ierr = PetscMemcpy(aij->saved_values,aij->a,nz*sizeof(PetscScalar));CHKERRQ(ierr); 3228be6bf707SBarry Smith PetscFunctionReturn(0); 3229be6bf707SBarry Smith } 3230fb2e594dSBarry Smith EXTERN_C_END 3231be6bf707SBarry Smith 32324a2ae208SSatish Balay #undef __FUNCT__ 3233b9617806SBarry Smith #define __FUNCT__ "MatStoreValues" 3234be6bf707SBarry Smith /*@ 3235be6bf707SBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows, for 3236be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3237be6bf707SBarry Smith nonlinear portion. 3238be6bf707SBarry Smith 3239be6bf707SBarry Smith Collect on Mat 3240be6bf707SBarry Smith 3241be6bf707SBarry Smith Input Parameters: 32420e609b76SBarry Smith . mat - the matrix (currently only AIJ matrices support this option) 3243be6bf707SBarry Smith 324415091d37SBarry Smith Level: advanced 324515091d37SBarry Smith 3246be6bf707SBarry Smith Common Usage, with SNESSolve(): 3247be6bf707SBarry Smith $ Create Jacobian matrix 3248be6bf707SBarry Smith $ Set linear terms into matrix 3249be6bf707SBarry Smith $ Apply boundary conditions to matrix, at this time matrix must have 3250be6bf707SBarry Smith $ final nonzero structure (i.e. setting the nonlinear terms and applying 3251be6bf707SBarry Smith $ boundary conditions again will not change the nonzero structure 3252512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3253be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3254be6bf707SBarry Smith $ Call SNESSetJacobian() with matrix 3255be6bf707SBarry Smith $ In your Jacobian routine 3256be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3257be6bf707SBarry Smith $ Set nonlinear terms in matrix 3258be6bf707SBarry Smith 3259be6bf707SBarry Smith Common Usage without SNESSolve(), i.e. when you handle nonlinear solve yourself: 3260be6bf707SBarry Smith $ // build linear portion of Jacobian 3261512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3262be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3263be6bf707SBarry Smith $ loop over nonlinear iterations 3264be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3265be6bf707SBarry Smith $ // call MatSetValues(mat,...) to set nonliner portion of Jacobian 3266be6bf707SBarry Smith $ // call MatAssemblyBegin/End() on matrix 3267be6bf707SBarry Smith $ Solve linear system with Jacobian 3268be6bf707SBarry Smith $ endloop 3269be6bf707SBarry Smith 3270be6bf707SBarry Smith Notes: 3271be6bf707SBarry Smith Matrix must already be assemblied before calling this routine 3272512a5fc5SBarry Smith Must set the matrix option MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); before 3273be6bf707SBarry Smith calling this routine. 3274be6bf707SBarry Smith 32750c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 32760c468ba9SBarry Smith and does not allocated additional space. 32770c468ba9SBarry Smith 3278be6bf707SBarry Smith .seealso: MatRetrieveValues() 3279be6bf707SBarry Smith 3280be6bf707SBarry Smith @*/ 32817087cfbeSBarry Smith PetscErrorCode MatStoreValues(Mat mat) 3282be6bf707SBarry Smith { 32834ac538c5SBarry Smith PetscErrorCode ierr; 3284be6bf707SBarry Smith 3285be6bf707SBarry Smith PetscFunctionBegin; 32860700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3287e32f2f54SBarry Smith if (!mat->assembled) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 3288e32f2f54SBarry Smith if (mat->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 32894ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatStoreValues_C",(Mat),(mat));CHKERRQ(ierr); 3290be6bf707SBarry Smith PetscFunctionReturn(0); 3291be6bf707SBarry Smith } 3292be6bf707SBarry Smith 3293fb2e594dSBarry Smith EXTERN_C_BEGIN 32944a2ae208SSatish Balay #undef __FUNCT__ 32954a2ae208SSatish Balay #define __FUNCT__ "MatRetrieveValues_SeqAIJ" 32967087cfbeSBarry Smith PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3297be6bf707SBarry Smith { 3298be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 32996849ba73SBarry Smith PetscErrorCode ierr; 3300d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3301be6bf707SBarry Smith 3302be6bf707SBarry Smith PetscFunctionBegin; 3303be6bf707SBarry Smith if (aij->nonew != 1) { 3304e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3305be6bf707SBarry Smith } 3306be6bf707SBarry Smith if (!aij->saved_values) { 3307e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatStoreValues(A);first"); 3308be6bf707SBarry Smith } 3309be6bf707SBarry Smith /* copy values over */ 331087828ca2SBarry Smith ierr = PetscMemcpy(aij->a,aij->saved_values,nz*sizeof(PetscScalar));CHKERRQ(ierr); 3311be6bf707SBarry Smith PetscFunctionReturn(0); 3312be6bf707SBarry Smith } 3313fb2e594dSBarry Smith EXTERN_C_END 3314be6bf707SBarry Smith 33154a2ae208SSatish Balay #undef __FUNCT__ 33164a2ae208SSatish Balay #define __FUNCT__ "MatRetrieveValues" 3317be6bf707SBarry Smith /*@ 3318be6bf707SBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for 3319be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3320be6bf707SBarry Smith nonlinear portion. 3321be6bf707SBarry Smith 3322be6bf707SBarry Smith Collect on Mat 3323be6bf707SBarry Smith 3324be6bf707SBarry Smith Input Parameters: 3325be6bf707SBarry Smith . mat - the matrix (currently on AIJ matrices support this option) 3326be6bf707SBarry Smith 332715091d37SBarry Smith Level: advanced 332815091d37SBarry Smith 3329be6bf707SBarry Smith .seealso: MatStoreValues() 3330be6bf707SBarry Smith 3331be6bf707SBarry Smith @*/ 33327087cfbeSBarry Smith PetscErrorCode MatRetrieveValues(Mat mat) 3333be6bf707SBarry Smith { 33344ac538c5SBarry Smith PetscErrorCode ierr; 3335be6bf707SBarry Smith 3336be6bf707SBarry Smith PetscFunctionBegin; 33370700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3338e32f2f54SBarry Smith if (!mat->assembled) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 3339e32f2f54SBarry Smith if (mat->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 33404ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatRetrieveValues_C",(Mat),(mat));CHKERRQ(ierr); 3341be6bf707SBarry Smith PetscFunctionReturn(0); 3342be6bf707SBarry Smith } 3343be6bf707SBarry Smith 3344f83d6046SBarry Smith 3345be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/ 33464a2ae208SSatish Balay #undef __FUNCT__ 33474a2ae208SSatish Balay #define __FUNCT__ "MatCreateSeqAIJ" 334817ab2063SBarry Smith /*@C 3349682d7d0cSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in AIJ (compressed row) format 33500d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 33516e62573dSLois Curfman McInnes the user should preallocate the matrix storage by setting the parameter nz 335251c19458SBarry Smith (or the array nnz). By setting these parameters accurately, performance 33532bd5e0b2SLois Curfman McInnes during matrix assembly can be increased by more than a factor of 50. 335417ab2063SBarry Smith 3355db81eaa0SLois Curfman McInnes Collective on MPI_Comm 3356db81eaa0SLois Curfman McInnes 335717ab2063SBarry Smith Input Parameters: 3358db81eaa0SLois Curfman McInnes + comm - MPI communicator, set to PETSC_COMM_SELF 335917ab2063SBarry Smith . m - number of rows 336017ab2063SBarry Smith . n - number of columns 336117ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 336251c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 33632bd5e0b2SLois Curfman McInnes (possibly different for each row) or PETSC_NULL 336417ab2063SBarry Smith 336517ab2063SBarry Smith Output Parameter: 3366416022c9SBarry Smith . A - the matrix 336717ab2063SBarry Smith 3368175b88e8SBarry Smith It is recommended that one use the MatCreate(), MatSetType() and/or MatSetFromOptions(), 3369ae1d86c5SBarry Smith MatXXXXSetPreallocation() paradgm instead of this routine directly. 3370175b88e8SBarry Smith [MatXXXXSetPreallocation() is, for example, MatSeqAIJSetPreallocation] 3371175b88e8SBarry Smith 3372b259b22eSLois Curfman McInnes Notes: 337349a6f317SBarry Smith If nnz is given then nz is ignored 337449a6f317SBarry Smith 337517ab2063SBarry Smith The AIJ format (also called the Yale sparse matrix format or 337617ab2063SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 33770002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 337844cd7ae7SLois Curfman McInnes either one (as in Fortran) or zero. See the users' manual for details. 337917ab2063SBarry Smith 338017ab2063SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 3381a40aa06bSLois Curfman McInnes Set nz=PETSC_DEFAULT and nnz=PETSC_NULL for PETSc to control dynamic memory 33823d323bbdSBarry Smith allocation. For large problems you MUST preallocate memory or you 33836da5968aSLois Curfman McInnes will get TERRIBLE performance, see the users' manual chapter on matrices. 338417ab2063SBarry Smith 3385682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 33864fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3387682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 33886c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 33896c7ebb05SLois Curfman McInnes 33906c7ebb05SLois Curfman McInnes Options Database Keys: 3391698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 33929db58ca8SBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 339317ab2063SBarry Smith 3394027ccd11SLois Curfman McInnes Level: intermediate 3395027ccd11SLois Curfman McInnes 339636db0b34SBarry Smith .seealso: MatCreate(), MatCreateMPIAIJ(), MatSetValues(), MatSeqAIJSetColumnIndices(), MatCreateSeqAIJWithArrays() 339736db0b34SBarry Smith 339817ab2063SBarry Smith @*/ 33997087cfbeSBarry Smith PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt nz,const PetscInt nnz[],Mat *A) 340017ab2063SBarry Smith { 3401dfbe8321SBarry Smith PetscErrorCode ierr; 34026945ee14SBarry Smith 34033a40ed3dSBarry Smith PetscFunctionBegin; 3404f69a0ea3SMatthew Knepley ierr = MatCreate(comm,A);CHKERRQ(ierr); 3405117016b1SBarry Smith ierr = MatSetSizes(*A,m,n,m,n);CHKERRQ(ierr); 3406c4752a88SBarry Smith ierr = MatSetType(*A,MATSEQAIJ);CHKERRQ(ierr); 3407d28bb7d2SJed Brown ierr = MatSeqAIJSetPreallocation_SeqAIJ(*A,nz,nnz);CHKERRQ(ierr); 3408273d9f13SBarry Smith PetscFunctionReturn(0); 3409273d9f13SBarry Smith } 3410273d9f13SBarry Smith 34114a2ae208SSatish Balay #undef __FUNCT__ 34124a2ae208SSatish Balay #define __FUNCT__ "MatSeqAIJSetPreallocation" 3413273d9f13SBarry Smith /*@C 3414273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3415273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3416273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3417273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3418273d9f13SBarry Smith 3419273d9f13SBarry Smith Collective on MPI_Comm 3420273d9f13SBarry Smith 3421273d9f13SBarry Smith Input Parameters: 3422117016b1SBarry Smith + B - The matrix-free 3423273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3424273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 3425273d9f13SBarry Smith (possibly different for each row) or PETSC_NULL 3426273d9f13SBarry Smith 3427273d9f13SBarry Smith Notes: 342849a6f317SBarry Smith If nnz is given then nz is ignored 342949a6f317SBarry Smith 3430273d9f13SBarry Smith The AIJ format (also called the Yale sparse matrix format or 3431273d9f13SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 3432273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3433273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3434273d9f13SBarry Smith 3435273d9f13SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 3436273d9f13SBarry Smith Set nz=PETSC_DEFAULT and nnz=PETSC_NULL for PETSc to control dynamic memory 3437273d9f13SBarry Smith allocation. For large problems you MUST preallocate memory or you 3438273d9f13SBarry Smith will get TERRIBLE performance, see the users' manual chapter on matrices. 3439273d9f13SBarry Smith 3440aa95bbe8SBarry Smith You can call MatGetInfo() to get information on how effective the preallocation was; 3441aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3442aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3443aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3444aa95bbe8SBarry Smith 3445a96a251dSBarry Smith Developers: Use nz of MAT_SKIP_ALLOCATION to not allocate any space for the matrix 3446a96a251dSBarry Smith entries or columns indices 3447a96a251dSBarry Smith 3448273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3449273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3450273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3451273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3452273d9f13SBarry Smith 3453273d9f13SBarry Smith Options Database Keys: 3454698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 3455698d4c6aSKris Buschelman . -mat_inode_limit <limit> - Sets inode limit (max limit=5) 3456273d9f13SBarry Smith - -mat_aij_oneindex - Internally use indexing starting at 1 3457273d9f13SBarry Smith rather than 0. Note that when calling MatSetValues(), 3458273d9f13SBarry Smith the user still MUST index entries starting at 0! 3459273d9f13SBarry Smith 3460273d9f13SBarry Smith Level: intermediate 3461273d9f13SBarry Smith 3462aa95bbe8SBarry Smith .seealso: MatCreate(), MatCreateMPIAIJ(), MatSetValues(), MatSeqAIJSetColumnIndices(), MatCreateSeqAIJWithArrays(), MatGetInfo() 3463273d9f13SBarry Smith 3464273d9f13SBarry Smith @*/ 34657087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation(Mat B,PetscInt nz,const PetscInt nnz[]) 3466273d9f13SBarry Smith { 34674ac538c5SBarry Smith PetscErrorCode ierr; 3468a23d5eceSKris Buschelman 3469a23d5eceSKris Buschelman PetscFunctionBegin; 34704ac538c5SBarry Smith ierr = PetscTryMethod(B,"MatSeqAIJSetPreallocation_C",(Mat,PetscInt,const PetscInt[]),(B,nz,nnz));CHKERRQ(ierr); 3471a23d5eceSKris Buschelman PetscFunctionReturn(0); 3472a23d5eceSKris Buschelman } 3473a23d5eceSKris Buschelman 3474a23d5eceSKris Buschelman EXTERN_C_BEGIN 3475a23d5eceSKris Buschelman #undef __FUNCT__ 3476a23d5eceSKris Buschelman #define __FUNCT__ "MatSeqAIJSetPreallocation_SeqAIJ" 34777087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B,PetscInt nz,const PetscInt *nnz) 3478a23d5eceSKris Buschelman { 3479273d9f13SBarry Smith Mat_SeqAIJ *b; 3480ace3abfcSBarry Smith PetscBool skipallocation = PETSC_FALSE; 34816849ba73SBarry Smith PetscErrorCode ierr; 348297f1f81fSBarry Smith PetscInt i; 3483273d9f13SBarry Smith 3484273d9f13SBarry Smith PetscFunctionBegin; 3485d5d45c9bSBarry Smith 3486a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3487c461c341SBarry Smith skipallocation = PETSC_TRUE; 3488c461c341SBarry Smith nz = 0; 3489c461c341SBarry Smith } 3490c461c341SBarry Smith 349126283091SBarry Smith ierr = PetscLayoutSetBlockSize(B->rmap,1);CHKERRQ(ierr); 349226283091SBarry Smith ierr = PetscLayoutSetBlockSize(B->cmap,1);CHKERRQ(ierr); 349326283091SBarry Smith ierr = PetscLayoutSetUp(B->rmap);CHKERRQ(ierr); 349426283091SBarry Smith ierr = PetscLayoutSetUp(B->cmap);CHKERRQ(ierr); 3495899cda47SBarry Smith 3496435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 3497e32f2f54SBarry Smith if (nz < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nz cannot be less than 0: value %d",nz); 3498b73539f3SBarry Smith if (nnz) { 3499d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) { 3500e32f2f54SBarry Smith if (nnz[i] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be less than 0: local row %d value %d",i,nnz[i]); 3501e32f2f54SBarry Smith if (nnz[i] > B->cmap->n) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be greater than row length: local row %d value %d rowlength %d",i,nnz[i],B->cmap->n); 3502b73539f3SBarry Smith } 3503b73539f3SBarry Smith } 3504b73539f3SBarry Smith 3505273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 3506273d9f13SBarry Smith b = (Mat_SeqAIJ*)B->data; 3507273d9f13SBarry Smith 3508ab93d7beSBarry Smith if (!skipallocation) { 35092ee49352SLisandro Dalcin if (!b->imax) { 3510d0f46423SBarry Smith ierr = PetscMalloc2(B->rmap->n,PetscInt,&b->imax,B->rmap->n,PetscInt,&b->ilen);CHKERRQ(ierr); 3511d0f46423SBarry Smith ierr = PetscLogObjectMemory(B,2*B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 35122ee49352SLisandro Dalcin } 3513273d9f13SBarry Smith if (!nnz) { 3514435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 3515c62bd62aSJed Brown else if (nz < 0) nz = 1; 3516d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) b->imax[i] = nz; 3517d0f46423SBarry Smith nz = nz*B->rmap->n; 3518273d9f13SBarry Smith } else { 3519273d9f13SBarry Smith nz = 0; 3520d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) {b->imax[i] = nnz[i]; nz += nnz[i];} 3521273d9f13SBarry Smith } 3522ab93d7beSBarry Smith /* b->ilen will count nonzeros in each row so far. */ 3523d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) { b->ilen[i] = 0; } 3524ab93d7beSBarry Smith 3525273d9f13SBarry Smith /* allocate the matrix space */ 35262ee49352SLisandro Dalcin ierr = MatSeqXAIJFreeAIJ(B,&b->a,&b->j,&b->i);CHKERRQ(ierr); 3527d0f46423SBarry Smith ierr = PetscMalloc3(nz,PetscScalar,&b->a,nz,PetscInt,&b->j,B->rmap->n+1,PetscInt,&b->i);CHKERRQ(ierr); 3528d0f46423SBarry Smith ierr = PetscLogObjectMemory(B,(B->rmap->n+1)*sizeof(PetscInt)+nz*(sizeof(PetscScalar)+sizeof(PetscInt)));CHKERRQ(ierr); 3529bfeeae90SHong Zhang b->i[0] = 0; 3530d0f46423SBarry Smith for (i=1; i<B->rmap->n+1; i++) { 35315da197adSKris Buschelman b->i[i] = b->i[i-1] + b->imax[i-1]; 35325da197adSKris Buschelman } 3533273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 3534e6b907acSBarry Smith b->free_a = PETSC_TRUE; 3535e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 3536c461c341SBarry Smith } else { 3537e6b907acSBarry Smith b->free_a = PETSC_FALSE; 3538e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 3539c461c341SBarry Smith } 3540273d9f13SBarry Smith 3541273d9f13SBarry Smith b->nz = 0; 3542273d9f13SBarry Smith b->maxnz = nz; 3543273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 3544273d9f13SBarry Smith PetscFunctionReturn(0); 3545273d9f13SBarry Smith } 3546a23d5eceSKris Buschelman EXTERN_C_END 3547273d9f13SBarry Smith 3548a1661176SMatthew Knepley #undef __FUNCT__ 3549a1661176SMatthew Knepley #define __FUNCT__ "MatSeqAIJSetPreallocationCSR" 355058d36128SBarry Smith /*@ 3551a1661176SMatthew Knepley MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in AIJ format. 3552a1661176SMatthew Knepley 3553a1661176SMatthew Knepley Input Parameters: 3554a1661176SMatthew Knepley + B - the matrix 3555a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 3556a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 3557a1661176SMatthew Knepley - v - optional values in the matrix 3558a1661176SMatthew Knepley 3559a1661176SMatthew Knepley Level: developer 3560a1661176SMatthew Knepley 356158d36128SBarry Smith The i,j,v values are COPIED with this routine; to avoid the copy use MatCreateSeqAIJWithArrays() 356258d36128SBarry Smith 3563a1661176SMatthew Knepley .keywords: matrix, aij, compressed row, sparse, sequential 3564a1661176SMatthew Knepley 3565a1661176SMatthew Knepley .seealso: MatCreate(), MatCreateSeqAIJ(), MatSetValues(), MatSeqAIJSetPreallocation(), MatCreateSeqAIJ(), SeqAIJ 3566a1661176SMatthew Knepley @*/ 3567a1661176SMatthew Knepley PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B,const PetscInt i[],const PetscInt j[],const PetscScalar v[]) 3568a1661176SMatthew Knepley { 3569a1661176SMatthew Knepley PetscErrorCode ierr; 3570a1661176SMatthew Knepley 3571a1661176SMatthew Knepley PetscFunctionBegin; 35720700a824SBarry Smith PetscValidHeaderSpecific(B,MAT_CLASSID,1); 35734ac538c5SBarry Smith ierr = PetscTryMethod(B,"MatSeqAIJSetPreallocationCSR_C",(Mat,const PetscInt[],const PetscInt[],const PetscScalar[]),(B,i,j,v));CHKERRQ(ierr); 3574a1661176SMatthew Knepley PetscFunctionReturn(0); 3575a1661176SMatthew Knepley } 3576a1661176SMatthew Knepley 3577a1661176SMatthew Knepley EXTERN_C_BEGIN 3578a1661176SMatthew Knepley #undef __FUNCT__ 3579a1661176SMatthew Knepley #define __FUNCT__ "MatSeqAIJSetPreallocationCSR_SeqAIJ" 35807087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B,const PetscInt Ii[],const PetscInt J[],const PetscScalar v[]) 3581a1661176SMatthew Knepley { 3582a1661176SMatthew Knepley PetscInt i; 3583a1661176SMatthew Knepley PetscInt m,n; 3584a1661176SMatthew Knepley PetscInt nz; 3585a1661176SMatthew Knepley PetscInt *nnz, nz_max = 0; 3586a1661176SMatthew Knepley PetscScalar *values; 3587a1661176SMatthew Knepley PetscErrorCode ierr; 3588a1661176SMatthew Knepley 3589a1661176SMatthew Knepley PetscFunctionBegin; 3590a1661176SMatthew Knepley ierr = MatGetSize(B, &m, &n);CHKERRQ(ierr); 3591a1661176SMatthew Knepley 359265e19b50SBarry Smith if (Ii[0]) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %D", Ii[0]); 3593a1661176SMatthew Knepley ierr = PetscMalloc((m+1) * sizeof(PetscInt), &nnz);CHKERRQ(ierr); 3594a1661176SMatthew Knepley for(i = 0; i < m; i++) { 3595b7940d39SSatish Balay nz = Ii[i+1]- Ii[i]; 3596a1661176SMatthew Knepley nz_max = PetscMax(nz_max, nz); 359765e19b50SBarry Smith if (nz < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Local row %D has a negative number of columns %D", i, nnz); 3598a1661176SMatthew Knepley nnz[i] = nz; 3599a1661176SMatthew Knepley } 3600a1661176SMatthew Knepley ierr = MatSeqAIJSetPreallocation(B, 0, nnz);CHKERRQ(ierr); 3601a1661176SMatthew Knepley ierr = PetscFree(nnz);CHKERRQ(ierr); 3602a1661176SMatthew Knepley 3603a1661176SMatthew Knepley if (v) { 3604a1661176SMatthew Knepley values = (PetscScalar*) v; 3605a1661176SMatthew Knepley } else { 36060e83c824SBarry Smith ierr = PetscMalloc(nz_max*sizeof(PetscScalar), &values);CHKERRQ(ierr); 3607a1661176SMatthew Knepley ierr = PetscMemzero(values, nz_max*sizeof(PetscScalar));CHKERRQ(ierr); 3608a1661176SMatthew Knepley } 3609a1661176SMatthew Knepley 3610a1661176SMatthew Knepley for(i = 0; i < m; i++) { 3611b7940d39SSatish Balay nz = Ii[i+1] - Ii[i]; 3612b7940d39SSatish Balay ierr = MatSetValues_SeqAIJ(B, 1, &i, nz, J+Ii[i], values + (v ? Ii[i] : 0), INSERT_VALUES);CHKERRQ(ierr); 3613a1661176SMatthew Knepley } 3614a1661176SMatthew Knepley 3615a1661176SMatthew Knepley ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3616a1661176SMatthew Knepley ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3617a1661176SMatthew Knepley 3618a1661176SMatthew Knepley if (!v) { 3619a1661176SMatthew Knepley ierr = PetscFree(values);CHKERRQ(ierr); 3620a1661176SMatthew Knepley } 3621a1661176SMatthew Knepley PetscFunctionReturn(0); 3622a1661176SMatthew Knepley } 3623a1661176SMatthew Knepley EXTERN_C_END 3624a1661176SMatthew Knepley 3625c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 3626c6db04a5SJed Brown #include <private/petscaxpy.h> 3627170fe5c8SBarry Smith 3628170fe5c8SBarry Smith #undef __FUNCT__ 3629170fe5c8SBarry Smith #define __FUNCT__ "MatMatMultNumeric_SeqDense_SeqAIJ" 3630170fe5c8SBarry Smith /* 3631170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 3632170fe5c8SBarry Smith 3633170fe5c8SBarry Smith n p p 3634170fe5c8SBarry Smith ( ) ( ) ( ) 3635170fe5c8SBarry Smith m ( A ) * n ( B ) = m ( C ) 3636170fe5c8SBarry Smith ( ) ( ) ( ) 3637170fe5c8SBarry Smith 3638170fe5c8SBarry Smith */ 3639170fe5c8SBarry Smith PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A,Mat B,Mat C) 3640170fe5c8SBarry Smith { 3641170fe5c8SBarry Smith PetscErrorCode ierr; 3642170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense*)A->data; 3643170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ*)B->data; 3644170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense*)C->data; 36451de00fd4SBarry Smith PetscInt i,n,m,q,p; 3646170fe5c8SBarry Smith const PetscInt *ii,*idx; 3647170fe5c8SBarry Smith const PetscScalar *b,*a,*a_q; 3648170fe5c8SBarry Smith PetscScalar *c,*c_q; 3649170fe5c8SBarry Smith 3650170fe5c8SBarry Smith PetscFunctionBegin; 3651d0f46423SBarry Smith m = A->rmap->n; 3652d0f46423SBarry Smith n = A->cmap->n; 3653d0f46423SBarry Smith p = B->cmap->n; 3654170fe5c8SBarry Smith a = sub_a->v; 3655170fe5c8SBarry Smith b = sub_b->a; 3656170fe5c8SBarry Smith c = sub_c->v; 3657170fe5c8SBarry Smith ierr = PetscMemzero(c,m*p*sizeof(PetscScalar));CHKERRQ(ierr); 3658170fe5c8SBarry Smith 3659170fe5c8SBarry Smith ii = sub_b->i; 3660170fe5c8SBarry Smith idx = sub_b->j; 3661170fe5c8SBarry Smith for (i=0; i<n; i++) { 3662170fe5c8SBarry Smith q = ii[i+1] - ii[i]; 3663170fe5c8SBarry Smith while (q-->0) { 3664170fe5c8SBarry Smith c_q = c + m*(*idx); 3665170fe5c8SBarry Smith a_q = a + m*i; 3666be7314b0SBarry Smith PetscAXPY(c_q,*b,a_q,m); 3667170fe5c8SBarry Smith idx++; 3668170fe5c8SBarry Smith b++; 3669170fe5c8SBarry Smith } 3670170fe5c8SBarry Smith } 3671170fe5c8SBarry Smith PetscFunctionReturn(0); 3672170fe5c8SBarry Smith } 3673170fe5c8SBarry Smith 3674170fe5c8SBarry Smith #undef __FUNCT__ 3675170fe5c8SBarry Smith #define __FUNCT__ "MatMatMultSymbolic_SeqDense_SeqAIJ" 3676170fe5c8SBarry Smith PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A,Mat B,PetscReal fill,Mat *C) 3677170fe5c8SBarry Smith { 3678170fe5c8SBarry Smith PetscErrorCode ierr; 3679d0f46423SBarry Smith PetscInt m=A->rmap->n,n=B->cmap->n; 3680170fe5c8SBarry Smith Mat Cmat; 3681170fe5c8SBarry Smith 3682170fe5c8SBarry Smith PetscFunctionBegin; 3683e32f2f54SBarry Smith if (A->cmap->n != B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"A->cmap->n %d != B->rmap->n %d\n",A->cmap->n,B->rmap->n); 368439804f7cSBarry Smith ierr = MatCreate(((PetscObject)A)->comm,&Cmat);CHKERRQ(ierr); 3685170fe5c8SBarry Smith ierr = MatSetSizes(Cmat,m,n,m,n);CHKERRQ(ierr); 3686170fe5c8SBarry Smith ierr = MatSetType(Cmat,MATSEQDENSE);CHKERRQ(ierr); 3687170fe5c8SBarry Smith ierr = MatSeqDenseSetPreallocation(Cmat,PETSC_NULL);CHKERRQ(ierr); 3688170fe5c8SBarry Smith Cmat->assembled = PETSC_TRUE; 3689170fe5c8SBarry Smith *C = Cmat; 3690170fe5c8SBarry Smith PetscFunctionReturn(0); 3691170fe5c8SBarry Smith } 3692170fe5c8SBarry Smith 3693170fe5c8SBarry Smith /* ----------------------------------------------------------------*/ 3694170fe5c8SBarry Smith #undef __FUNCT__ 3695170fe5c8SBarry Smith #define __FUNCT__ "MatMatMult_SeqDense_SeqAIJ" 3696170fe5c8SBarry Smith PetscErrorCode MatMatMult_SeqDense_SeqAIJ(Mat A,Mat B,MatReuse scall,PetscReal fill,Mat *C) 3697170fe5c8SBarry Smith { 3698170fe5c8SBarry Smith PetscErrorCode ierr; 3699170fe5c8SBarry Smith 3700170fe5c8SBarry Smith PetscFunctionBegin; 3701170fe5c8SBarry Smith if (scall == MAT_INITIAL_MATRIX){ 3702170fe5c8SBarry Smith ierr = MatMatMultSymbolic_SeqDense_SeqAIJ(A,B,fill,C);CHKERRQ(ierr); 3703170fe5c8SBarry Smith } 3704170fe5c8SBarry Smith ierr = MatMatMultNumeric_SeqDense_SeqAIJ(A,B,*C);CHKERRQ(ierr); 3705170fe5c8SBarry Smith PetscFunctionReturn(0); 3706170fe5c8SBarry Smith } 3707170fe5c8SBarry Smith 3708170fe5c8SBarry Smith 37090bad9183SKris Buschelman /*MC 3710fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 37110bad9183SKris Buschelman based on compressed sparse row format. 37120bad9183SKris Buschelman 37130bad9183SKris Buschelman Options Database Keys: 37140bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 37150bad9183SKris Buschelman 37160bad9183SKris Buschelman Level: beginner 37170bad9183SKris Buschelman 3718f587520bSBarry Smith .seealso: MatCreateSeqAIJ(), MatSetFromOptions(), MatSetType(), MatCreate(), MatType 37190bad9183SKris Buschelman M*/ 37200bad9183SKris Buschelman 3721a6175056SHong Zhang EXTERN_C_BEGIN 3722b5e56a35SBarry Smith #if defined(PETSC_HAVE_PASTIX) 3723b5e56a35SBarry Smith extern PetscErrorCode MatGetFactor_seqaij_pastix(Mat,MatFactorType,Mat*); 3724b5e56a35SBarry Smith #endif 3725ce63c4c1SBarry Smith #if defined(PETSC_HAVE_ESSL) && !defined(PETSC_USE_COMPLEX) && !defined(PETSC_USE_REAL_SINGLE) && !defined(PETSC_USE_REAL___FLOAT128) 3726af1023dbSSatish Balay extern PetscErrorCode MatGetFactor_seqaij_essl(Mat,MatFactorType,Mat *); 3727af1023dbSSatish Balay #endif 37287087cfbeSBarry Smith extern PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat,MatType,MatReuse,Mat*); 37297087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_petsc(Mat,MatFactorType,Mat*); 37307087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_bas(Mat,MatFactorType,Mat*); 37317087cfbeSBarry Smith extern PetscErrorCode MatGetFactorAvailable_seqaij_petsc(Mat,MatFactorType,PetscBool *); 3732611f576cSBarry Smith #if defined(PETSC_HAVE_MUMPS) 37337087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_aij_mumps(Mat,MatFactorType,Mat*); 3734611f576cSBarry Smith #endif 3735611f576cSBarry Smith #if defined(PETSC_HAVE_SUPERLU) 37367087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_superlu(Mat,MatFactorType,Mat*); 3737611f576cSBarry Smith #endif 3738f3c0ef26SHong Zhang #if defined(PETSC_HAVE_SUPERLU_DIST) 3739f3c0ef26SHong Zhang extern PetscErrorCode MatGetFactor_seqaij_superlu_dist(Mat,MatFactorType,Mat*); 3740f3c0ef26SHong Zhang #endif 3741611f576cSBarry Smith #if defined(PETSC_HAVE_SPOOLES) 37427087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_spooles(Mat,MatFactorType,Mat*); 3743611f576cSBarry Smith #endif 3744eb3b5408SSatish Balay #if defined(PETSC_HAVE_UMFPACK) 37457087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_umfpack(Mat,MatFactorType,Mat*); 3746eb3b5408SSatish Balay #endif 3747586621ddSJed Brown #if defined(PETSC_HAVE_CHOLMOD) 37487087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_cholmod(Mat,MatFactorType,Mat*); 3749586621ddSJed Brown #endif 3750719d5645SBarry Smith #if defined(PETSC_HAVE_LUSOL) 37517087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_lusol(Mat,MatFactorType,Mat*); 3752719d5645SBarry Smith #endif 3753b3866ffcSBarry Smith #if defined(PETSC_HAVE_MATLAB_ENGINE) 37547087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_matlab(Mat,MatFactorType,Mat*); 37557087cfbeSBarry Smith extern PetscErrorCode MatlabEnginePut_SeqAIJ(PetscObject,void*); 37567087cfbeSBarry Smith extern PetscErrorCode MatlabEngineGet_SeqAIJ(PetscObject,void*); 3757b3866ffcSBarry Smith #endif 375817667f90SBarry Smith EXTERN_C_END 375917667f90SBarry Smith 376017667f90SBarry Smith EXTERN_C_BEGIN 37614a2ae208SSatish Balay #undef __FUNCT__ 37624a2ae208SSatish Balay #define __FUNCT__ "MatCreate_SeqAIJ" 37637087cfbeSBarry Smith PetscErrorCode MatCreate_SeqAIJ(Mat B) 3764273d9f13SBarry Smith { 3765273d9f13SBarry Smith Mat_SeqAIJ *b; 3766dfbe8321SBarry Smith PetscErrorCode ierr; 376738baddfdSBarry Smith PetscMPIInt size; 3768273d9f13SBarry Smith 3769273d9f13SBarry Smith PetscFunctionBegin; 37707adad957SLisandro Dalcin ierr = MPI_Comm_size(((PetscObject)B)->comm,&size);CHKERRQ(ierr); 3771e32f2f54SBarry Smith if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Comm must be of size 1"); 3772273d9f13SBarry Smith 377338f2d2fdSLisandro Dalcin ierr = PetscNewLog(B,Mat_SeqAIJ,&b);CHKERRQ(ierr); 3774b0a32e0cSBarry Smith B->data = (void*)b; 3775549d3d68SSatish Balay ierr = PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps));CHKERRQ(ierr); 3776416022c9SBarry Smith b->row = 0; 3777416022c9SBarry Smith b->col = 0; 377882bf6240SBarry Smith b->icol = 0; 3779b810aeb4SBarry Smith b->reallocs = 0; 378036db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 3781f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 3782416022c9SBarry Smith b->nonew = 0; 3783416022c9SBarry Smith b->diag = 0; 3784416022c9SBarry Smith b->solve_work = 0; 37852a1b7f2aSHong Zhang B->spptr = 0; 3786be6bf707SBarry Smith b->saved_values = 0; 3787d7f994e1SBarry Smith b->idiag = 0; 378871f1c65dSBarry Smith b->mdiag = 0; 378971f1c65dSBarry Smith b->ssor_work = 0; 379071f1c65dSBarry Smith b->omega = 1.0; 379171f1c65dSBarry Smith b->fshift = 0.0; 379271f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 3793bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 3794a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 3795a30b2313SHong Zhang b->xtoy = 0; 3796a30b2313SHong Zhang b->XtoY = 0; 379788e51ccdSHong Zhang B->same_nonzero = PETSC_FALSE; 379817ab2063SBarry Smith 379935d8aa7fSBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ);CHKERRQ(ierr); 3800b3866ffcSBarry Smith #if defined(PETSC_HAVE_MATLAB_ENGINE) 3801700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_matlab_C","MatGetFactor_seqaij_matlab",MatGetFactor_seqaij_matlab);CHKERRQ(ierr); 3802b3866ffcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"PetscMatlabEnginePut_C","MatlabEnginePut_SeqAIJ",MatlabEnginePut_SeqAIJ);CHKERRQ(ierr); 3803b3866ffcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"PetscMatlabEngineGet_C","MatlabEngineGet_SeqAIJ",MatlabEngineGet_SeqAIJ);CHKERRQ(ierr); 3804b3866ffcSBarry Smith #endif 3805b5e56a35SBarry Smith #if defined(PETSC_HAVE_PASTIX) 3806700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_pastix_C","MatGetFactor_seqaij_pastix",MatGetFactor_seqaij_pastix);CHKERRQ(ierr); 3807b5e56a35SBarry Smith #endif 3808ce63c4c1SBarry Smith #if defined(PETSC_HAVE_ESSL) && !defined(PETSC_USE_COMPLEX) && !defined(PETSC_USE_REAL_SINGLE) && !defined(PETSC_USE_REAL___FLOAT128) 3809700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_essl_C","MatGetFactor_seqaij_essl",MatGetFactor_seqaij_essl);CHKERRQ(ierr); 3810719d5645SBarry Smith #endif 3811611f576cSBarry Smith #if defined(PETSC_HAVE_SUPERLU) 3812700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_superlu_C","MatGetFactor_seqaij_superlu",MatGetFactor_seqaij_superlu);CHKERRQ(ierr); 3813611f576cSBarry Smith #endif 3814f3c0ef26SHong Zhang #if defined(PETSC_HAVE_SUPERLU_DIST) 3815700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_superlu_dist_C","MatGetFactor_seqaij_superlu_dist",MatGetFactor_seqaij_superlu_dist);CHKERRQ(ierr); 3816f3c0ef26SHong Zhang #endif 3817611f576cSBarry Smith #if defined(PETSC_HAVE_SPOOLES) 3818700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_spooles_C","MatGetFactor_seqaij_spooles",MatGetFactor_seqaij_spooles);CHKERRQ(ierr); 3819611f576cSBarry Smith #endif 3820611f576cSBarry Smith #if defined(PETSC_HAVE_MUMPS) 3821700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_mumps_C","MatGetFactor_aij_mumps",MatGetFactor_aij_mumps);CHKERRQ(ierr); 3822611f576cSBarry Smith #endif 3823eb3b5408SSatish Balay #if defined(PETSC_HAVE_UMFPACK) 3824700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_umfpack_C","MatGetFactor_seqaij_umfpack",MatGetFactor_seqaij_umfpack);CHKERRQ(ierr); 3825eb3b5408SSatish Balay #endif 3826586621ddSJed Brown #if defined(PETSC_HAVE_CHOLMOD) 3827700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_cholmod_C","MatGetFactor_seqaij_cholmod",MatGetFactor_seqaij_cholmod);CHKERRQ(ierr); 3828586621ddSJed Brown #endif 3829719d5645SBarry Smith #if defined(PETSC_HAVE_LUSOL) 3830700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_lusol_C","MatGetFactor_seqaij_lusol",MatGetFactor_seqaij_lusol);CHKERRQ(ierr); 3831719d5645SBarry Smith #endif 3832700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_petsc_C","MatGetFactor_seqaij_petsc",MatGetFactor_seqaij_petsc);CHKERRQ(ierr); 3833700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactorAvailable_petsc_C","MatGetFactorAvailable_seqaij_petsc",MatGetFactorAvailable_seqaij_petsc);CHKERRQ(ierr); 3834700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_bas_C","MatGetFactor_seqaij_bas",MatGetFactor_seqaij_bas);CHKERRQ(ierr); 3835700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatSeqAIJSetColumnIndices_C","MatSeqAIJSetColumnIndices_SeqAIJ",MatSeqAIJSetColumnIndices_SeqAIJ);CHKERRQ(ierr); 3836700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatStoreValues_C","MatStoreValues_SeqAIJ",MatStoreValues_SeqAIJ);CHKERRQ(ierr); 3837700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatRetrieveValues_C","MatRetrieveValues_SeqAIJ",MatRetrieveValues_SeqAIJ);CHKERRQ(ierr); 3838700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatConvert_seqaij_seqsbaij_C","MatConvert_SeqAIJ_SeqSBAIJ",MatConvert_SeqAIJ_SeqSBAIJ);CHKERRQ(ierr); 3839700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatConvert_seqaij_seqbaij_C","MatConvert_SeqAIJ_SeqBAIJ",MatConvert_SeqAIJ_SeqBAIJ);CHKERRQ(ierr); 3840700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatConvert_seqaij_seqaijperm_C","MatConvert_SeqAIJ_SeqAIJPERM",MatConvert_SeqAIJ_SeqAIJPERM);CHKERRQ(ierr); 3841700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatConvert_seqaij_seqaijcrl_C","MatConvert_SeqAIJ_SeqAIJCRL",MatConvert_SeqAIJ_SeqAIJCRL);CHKERRQ(ierr); 3842700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatIsTranspose_C","MatIsTranspose_SeqAIJ",MatIsTranspose_SeqAIJ);CHKERRQ(ierr); 3843700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatIsHermitianTranspose_C","MatIsHermitianTranspose_SeqAIJ",MatIsTranspose_SeqAIJ);CHKERRQ(ierr); 3844700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatSeqAIJSetPreallocation_C","MatSeqAIJSetPreallocation_SeqAIJ",MatSeqAIJSetPreallocation_SeqAIJ);CHKERRQ(ierr); 3845700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatSeqAIJSetPreallocationCSR_C","MatSeqAIJSetPreallocationCSR_SeqAIJ",MatSeqAIJSetPreallocationCSR_SeqAIJ);CHKERRQ(ierr); 3846700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatReorderForNonzeroDiagonal_C","MatReorderForNonzeroDiagonal_SeqAIJ",MatReorderForNonzeroDiagonal_SeqAIJ);CHKERRQ(ierr); 3847700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatMatMult_seqdense_seqaij_C","MatMatMult_SeqDense_SeqAIJ",MatMatMult_SeqDense_SeqAIJ);CHKERRQ(ierr); 3848700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatMatMultSymbolic_seqdense_seqaij_C","MatMatMultSymbolic_SeqDense_SeqAIJ",MatMatMultSymbolic_SeqDense_SeqAIJ);CHKERRQ(ierr); 3849700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatMatMultNumeric_seqdense_seqaij_C","MatMatMultNumeric_SeqDense_SeqAIJ",MatMatMultNumeric_SeqDense_SeqAIJ);CHKERRQ(ierr); 38504108e4d5SBarry Smith ierr = MatCreate_SeqAIJ_Inode(B);CHKERRQ(ierr); 385117667f90SBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ);CHKERRQ(ierr); 38523a40ed3dSBarry Smith PetscFunctionReturn(0); 385317ab2063SBarry Smith } 3854273d9f13SBarry Smith EXTERN_C_END 385517ab2063SBarry Smith 3856ff34cdc8SBarry Smith #if defined(PETSC_HAVE_PTHREADCLASSES) 385751d315f7SKerry Stevens EXTERN_C_BEGIN 385851d315f7SKerry Stevens #undef __FUNCT__ 38597d6a0e61SBarry Smith #define __FUNCT__ "MatCreate_SeqAIJPThread" 38607d6a0e61SBarry Smith PetscErrorCode MatCreate_SeqAIJPThread(Mat B) 386151d315f7SKerry Stevens { 386251d315f7SKerry Stevens PetscErrorCode ierr; 386351d315f7SKerry Stevens 386451d315f7SKerry Stevens PetscFunctionBegin; 386551d315f7SKerry Stevens ierr = MatCreate_SeqAIJ(B); 386651d315f7SKerry Stevens ierr = PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps));CHKERRQ(ierr); 38677d6a0e61SBarry Smith B->ops->mult = MatMult_SeqAIJPThread; 38687d6a0e61SBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJPTHREAD);CHKERRQ(ierr); 386951d315f7SKerry Stevens PetscFunctionReturn(0); 387051d315f7SKerry Stevens } 387151d315f7SKerry Stevens EXTERN_C_END 3872ba61063dSBarry Smith #endif 387351d315f7SKerry Stevens 38744a2ae208SSatish Balay #undef __FUNCT__ 3875b24902e0SBarry Smith #define __FUNCT__ "MatDuplicateNoCreate_SeqAIJ" 3876b24902e0SBarry Smith /* 3877b24902e0SBarry Smith Given a matrix generated with MatGetFactor() duplicates all the information in A into B 3878b24902e0SBarry Smith */ 3879ace3abfcSBarry Smith PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C,Mat A,MatDuplicateOption cpvalues,PetscBool mallocmatspace) 388017ab2063SBarry Smith { 3881416022c9SBarry Smith Mat_SeqAIJ *c,*a = (Mat_SeqAIJ*)A->data; 38826849ba73SBarry Smith PetscErrorCode ierr; 3883d0f46423SBarry Smith PetscInt i,m = A->rmap->n; 388417ab2063SBarry Smith 38853a40ed3dSBarry Smith PetscFunctionBegin; 3886273d9f13SBarry Smith c = (Mat_SeqAIJ*)C->data; 3887273d9f13SBarry Smith 3888d5f3da31SBarry Smith C->factortype = A->factortype; 3889416022c9SBarry Smith c->row = 0; 3890416022c9SBarry Smith c->col = 0; 389182bf6240SBarry Smith c->icol = 0; 38926ad4291fSHong Zhang c->reallocs = 0; 389317ab2063SBarry Smith 38946ad4291fSHong Zhang C->assembled = PETSC_TRUE; 389517ab2063SBarry Smith 3896aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->rmap,&C->rmap);CHKERRQ(ierr); 3897aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->cmap,&C->cmap);CHKERRQ(ierr); 3898eec197d1SBarry Smith 389933b91e9fSSatish Balay ierr = PetscMalloc2(m,PetscInt,&c->imax,m,PetscInt,&c->ilen);CHKERRQ(ierr); 39009518dbb4SMatthew Knepley ierr = PetscLogObjectMemory(C, 2*m*sizeof(PetscInt));CHKERRQ(ierr); 390117ab2063SBarry Smith for (i=0; i<m; i++) { 3902416022c9SBarry Smith c->imax[i] = a->imax[i]; 3903416022c9SBarry Smith c->ilen[i] = a->ilen[i]; 390417ab2063SBarry Smith } 390517ab2063SBarry Smith 390617ab2063SBarry Smith /* allocate the matrix space */ 3907f77e22a1SHong Zhang if (mallocmatspace){ 3908a96a251dSBarry Smith ierr = PetscMalloc3(a->i[m],PetscScalar,&c->a,a->i[m],PetscInt,&c->j,m+1,PetscInt,&c->i);CHKERRQ(ierr); 39099518dbb4SMatthew Knepley ierr = PetscLogObjectMemory(C, a->i[m]*(sizeof(PetscScalar)+sizeof(PetscInt))+(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 3910f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 391197f1f81fSBarry Smith ierr = PetscMemcpy(c->i,a->i,(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 391217ab2063SBarry Smith if (m > 0) { 391397f1f81fSBarry Smith ierr = PetscMemcpy(c->j,a->j,(a->i[m])*sizeof(PetscInt));CHKERRQ(ierr); 3914be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 3915bfeeae90SHong Zhang ierr = PetscMemcpy(c->a,a->a,(a->i[m])*sizeof(PetscScalar));CHKERRQ(ierr); 3916be6bf707SBarry Smith } else { 3917bfeeae90SHong Zhang ierr = PetscMemzero(c->a,(a->i[m])*sizeof(PetscScalar));CHKERRQ(ierr); 391817ab2063SBarry Smith } 391908480c60SBarry Smith } 3920f77e22a1SHong Zhang } 392117ab2063SBarry Smith 39226ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 3923416022c9SBarry Smith c->roworiented = a->roworiented; 3924416022c9SBarry Smith c->nonew = a->nonew; 3925416022c9SBarry Smith if (a->diag) { 392697f1f81fSBarry Smith ierr = PetscMalloc((m+1)*sizeof(PetscInt),&c->diag);CHKERRQ(ierr); 392752e6d16bSBarry Smith ierr = PetscLogObjectMemory(C,(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 392817ab2063SBarry Smith for (i=0; i<m; i++) { 3929416022c9SBarry Smith c->diag[i] = a->diag[i]; 393017ab2063SBarry Smith } 39313a40ed3dSBarry Smith } else c->diag = 0; 39326ad4291fSHong Zhang c->solve_work = 0; 39336ad4291fSHong Zhang c->saved_values = 0; 39346ad4291fSHong Zhang c->idiag = 0; 393571f1c65dSBarry Smith c->ssor_work = 0; 3936a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 3937e6b907acSBarry Smith c->free_a = PETSC_TRUE; 3938e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 39396ad4291fSHong Zhang c->xtoy = 0; 39406ad4291fSHong Zhang c->XtoY = 0; 39416ad4291fSHong Zhang 3942416022c9SBarry Smith c->nz = a->nz; 39438ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 3944273d9f13SBarry Smith C->preallocated = PETSC_TRUE; 3945754ec7b1SSatish Balay 39466ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 39476ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 3948cd6b891eSBarry Smith c->compressedrow.check = a->compressedrow.check; 3949cd6b891eSBarry Smith if (a->compressedrow.use){ 39506ad4291fSHong Zhang i = a->compressedrow.nrows; 39510e83c824SBarry Smith ierr = PetscMalloc2(i+1,PetscInt,&c->compressedrow.i,i,PetscInt,&c->compressedrow.rindex);CHKERRQ(ierr); 39526ad4291fSHong Zhang ierr = PetscMemcpy(c->compressedrow.i,a->compressedrow.i,(i+1)*sizeof(PetscInt));CHKERRQ(ierr); 39536ad4291fSHong Zhang ierr = PetscMemcpy(c->compressedrow.rindex,a->compressedrow.rindex,i*sizeof(PetscInt));CHKERRQ(ierr); 395427ea64f8SHong Zhang } else { 395527ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 395627ea64f8SHong Zhang c->compressedrow.i = PETSC_NULL; 395727ea64f8SHong Zhang c->compressedrow.rindex = PETSC_NULL; 39586ad4291fSHong Zhang } 395988e51ccdSHong Zhang C->same_nonzero = A->same_nonzero; 39604108e4d5SBarry Smith ierr = MatDuplicate_SeqAIJ_Inode(A,cpvalues,&C);CHKERRQ(ierr); 39614846f1f5SKris Buschelman 39627adad957SLisandro Dalcin ierr = PetscFListDuplicate(((PetscObject)A)->qlist,&((PetscObject)C)->qlist);CHKERRQ(ierr); 39633a40ed3dSBarry Smith PetscFunctionReturn(0); 396417ab2063SBarry Smith } 396517ab2063SBarry Smith 39664a2ae208SSatish Balay #undef __FUNCT__ 3967b24902e0SBarry Smith #define __FUNCT__ "MatDuplicate_SeqAIJ" 3968b24902e0SBarry Smith PetscErrorCode MatDuplicate_SeqAIJ(Mat A,MatDuplicateOption cpvalues,Mat *B) 3969b24902e0SBarry Smith { 3970b24902e0SBarry Smith PetscErrorCode ierr; 3971b24902e0SBarry Smith 3972b24902e0SBarry Smith PetscFunctionBegin; 3973b24902e0SBarry Smith ierr = MatCreate(((PetscObject)A)->comm,B);CHKERRQ(ierr); 39744b6263acSBarry Smith ierr = MatSetSizes(*B,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 3975b24902e0SBarry Smith ierr = MatSetType(*B,MATSEQAIJ);CHKERRQ(ierr); 3976f77e22a1SHong Zhang ierr = MatDuplicateNoCreate_SeqAIJ(*B,A,cpvalues,PETSC_TRUE);CHKERRQ(ierr); 3977b24902e0SBarry Smith PetscFunctionReturn(0); 3978b24902e0SBarry Smith } 3979b24902e0SBarry Smith 3980b24902e0SBarry Smith #undef __FUNCT__ 39814a2ae208SSatish Balay #define __FUNCT__ "MatLoad_SeqAIJ" 3982112444f4SShri Abhyankar PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 3983fbdbba38SShri Abhyankar { 3984fbdbba38SShri Abhyankar Mat_SeqAIJ *a; 3985fbdbba38SShri Abhyankar PetscErrorCode ierr; 3986fbdbba38SShri Abhyankar PetscInt i,sum,nz,header[4],*rowlengths = 0,M,N,rows,cols; 3987fbdbba38SShri Abhyankar int fd; 3988fbdbba38SShri Abhyankar PetscMPIInt size; 3989fbdbba38SShri Abhyankar MPI_Comm comm; 3990bbead8a2SBarry Smith PetscInt bs = 1; 3991fbdbba38SShri Abhyankar 3992fbdbba38SShri Abhyankar PetscFunctionBegin; 3993fbdbba38SShri Abhyankar ierr = PetscObjectGetComm((PetscObject)viewer,&comm);CHKERRQ(ierr); 3994fbdbba38SShri Abhyankar ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 3995fbdbba38SShri Abhyankar if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"view must have one processor"); 3996bbead8a2SBarry Smith 3997bbead8a2SBarry Smith ierr = PetscOptionsBegin(comm,PETSC_NULL,"Options for loading SEQAIJ matrix","Mat");CHKERRQ(ierr); 3998bbead8a2SBarry Smith ierr = PetscOptionsInt("-matload_block_size","Set the blocksize used to store the matrix","MatLoad",bs,&bs,PETSC_NULL);CHKERRQ(ierr); 3999bbead8a2SBarry Smith ierr = PetscOptionsEnd();CHKERRQ(ierr); 4000bbead8a2SBarry Smith 4001fbdbba38SShri Abhyankar ierr = PetscViewerBinaryGetDescriptor(viewer,&fd);CHKERRQ(ierr); 4002fbdbba38SShri Abhyankar ierr = PetscBinaryRead(fd,header,4,PETSC_INT);CHKERRQ(ierr); 4003fbdbba38SShri Abhyankar if (header[0] != MAT_FILE_CLASSID) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"not matrix object in file"); 4004fbdbba38SShri Abhyankar M = header[1]; N = header[2]; nz = header[3]; 4005fbdbba38SShri Abhyankar 4006bbead8a2SBarry Smith if (nz < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Matrix stored in special format on disk,cannot load as SeqAIJ"); 4007fbdbba38SShri Abhyankar 4008fbdbba38SShri Abhyankar /* read in row lengths */ 4009fbdbba38SShri Abhyankar ierr = PetscMalloc(M*sizeof(PetscInt),&rowlengths);CHKERRQ(ierr); 4010fbdbba38SShri Abhyankar ierr = PetscBinaryRead(fd,rowlengths,M,PETSC_INT);CHKERRQ(ierr); 4011fbdbba38SShri Abhyankar 4012fbdbba38SShri Abhyankar /* check if sum of rowlengths is same as nz */ 4013fbdbba38SShri Abhyankar for (i=0,sum=0; i< M; i++) sum +=rowlengths[i]; 4014fbdbba38SShri Abhyankar if (sum != nz) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_FILE_READ,"Inconsistant matrix data in file. no-nonzeros = %d, sum-row-lengths = %d\n",nz,sum); 4015fbdbba38SShri Abhyankar 4016fbdbba38SShri Abhyankar /* set global size if not set already*/ 4017f501eaabSShri Abhyankar if (newMat->rmap->n < 0 && newMat->rmap->N < 0 && newMat->cmap->n < 0 && newMat->cmap->N < 0) { 4018fbdbba38SShri Abhyankar ierr = MatSetSizes(newMat,PETSC_DECIDE,PETSC_DECIDE,M,N);CHKERRQ(ierr); 4019aabbc4fbSShri Abhyankar } else { 4020fbdbba38SShri Abhyankar /* if sizes and type are already set, check if the vector global sizes are correct */ 4021fbdbba38SShri Abhyankar ierr = MatGetSize(newMat,&rows,&cols);CHKERRQ(ierr); 40224c5b953cSHong Zhang if (rows < 0 && cols < 0){ /* user might provide local size instead of global size */ 40234c5b953cSHong Zhang ierr = MatGetLocalSize(newMat,&rows,&cols);CHKERRQ(ierr); 40244c5b953cSHong Zhang } 4025f501eaabSShri Abhyankar if (M != rows || N != cols) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%d, %d) than the input matrix (%d, %d)",M,N,rows,cols); 4026aabbc4fbSShri Abhyankar } 4027fbdbba38SShri Abhyankar ierr = MatSeqAIJSetPreallocation_SeqAIJ(newMat,0,rowlengths);CHKERRQ(ierr); 4028fbdbba38SShri Abhyankar a = (Mat_SeqAIJ*)newMat->data; 4029fbdbba38SShri Abhyankar 4030fbdbba38SShri Abhyankar ierr = PetscBinaryRead(fd,a->j,nz,PETSC_INT);CHKERRQ(ierr); 4031fbdbba38SShri Abhyankar 4032fbdbba38SShri Abhyankar /* read in nonzero values */ 4033fbdbba38SShri Abhyankar ierr = PetscBinaryRead(fd,a->a,nz,PETSC_SCALAR);CHKERRQ(ierr); 4034fbdbba38SShri Abhyankar 4035fbdbba38SShri Abhyankar /* set matrix "i" values */ 4036fbdbba38SShri Abhyankar a->i[0] = 0; 4037fbdbba38SShri Abhyankar for (i=1; i<= M; i++) { 4038fbdbba38SShri Abhyankar a->i[i] = a->i[i-1] + rowlengths[i-1]; 4039fbdbba38SShri Abhyankar a->ilen[i-1] = rowlengths[i-1]; 4040fbdbba38SShri Abhyankar } 4041fbdbba38SShri Abhyankar ierr = PetscFree(rowlengths);CHKERRQ(ierr); 4042fbdbba38SShri Abhyankar 4043fbdbba38SShri Abhyankar ierr = MatAssemblyBegin(newMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4044fbdbba38SShri Abhyankar ierr = MatAssemblyEnd(newMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4045bbead8a2SBarry Smith if (bs > 1) {ierr = MatSetBlockSize(newMat,bs);CHKERRQ(ierr);} 4046fbdbba38SShri Abhyankar PetscFunctionReturn(0); 4047fbdbba38SShri Abhyankar } 4048fbdbba38SShri Abhyankar 4049fbdbba38SShri Abhyankar #undef __FUNCT__ 4050b9617806SBarry Smith #define __FUNCT__ "MatEqual_SeqAIJ" 4051ace3abfcSBarry Smith PetscErrorCode MatEqual_SeqAIJ(Mat A,Mat B,PetscBool * flg) 40527264ac53SSatish Balay { 40537264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data,*b = (Mat_SeqAIJ *)B->data; 4054dfbe8321SBarry Smith PetscErrorCode ierr; 4055eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 4056eeffb40dSHong Zhang PetscInt k; 4057eeffb40dSHong Zhang #endif 40587264ac53SSatish Balay 40593a40ed3dSBarry Smith PetscFunctionBegin; 4060bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 4061d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) ||(a->nz != b->nz)) { 4062ca44d042SBarry Smith *flg = PETSC_FALSE; 4063ca44d042SBarry Smith PetscFunctionReturn(0); 4064bcd2baecSBarry Smith } 40657264ac53SSatish Balay 40667264ac53SSatish Balay /* if the a->i are the same */ 4067d0f46423SBarry Smith ierr = PetscMemcmp(a->i,b->i,(A->rmap->n+1)*sizeof(PetscInt),flg);CHKERRQ(ierr); 4068abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 40697264ac53SSatish Balay 40707264ac53SSatish Balay /* if a->j are the same */ 407197f1f81fSBarry Smith ierr = PetscMemcmp(a->j,b->j,(a->nz)*sizeof(PetscInt),flg);CHKERRQ(ierr); 4072abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 4073bcd2baecSBarry Smith 4074bcd2baecSBarry Smith /* if a->a are the same */ 4075eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 4076eeffb40dSHong Zhang for (k=0; k<a->nz; k++){ 4077eeffb40dSHong Zhang if (PetscRealPart(a->a[k]) != PetscRealPart(b->a[k]) || PetscImaginaryPart(a->a[k]) != PetscImaginaryPart(b->a[k])){ 4078eeffb40dSHong Zhang *flg = PETSC_FALSE; 40793a40ed3dSBarry Smith PetscFunctionReturn(0); 4080eeffb40dSHong Zhang } 4081eeffb40dSHong Zhang } 4082eeffb40dSHong Zhang #else 4083eeffb40dSHong Zhang ierr = PetscMemcmp(a->a,b->a,(a->nz)*sizeof(PetscScalar),flg);CHKERRQ(ierr); 4084eeffb40dSHong Zhang #endif 4085eeffb40dSHong Zhang PetscFunctionReturn(0); 40867264ac53SSatish Balay } 408736db0b34SBarry Smith 40884a2ae208SSatish Balay #undef __FUNCT__ 40894a2ae208SSatish Balay #define __FUNCT__ "MatCreateSeqAIJWithArrays" 409005869f15SSatish Balay /*@ 409136db0b34SBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential AIJ matrix using matrix elements (in CSR format) 409236db0b34SBarry Smith provided by the user. 409336db0b34SBarry Smith 4094c75a6043SHong Zhang Collective on MPI_Comm 409536db0b34SBarry Smith 409636db0b34SBarry Smith Input Parameters: 409736db0b34SBarry Smith + comm - must be an MPI communicator of size 1 409836db0b34SBarry Smith . m - number of rows 409936db0b34SBarry Smith . n - number of columns 410036db0b34SBarry Smith . i - row indices 410136db0b34SBarry Smith . j - column indices 410236db0b34SBarry Smith - a - matrix values 410336db0b34SBarry Smith 410436db0b34SBarry Smith Output Parameter: 410536db0b34SBarry Smith . mat - the matrix 410636db0b34SBarry Smith 410736db0b34SBarry Smith Level: intermediate 410836db0b34SBarry Smith 410936db0b34SBarry Smith Notes: 41100551d7c0SBarry Smith The i, j, and a arrays are not copied by this routine, the user must free these arrays 4111292fb18eSBarry Smith once the matrix is destroyed and not before 411236db0b34SBarry Smith 411336db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 411436db0b34SBarry Smith 4115bfeeae90SHong Zhang The i and j indices are 0 based 411636db0b34SBarry Smith 4117a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 4118a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 4119a4552177SSatish Balay as shown: 4120a4552177SSatish Balay 4121a4552177SSatish Balay 1 0 0 4122a4552177SSatish Balay 2 0 3 4123a4552177SSatish Balay 4 5 6 4124a4552177SSatish Balay 4125a4552177SSatish Balay i = {0,1,3,6} [size = nrow+1 = 3+1] 41269985e31cSBarry Smith j = {0,0,2,0,1,2} [size = nz = 6]; values must be sorted for each row 4127a4552177SSatish Balay v = {1,2,3,4,5,6} [size = nz = 6] 4128a4552177SSatish Balay 41299985e31cSBarry Smith 41302fb0ec9aSBarry Smith .seealso: MatCreate(), MatCreateMPIAIJ(), MatCreateSeqAIJ(), MatCreateMPIAIJWithArrays(), MatMPIAIJSetPreallocationCSR() 413136db0b34SBarry Smith 413236db0b34SBarry Smith @*/ 41337087cfbeSBarry Smith PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt* i,PetscInt*j,PetscScalar *a,Mat *mat) 413436db0b34SBarry Smith { 4135dfbe8321SBarry Smith PetscErrorCode ierr; 4136cbcfb4deSHong Zhang PetscInt ii; 413736db0b34SBarry Smith Mat_SeqAIJ *aij; 4138cbcfb4deSHong Zhang #if defined(PETSC_USE_DEBUG) 4139cbcfb4deSHong Zhang PetscInt jj; 4140cbcfb4deSHong Zhang #endif 414136db0b34SBarry Smith 414236db0b34SBarry Smith PetscFunctionBegin; 4143a96a251dSBarry Smith if (i[0]) { 4144e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"i (row indices) must start with 0"); 414536db0b34SBarry Smith } 4146f69a0ea3SMatthew Knepley ierr = MatCreate(comm,mat);CHKERRQ(ierr); 4147f69a0ea3SMatthew Knepley ierr = MatSetSizes(*mat,m,n,m,n);CHKERRQ(ierr); 4148ab93d7beSBarry Smith ierr = MatSetType(*mat,MATSEQAIJ);CHKERRQ(ierr); 4149ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(*mat,MAT_SKIP_ALLOCATION,0);CHKERRQ(ierr); 4150ab93d7beSBarry Smith aij = (Mat_SeqAIJ*)(*mat)->data; 4151ab93d7beSBarry Smith ierr = PetscMalloc2(m,PetscInt,&aij->imax,m,PetscInt,&aij->ilen);CHKERRQ(ierr); 4152ab93d7beSBarry Smith 415336db0b34SBarry Smith aij->i = i; 415436db0b34SBarry Smith aij->j = j; 415536db0b34SBarry Smith aij->a = a; 415636db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 415736db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 4158e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 4159e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 416036db0b34SBarry Smith 416136db0b34SBarry Smith for (ii=0; ii<m; ii++) { 416236db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii+1] - i[ii]; 41632515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 4164e32f2f54SBarry Smith if (i[ii+1] - i[ii] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row length in i (row indices) row = %d length = %d",ii,i[ii+1] - i[ii]); 41659985e31cSBarry Smith for (jj=i[ii]+1; jj<i[ii+1]; jj++) { 4166e32f2f54SBarry Smith if (j[jj] < j[jj-1]) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %D (actual colum %D) in row %D is not sorted",jj-i[ii],j[jj],ii); 4167e32f2f54SBarry Smith if (j[jj] == j[jj]-1) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %D (actual colum %D) in row %D is identical to previous entry",jj-i[ii],j[jj],ii); 41689985e31cSBarry Smith } 416936db0b34SBarry Smith #endif 417036db0b34SBarry Smith } 41712515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 417236db0b34SBarry Smith for (ii=0; ii<aij->i[m]; ii++) { 4173e32f2f54SBarry Smith if (j[ii] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column index at location = %d index = %d",ii,j[ii]); 4174e32f2f54SBarry Smith if (j[ii] > n - 1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column index to large at location = %d index = %d",ii,j[ii]); 417536db0b34SBarry Smith } 417636db0b34SBarry Smith #endif 417736db0b34SBarry Smith 4178b65db4caSBarry Smith ierr = MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4179b65db4caSBarry Smith ierr = MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 418036db0b34SBarry Smith PetscFunctionReturn(0); 418136db0b34SBarry Smith } 418236db0b34SBarry Smith 4183cc8ba8e1SBarry Smith #undef __FUNCT__ 4184ee4f033dSBarry Smith #define __FUNCT__ "MatSetColoring_SeqAIJ" 4185dfbe8321SBarry Smith PetscErrorCode MatSetColoring_SeqAIJ(Mat A,ISColoring coloring) 4186cc8ba8e1SBarry Smith { 4187dfbe8321SBarry Smith PetscErrorCode ierr; 4188cc8ba8e1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 418936db0b34SBarry Smith 4190cc8ba8e1SBarry Smith PetscFunctionBegin; 41918ee2e534SBarry Smith if (coloring->ctype == IS_COLORING_GLOBAL) { 4192cc8ba8e1SBarry Smith ierr = ISColoringReference(coloring);CHKERRQ(ierr); 4193cc8ba8e1SBarry Smith a->coloring = coloring; 419412c595b3SBarry Smith } else if (coloring->ctype == IS_COLORING_GHOSTED) { 419597f1f81fSBarry Smith PetscInt i,*larray; 419612c595b3SBarry Smith ISColoring ocoloring; 419708b6dcc0SBarry Smith ISColoringValue *colors; 419812c595b3SBarry Smith 419912c595b3SBarry Smith /* set coloring for diagonal portion */ 42000e83c824SBarry Smith ierr = PetscMalloc(A->cmap->n*sizeof(PetscInt),&larray);CHKERRQ(ierr); 4201d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) { 420212c595b3SBarry Smith larray[i] = i; 420312c595b3SBarry Smith } 4204992144d0SBarry Smith ierr = ISGlobalToLocalMappingApply(A->cmap->mapping,IS_GTOLM_MASK,A->cmap->n,larray,PETSC_NULL,larray);CHKERRQ(ierr); 42050e83c824SBarry Smith ierr = PetscMalloc(A->cmap->n*sizeof(ISColoringValue),&colors);CHKERRQ(ierr); 4206d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) { 420712c595b3SBarry Smith colors[i] = coloring->colors[larray[i]]; 420812c595b3SBarry Smith } 420912c595b3SBarry Smith ierr = PetscFree(larray);CHKERRQ(ierr); 4210d0f46423SBarry Smith ierr = ISColoringCreate(PETSC_COMM_SELF,coloring->n,A->cmap->n,colors,&ocoloring);CHKERRQ(ierr); 421112c595b3SBarry Smith a->coloring = ocoloring; 421212c595b3SBarry Smith } 4213cc8ba8e1SBarry Smith PetscFunctionReturn(0); 4214cc8ba8e1SBarry Smith } 4215cc8ba8e1SBarry Smith 4216dcf5cc72SBarry Smith #if defined(PETSC_HAVE_ADIC) 4217ee4f033dSBarry Smith EXTERN_C_BEGIN 4218c6db04a5SJed Brown #include <adic/ad_utils.h> 4219ee4f033dSBarry Smith EXTERN_C_END 4220cc8ba8e1SBarry Smith 4221cc8ba8e1SBarry Smith #undef __FUNCT__ 4222ee4f033dSBarry Smith #define __FUNCT__ "MatSetValuesAdic_SeqAIJ" 4223dfbe8321SBarry Smith PetscErrorCode MatSetValuesAdic_SeqAIJ(Mat A,void *advalues) 4224cc8ba8e1SBarry Smith { 4225cc8ba8e1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 4226d0f46423SBarry Smith PetscInt m = A->rmap->n,*ii = a->i,*jj = a->j,nz,i,j,nlen; 42274440f671SBarry Smith PetscScalar *v = a->a,*values = ((PetscScalar*)advalues)+1; 422808b6dcc0SBarry Smith ISColoringValue *color; 4229cc8ba8e1SBarry Smith 4230cc8ba8e1SBarry Smith PetscFunctionBegin; 4231e32f2f54SBarry Smith if (!a->coloring) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Coloring not set for matrix"); 42324440f671SBarry Smith nlen = PetscADGetDerivTypeSize()/sizeof(PetscScalar); 4233cc8ba8e1SBarry Smith color = a->coloring->colors; 4234cc8ba8e1SBarry Smith /* loop over rows */ 4235cc8ba8e1SBarry Smith for (i=0; i<m; i++) { 4236cc8ba8e1SBarry Smith nz = ii[i+1] - ii[i]; 4237cc8ba8e1SBarry Smith /* loop over columns putting computed value into matrix */ 4238cc8ba8e1SBarry Smith for (j=0; j<nz; j++) { 4239cc8ba8e1SBarry Smith *v++ = values[color[*jj++]]; 4240cc8ba8e1SBarry Smith } 42414440f671SBarry Smith values += nlen; /* jump to next row of derivatives */ 4242ee4f033dSBarry Smith } 4243ee4f033dSBarry Smith PetscFunctionReturn(0); 4244ee4f033dSBarry Smith } 4245ee4f033dSBarry Smith #endif 4246ee4f033dSBarry Smith 4247ee4f033dSBarry Smith #undef __FUNCT__ 4248ee4f033dSBarry Smith #define __FUNCT__ "MatSetValuesAdifor_SeqAIJ" 424997f1f81fSBarry Smith PetscErrorCode MatSetValuesAdifor_SeqAIJ(Mat A,PetscInt nl,void *advalues) 4250ee4f033dSBarry Smith { 4251ee4f033dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 4252d0f46423SBarry Smith PetscInt m = A->rmap->n,*ii = a->i,*jj = a->j,nz,i,j; 425354f21887SBarry Smith MatScalar *v = a->a; 425454f21887SBarry Smith PetscScalar *values = (PetscScalar *)advalues; 425508b6dcc0SBarry Smith ISColoringValue *color; 4256ee4f033dSBarry Smith 4257ee4f033dSBarry Smith PetscFunctionBegin; 4258e32f2f54SBarry Smith if (!a->coloring) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Coloring not set for matrix"); 4259ee4f033dSBarry Smith color = a->coloring->colors; 4260ee4f033dSBarry Smith /* loop over rows */ 4261ee4f033dSBarry Smith for (i=0; i<m; i++) { 4262ee4f033dSBarry Smith nz = ii[i+1] - ii[i]; 4263ee4f033dSBarry Smith /* loop over columns putting computed value into matrix */ 4264ee4f033dSBarry Smith for (j=0; j<nz; j++) { 4265ee4f033dSBarry Smith *v++ = values[color[*jj++]]; 4266ee4f033dSBarry Smith } 4267ee4f033dSBarry Smith values += nl; /* jump to next row of derivatives */ 4268cc8ba8e1SBarry Smith } 4269cc8ba8e1SBarry Smith PetscFunctionReturn(0); 4270cc8ba8e1SBarry Smith } 427136db0b34SBarry Smith 427281824310SBarry Smith /* 427381824310SBarry Smith Special version for direct calls from Fortran 427481824310SBarry Smith */ 4275c6db04a5SJed Brown #include <private/fortranimpl.h> 427681824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 427781824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 427881824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 427981824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 428081824310SBarry Smith #endif 428181824310SBarry Smith 428281824310SBarry Smith /* Change these macros so can be used in void function */ 428381824310SBarry Smith #undef CHKERRQ 42847adad957SLisandro Dalcin #define CHKERRQ(ierr) CHKERRABORT(((PetscObject)A)->comm,ierr) 428581824310SBarry Smith #undef SETERRQ2 4286e32f2f54SBarry Smith #define SETERRQ2(comm,ierr,b,c,d) CHKERRABORT(comm,ierr) 428781824310SBarry Smith 428881824310SBarry Smith EXTERN_C_BEGIN 428981824310SBarry Smith #undef __FUNCT__ 429081824310SBarry Smith #define __FUNCT__ "matsetvaluesseqaij_" 42911f6cc5b2SSatish Balay void PETSC_STDCALL matsetvaluesseqaij_(Mat *AA,PetscInt *mm,const PetscInt im[],PetscInt *nn,const PetscInt in[],const PetscScalar v[],InsertMode *isis, PetscErrorCode *_ierr) 429281824310SBarry Smith { 429381824310SBarry Smith Mat A = *AA; 429481824310SBarry Smith PetscInt m = *mm, n = *nn; 429581824310SBarry Smith InsertMode is = *isis; 429681824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 429781824310SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 429881824310SBarry Smith PetscInt *imax,*ai,*ailen; 429981824310SBarry Smith PetscErrorCode ierr; 430081824310SBarry Smith PetscInt *aj,nonew = a->nonew,lastcol = -1; 430154f21887SBarry Smith MatScalar *ap,value,*aa; 4302ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 4303ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 430481824310SBarry Smith 430581824310SBarry Smith PetscFunctionBegin; 4306d9e2c085SLisandro Dalcin ierr = MatPreallocated(A);CHKERRQ(ierr); 430781824310SBarry Smith imax = a->imax; 430881824310SBarry Smith ai = a->i; 430981824310SBarry Smith ailen = a->ilen; 431081824310SBarry Smith aj = a->j; 431181824310SBarry Smith aa = a->a; 431281824310SBarry Smith 431381824310SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 431481824310SBarry Smith row = im[k]; 431581824310SBarry Smith if (row < 0) continue; 431681824310SBarry Smith #if defined(PETSC_USE_DEBUG) 4317d0f46423SBarry Smith if (row >= A->rmap->n) SETERRABORT(((PetscObject)A)->comm,PETSC_ERR_ARG_OUTOFRANGE,"Row too large"); 431881824310SBarry Smith #endif 431981824310SBarry Smith rp = aj + ai[row]; ap = aa + ai[row]; 432081824310SBarry Smith rmax = imax[row]; nrow = ailen[row]; 432181824310SBarry Smith low = 0; 432281824310SBarry Smith high = nrow; 432381824310SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 432481824310SBarry Smith if (in[l] < 0) continue; 432581824310SBarry Smith #if defined(PETSC_USE_DEBUG) 4326d0f46423SBarry Smith if (in[l] >= A->cmap->n) SETERRABORT(((PetscObject)A)->comm,PETSC_ERR_ARG_OUTOFRANGE,"Column too large"); 432781824310SBarry Smith #endif 432881824310SBarry Smith col = in[l]; 432981824310SBarry Smith if (roworiented) { 433081824310SBarry Smith value = v[l + k*n]; 433181824310SBarry Smith } else { 433281824310SBarry Smith value = v[k + l*m]; 433381824310SBarry Smith } 433481824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 433581824310SBarry Smith 433681824310SBarry Smith if (col <= lastcol) low = 0; else high = nrow; 433781824310SBarry Smith lastcol = col; 433881824310SBarry Smith while (high-low > 5) { 433981824310SBarry Smith t = (low+high)/2; 434081824310SBarry Smith if (rp[t] > col) high = t; 434181824310SBarry Smith else low = t; 434281824310SBarry Smith } 434381824310SBarry Smith for (i=low; i<high; i++) { 434481824310SBarry Smith if (rp[i] > col) break; 434581824310SBarry Smith if (rp[i] == col) { 434681824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 434781824310SBarry Smith else ap[i] = value; 434881824310SBarry Smith goto noinsert; 434981824310SBarry Smith } 435081824310SBarry Smith } 435181824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 435281824310SBarry Smith if (nonew == 1) goto noinsert; 43537adad957SLisandro Dalcin if (nonew == -1) SETERRABORT(((PetscObject)A)->comm,PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero in the matrix"); 4354fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 435581824310SBarry Smith N = nrow++ - 1; a->nz++; high++; 435681824310SBarry Smith /* shift up all the later entries in this row */ 435781824310SBarry Smith for (ii=N; ii>=i; ii--) { 435881824310SBarry Smith rp[ii+1] = rp[ii]; 435981824310SBarry Smith ap[ii+1] = ap[ii]; 436081824310SBarry Smith } 436181824310SBarry Smith rp[i] = col; 436281824310SBarry Smith ap[i] = value; 436381824310SBarry Smith noinsert:; 436481824310SBarry Smith low = i + 1; 436581824310SBarry Smith } 436681824310SBarry Smith ailen[row] = nrow; 436781824310SBarry Smith } 436881824310SBarry Smith A->same_nonzero = PETSC_FALSE; 436981824310SBarry Smith PetscFunctionReturnVoid(); 437081824310SBarry Smith } 437181824310SBarry Smith EXTERN_C_END 437262298a1eSBarry Smith 4373