1b377110cSBarry Smith 2d5d45c9bSBarry Smith /* 33369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 4d5d45c9bSBarry Smith matrix storage format. 5d5d45c9bSBarry Smith */ 63369ce9aSBarry Smith 77c4f633dSBarry Smith 8c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 9c6db04a5SJed Brown #include <petscblaslapack.h> 10c6db04a5SJed Brown #include <petscbt.h> 1117ab2063SBarry Smith 120716a85fSBarry Smith 130716a85fSBarry Smith #undef __FUNCT__ 140716a85fSBarry Smith #define __FUNCT__ "MatGetColumnNorms_SeqAIJ" 150716a85fSBarry Smith PetscErrorCode MatGetColumnNorms_SeqAIJ(Mat A,NormType type,PetscReal *norms) 160716a85fSBarry Smith { 170716a85fSBarry Smith PetscErrorCode ierr; 180716a85fSBarry Smith PetscInt i,m,n; 190716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 200716a85fSBarry Smith 210716a85fSBarry Smith PetscFunctionBegin; 220716a85fSBarry Smith ierr = MatGetSize(A,&m,&n);CHKERRQ(ierr); 230716a85fSBarry Smith ierr = PetscMemzero(norms,n*sizeof(PetscReal));CHKERRQ(ierr); 240716a85fSBarry Smith if (type == NORM_2) { 250716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 260716a85fSBarry Smith norms[aij->j[i]] += PetscAbsScalar(aij->a[i]*aij->a[i]); 270716a85fSBarry Smith } 280716a85fSBarry Smith } else if (type == NORM_1) { 290716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 300716a85fSBarry Smith norms[aij->j[i]] += PetscAbsScalar(aij->a[i]); 310716a85fSBarry Smith } 320716a85fSBarry Smith } else if (type == NORM_INFINITY) { 330716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 340716a85fSBarry Smith norms[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]),norms[aij->j[i]]); 350716a85fSBarry Smith } 360716a85fSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Unknown NormType"); 370716a85fSBarry Smith 380716a85fSBarry Smith if (type == NORM_2) { 398f1a2a5eSBarry Smith for (i=0; i<n; i++) norms[i] = PetscSqrtReal(norms[i]); 400716a85fSBarry Smith } 410716a85fSBarry Smith PetscFunctionReturn(0); 420716a85fSBarry Smith } 430716a85fSBarry Smith 444a2ae208SSatish Balay #undef __FUNCT__ 456ce1633cSBarry Smith #define __FUNCT__ "MatFindZeroDiagonals_SeqAIJ" 466ce1633cSBarry Smith PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A,IS *zrows) 476ce1633cSBarry Smith { 486ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 496ce1633cSBarry Smith const MatScalar *aa = a->a; 506ce1633cSBarry Smith PetscInt i,m=A->rmap->n,cnt = 0; 516ce1633cSBarry Smith const PetscInt *jj = a->j,*diag; 526ce1633cSBarry Smith PetscInt *rows; 536ce1633cSBarry Smith PetscErrorCode ierr; 546ce1633cSBarry Smith 556ce1633cSBarry Smith PetscFunctionBegin; 566ce1633cSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 576ce1633cSBarry Smith diag = a->diag; 586ce1633cSBarry Smith for (i=0; i<m; i++) { 596ce1633cSBarry Smith if ((jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 606ce1633cSBarry Smith cnt++; 616ce1633cSBarry Smith } 626ce1633cSBarry Smith } 636ce1633cSBarry Smith ierr = PetscMalloc(cnt*sizeof(PetscInt),&rows);CHKERRQ(ierr); 646ce1633cSBarry Smith cnt = 0; 656ce1633cSBarry Smith for (i=0; i<m; i++) { 666ce1633cSBarry Smith if ((jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 676ce1633cSBarry Smith rows[cnt++] = i; 686ce1633cSBarry Smith } 696ce1633cSBarry Smith } 706ce1633cSBarry Smith ierr = ISCreateGeneral(((PetscObject)A)->comm,cnt,rows,PETSC_OWN_POINTER,zrows);CHKERRQ(ierr); 716ce1633cSBarry Smith PetscFunctionReturn(0); 726ce1633cSBarry Smith } 736ce1633cSBarry Smith 746ce1633cSBarry Smith #undef __FUNCT__ 75b3a44c85SBarry Smith #define __FUNCT__ "MatFindNonzeroRows_SeqAIJ" 76b3a44c85SBarry Smith PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A,IS *keptrows) 77b3a44c85SBarry Smith { 78b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 79b3a44c85SBarry Smith const MatScalar *aa; 80b3a44c85SBarry Smith PetscInt m=A->rmap->n,cnt = 0; 81b3a44c85SBarry Smith const PetscInt *ii; 82b3a44c85SBarry Smith PetscInt n,i,j,*rows; 83b3a44c85SBarry Smith PetscErrorCode ierr; 84b3a44c85SBarry Smith 85b3a44c85SBarry Smith PetscFunctionBegin; 86b3a44c85SBarry Smith *keptrows = 0; 87b3a44c85SBarry Smith ii = a->i; 88b3a44c85SBarry Smith for (i=0; i<m; i++) { 89b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 90b3a44c85SBarry Smith if (!n) { 91b3a44c85SBarry Smith cnt++; 92b3a44c85SBarry Smith goto ok1; 93b3a44c85SBarry Smith } 94b3a44c85SBarry Smith aa = a->a + ii[i]; 95b3a44c85SBarry Smith for (j=0; j<n; j++) { 96b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 97b3a44c85SBarry Smith } 98b3a44c85SBarry Smith cnt++; 99b3a44c85SBarry Smith ok1:; 100b3a44c85SBarry Smith } 101b3a44c85SBarry Smith if (!cnt) PetscFunctionReturn(0); 102b3a44c85SBarry Smith ierr = PetscMalloc((A->rmap->n-cnt)*sizeof(PetscInt),&rows);CHKERRQ(ierr); 103b3a44c85SBarry Smith cnt = 0; 104b3a44c85SBarry Smith for (i=0; i<m; i++) { 105b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 106b3a44c85SBarry Smith if (!n) continue; 107b3a44c85SBarry Smith aa = a->a + ii[i]; 108b3a44c85SBarry Smith for (j=0; j<n; j++) { 109b3a44c85SBarry Smith if (aa[j] != 0.0) { 110b3a44c85SBarry Smith rows[cnt++] = i; 111b3a44c85SBarry Smith break; 112b3a44c85SBarry Smith } 113b3a44c85SBarry Smith } 114b3a44c85SBarry Smith } 115b3a44c85SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,cnt,rows,PETSC_OWN_POINTER,keptrows);CHKERRQ(ierr); 116b3a44c85SBarry Smith PetscFunctionReturn(0); 117b3a44c85SBarry Smith } 118b3a44c85SBarry Smith 119b3a44c85SBarry Smith #undef __FUNCT__ 12079299369SBarry Smith #define __FUNCT__ "MatDiagonalSet_SeqAIJ" 1217087cfbeSBarry Smith PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y,Vec D,InsertMode is) 12279299369SBarry Smith { 12379299369SBarry Smith PetscErrorCode ierr; 12479299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) Y->data; 125d0f46423SBarry Smith PetscInt i,*diag, m = Y->rmap->n; 12654f21887SBarry Smith MatScalar *aa = aij->a; 12754f21887SBarry Smith PetscScalar *v; 128ace3abfcSBarry Smith PetscBool missing; 12979299369SBarry Smith 13079299369SBarry Smith PetscFunctionBegin; 13109f38230SBarry Smith if (Y->assembled) { 13209f38230SBarry Smith ierr = MatMissingDiagonal_SeqAIJ(Y,&missing,PETSC_NULL);CHKERRQ(ierr); 13309f38230SBarry Smith if (!missing) { 13479299369SBarry Smith diag = aij->diag; 13579299369SBarry Smith ierr = VecGetArray(D,&v);CHKERRQ(ierr); 13679299369SBarry Smith if (is == INSERT_VALUES) { 13779299369SBarry Smith for (i=0; i<m; i++) { 13879299369SBarry Smith aa[diag[i]] = v[i]; 13979299369SBarry Smith } 14079299369SBarry Smith } else { 14179299369SBarry Smith for (i=0; i<m; i++) { 14279299369SBarry Smith aa[diag[i]] += v[i]; 14379299369SBarry Smith } 14479299369SBarry Smith } 14579299369SBarry Smith ierr = VecRestoreArray(D,&v);CHKERRQ(ierr); 14679299369SBarry Smith PetscFunctionReturn(0); 14779299369SBarry Smith } 148*86c113feSBarry Smith aij->idiagvalid = PETSC_FALSE; 149*86c113feSBarry Smith aij->ibdiagvalid = PETSC_FALSE; 15009f38230SBarry Smith } 15109f38230SBarry Smith ierr = MatDiagonalSet_Default(Y,D,is);CHKERRQ(ierr); 15209f38230SBarry Smith PetscFunctionReturn(0); 15309f38230SBarry Smith } 15479299369SBarry Smith 15579299369SBarry Smith #undef __FUNCT__ 1564a2ae208SSatish Balay #define __FUNCT__ "MatGetRowIJ_SeqAIJ" 157ace3abfcSBarry Smith PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *m,PetscInt *ia[],PetscInt *ja[],PetscBool *done) 15817ab2063SBarry Smith { 159416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 160dfbe8321SBarry Smith PetscErrorCode ierr; 16197f1f81fSBarry Smith PetscInt i,ishift; 16217ab2063SBarry Smith 1633a40ed3dSBarry Smith PetscFunctionBegin; 164d0f46423SBarry Smith *m = A->rmap->n; 1653a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 166bfeeae90SHong Zhang ishift = 0; 16753e63a63SBarry Smith if (symmetric && !A->structurally_symmetric) { 168d0f46423SBarry Smith ierr = MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,ishift,oshift,ia,ja);CHKERRQ(ierr); 169bfeeae90SHong Zhang } else if (oshift == 1) { 170d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 1713b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 172d0f46423SBarry Smith ierr = PetscMalloc((A->rmap->n+1)*sizeof(PetscInt),ia);CHKERRQ(ierr); 173d0f46423SBarry Smith for (i=0; i<A->rmap->n+1; i++) (*ia)[i] = a->i[i] + 1; 174ecc77c7aSBarry Smith if (ja) { 17597f1f81fSBarry Smith ierr = PetscMalloc((nz+1)*sizeof(PetscInt),ja);CHKERRQ(ierr); 1763b2fbd54SBarry Smith for (i=0; i<nz; i++) (*ja)[i] = a->j[i] + 1; 177ecc77c7aSBarry Smith } 1786945ee14SBarry Smith } else { 179ecc77c7aSBarry Smith *ia = a->i; 180ecc77c7aSBarry Smith if (ja) *ja = a->j; 181a2ce50c7SBarry Smith } 1823a40ed3dSBarry Smith PetscFunctionReturn(0); 183a2744918SBarry Smith } 184a2744918SBarry Smith 1854a2ae208SSatish Balay #undef __FUNCT__ 1864a2ae208SSatish Balay #define __FUNCT__ "MatRestoreRowIJ_SeqAIJ" 187ace3abfcSBarry Smith PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,PetscInt *ia[],PetscInt *ja[],PetscBool *done) 1886945ee14SBarry Smith { 189dfbe8321SBarry Smith PetscErrorCode ierr; 1906945ee14SBarry Smith 1913a40ed3dSBarry Smith PetscFunctionBegin; 1923a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 193bfeeae90SHong Zhang if ((symmetric && !A->structurally_symmetric) || oshift == 1) { 194606d414cSSatish Balay ierr = PetscFree(*ia);CHKERRQ(ierr); 195ecc77c7aSBarry Smith if (ja) {ierr = PetscFree(*ja);CHKERRQ(ierr);} 196bcd2baecSBarry Smith } 1973a40ed3dSBarry Smith PetscFunctionReturn(0); 19817ab2063SBarry Smith } 19917ab2063SBarry Smith 2004a2ae208SSatish Balay #undef __FUNCT__ 2014a2ae208SSatish Balay #define __FUNCT__ "MatGetColumnIJ_SeqAIJ" 202ace3abfcSBarry Smith PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *nn,PetscInt *ia[],PetscInt *ja[],PetscBool *done) 2033b2fbd54SBarry Smith { 2043b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 205dfbe8321SBarry Smith PetscErrorCode ierr; 206d0f46423SBarry Smith PetscInt i,*collengths,*cia,*cja,n = A->cmap->n,m = A->rmap->n; 20797f1f81fSBarry Smith PetscInt nz = a->i[m],row,*jj,mr,col; 2083b2fbd54SBarry Smith 2093a40ed3dSBarry Smith PetscFunctionBegin; 210899cda47SBarry Smith *nn = n; 2113a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2123b2fbd54SBarry Smith if (symmetric) { 213d0f46423SBarry Smith ierr = MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,0,oshift,ia,ja);CHKERRQ(ierr); 2143b2fbd54SBarry Smith } else { 21597f1f81fSBarry Smith ierr = PetscMalloc((n+1)*sizeof(PetscInt),&collengths);CHKERRQ(ierr); 21697f1f81fSBarry Smith ierr = PetscMemzero(collengths,n*sizeof(PetscInt));CHKERRQ(ierr); 21797f1f81fSBarry Smith ierr = PetscMalloc((n+1)*sizeof(PetscInt),&cia);CHKERRQ(ierr); 21897f1f81fSBarry Smith ierr = PetscMalloc((nz+1)*sizeof(PetscInt),&cja);CHKERRQ(ierr); 2193b2fbd54SBarry Smith jj = a->j; 2203b2fbd54SBarry Smith for (i=0; i<nz; i++) { 221bfeeae90SHong Zhang collengths[jj[i]]++; 2223b2fbd54SBarry Smith } 2233b2fbd54SBarry Smith cia[0] = oshift; 2243b2fbd54SBarry Smith for (i=0; i<n; i++) { 2253b2fbd54SBarry Smith cia[i+1] = cia[i] + collengths[i]; 2263b2fbd54SBarry Smith } 22797f1f81fSBarry Smith ierr = PetscMemzero(collengths,n*sizeof(PetscInt));CHKERRQ(ierr); 2283b2fbd54SBarry Smith jj = a->j; 229a93ec695SBarry Smith for (row=0; row<m; row++) { 230a93ec695SBarry Smith mr = a->i[row+1] - a->i[row]; 231a93ec695SBarry Smith for (i=0; i<mr; i++) { 232bfeeae90SHong Zhang col = *jj++; 2333b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2343b2fbd54SBarry Smith } 2353b2fbd54SBarry Smith } 236606d414cSSatish Balay ierr = PetscFree(collengths);CHKERRQ(ierr); 2373b2fbd54SBarry Smith *ia = cia; *ja = cja; 2383b2fbd54SBarry Smith } 2393a40ed3dSBarry Smith PetscFunctionReturn(0); 2403b2fbd54SBarry Smith } 2413b2fbd54SBarry Smith 2424a2ae208SSatish Balay #undef __FUNCT__ 2434a2ae208SSatish Balay #define __FUNCT__ "MatRestoreColumnIJ_SeqAIJ" 244ace3abfcSBarry Smith PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,PetscInt *ia[],PetscInt *ja[],PetscBool *done) 2453b2fbd54SBarry Smith { 246dfbe8321SBarry Smith PetscErrorCode ierr; 247606d414cSSatish Balay 2483a40ed3dSBarry Smith PetscFunctionBegin; 2493a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2503b2fbd54SBarry Smith 251606d414cSSatish Balay ierr = PetscFree(*ia);CHKERRQ(ierr); 252606d414cSSatish Balay ierr = PetscFree(*ja);CHKERRQ(ierr); 2533b2fbd54SBarry Smith 2543a40ed3dSBarry Smith PetscFunctionReturn(0); 2553b2fbd54SBarry Smith } 2563b2fbd54SBarry Smith 25787d4246cSBarry Smith #undef __FUNCT__ 25887d4246cSBarry Smith #define __FUNCT__ "MatSetValuesRow_SeqAIJ" 25987d4246cSBarry Smith PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A,PetscInt row,const PetscScalar v[]) 26087d4246cSBarry Smith { 26187d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 26287d4246cSBarry Smith PetscInt *ai = a->i; 26387d4246cSBarry Smith PetscErrorCode ierr; 26487d4246cSBarry Smith 26587d4246cSBarry Smith PetscFunctionBegin; 26687d4246cSBarry Smith ierr = PetscMemcpy(a->a+ai[row],v,(ai[row+1]-ai[row])*sizeof(PetscScalar));CHKERRQ(ierr); 26787d4246cSBarry Smith PetscFunctionReturn(0); 26887d4246cSBarry Smith } 26987d4246cSBarry Smith 2704a2ae208SSatish Balay #undef __FUNCT__ 2714a2ae208SSatish Balay #define __FUNCT__ "MatSetValues_SeqAIJ" 27297f1f81fSBarry Smith PetscErrorCode MatSetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 27317ab2063SBarry Smith { 274416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 275e2ee6c50SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 27697f1f81fSBarry Smith PetscInt *imax = a->imax,*ai = a->i,*ailen = a->ilen; 2776849ba73SBarry Smith PetscErrorCode ierr; 278e2ee6c50SBarry Smith PetscInt *aj = a->j,nonew = a->nonew,lastcol = -1; 27954f21887SBarry Smith MatScalar *ap,value,*aa = a->a; 280ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 281ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 28217ab2063SBarry Smith 2833a40ed3dSBarry Smith PetscFunctionBegin; 28471fd2e92SBarry Smith if (v) PetscValidScalarPointer(v,6); 28517ab2063SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 286416022c9SBarry Smith row = im[k]; 2875ef9f2a5SBarry Smith if (row < 0) continue; 2882515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 289e32f2f54SBarry Smith if (row >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",row,A->rmap->n-1); 2903b2fbd54SBarry Smith #endif 291bfeeae90SHong Zhang rp = aj + ai[row]; ap = aa + ai[row]; 29217ab2063SBarry Smith rmax = imax[row]; nrow = ailen[row]; 293416022c9SBarry Smith low = 0; 294c71e6ed7SBarry Smith high = nrow; 29517ab2063SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 2965ef9f2a5SBarry Smith if (in[l] < 0) continue; 2972515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 298e32f2f54SBarry Smith if (in[l] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",in[l],A->cmap->n-1); 2993b2fbd54SBarry Smith #endif 300bfeeae90SHong Zhang col = in[l]; 30116371a99SBarry Smith if (v) { 3024b0e389bSBarry Smith if (roworiented) { 3035ef9f2a5SBarry Smith value = v[l + k*n]; 304bef8e0ddSBarry Smith } else { 3054b0e389bSBarry Smith value = v[k + l*m]; 3064b0e389bSBarry Smith } 30716371a99SBarry Smith } else { 30875567043SBarry Smith value = 0.; 30916371a99SBarry Smith } 310abc0a331SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 31136db0b34SBarry Smith 3127cd84e04SBarry Smith if (col <= lastcol) low = 0; else high = nrow; 313e2ee6c50SBarry Smith lastcol = col; 314416022c9SBarry Smith while (high-low > 5) { 315416022c9SBarry Smith t = (low+high)/2; 316416022c9SBarry Smith if (rp[t] > col) high = t; 317416022c9SBarry Smith else low = t; 31817ab2063SBarry Smith } 319416022c9SBarry Smith for (i=low; i<high; i++) { 32017ab2063SBarry Smith if (rp[i] > col) break; 32117ab2063SBarry Smith if (rp[i] == col) { 322416022c9SBarry Smith if (is == ADD_VALUES) ap[i] += value; 32317ab2063SBarry Smith else ap[i] = value; 324e44c0bd4SBarry Smith low = i + 1; 32517ab2063SBarry Smith goto noinsert; 32617ab2063SBarry Smith } 32717ab2063SBarry Smith } 328abc0a331SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 329c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 330e32f2f54SBarry Smith if (nonew == -1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero at (%D,%D) in the matrix",row,col); 331fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 332c03d1d03SSatish Balay N = nrow++ - 1; a->nz++; high++; 333416022c9SBarry Smith /* shift up all the later entries in this row */ 334416022c9SBarry Smith for (ii=N; ii>=i; ii--) { 33517ab2063SBarry Smith rp[ii+1] = rp[ii]; 33617ab2063SBarry Smith ap[ii+1] = ap[ii]; 33717ab2063SBarry Smith } 33817ab2063SBarry Smith rp[i] = col; 33917ab2063SBarry Smith ap[i] = value; 340416022c9SBarry Smith low = i + 1; 341e44c0bd4SBarry Smith noinsert:; 34217ab2063SBarry Smith } 34317ab2063SBarry Smith ailen[row] = nrow; 34417ab2063SBarry Smith } 34588e51ccdSHong Zhang A->same_nonzero = PETSC_FALSE; 3463a40ed3dSBarry Smith PetscFunctionReturn(0); 34717ab2063SBarry Smith } 34817ab2063SBarry Smith 34981824310SBarry Smith 3504a2ae208SSatish Balay #undef __FUNCT__ 3514a2ae208SSatish Balay #define __FUNCT__ "MatGetValues_SeqAIJ" 352a77337e4SBarry Smith PetscErrorCode MatGetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],PetscScalar v[]) 3537eb43aa7SLois Curfman McInnes { 3547eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 35597f1f81fSBarry Smith PetscInt *rp,k,low,high,t,row,nrow,i,col,l,*aj = a->j; 35697f1f81fSBarry Smith PetscInt *ai = a->i,*ailen = a->ilen; 35754f21887SBarry Smith MatScalar *ap,*aa = a->a; 3587eb43aa7SLois Curfman McInnes 3593a40ed3dSBarry Smith PetscFunctionBegin; 3607eb43aa7SLois Curfman McInnes for (k=0; k<m; k++) { /* loop over rows */ 3617eb43aa7SLois Curfman McInnes row = im[k]; 362e32f2f54SBarry Smith if (row < 0) {v += n; continue;} /* SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row: %D",row); */ 363e32f2f54SBarry Smith if (row >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",row,A->rmap->n-1); 364bfeeae90SHong Zhang rp = aj + ai[row]; ap = aa + ai[row]; 3657eb43aa7SLois Curfman McInnes nrow = ailen[row]; 3667eb43aa7SLois Curfman McInnes for (l=0; l<n; l++) { /* loop over columns */ 367e32f2f54SBarry Smith if (in[l] < 0) {v++; continue;} /* SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column: %D",in[l]); */ 368e32f2f54SBarry Smith if (in[l] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",in[l],A->cmap->n-1); 369bfeeae90SHong Zhang col = in[l] ; 3707eb43aa7SLois Curfman McInnes high = nrow; low = 0; /* assume unsorted */ 3717eb43aa7SLois Curfman McInnes while (high-low > 5) { 3727eb43aa7SLois Curfman McInnes t = (low+high)/2; 3737eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 3747eb43aa7SLois Curfman McInnes else low = t; 3757eb43aa7SLois Curfman McInnes } 3767eb43aa7SLois Curfman McInnes for (i=low; i<high; i++) { 3777eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 3787eb43aa7SLois Curfman McInnes if (rp[i] == col) { 379b49de8d1SLois Curfman McInnes *v++ = ap[i]; 3807eb43aa7SLois Curfman McInnes goto finished; 3817eb43aa7SLois Curfman McInnes } 3827eb43aa7SLois Curfman McInnes } 38397e567efSBarry Smith *v++ = 0.0; 3847eb43aa7SLois Curfman McInnes finished:; 3857eb43aa7SLois Curfman McInnes } 3867eb43aa7SLois Curfman McInnes } 3873a40ed3dSBarry Smith PetscFunctionReturn(0); 3887eb43aa7SLois Curfman McInnes } 3897eb43aa7SLois Curfman McInnes 39017ab2063SBarry Smith 3914a2ae208SSatish Balay #undef __FUNCT__ 3924a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqAIJ_Binary" 393dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Binary(Mat A,PetscViewer viewer) 39417ab2063SBarry Smith { 395416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3966849ba73SBarry Smith PetscErrorCode ierr; 3976f69ff64SBarry Smith PetscInt i,*col_lens; 3986f69ff64SBarry Smith int fd; 39917ab2063SBarry Smith 4003a40ed3dSBarry Smith PetscFunctionBegin; 401b0a32e0cSBarry Smith ierr = PetscViewerBinaryGetDescriptor(viewer,&fd);CHKERRQ(ierr); 402d0f46423SBarry Smith ierr = PetscMalloc((4+A->rmap->n)*sizeof(PetscInt),&col_lens);CHKERRQ(ierr); 4030700a824SBarry Smith col_lens[0] = MAT_FILE_CLASSID; 404d0f46423SBarry Smith col_lens[1] = A->rmap->n; 405d0f46423SBarry Smith col_lens[2] = A->cmap->n; 406416022c9SBarry Smith col_lens[3] = a->nz; 407416022c9SBarry Smith 408416022c9SBarry Smith /* store lengths of each row and write (including header) to file */ 409d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 410416022c9SBarry Smith col_lens[4+i] = a->i[i+1] - a->i[i]; 41117ab2063SBarry Smith } 412d0f46423SBarry Smith ierr = PetscBinaryWrite(fd,col_lens,4+A->rmap->n,PETSC_INT,PETSC_TRUE);CHKERRQ(ierr); 413606d414cSSatish Balay ierr = PetscFree(col_lens);CHKERRQ(ierr); 414416022c9SBarry Smith 415416022c9SBarry Smith /* store column indices (zero start index) */ 4166f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,a->j,a->nz,PETSC_INT,PETSC_FALSE);CHKERRQ(ierr); 417416022c9SBarry Smith 418416022c9SBarry Smith /* store nonzero values */ 4196f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,a->a,a->nz,PETSC_SCALAR,PETSC_FALSE);CHKERRQ(ierr); 4203a40ed3dSBarry Smith PetscFunctionReturn(0); 42117ab2063SBarry Smith } 422416022c9SBarry Smith 42309573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat,PetscViewer); 424cd155464SBarry Smith 4254a2ae208SSatish Balay #undef __FUNCT__ 4264a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqAIJ_ASCII" 427dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_ASCII(Mat A,PetscViewer viewer) 428416022c9SBarry Smith { 429416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 430dfbe8321SBarry Smith PetscErrorCode ierr; 431d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,shift=0; 432e060cb09SBarry Smith const char *name; 433f3ef73ceSBarry Smith PetscViewerFormat format; 43417ab2063SBarry Smith 4353a40ed3dSBarry Smith PetscFunctionBegin; 436b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 43771c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 43897f1f81fSBarry Smith PetscInt nofinalvalue = 0; 439d0f46423SBarry Smith if ((a->i[m] == a->i[m-1]) || (a->j[a->nz-1] != A->cmap->n-!shift)) { 440d00d2cf4SBarry Smith nofinalvalue = 1; 441d00d2cf4SBarry Smith } 442d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 443d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Size = %D %D \n",m,A->cmap->n);CHKERRQ(ierr); 44477431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Nonzeros = %D \n",a->nz);CHKERRQ(ierr); 44577431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"zzz = zeros(%D,3);\n",a->nz+nofinalvalue);CHKERRQ(ierr); 446b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"zzz = [\n");CHKERRQ(ierr); 44717ab2063SBarry Smith 44817ab2063SBarry Smith for (i=0; i<m; i++) { 449416022c9SBarry Smith for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 450aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 45177431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e + %18.16ei \n",i+1,a->j[j]+!shift,PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 45217ab2063SBarry Smith #else 45377431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e\n",i+1,a->j[j]+!shift,a->a[j]);CHKERRQ(ierr); 45417ab2063SBarry Smith #endif 45517ab2063SBarry Smith } 45617ab2063SBarry Smith } 457d00d2cf4SBarry Smith if (nofinalvalue) { 458d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e\n",m,A->cmap->n,0.0);CHKERRQ(ierr); 459d00d2cf4SBarry Smith } 460317d6ea6SBarry Smith ierr = PetscObjectGetName((PetscObject)A,&name);CHKERRQ(ierr); 461fb9695e5SSatish Balay ierr = PetscViewerASCIIPrintf(viewer,"];\n %s = spconvert(zzz);\n",name);CHKERRQ(ierr); 462d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 46368369a75SKris Buschelman } else if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO) { 464cd155464SBarry Smith PetscFunctionReturn(0); 465fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 466d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 4677566de4bSShri Abhyankar ierr = PetscObjectPrintClassNamePrefixType((PetscObject)A,viewer,"Matrix Object");CHKERRQ(ierr); 46844cd7ae7SLois Curfman McInnes for (i=0; i<m; i++) { 46977431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 47044cd7ae7SLois Curfman McInnes for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 471aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 47236db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 473a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G + %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 47436db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 475a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G - %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 47636db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 477a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,PetscRealPart(a->a[j]));CHKERRQ(ierr); 4786831982aSBarry Smith } 47944cd7ae7SLois Curfman McInnes #else 480a83599f4SBarry Smith if (a->a[j] != 0.0) {ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,a->a[j]);CHKERRQ(ierr);} 48144cd7ae7SLois Curfman McInnes #endif 48244cd7ae7SLois Curfman McInnes } 483b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 48444cd7ae7SLois Curfman McInnes } 485d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 486fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 48797f1f81fSBarry Smith PetscInt nzd=0,fshift=1,*sptr; 488d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 4897566de4bSShri Abhyankar ierr = PetscObjectPrintClassNamePrefixType((PetscObject)A,viewer,"Matrix Object");CHKERRQ(ierr); 49097f1f81fSBarry Smith ierr = PetscMalloc((m+1)*sizeof(PetscInt),&sptr);CHKERRQ(ierr); 491496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 492496be53dSLois Curfman McInnes sptr[i] = nzd+1; 493496be53dSLois Curfman McInnes for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 494496be53dSLois Curfman McInnes if (a->j[j] >= i) { 495aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 49636db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 497496be53dSLois Curfman McInnes #else 498496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 499496be53dSLois Curfman McInnes #endif 500496be53dSLois Curfman McInnes } 501496be53dSLois Curfman McInnes } 502496be53dSLois Curfman McInnes } 5032e44a96cSLois Curfman McInnes sptr[m] = nzd+1; 50477431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %D %D\n\n",m,nzd);CHKERRQ(ierr); 5052e44a96cSLois Curfman McInnes for (i=0; i<m+1; i+=6) { 50677431f27SBarry Smith if (i+4<m) {ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4],sptr[i+5]);CHKERRQ(ierr);} 50777431f27SBarry Smith else if (i+3<m) {ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4]);CHKERRQ(ierr);} 50877431f27SBarry Smith else if (i+2<m) {ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3]);CHKERRQ(ierr);} 50977431f27SBarry Smith else if (i+1<m) {ierr = PetscViewerASCIIPrintf(viewer," %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2]);CHKERRQ(ierr);} 51077431f27SBarry Smith else if (i<m) {ierr = PetscViewerASCIIPrintf(viewer," %D %D\n",sptr[i],sptr[i+1]);CHKERRQ(ierr);} 51177431f27SBarry Smith else {ierr = PetscViewerASCIIPrintf(viewer," %D\n",sptr[i]);CHKERRQ(ierr);} 512496be53dSLois Curfman McInnes } 513b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 514606d414cSSatish Balay ierr = PetscFree(sptr);CHKERRQ(ierr); 515496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 516496be53dSLois Curfman McInnes for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 51777431f27SBarry Smith if (a->j[j] >= i) {ierr = PetscViewerASCIIPrintf(viewer," %D ",a->j[j]+fshift);CHKERRQ(ierr);} 518496be53dSLois Curfman McInnes } 519b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 520496be53dSLois Curfman McInnes } 521b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 522496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 523496be53dSLois Curfman McInnes for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 524496be53dSLois Curfman McInnes if (a->j[j] >= i) { 525aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 52636db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) { 527b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %18.16e %18.16e ",PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 5286831982aSBarry Smith } 529496be53dSLois Curfman McInnes #else 530b0a32e0cSBarry Smith if (a->a[j] != 0.0) {ierr = PetscViewerASCIIPrintf(viewer," %18.16e ",a->a[j]);CHKERRQ(ierr);} 531496be53dSLois Curfman McInnes #endif 532496be53dSLois Curfman McInnes } 533496be53dSLois Curfman McInnes } 534b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 535496be53dSLois Curfman McInnes } 536d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 537fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 53897f1f81fSBarry Smith PetscInt cnt = 0,jcnt; 53987828ca2SBarry Smith PetscScalar value; 54002594712SBarry Smith 541d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 5427566de4bSShri Abhyankar ierr = PetscObjectPrintClassNamePrefixType((PetscObject)A,viewer,"Matrix Object");CHKERRQ(ierr); 54302594712SBarry Smith for (i=0; i<m; i++) { 54402594712SBarry Smith jcnt = 0; 545d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 546e24b481bSBarry Smith if (jcnt < a->i[i+1]-a->i[i] && j == a->j[cnt]) { 54702594712SBarry Smith value = a->a[cnt++]; 548e24b481bSBarry Smith jcnt++; 54902594712SBarry Smith } else { 55002594712SBarry Smith value = 0.0; 55102594712SBarry Smith } 552aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 553b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %7.5e+%7.5e i ",PetscRealPart(value),PetscImaginaryPart(value));CHKERRQ(ierr); 55402594712SBarry Smith #else 555b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %7.5e ",value);CHKERRQ(ierr); 55602594712SBarry Smith #endif 55702594712SBarry Smith } 558b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 55902594712SBarry Smith } 560d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 5613c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 562d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 5637566de4bSShri Abhyankar ierr = PetscObjectPrintClassNamePrefixType((PetscObject)A,viewer,"Matrix Object");CHKERRQ(ierr); 5643c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 5653c215bfdSMatthew Knepley ierr = PetscViewerASCIIPrintf(viewer,"%%matrix complex general\n");CHKERRQ(ierr); 5663c215bfdSMatthew Knepley #else 5673c215bfdSMatthew Knepley ierr = PetscViewerASCIIPrintf(viewer,"%%matrix real general\n");CHKERRQ(ierr); 5683c215bfdSMatthew Knepley #endif 569d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %D\n", m, A->cmap->n, a->nz);CHKERRQ(ierr); 5703c215bfdSMatthew Knepley for (i=0; i<m; i++) { 5713c215bfdSMatthew Knepley for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 5723c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 5733c215bfdSMatthew Knepley if (PetscImaginaryPart(a->a[j]) > 0.0) { 5743c215bfdSMatthew Knepley ierr = PetscViewerASCIIPrintf(viewer,"%D %D, %G %G\n", i+shift,a->j[j]+shift,PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 5753c215bfdSMatthew Knepley } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 5763c215bfdSMatthew Knepley ierr = PetscViewerASCIIPrintf(viewer,"%D %D, %G -%G\n", i+shift,a->j[j]+shift,PetscRealPart(a->a[j]),-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 5773c215bfdSMatthew Knepley } else { 5783c215bfdSMatthew Knepley ierr = PetscViewerASCIIPrintf(viewer,"%D %D, %G\n", i+shift,a->j[j]+shift,PetscRealPart(a->a[j]));CHKERRQ(ierr); 5793c215bfdSMatthew Knepley } 5803c215bfdSMatthew Knepley #else 5813c215bfdSMatthew Knepley ierr = PetscViewerASCIIPrintf(viewer,"%D %D %G\n", i+shift, a->j[j]+shift, a->a[j]);CHKERRQ(ierr); 5823c215bfdSMatthew Knepley #endif 5833c215bfdSMatthew Knepley } 5843c215bfdSMatthew Knepley } 585d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 5863a40ed3dSBarry Smith } else { 587d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 5887566de4bSShri Abhyankar ierr = PetscObjectPrintClassNamePrefixType((PetscObject)A,viewer,"Matrix Object");CHKERRQ(ierr); 589d5f3da31SBarry Smith if (A->factortype){ 59016cd7e1dSShri Abhyankar for (i=0; i<m; i++) { 59116cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 59216cd7e1dSShri Abhyankar /* L part */ 59316cd7e1dSShri Abhyankar for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 59416cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 59516cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 59616cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G + %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 59716cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 59816cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G - %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 59916cd7e1dSShri Abhyankar } else { 60016cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,PetscRealPart(a->a[j]));CHKERRQ(ierr); 60116cd7e1dSShri Abhyankar } 60216cd7e1dSShri Abhyankar #else 60316cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,a->a[j]);CHKERRQ(ierr); 60416cd7e1dSShri Abhyankar #endif 60516cd7e1dSShri Abhyankar } 60616cd7e1dSShri Abhyankar /* diagonal */ 60716cd7e1dSShri Abhyankar j = a->diag[i]; 60816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 60916cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 6102c990fa1SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (%D, %G + %G i)",a->j[j]+shift,PetscRealPart(1.0/a->a[j]),PetscImaginaryPart(1.0/a->a[j]));CHKERRQ(ierr); 61116cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 6122c990fa1SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (%D, %G - %G i)",a->j[j]+shift,PetscRealPart(1.0/a->a[j]),-PetscImaginaryPart(1.0/a->a[j]));CHKERRQ(ierr); 61316cd7e1dSShri Abhyankar } else { 6142c990fa1SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,PetscRealPart(1.0/a->a[j]));CHKERRQ(ierr); 61516cd7e1dSShri Abhyankar } 61616cd7e1dSShri Abhyankar #else 6172c990fa1SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,1.0/a->a[j]);CHKERRQ(ierr); 61816cd7e1dSShri Abhyankar #endif 61916cd7e1dSShri Abhyankar 62016cd7e1dSShri Abhyankar /* U part */ 62116cd7e1dSShri Abhyankar for (j=a->diag[i+1]+1+shift; j<a->diag[i]+shift; j++) { 62216cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 62316cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 62416cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G + %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 62516cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 62616cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G - %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 62716cd7e1dSShri Abhyankar } else { 62816cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,PetscRealPart(a->a[j]));CHKERRQ(ierr); 62916cd7e1dSShri Abhyankar } 63016cd7e1dSShri Abhyankar #else 63116cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,a->a[j]);CHKERRQ(ierr); 63216cd7e1dSShri Abhyankar #endif 63316cd7e1dSShri Abhyankar } 63416cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 63516cd7e1dSShri Abhyankar } 63616cd7e1dSShri Abhyankar } else { 63717ab2063SBarry Smith for (i=0; i<m; i++) { 63877431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 639416022c9SBarry Smith for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 640aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 64136db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 642a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G + %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 64336db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 644a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G - %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 6453a40ed3dSBarry Smith } else { 646a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,PetscRealPart(a->a[j]));CHKERRQ(ierr); 64717ab2063SBarry Smith } 64817ab2063SBarry Smith #else 649a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,a->a[j]);CHKERRQ(ierr); 65017ab2063SBarry Smith #endif 65117ab2063SBarry Smith } 652b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 65317ab2063SBarry Smith } 65416cd7e1dSShri Abhyankar } 655d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 65617ab2063SBarry Smith } 657b0a32e0cSBarry Smith ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 6583a40ed3dSBarry Smith PetscFunctionReturn(0); 659416022c9SBarry Smith } 660416022c9SBarry Smith 6614a2ae208SSatish Balay #undef __FUNCT__ 6624a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqAIJ_Draw_Zoom" 663dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw,void *Aa) 664416022c9SBarry Smith { 665480ef9eaSBarry Smith Mat A = (Mat) Aa; 666416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 667dfbe8321SBarry Smith PetscErrorCode ierr; 668d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,color; 66936db0b34SBarry Smith PetscReal xl,yl,xr,yr,x_l,x_r,y_l,y_r,maxv = 0.0; 670b0a32e0cSBarry Smith PetscViewer viewer; 671f3ef73ceSBarry Smith PetscViewerFormat format; 672cddf8d76SBarry Smith 6733a40ed3dSBarry Smith PetscFunctionBegin; 674480ef9eaSBarry Smith ierr = PetscObjectQuery((PetscObject)A,"Zoomviewer",(PetscObject*)&viewer);CHKERRQ(ierr); 675b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 67619bcc07fSBarry Smith 677b0a32e0cSBarry Smith ierr = PetscDrawGetCoordinates(draw,&xl,&yl,&xr,&yr);CHKERRQ(ierr); 678416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 6790513a670SBarry Smith 680fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 6810513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 682b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 683416022c9SBarry Smith for (i=0; i<m; i++) { 684cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 685bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 686bfeeae90SHong Zhang x_l = a->j[j] ; x_r = x_l + 1.0; 687aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 68836db0b34SBarry Smith if (PetscRealPart(a->a[j]) >= 0.) continue; 689cddf8d76SBarry Smith #else 690cddf8d76SBarry Smith if (a->a[j] >= 0.) continue; 691cddf8d76SBarry Smith #endif 692b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 693cddf8d76SBarry Smith } 694cddf8d76SBarry Smith } 695b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 696cddf8d76SBarry Smith for (i=0; i<m; i++) { 697cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 698bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 699bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 700cddf8d76SBarry Smith if (a->a[j] != 0.) continue; 701b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 702cddf8d76SBarry Smith } 703cddf8d76SBarry Smith } 704b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 705cddf8d76SBarry Smith for (i=0; i<m; i++) { 706cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 707bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 708bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 709aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 71036db0b34SBarry Smith if (PetscRealPart(a->a[j]) <= 0.) continue; 711cddf8d76SBarry Smith #else 712cddf8d76SBarry Smith if (a->a[j] <= 0.) continue; 713cddf8d76SBarry Smith #endif 714b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 715416022c9SBarry Smith } 716416022c9SBarry Smith } 7170513a670SBarry Smith } else { 7180513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 7190513a670SBarry Smith /* first determine max of all nonzero values */ 72097f1f81fSBarry Smith PetscInt nz = a->nz,count; 721b0a32e0cSBarry Smith PetscDraw popup; 72236db0b34SBarry Smith PetscReal scale; 7230513a670SBarry Smith 7240513a670SBarry Smith for (i=0; i<nz; i++) { 7250513a670SBarry Smith if (PetscAbsScalar(a->a[i]) > maxv) maxv = PetscAbsScalar(a->a[i]); 7260513a670SBarry Smith } 727b0a32e0cSBarry Smith scale = (245.0 - PETSC_DRAW_BASIC_COLORS)/maxv; 728b0a32e0cSBarry Smith ierr = PetscDrawGetPopup(draw,&popup);CHKERRQ(ierr); 729b0a32e0cSBarry Smith if (popup) {ierr = PetscDrawScalePopup(popup,0.0,maxv);CHKERRQ(ierr);} 7300513a670SBarry Smith count = 0; 7310513a670SBarry Smith for (i=0; i<m; i++) { 7320513a670SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 733bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 734bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 73597f1f81fSBarry Smith color = PETSC_DRAW_BASIC_COLORS + (PetscInt)(scale*PetscAbsScalar(a->a[count])); 736b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 7370513a670SBarry Smith count++; 7380513a670SBarry Smith } 7390513a670SBarry Smith } 7400513a670SBarry Smith } 741480ef9eaSBarry Smith PetscFunctionReturn(0); 742480ef9eaSBarry Smith } 743cddf8d76SBarry Smith 7444a2ae208SSatish Balay #undef __FUNCT__ 7454a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqAIJ_Draw" 746dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw(Mat A,PetscViewer viewer) 747480ef9eaSBarry Smith { 748dfbe8321SBarry Smith PetscErrorCode ierr; 749b0a32e0cSBarry Smith PetscDraw draw; 75036db0b34SBarry Smith PetscReal xr,yr,xl,yl,h,w; 751ace3abfcSBarry Smith PetscBool isnull; 752480ef9eaSBarry Smith 753480ef9eaSBarry Smith PetscFunctionBegin; 754b0a32e0cSBarry Smith ierr = PetscViewerDrawGetDraw(viewer,0,&draw);CHKERRQ(ierr); 755b0a32e0cSBarry Smith ierr = PetscDrawIsNull(draw,&isnull);CHKERRQ(ierr); 756480ef9eaSBarry Smith if (isnull) PetscFunctionReturn(0); 757480ef9eaSBarry Smith 758480ef9eaSBarry Smith ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",(PetscObject)viewer);CHKERRQ(ierr); 759d0f46423SBarry Smith xr = A->cmap->n; yr = A->rmap->n; h = yr/10.0; w = xr/10.0; 760480ef9eaSBarry Smith xr += w; yr += h; xl = -w; yl = -h; 761b0a32e0cSBarry Smith ierr = PetscDrawSetCoordinates(draw,xl,yl,xr,yr);CHKERRQ(ierr); 762b0a32e0cSBarry Smith ierr = PetscDrawZoom(draw,MatView_SeqAIJ_Draw_Zoom,A);CHKERRQ(ierr); 763480ef9eaSBarry Smith ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",PETSC_NULL);CHKERRQ(ierr); 7643a40ed3dSBarry Smith PetscFunctionReturn(0); 765416022c9SBarry Smith } 766416022c9SBarry Smith 7674a2ae208SSatish Balay #undef __FUNCT__ 7684a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqAIJ" 769dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ(Mat A,PetscViewer viewer) 770416022c9SBarry Smith { 771dfbe8321SBarry Smith PetscErrorCode ierr; 772ace3abfcSBarry Smith PetscBool iascii,isbinary,isdraw; 773416022c9SBarry Smith 7743a40ed3dSBarry Smith PetscFunctionBegin; 7752692d6eeSBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 7762692d6eeSBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 7772692d6eeSBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSCVIEWERDRAW,&isdraw);CHKERRQ(ierr); 778c45a1595SBarry Smith if (iascii) { 7793a40ed3dSBarry Smith ierr = MatView_SeqAIJ_ASCII(A,viewer);CHKERRQ(ierr); 7800f5bd95cSBarry Smith } else if (isbinary) { 7813a40ed3dSBarry Smith ierr = MatView_SeqAIJ_Binary(A,viewer);CHKERRQ(ierr); 7820f5bd95cSBarry Smith } else if (isdraw) { 7833a40ed3dSBarry Smith ierr = MatView_SeqAIJ_Draw(A,viewer);CHKERRQ(ierr); 7845cd90555SBarry Smith } else { 785e32f2f54SBarry Smith SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"Viewer type %s not supported by SeqAIJ matrices",((PetscObject)viewer)->type_name); 78617ab2063SBarry Smith } 7874108e4d5SBarry Smith ierr = MatView_SeqAIJ_Inode(A,viewer);CHKERRQ(ierr); 7883a40ed3dSBarry Smith PetscFunctionReturn(0); 78917ab2063SBarry Smith } 79019bcc07fSBarry Smith 7914a2ae208SSatish Balay #undef __FUNCT__ 7924a2ae208SSatish Balay #define __FUNCT__ "MatAssemblyEnd_SeqAIJ" 793dfbe8321SBarry Smith PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A,MatAssemblyType mode) 79417ab2063SBarry Smith { 795416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 7966849ba73SBarry Smith PetscErrorCode ierr; 79797f1f81fSBarry Smith PetscInt fshift = 0,i,j,*ai = a->i,*aj = a->j,*imax = a->imax; 798d0f46423SBarry Smith PetscInt m = A->rmap->n,*ip,N,*ailen = a->ilen,rmax = 0; 79954f21887SBarry Smith MatScalar *aa = a->a,*ap; 8003447b6efSHong Zhang PetscReal ratio=0.6; 80117ab2063SBarry Smith 8023a40ed3dSBarry Smith PetscFunctionBegin; 8033a40ed3dSBarry Smith if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0); 80417ab2063SBarry Smith 80543ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 80617ab2063SBarry Smith for (i=1; i<m; i++) { 807416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 80817ab2063SBarry Smith fshift += imax[i-1] - ailen[i-1]; 80994a9d846SBarry Smith rmax = PetscMax(rmax,ailen[i]); 81017ab2063SBarry Smith if (fshift) { 811bfeeae90SHong Zhang ip = aj + ai[i] ; 812bfeeae90SHong Zhang ap = aa + ai[i] ; 81317ab2063SBarry Smith N = ailen[i]; 81417ab2063SBarry Smith for (j=0; j<N; j++) { 81517ab2063SBarry Smith ip[j-fshift] = ip[j]; 81617ab2063SBarry Smith ap[j-fshift] = ap[j]; 81717ab2063SBarry Smith } 81817ab2063SBarry Smith } 81917ab2063SBarry Smith ai[i] = ai[i-1] + ailen[i-1]; 82017ab2063SBarry Smith } 82117ab2063SBarry Smith if (m) { 82217ab2063SBarry Smith fshift += imax[m-1] - ailen[m-1]; 82317ab2063SBarry Smith ai[m] = ai[m-1] + ailen[m-1]; 82417ab2063SBarry Smith } 82517ab2063SBarry Smith /* reset ilen and imax for each row */ 82617ab2063SBarry Smith for (i=0; i<m; i++) { 82717ab2063SBarry Smith ailen[i] = imax[i] = ai[i+1] - ai[i]; 82817ab2063SBarry Smith } 829bfeeae90SHong Zhang a->nz = ai[m]; 83065e19b50SBarry Smith if (fshift && a->nounused == -1) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_PLIB, "Unused space detected in matrix: %D X %D, %D unneeded", m, A->cmap->n, fshift); 83117ab2063SBarry Smith 83209f38230SBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 833d0f46423SBarry Smith ierr = PetscInfo4(A,"Matrix size: %D X %D; storage space: %D unneeded,%D used\n",m,A->cmap->n,fshift,a->nz);CHKERRQ(ierr); 834ae15b995SBarry Smith ierr = PetscInfo1(A,"Number of mallocs during MatSetValues() is %D\n",a->reallocs);CHKERRQ(ierr); 835ae15b995SBarry Smith ierr = PetscInfo1(A,"Maximum nonzeros in any row is %D\n",rmax);CHKERRQ(ierr); 8368e58a170SBarry Smith A->info.mallocs += a->reallocs; 837dd5f02e7SSatish Balay a->reallocs = 0; 8384e220ebcSLois Curfman McInnes A->info.nz_unneeded = (double)fshift; 83936db0b34SBarry Smith a->rmax = rmax; 8404e220ebcSLois Curfman McInnes 841cd6b891eSBarry Smith ierr = MatCheckCompressedRow(A,&a->compressedrow,a->i,m,ratio);CHKERRQ(ierr); 84288e51ccdSHong Zhang A->same_nonzero = PETSC_TRUE; 84371c2f376SKris Buschelman 8444108e4d5SBarry Smith ierr = MatAssemblyEnd_SeqAIJ_Inode(A,mode);CHKERRQ(ierr); 84571f1c65dSBarry Smith 84671f1c65dSBarry Smith a->idiagvalid = PETSC_FALSE; 847bbead8a2SBarry Smith a->ibdiagvalid = PETSC_FALSE; 8483a40ed3dSBarry Smith PetscFunctionReturn(0); 84917ab2063SBarry Smith } 85017ab2063SBarry Smith 8514a2ae208SSatish Balay #undef __FUNCT__ 85299cafbc1SBarry Smith #define __FUNCT__ "MatRealPart_SeqAIJ" 85399cafbc1SBarry Smith PetscErrorCode MatRealPart_SeqAIJ(Mat A) 85499cafbc1SBarry Smith { 85599cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 85699cafbc1SBarry Smith PetscInt i,nz = a->nz; 85754f21887SBarry Smith MatScalar *aa = a->a; 85899cafbc1SBarry Smith 85999cafbc1SBarry Smith PetscFunctionBegin; 86099cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscRealPart(aa[i]); 861*86c113feSBarry Smith a->idiagvalid = PETSC_FALSE; 862*86c113feSBarry Smith a->ibdiagvalid = PETSC_FALSE; 86399cafbc1SBarry Smith PetscFunctionReturn(0); 86499cafbc1SBarry Smith } 86599cafbc1SBarry Smith 86699cafbc1SBarry Smith #undef __FUNCT__ 86799cafbc1SBarry Smith #define __FUNCT__ "MatImaginaryPart_SeqAIJ" 86899cafbc1SBarry Smith PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 86999cafbc1SBarry Smith { 87099cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 87199cafbc1SBarry Smith PetscInt i,nz = a->nz; 87254f21887SBarry Smith MatScalar *aa = a->a; 87399cafbc1SBarry Smith 87499cafbc1SBarry Smith PetscFunctionBegin; 87599cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 876*86c113feSBarry Smith a->idiagvalid = PETSC_FALSE; 877*86c113feSBarry Smith a->ibdiagvalid = PETSC_FALSE; 87899cafbc1SBarry Smith PetscFunctionReturn(0); 87999cafbc1SBarry Smith } 88099cafbc1SBarry Smith 88199cafbc1SBarry Smith #undef __FUNCT__ 8824a2ae208SSatish Balay #define __FUNCT__ "MatZeroEntries_SeqAIJ" 883dfbe8321SBarry Smith PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 88417ab2063SBarry Smith { 885416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 886dfbe8321SBarry Smith PetscErrorCode ierr; 8873a40ed3dSBarry Smith 8883a40ed3dSBarry Smith PetscFunctionBegin; 889d0f46423SBarry Smith ierr = PetscMemzero(a->a,(a->i[A->rmap->n])*sizeof(PetscScalar));CHKERRQ(ierr); 890*86c113feSBarry Smith a->idiagvalid = PETSC_FALSE; 891*86c113feSBarry Smith a->ibdiagvalid = PETSC_FALSE; 8923a40ed3dSBarry Smith PetscFunctionReturn(0); 89317ab2063SBarry Smith } 894416022c9SBarry Smith 8954a2ae208SSatish Balay #undef __FUNCT__ 8964a2ae208SSatish Balay #define __FUNCT__ "MatDestroy_SeqAIJ" 897dfbe8321SBarry Smith PetscErrorCode MatDestroy_SeqAIJ(Mat A) 89817ab2063SBarry Smith { 899416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 900dfbe8321SBarry Smith PetscErrorCode ierr; 901d5d45c9bSBarry Smith 9023a40ed3dSBarry Smith PetscFunctionBegin; 903aa482453SBarry Smith #if defined(PETSC_USE_LOG) 904d0f46423SBarry Smith PetscLogObjectState((PetscObject)A,"Rows=%D, Cols=%D, NZ=%D",A->rmap->n,A->cmap->n,a->nz); 90517ab2063SBarry Smith #endif 906e6b907acSBarry Smith ierr = MatSeqXAIJFreeAIJ(A,&a->a,&a->j,&a->i);CHKERRQ(ierr); 9076bf464f9SBarry Smith ierr = ISDestroy(&a->row);CHKERRQ(ierr); 9086bf464f9SBarry Smith ierr = ISDestroy(&a->col);CHKERRQ(ierr); 90905b42c5fSBarry Smith ierr = PetscFree(a->diag);CHKERRQ(ierr); 910d48dcb14SBarry Smith ierr = PetscFree(a->ibdiag);CHKERRQ(ierr); 91105b42c5fSBarry Smith ierr = PetscFree2(a->imax,a->ilen);CHKERRQ(ierr); 91271f1c65dSBarry Smith ierr = PetscFree3(a->idiag,a->mdiag,a->ssor_work);CHKERRQ(ierr); 91305b42c5fSBarry Smith ierr = PetscFree(a->solve_work);CHKERRQ(ierr); 9146bf464f9SBarry Smith ierr = ISDestroy(&a->icol);CHKERRQ(ierr); 91505b42c5fSBarry Smith ierr = PetscFree(a->saved_values);CHKERRQ(ierr); 9166bf464f9SBarry Smith ierr = ISColoringDestroy(&a->coloring);CHKERRQ(ierr); 91705b42c5fSBarry Smith ierr = PetscFree(a->xtoy);CHKERRQ(ierr); 9186bf464f9SBarry Smith ierr = MatDestroy(&a->XtoY);CHKERRQ(ierr); 919cd6b891eSBarry Smith ierr = PetscFree2(a->compressedrow.i,a->compressedrow.rindex);CHKERRQ(ierr); 920a30b2313SHong Zhang 9214108e4d5SBarry Smith ierr = MatDestroy_SeqAIJ_Inode(A);CHKERRQ(ierr); 922bf0cc555SLisandro Dalcin ierr = PetscFree(A->data);CHKERRQ(ierr); 923901853e0SKris Buschelman 924dbd8c25aSHong Zhang ierr = PetscObjectChangeTypeName((PetscObject)A,0);CHKERRQ(ierr); 925901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatSeqAIJSetColumnIndices_C","",PETSC_NULL);CHKERRQ(ierr); 926901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatStoreValues_C","",PETSC_NULL);CHKERRQ(ierr); 927901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatRetrieveValues_C","",PETSC_NULL);CHKERRQ(ierr); 928901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatConvert_seqaij_seqsbaij_C","",PETSC_NULL);CHKERRQ(ierr); 929901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatConvert_seqaij_seqbaij_C","",PETSC_NULL);CHKERRQ(ierr); 9305a11e1b2SBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatConvert_seqaij_seqaijperm_C","",PETSC_NULL);CHKERRQ(ierr); 931901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatIsTranspose_C","",PETSC_NULL);CHKERRQ(ierr); 932901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatSeqAIJSetPreallocation_C","",PETSC_NULL);CHKERRQ(ierr); 933a1661176SMatthew Knepley ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatSeqAIJSetPreallocationCSR_C","",PETSC_NULL);CHKERRQ(ierr); 934901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatReorderForNonzeroDiagonal_C","",PETSC_NULL);CHKERRQ(ierr); 9353a40ed3dSBarry Smith PetscFunctionReturn(0); 93617ab2063SBarry Smith } 93717ab2063SBarry Smith 9384a2ae208SSatish Balay #undef __FUNCT__ 9394a2ae208SSatish Balay #define __FUNCT__ "MatSetOption_SeqAIJ" 940ace3abfcSBarry Smith PetscErrorCode MatSetOption_SeqAIJ(Mat A,MatOption op,PetscBool flg) 94117ab2063SBarry Smith { 942416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 9434846f1f5SKris Buschelman PetscErrorCode ierr; 9443a40ed3dSBarry Smith 9453a40ed3dSBarry Smith PetscFunctionBegin; 946a65d3064SKris Buschelman switch (op) { 947a65d3064SKris Buschelman case MAT_ROW_ORIENTED: 9484e0d8c25SBarry Smith a->roworiented = flg; 949a65d3064SKris Buschelman break; 950a9817697SBarry Smith case MAT_KEEP_NONZERO_PATTERN: 951a9817697SBarry Smith a->keepnonzeropattern = flg; 952a65d3064SKris Buschelman break; 953512a5fc5SBarry Smith case MAT_NEW_NONZERO_LOCATIONS: 954512a5fc5SBarry Smith a->nonew = (flg ? 0 : 1); 955a65d3064SKris Buschelman break; 956a65d3064SKris Buschelman case MAT_NEW_NONZERO_LOCATION_ERR: 9574e0d8c25SBarry Smith a->nonew = (flg ? -1 : 0); 958a65d3064SKris Buschelman break; 959a65d3064SKris Buschelman case MAT_NEW_NONZERO_ALLOCATION_ERR: 9604e0d8c25SBarry Smith a->nonew = (flg ? -2 : 0); 961a65d3064SKris Buschelman break; 96228b2fa4aSMatthew Knepley case MAT_UNUSED_NONZERO_LOCATION_ERR: 96328b2fa4aSMatthew Knepley a->nounused = (flg ? -1 : 0); 96428b2fa4aSMatthew Knepley break; 965a65d3064SKris Buschelman case MAT_IGNORE_ZERO_ENTRIES: 9664e0d8c25SBarry Smith a->ignorezeroentries = flg; 9670df259c2SBarry Smith break; 968cd6b891eSBarry Smith case MAT_CHECK_COMPRESSED_ROW: 969cd6b891eSBarry Smith a->compressedrow.check = flg; 970d487561eSHong Zhang break; 9713d472b54SHong Zhang case MAT_SPD: 9723d472b54SHong Zhang A->spd_set = PETSC_TRUE; 9733d472b54SHong Zhang A->spd = flg; 9743d472b54SHong Zhang if (flg) { 9753d472b54SHong Zhang A->symmetric = PETSC_TRUE; 9763d472b54SHong Zhang A->structurally_symmetric = PETSC_TRUE; 9773d472b54SHong Zhang A->symmetric_set = PETSC_TRUE; 9783d472b54SHong Zhang A->structurally_symmetric_set = PETSC_TRUE; 9793d472b54SHong Zhang } 9803d472b54SHong Zhang break; 981b1646e73SJed Brown case MAT_SYMMETRIC: 982b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 983b1646e73SJed Brown case MAT_HERMITIAN: 984b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 9854e0d8c25SBarry Smith case MAT_NEW_DIAGONALS: 986a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 987a65d3064SKris Buschelman case MAT_USE_HASH_TABLE: 988290bbb0aSBarry Smith ierr = PetscInfo1(A,"Option %s ignored\n",MatOptions[op]);CHKERRQ(ierr); 989a65d3064SKris Buschelman break; 990b87ac2d8SJed Brown case MAT_USE_INODES: 991b87ac2d8SJed Brown /* Not an error because MatSetOption_SeqAIJ_Inode handles this one */ 992b87ac2d8SJed Brown break; 993a65d3064SKris Buschelman default: 994e32f2f54SBarry Smith SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"unknown option %d",op); 995a65d3064SKris Buschelman } 9964108e4d5SBarry Smith ierr = MatSetOption_SeqAIJ_Inode(A,op,flg);CHKERRQ(ierr); 9973a40ed3dSBarry Smith PetscFunctionReturn(0); 99817ab2063SBarry Smith } 99917ab2063SBarry Smith 10004a2ae208SSatish Balay #undef __FUNCT__ 10014a2ae208SSatish Balay #define __FUNCT__ "MatGetDiagonal_SeqAIJ" 1002dfbe8321SBarry Smith PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A,Vec v) 100317ab2063SBarry Smith { 1004416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 10056849ba73SBarry Smith PetscErrorCode ierr; 1006d3e70bfaSHong Zhang PetscInt i,j,n,*ai=a->i,*aj=a->j,nz; 100735e7444dSHong Zhang PetscScalar *aa=a->a,*x,zero=0.0; 100817ab2063SBarry Smith 10093a40ed3dSBarry Smith PetscFunctionBegin; 1010d3e70bfaSHong Zhang ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 1011e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 101235e7444dSHong Zhang 1013d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU){ 1014d3e70bfaSHong Zhang PetscInt *diag=a->diag; 101535e7444dSHong Zhang ierr = VecGetArray(v,&x);CHKERRQ(ierr); 10162c990fa1SHong Zhang for (i=0; i<n; i++) x[i] = 1.0/aa[diag[i]]; 101735e7444dSHong Zhang ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 101835e7444dSHong Zhang PetscFunctionReturn(0); 101935e7444dSHong Zhang } 102035e7444dSHong Zhang 10212dcb1b2aSMatthew Knepley ierr = VecSet(v,zero);CHKERRQ(ierr); 10221ebc52fbSHong Zhang ierr = VecGetArray(v,&x);CHKERRQ(ierr); 102335e7444dSHong Zhang for (i=0; i<n; i++) { 102435e7444dSHong Zhang nz = ai[i+1] - ai[i]; 10252f5a7c2eSBarry Smith if (!nz) x[i] = 0.0; 102635e7444dSHong Zhang for (j=ai[i]; j<ai[i+1]; j++){ 102735e7444dSHong Zhang if (aj[j] == i) { 102835e7444dSHong Zhang x[i] = aa[j]; 102917ab2063SBarry Smith break; 103017ab2063SBarry Smith } 103117ab2063SBarry Smith } 103217ab2063SBarry Smith } 10331ebc52fbSHong Zhang ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 10343a40ed3dSBarry Smith PetscFunctionReturn(0); 103517ab2063SBarry Smith } 103617ab2063SBarry Smith 1037c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 10384a2ae208SSatish Balay #undef __FUNCT__ 10394a2ae208SSatish Balay #define __FUNCT__ "MatMultTransposeAdd_SeqAIJ" 1040dfbe8321SBarry Smith PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A,Vec xx,Vec zz,Vec yy) 104117ab2063SBarry Smith { 1042416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 10435c897100SBarry Smith PetscScalar *x,*y; 1044dfbe8321SBarry Smith PetscErrorCode ierr; 1045d0f46423SBarry Smith PetscInt m = A->rmap->n; 10465c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1047a77337e4SBarry Smith MatScalar *v; 1048a77337e4SBarry Smith PetscScalar alpha; 104904fbf559SBarry Smith PetscInt n,i,j,*idx,*ii,*ridx=PETSC_NULL; 10503447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1051ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 10525c897100SBarry Smith #endif 105317ab2063SBarry Smith 10543a40ed3dSBarry Smith PetscFunctionBegin; 10552e8a6d31SBarry Smith if (zz != yy) {ierr = VecCopy(zz,yy);CHKERRQ(ierr);} 10561ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 10571ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 10585c897100SBarry Smith 10595c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1060bfeeae90SHong Zhang fortranmulttransposeaddaij_(&m,x,a->i,a->j,a->a,y); 10615c897100SBarry Smith #else 10623447b6efSHong Zhang if (usecprow){ 10633447b6efSHong Zhang m = cprow.nrows; 10643447b6efSHong Zhang ii = cprow.i; 10657b2bb3b9SHong Zhang ridx = cprow.rindex; 10663447b6efSHong Zhang } else { 10673447b6efSHong Zhang ii = a->i; 10683447b6efSHong Zhang } 106917ab2063SBarry Smith for (i=0; i<m; i++) { 10703447b6efSHong Zhang idx = a->j + ii[i] ; 10713447b6efSHong Zhang v = a->a + ii[i] ; 10723447b6efSHong Zhang n = ii[i+1] - ii[i]; 10733447b6efSHong Zhang if (usecprow){ 10747b2bb3b9SHong Zhang alpha = x[ridx[i]]; 10753447b6efSHong Zhang } else { 107617ab2063SBarry Smith alpha = x[i]; 10773447b6efSHong Zhang } 107804fbf559SBarry Smith for (j=0; j<n; j++) y[idx[j]] += alpha*v[j]; 107917ab2063SBarry Smith } 10805c897100SBarry Smith #endif 1081dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 10821ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 10831ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 10843a40ed3dSBarry Smith PetscFunctionReturn(0); 108517ab2063SBarry Smith } 108617ab2063SBarry Smith 10874a2ae208SSatish Balay #undef __FUNCT__ 10885c897100SBarry Smith #define __FUNCT__ "MatMultTranspose_SeqAIJ" 1089dfbe8321SBarry Smith PetscErrorCode MatMultTranspose_SeqAIJ(Mat A,Vec xx,Vec yy) 10905c897100SBarry Smith { 1091dfbe8321SBarry Smith PetscErrorCode ierr; 10925c897100SBarry Smith 10935c897100SBarry Smith PetscFunctionBegin; 1094170fe5c8SBarry Smith ierr = VecSet(yy,0.0);CHKERRQ(ierr); 10955c897100SBarry Smith ierr = MatMultTransposeAdd_SeqAIJ(A,xx,yy,yy);CHKERRQ(ierr); 10965c897100SBarry Smith PetscFunctionReturn(0); 10975c897100SBarry Smith } 10985c897100SBarry Smith 1099c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 11005c897100SBarry Smith #undef __FUNCT__ 11014a2ae208SSatish Balay #define __FUNCT__ "MatMult_SeqAIJ" 1102dfbe8321SBarry Smith PetscErrorCode MatMult_SeqAIJ(Mat A,Vec xx,Vec yy) 110317ab2063SBarry Smith { 1104416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1105d9fead3dSBarry Smith PetscScalar *y; 110654f21887SBarry Smith const PetscScalar *x; 110754f21887SBarry Smith const MatScalar *aa; 1108dfbe8321SBarry Smith PetscErrorCode ierr; 1109003131ecSBarry Smith PetscInt m=A->rmap->n; 1110003131ecSBarry Smith const PetscInt *aj,*ii,*ridx=PETSC_NULL; 11118aee2decSHong Zhang PetscInt n,i,nonzerorow=0; 1112362ced78SSatish Balay PetscScalar sum; 1113ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 111417ab2063SBarry Smith 1115b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 111697952fefSHong Zhang #pragma disjoint(*x,*y,*aa) 1117fee21e36SBarry Smith #endif 1118fee21e36SBarry Smith 11193a40ed3dSBarry Smith PetscFunctionBegin; 11203649974fSBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 11211ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 112297952fefSHong Zhang aj = a->j; 112397952fefSHong Zhang aa = a->a; 1124416022c9SBarry Smith ii = a->i; 11254eb6d288SHong Zhang if (usecprow){ /* use compressed row format */ 112697952fefSHong Zhang m = a->compressedrow.nrows; 112797952fefSHong Zhang ii = a->compressedrow.i; 112897952fefSHong Zhang ridx = a->compressedrow.rindex; 112997952fefSHong Zhang for (i=0; i<m; i++){ 113097952fefSHong Zhang n = ii[i+1] - ii[i]; 113197952fefSHong Zhang aj = a->j + ii[i]; 113297952fefSHong Zhang aa = a->a + ii[i]; 113397952fefSHong Zhang sum = 0.0; 1134a46b3154SVictor Eijkhout nonzerorow += (n>0); 1135003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 1136003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 113797952fefSHong Zhang y[*ridx++] = sum; 113897952fefSHong Zhang } 113997952fefSHong Zhang } else { /* do not use compressed row format */ 1140b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 1141b05257ddSBarry Smith fortranmultaij_(&m,x,ii,aj,aa,y); 1142b05257ddSBarry Smith #else 114317ab2063SBarry Smith for (i=0; i<m; i++) { 1144003131ecSBarry Smith n = ii[i+1] - ii[i]; 1145003131ecSBarry Smith aj = a->j + ii[i]; 1146003131ecSBarry Smith aa = a->a + ii[i]; 114717ab2063SBarry Smith sum = 0.0; 1148a46b3154SVictor Eijkhout nonzerorow += (n>0); 1149003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 115017ab2063SBarry Smith y[i] = sum; 115117ab2063SBarry Smith } 11528d195f9aSBarry Smith #endif 1153b05257ddSBarry Smith } 1154dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*a->nz - nonzerorow);CHKERRQ(ierr); 11553649974fSBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 11561ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 11573a40ed3dSBarry Smith PetscFunctionReturn(0); 115817ab2063SBarry Smith } 115917ab2063SBarry Smith 116063db405bSBarry Smith #if defined(PETSC_HAVE_PTHREADCLASSES) 116163db405bSBarry Smith 11620c74a584SJed Brown /* ******************* */ 1163700485ddSSatish Balay #if defined(PETSC_HAVE_PTHREADCLASSES) 1164cfcfc605SKerry Stevens extern PetscBool PetscUseThreadPool; 1165cfcfc605SKerry Stevens void* DoCoreAffinity(void); 1166cfcfc605SKerry Stevens 11670ca81413SKerry Stevens typedef struct { 11680ca81413SKerry Stevens const MatScalar* matdata; 11690ca81413SKerry Stevens const PetscScalar* vecdata; 11700ca81413SKerry Stevens PetscScalar* vecout; 11710ca81413SKerry Stevens const PetscInt* colindnz; 11720ca81413SKerry Stevens const PetscInt* rownumnz; 11730ca81413SKerry Stevens PetscInt numrows; 11740ca81413SKerry Stevens const PetscInt* specidx; 11750ca81413SKerry Stevens PetscInt nzr; 11760ca81413SKerry Stevens } MatMult_KernelData; 11770ca81413SKerry Stevens 11780ca81413SKerry Stevens void* MatMult_Kernel(void *arg) 11790ca81413SKerry Stevens { 1180cfcfc605SKerry Stevens if(PetscUseThreadPool==PETSC_FALSE) { 1181cfcfc605SKerry Stevens DoCoreAffinity(); 1182cfcfc605SKerry Stevens } 11830ca81413SKerry Stevens MatMult_KernelData *data = (MatMult_KernelData*)arg; 11840ca81413SKerry Stevens PetscScalar sum; 11850ca81413SKerry Stevens const MatScalar *aabase = data->matdata,*aa; 11860ca81413SKerry Stevens const PetscScalar *x = data->vecdata; 11870ca81413SKerry Stevens PetscScalar *y = data->vecout; 11880ca81413SKerry Stevens const PetscInt *ajbase = data->colindnz,*aj; 11890ca81413SKerry Stevens const PetscInt *ii = data->rownumnz; 11900ca81413SKerry Stevens PetscInt m = data->numrows; 11910ca81413SKerry Stevens const PetscInt *ridx = data->specidx; 11920ca81413SKerry Stevens PetscInt i,n,nonzerorow = 0; 11930ca81413SKerry Stevens 11940ca81413SKerry Stevens if(ridx!=NULL) { 11950ca81413SKerry Stevens for (i=0; i<m; i++){ 11960ca81413SKerry Stevens n = ii[i+1] - ii[i]; 11970ca81413SKerry Stevens aj = ajbase + ii[i]; 11980ca81413SKerry Stevens aa = aabase + ii[i]; 11990ca81413SKerry Stevens sum = 0.0; 1200cfcfc605SKerry Stevens if(n>0) { 120151d315f7SKerry Stevens PetscSparseDensePlusDot(sum,x,aa,aj,n); 120251d315f7SKerry Stevens nonzerorow++; 1203cfcfc605SKerry Stevens } 12040ca81413SKerry Stevens y[*ridx++] = sum; 12050ca81413SKerry Stevens } 12060ca81413SKerry Stevens } 12070ca81413SKerry Stevens else { 120851d315f7SKerry Stevens PetscInt ibase = data->nzr; 12090ca81413SKerry Stevens for (i=0; i<m; i++) { 12100ca81413SKerry Stevens n = ii[i+1] - ii[i]; 12110ca81413SKerry Stevens aj = ajbase + ii[i]; 12120ca81413SKerry Stevens aa = aabase + ii[i]; 12130ca81413SKerry Stevens sum = 0.0; 1214cfcfc605SKerry Stevens if(n>0) { 121551d315f7SKerry Stevens PetscSparseDensePlusDot(sum,x,aa,aj,n); 121651d315f7SKerry Stevens nonzerorow++; 1217cfcfc605SKerry Stevens } 121851d315f7SKerry Stevens y[i+ibase] = sum; 12190ca81413SKerry Stevens } 12200ca81413SKerry Stevens } 12210ca81413SKerry Stevens data->nzr = nonzerorow; 12220ca81413SKerry Stevens return NULL; 12230ca81413SKerry Stevens } 1224700485ddSSatish Balay #endif 12250ca81413SKerry Stevens 12260ca81413SKerry Stevens extern PetscMPIInt PetscMaxThreads; 12274b83fb64SBarry Smith extern PetscErrorCode (*MainJob)(void* (*pFunc)(void*),void**,PetscInt); 122851d315f7SKerry Stevens 12290ca81413SKerry Stevens #undef __FUNCT__ 12307d6a0e61SBarry Smith #define __FUNCT__ "MatMult_SeqAIJPThread" 12317d6a0e61SBarry Smith PetscErrorCode MatMult_SeqAIJPThread(Mat A,Vec xx,Vec yy) 12320ca81413SKerry Stevens { 12330ca81413SKerry Stevens Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 12340ca81413SKerry Stevens PetscScalar *y; 12350ca81413SKerry Stevens const PetscScalar *x; 12360ca81413SKerry Stevens PetscErrorCode ierr; 12370ca81413SKerry Stevens PetscInt m=A->rmap->n,nonzerorow=0; 12380ca81413SKerry Stevens PetscBool usecprow=a->compressedrow.use; 12390ca81413SKerry Stevens 12400ca81413SKerry Stevens #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 12410ca81413SKerry Stevens #pragma disjoint(*x,*y,*aa) 12420ca81413SKerry Stevens #endif 12430ca81413SKerry Stevens 12440ca81413SKerry Stevens PetscFunctionBegin; 12450ca81413SKerry Stevens ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 12460ca81413SKerry Stevens ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 12470ca81413SKerry Stevens 12480ca81413SKerry Stevens if(usecprow) { 12490ca81413SKerry Stevens PetscInt NumPerThread,iindex; 12500ca81413SKerry Stevens const MatScalar *aa = a->a; 12510ca81413SKerry Stevens const PetscInt *aj = a->j,*ii = a->compressedrow.i,*ridx=a->compressedrow.rindex; 12520ca81413SKerry Stevens PetscInt i,iStartVal,iEndVal,iStartIndex,iEndIndex; 12530c74a584SJed Brown const PetscInt iNumThreads = PetscMaxThreads; /* this number could be different */ 1254cfcfc605SKerry Stevens MatMult_KernelData* kerneldatap = (MatMult_KernelData*)malloc(iNumThreads*sizeof(MatMult_KernelData)); 1255cfcfc605SKerry Stevens MatMult_KernelData** pdata = (MatMult_KernelData**)malloc(iNumThreads*sizeof(MatMult_KernelData*)); 12560ca81413SKerry Stevens 12570ca81413SKerry Stevens m = a->compressedrow.nrows; 12580ca81413SKerry Stevens NumPerThread = ii[m]/iNumThreads; 12590ca81413SKerry Stevens iindex = 0; 12600ca81413SKerry Stevens for(i=0; i<iNumThreads;i++) { 12610ca81413SKerry Stevens iStartIndex = iindex; 12620ca81413SKerry Stevens iStartVal = ii[iStartIndex]; 12630ca81413SKerry Stevens iEndVal = iStartVal; 12640c74a584SJed Brown /* determine number of rows to process */ 12650ca81413SKerry Stevens while(iEndVal-iStartVal<NumPerThread) { 12660ca81413SKerry Stevens iindex++; 12670ca81413SKerry Stevens iEndVal = ii[iindex]; 12680ca81413SKerry Stevens } 12690c74a584SJed Brown /* determine whether to go back 1 */ 12700ca81413SKerry Stevens if(iEndVal-iStartVal-NumPerThread>NumPerThread-(ii[iindex-1]-iStartVal)) { 12710ca81413SKerry Stevens iindex--; 12720ca81413SKerry Stevens iEndVal = ii[iindex]; 12730ca81413SKerry Stevens } 12740ca81413SKerry Stevens iEndIndex = iindex; 1275cfcfc605SKerry Stevens kerneldatap[i].matdata = aa; 12760ca81413SKerry Stevens kerneldatap[i].vecdata = x; 12770ca81413SKerry Stevens kerneldatap[i].vecout = y; 12780ca81413SKerry Stevens kerneldatap[i].colindnz = aj; 12790ca81413SKerry Stevens kerneldatap[i].rownumnz = ii + iStartIndex; 12800ca81413SKerry Stevens kerneldatap[i].numrows = iEndIndex - iStartIndex + 1; 12810ca81413SKerry Stevens kerneldatap[i].specidx = ridx + iStartVal; 12820ca81413SKerry Stevens kerneldatap[i].nzr = 0; 1283cfcfc605SKerry Stevens pdata[i] = &kerneldatap[i]; 12840ca81413SKerry Stevens iindex++; 12850ca81413SKerry Stevens } 1286cfcfc605SKerry Stevens ierr = MainJob(MatMult_Kernel,(void**)pdata,iNumThreads); 1287cfcfc605SKerry Stevens /* collect results */ 128851d315f7SKerry Stevens for(i=0; i<iNumThreads; i++) { 1289cfcfc605SKerry Stevens nonzerorow += kerneldatap[i].nzr; 129051d315f7SKerry Stevens } 1291cfcfc605SKerry Stevens free(kerneldatap); 1292cfcfc605SKerry Stevens free(pdata); 129351d315f7SKerry Stevens } 129451d315f7SKerry Stevens else { 129551d315f7SKerry Stevens #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 129651d315f7SKerry Stevens fortranmultaij_(&m,x,a->i,a->j,a->a,y); 129751d315f7SKerry Stevens #else 129851d315f7SKerry Stevens PetscInt i,iindex; 129951d315f7SKerry Stevens const MatScalar *aa = a->a; 130051d315f7SKerry Stevens const PetscInt *aj = a->j,*ii = a->i; 13010c74a584SJed Brown const PetscInt iNumThreads = PetscMaxThreads; /* this number could be different */ 130251d315f7SKerry Stevens PetscInt Q = m/iNumThreads; 130351d315f7SKerry Stevens PetscInt R = m-Q*iNumThreads; 130451d315f7SKerry Stevens PetscBool S; 130551d315f7SKerry Stevens 130651d315f7SKerry Stevens MatMult_KernelData* kerneldatap = (MatMult_KernelData*)malloc(iNumThreads*sizeof(MatMult_KernelData)); 130751d315f7SKerry Stevens MatMult_KernelData** pdata = (MatMult_KernelData**)malloc(iNumThreads*sizeof(MatMult_KernelData*)); 130851d315f7SKerry Stevens 130951d315f7SKerry Stevens iindex = 0; 131051d315f7SKerry Stevens for(i=0; i<iNumThreads;i++) { 1311b50af74fSBarry Smith S = (PetscBool)(i<R); 131251d315f7SKerry Stevens kerneldatap[i].matdata = aa; 131351d315f7SKerry Stevens kerneldatap[i].vecdata = x; 131451d315f7SKerry Stevens kerneldatap[i].vecout = y; 131551d315f7SKerry Stevens kerneldatap[i].colindnz = aj; 131651d315f7SKerry Stevens kerneldatap[i].rownumnz = ii + iindex; 131751d315f7SKerry Stevens kerneldatap[i].numrows = S?Q+1:Q; 131851d315f7SKerry Stevens kerneldatap[i].specidx = PETSC_NULL; 13190c74a584SJed Brown kerneldatap[i].nzr = iindex; /* serves as the 'base' row (needed to access correctly into output vector y) */ 132051d315f7SKerry Stevens pdata[i] = &kerneldatap[i]; 132151d315f7SKerry Stevens iindex += kerneldatap[i].numrows; 132251d315f7SKerry Stevens } 13230ca81413SKerry Stevens MainJob(MatMult_Kernel,(void**)pdata,iNumThreads); 13240c74a584SJed Brown /* collect results */ 13250ca81413SKerry Stevens for(i=0; i<iNumThreads; i++) { 13260ca81413SKerry Stevens nonzerorow += kerneldatap[i].nzr; 13270ca81413SKerry Stevens } 132851d315f7SKerry Stevens free(kerneldatap); 132951d315f7SKerry Stevens free(pdata); 13300ca81413SKerry Stevens #endif 13310ca81413SKerry Stevens } 13320ca81413SKerry Stevens 13330ca81413SKerry Stevens ierr = PetscLogFlops(2.0*a->nz - nonzerorow);CHKERRQ(ierr); 13340ca81413SKerry Stevens ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 13350ca81413SKerry Stevens ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 13360ca81413SKerry Stevens PetscFunctionReturn(0); 13370ca81413SKerry Stevens } 13380c74a584SJed Brown /* ******************* */ 1339ba61063dSBarry Smith #endif 13400ca81413SKerry Stevens 1341c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 13424a2ae208SSatish Balay #undef __FUNCT__ 13434a2ae208SSatish Balay #define __FUNCT__ "MatMultAdd_SeqAIJ" 1344dfbe8321SBarry Smith PetscErrorCode MatMultAdd_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz) 134517ab2063SBarry Smith { 1346416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1347f15663dcSBarry Smith PetscScalar *y,*z; 1348f15663dcSBarry Smith const PetscScalar *x; 134954f21887SBarry Smith const MatScalar *aa; 1350dfbe8321SBarry Smith PetscErrorCode ierr; 1351d0f46423SBarry Smith PetscInt m = A->rmap->n,*aj,*ii; 1352f15663dcSBarry Smith PetscInt n,i,*ridx=PETSC_NULL; 1353362ced78SSatish Balay PetscScalar sum; 1354ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 13559ea0dfa2SSatish Balay 13563a40ed3dSBarry Smith PetscFunctionBegin; 1357f15663dcSBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 13581ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 13592e8a6d31SBarry Smith if (zz != yy) { 13601ebc52fbSHong Zhang ierr = VecGetArray(zz,&z);CHKERRQ(ierr); 13612e8a6d31SBarry Smith } else { 13622e8a6d31SBarry Smith z = y; 13632e8a6d31SBarry Smith } 1364bfeeae90SHong Zhang 136597952fefSHong Zhang aj = a->j; 136697952fefSHong Zhang aa = a->a; 1367cddf8d76SBarry Smith ii = a->i; 13684eb6d288SHong Zhang if (usecprow){ /* use compressed row format */ 13694eb6d288SHong Zhang if (zz != yy){ 13704eb6d288SHong Zhang ierr = PetscMemcpy(z,y,m*sizeof(PetscScalar));CHKERRQ(ierr); 13714eb6d288SHong Zhang } 137297952fefSHong Zhang m = a->compressedrow.nrows; 137397952fefSHong Zhang ii = a->compressedrow.i; 137497952fefSHong Zhang ridx = a->compressedrow.rindex; 137597952fefSHong Zhang for (i=0; i<m; i++){ 137697952fefSHong Zhang n = ii[i+1] - ii[i]; 137797952fefSHong Zhang aj = a->j + ii[i]; 137897952fefSHong Zhang aa = a->a + ii[i]; 137997952fefSHong Zhang sum = y[*ridx]; 1380f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 138197952fefSHong Zhang z[*ridx++] = sum; 138297952fefSHong Zhang } 138397952fefSHong Zhang } else { /* do not use compressed row format */ 1384f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 1385f15663dcSBarry Smith fortranmultaddaij_(&m,x,ii,aj,aa,y,z); 1386f15663dcSBarry Smith #else 138717ab2063SBarry Smith for (i=0; i<m; i++) { 1388f15663dcSBarry Smith n = ii[i+1] - ii[i]; 1389f15663dcSBarry Smith aj = a->j + ii[i]; 1390f15663dcSBarry Smith aa = a->a + ii[i]; 139117ab2063SBarry Smith sum = y[i]; 1392f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 139317ab2063SBarry Smith z[i] = sum; 139417ab2063SBarry Smith } 139502ab625aSSatish Balay #endif 1396f15663dcSBarry Smith } 1397dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1398f15663dcSBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 13991ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 14002e8a6d31SBarry Smith if (zz != yy) { 14011ebc52fbSHong Zhang ierr = VecRestoreArray(zz,&z);CHKERRQ(ierr); 14022e8a6d31SBarry Smith } 14038154be41SBarry Smith #if defined(PETSC_HAVE_CUSP) 14046b375ea7SVictor Minden /* 1405918e98c3SVictor Minden ierr = VecView(xx,0);CHKERRQ(ierr); 1406918e98c3SVictor Minden ierr = VecView(zz,0);CHKERRQ(ierr); 1407918e98c3SVictor Minden ierr = MatView(A,0);CHKERRQ(ierr); 14086b375ea7SVictor Minden */ 1409918e98c3SVictor Minden #endif 14103a40ed3dSBarry Smith PetscFunctionReturn(0); 141117ab2063SBarry Smith } 141217ab2063SBarry Smith 141317ab2063SBarry Smith /* 141417ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 141517ab2063SBarry Smith */ 14164a2ae208SSatish Balay #undef __FUNCT__ 14174a2ae208SSatish Balay #define __FUNCT__ "MatMarkDiagonal_SeqAIJ" 1418dfbe8321SBarry Smith PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 141917ab2063SBarry Smith { 1420416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 14216849ba73SBarry Smith PetscErrorCode ierr; 1422d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n; 142317ab2063SBarry Smith 14243a40ed3dSBarry Smith PetscFunctionBegin; 142509f38230SBarry Smith if (!a->diag) { 142609f38230SBarry Smith ierr = PetscMalloc(m*sizeof(PetscInt),&a->diag);CHKERRQ(ierr); 14279518dbb4SMatthew Knepley ierr = PetscLogObjectMemory(A, m*sizeof(PetscInt));CHKERRQ(ierr); 142809f38230SBarry Smith } 1429d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 143009f38230SBarry Smith a->diag[i] = a->i[i+1]; 1431bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1432bfeeae90SHong Zhang if (a->j[j] == i) { 143309f38230SBarry Smith a->diag[i] = j; 143417ab2063SBarry Smith break; 143517ab2063SBarry Smith } 143617ab2063SBarry Smith } 143717ab2063SBarry Smith } 14383a40ed3dSBarry Smith PetscFunctionReturn(0); 143917ab2063SBarry Smith } 144017ab2063SBarry Smith 1441be5855fcSBarry Smith /* 1442be5855fcSBarry Smith Checks for missing diagonals 1443be5855fcSBarry Smith */ 14444a2ae208SSatish Balay #undef __FUNCT__ 14454a2ae208SSatish Balay #define __FUNCT__ "MatMissingDiagonal_SeqAIJ" 1446ace3abfcSBarry Smith PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A,PetscBool *missing,PetscInt *d) 1447be5855fcSBarry Smith { 1448be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 144997f1f81fSBarry Smith PetscInt *diag,*jj = a->j,i; 1450be5855fcSBarry Smith 1451be5855fcSBarry Smith PetscFunctionBegin; 145209f38230SBarry Smith *missing = PETSC_FALSE; 1453d0f46423SBarry Smith if (A->rmap->n > 0 && !jj) { 145409f38230SBarry Smith *missing = PETSC_TRUE; 145509f38230SBarry Smith if (d) *d = 0; 145609f38230SBarry Smith PetscInfo(A,"Matrix has no entries therefor is missing diagonal"); 145709f38230SBarry Smith } else { 1458f1e2ffcdSBarry Smith diag = a->diag; 1459d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 1460bfeeae90SHong Zhang if (jj[diag[i]] != i) { 146109f38230SBarry Smith *missing = PETSC_TRUE; 146209f38230SBarry Smith if (d) *d = i; 146309f38230SBarry Smith PetscInfo1(A,"Matrix is missing diagonal number %D",i); 146409f38230SBarry Smith } 1465be5855fcSBarry Smith } 1466be5855fcSBarry Smith } 1467be5855fcSBarry Smith PetscFunctionReturn(0); 1468be5855fcSBarry Smith } 1469be5855fcSBarry Smith 147071f1c65dSBarry Smith EXTERN_C_BEGIN 147171f1c65dSBarry Smith #undef __FUNCT__ 147271f1c65dSBarry Smith #define __FUNCT__ "MatInvertDiagonal_SeqAIJ" 14737087cfbeSBarry Smith PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A,PetscScalar omega,PetscScalar fshift) 147471f1c65dSBarry Smith { 147571f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 147671f1c65dSBarry Smith PetscErrorCode ierr; 1477d0f46423SBarry Smith PetscInt i,*diag,m = A->rmap->n; 147854f21887SBarry Smith MatScalar *v = a->a; 147954f21887SBarry Smith PetscScalar *idiag,*mdiag; 148071f1c65dSBarry Smith 148171f1c65dSBarry Smith PetscFunctionBegin; 148271f1c65dSBarry Smith if (a->idiagvalid) PetscFunctionReturn(0); 148371f1c65dSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 148471f1c65dSBarry Smith diag = a->diag; 148571f1c65dSBarry Smith if (!a->idiag) { 148671f1c65dSBarry Smith ierr = PetscMalloc3(m,PetscScalar,&a->idiag,m,PetscScalar,&a->mdiag,m,PetscScalar,&a->ssor_work);CHKERRQ(ierr); 148771f1c65dSBarry Smith ierr = PetscLogObjectMemory(A, 3*m*sizeof(PetscScalar));CHKERRQ(ierr); 148871f1c65dSBarry Smith v = a->a; 148971f1c65dSBarry Smith } 149071f1c65dSBarry Smith mdiag = a->mdiag; 149171f1c65dSBarry Smith idiag = a->idiag; 149271f1c65dSBarry Smith 1493028cd4eaSSatish Balay if (omega == 1.0 && !PetscAbsScalar(fshift)) { 149471f1c65dSBarry Smith for (i=0; i<m; i++) { 149571f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1496e32f2f54SBarry Smith if (!PetscAbsScalar(mdiag[i])) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Zero diagonal on row %D",i); 149771f1c65dSBarry Smith idiag[i] = 1.0/v[diag[i]]; 149871f1c65dSBarry Smith } 149971f1c65dSBarry Smith ierr = PetscLogFlops(m);CHKERRQ(ierr); 150071f1c65dSBarry Smith } else { 150171f1c65dSBarry Smith for (i=0; i<m; i++) { 150271f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 150371f1c65dSBarry Smith idiag[i] = omega/(fshift + v[diag[i]]); 150471f1c65dSBarry Smith } 1505dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*m);CHKERRQ(ierr); 150671f1c65dSBarry Smith } 150771f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 150871f1c65dSBarry Smith PetscFunctionReturn(0); 150971f1c65dSBarry Smith } 15105a9745a3SMatthew Knepley EXTERN_C_END 151171f1c65dSBarry Smith 1512c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 15134a2ae208SSatish Balay #undef __FUNCT__ 151441f059aeSBarry Smith #define __FUNCT__ "MatSOR_SeqAIJ" 151541f059aeSBarry Smith PetscErrorCode MatSOR_SeqAIJ(Mat A,Vec bb,PetscReal omega,MatSORType flag,PetscReal fshift,PetscInt its,PetscInt lits,Vec xx) 151617ab2063SBarry Smith { 1517416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1518e6d1f457SBarry Smith PetscScalar *x,d,sum,*t,scale; 1519e6d1f457SBarry Smith const MatScalar *v = a->a,*idiag=0,*mdiag; 152054f21887SBarry Smith const PetscScalar *b, *bs,*xb, *ts; 1521dfbe8321SBarry Smith PetscErrorCode ierr; 1522d0f46423SBarry Smith PetscInt n = A->cmap->n,m = A->rmap->n,i; 152397f1f81fSBarry Smith const PetscInt *idx,*diag; 152417ab2063SBarry Smith 15253a40ed3dSBarry Smith PetscFunctionBegin; 1526b965ef7fSBarry Smith its = its*lits; 152791723122SBarry Smith 152871f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 152971f1c65dSBarry Smith if (!a->idiagvalid) {ierr = MatInvertDiagonal_SeqAIJ(A,omega,fshift);CHKERRQ(ierr);} 153071f1c65dSBarry Smith a->fshift = fshift; 153171f1c65dSBarry Smith a->omega = omega; 1532ed480e8bSBarry Smith 153371f1c65dSBarry Smith diag = a->diag; 153471f1c65dSBarry Smith t = a->ssor_work; 1535ed480e8bSBarry Smith idiag = a->idiag; 153671f1c65dSBarry Smith mdiag = a->mdiag; 1537ed480e8bSBarry Smith 15381ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 15393649974fSBarry Smith ierr = VecGetArrayRead(bb,&b);CHKERRQ(ierr); 154071f1c65dSBarry Smith CHKMEMQ; 1541ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 154217ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 154317ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1544ed480e8bSBarry Smith bs = b; 154517ab2063SBarry Smith for (i=0; i<m; i++) { 154671f1c65dSBarry Smith d = fshift + mdiag[i]; 1547416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1548ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1549ed480e8bSBarry Smith v = a->a + diag[i] + 1; 155017ab2063SBarry Smith sum = b[i]*d/omega; 1551003131ecSBarry Smith PetscSparseDensePlusDot(sum,bs,v,idx,n); 155217ab2063SBarry Smith x[i] = sum; 155317ab2063SBarry Smith } 15541ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 15553649974fSBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 1556efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 15573a40ed3dSBarry Smith PetscFunctionReturn(0); 155817ab2063SBarry Smith } 1559c783ea89SBarry Smith 156048af12d7SBarry Smith if (flag == SOR_APPLY_LOWER) { 1561e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"SOR_APPLY_LOWER is not implemented"); 15623a40ed3dSBarry Smith } else if (flag & SOR_EISENSTAT) { 156317ab2063SBarry Smith /* Let A = L + U + D; where L is lower trianglar, 1564887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 156517ab2063SBarry Smith 156617ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 156717ab2063SBarry Smith 1568887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 156917ab2063SBarry Smith */ 157017ab2063SBarry Smith scale = (2.0/omega) - 1.0; 157117ab2063SBarry Smith 157217ab2063SBarry Smith /* x = (E + U)^{-1} b */ 157317ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1574416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1575ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1576ed480e8bSBarry Smith v = a->a + diag[i] + 1; 157717ab2063SBarry Smith sum = b[i]; 1578e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 1579ed480e8bSBarry Smith x[i] = sum*idiag[i]; 158017ab2063SBarry Smith } 158117ab2063SBarry Smith 158217ab2063SBarry Smith /* t = b - (2*E - D)x */ 1583416022c9SBarry Smith v = a->a; 1584ed480e8bSBarry Smith for (i=0; i<m; i++) { t[i] = b[i] - scale*(v[*diag++])*x[i]; } 158517ab2063SBarry Smith 158617ab2063SBarry Smith /* t = (E + L)^{-1}t */ 1587ed480e8bSBarry Smith ts = t; 1588416022c9SBarry Smith diag = a->diag; 158917ab2063SBarry Smith for (i=0; i<m; i++) { 1590416022c9SBarry Smith n = diag[i] - a->i[i]; 1591ed480e8bSBarry Smith idx = a->j + a->i[i]; 1592ed480e8bSBarry Smith v = a->a + a->i[i]; 159317ab2063SBarry Smith sum = t[i]; 1594003131ecSBarry Smith PetscSparseDenseMinusDot(sum,ts,v,idx,n); 1595ed480e8bSBarry Smith t[i] = sum*idiag[i]; 1596733d66baSBarry Smith /* x = x + t */ 1597733d66baSBarry Smith x[i] += t[i]; 159817ab2063SBarry Smith } 159917ab2063SBarry Smith 1600dc0b31edSSatish Balay ierr = PetscLogFlops(6.0*m-1 + 2.0*a->nz);CHKERRQ(ierr); 16011ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 16023649974fSBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 16033a40ed3dSBarry Smith PetscFunctionReturn(0); 160417ab2063SBarry Smith } 160517ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 160617ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP){ 160717ab2063SBarry Smith for (i=0; i<m; i++) { 1608416022c9SBarry Smith n = diag[i] - a->i[i]; 1609ed480e8bSBarry Smith idx = a->j + a->i[i]; 1610ed480e8bSBarry Smith v = a->a + a->i[i]; 161117ab2063SBarry Smith sum = b[i]; 1612e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 16135c99c7daSBarry Smith t[i] = sum; 1614ed480e8bSBarry Smith x[i] = sum*idiag[i]; 161517ab2063SBarry Smith } 16165c99c7daSBarry Smith xb = t; 1617efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 16183a40ed3dSBarry Smith } else xb = b; 161917ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP){ 162017ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1621416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1622ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1623ed480e8bSBarry Smith v = a->a + diag[i] + 1; 162417ab2063SBarry Smith sum = xb[i]; 1625e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 16265c99c7daSBarry Smith if (xb == b) { 1627ed480e8bSBarry Smith x[i] = sum*idiag[i]; 16285c99c7daSBarry Smith } else { 16295c99c7daSBarry Smith x[i] = (1-omega)*x[i] + sum*idiag[i]; 163017ab2063SBarry Smith } 16315c99c7daSBarry Smith } 1632efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 163317ab2063SBarry Smith } 163417ab2063SBarry Smith its--; 163517ab2063SBarry Smith } 163617ab2063SBarry Smith while (its--) { 163717ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP){ 163817ab2063SBarry Smith for (i=0; i<m; i++) { 1639416022c9SBarry Smith n = a->i[i+1] - a->i[i]; 1640ed480e8bSBarry Smith idx = a->j + a->i[i]; 1641ed480e8bSBarry Smith v = a->a + a->i[i]; 164217ab2063SBarry Smith sum = b[i]; 1643e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 1644ed480e8bSBarry Smith x[i] = (1. - omega)*x[i] + (sum + mdiag[i]*x[i])*idiag[i]; 164517ab2063SBarry Smith } 16469f863219SBarry Smith ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 164717ab2063SBarry Smith } 164817ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP){ 164917ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1650416022c9SBarry Smith n = a->i[i+1] - a->i[i]; 1651ed480e8bSBarry Smith idx = a->j + a->i[i]; 1652ed480e8bSBarry Smith v = a->a + a->i[i]; 165317ab2063SBarry Smith sum = b[i]; 1654e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 1655ed480e8bSBarry Smith x[i] = (1. - omega)*x[i] + (sum + mdiag[i]*x[i])*idiag[i]; 165617ab2063SBarry Smith } 16579f863219SBarry Smith ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 165817ab2063SBarry Smith } 165917ab2063SBarry Smith } 16601ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 16613649974fSBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 166271f1c65dSBarry Smith CHKMEMQ; PetscFunctionReturn(0); 166317ab2063SBarry Smith } 166417ab2063SBarry Smith 16652af78befSBarry Smith 16664a2ae208SSatish Balay #undef __FUNCT__ 16674a2ae208SSatish Balay #define __FUNCT__ "MatGetInfo_SeqAIJ" 1668dfbe8321SBarry Smith PetscErrorCode MatGetInfo_SeqAIJ(Mat A,MatInfoType flag,MatInfo *info) 166917ab2063SBarry Smith { 1670416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 16714e220ebcSLois Curfman McInnes 16723a40ed3dSBarry Smith PetscFunctionBegin; 16734e220ebcSLois Curfman McInnes info->block_size = 1.0; 16744e220ebcSLois Curfman McInnes info->nz_allocated = (double)a->maxnz; 16754e220ebcSLois Curfman McInnes info->nz_used = (double)a->nz; 16764e220ebcSLois Curfman McInnes info->nz_unneeded = (double)(a->maxnz - a->nz); 16774e220ebcSLois Curfman McInnes info->assemblies = (double)A->num_ass; 16788e58a170SBarry Smith info->mallocs = (double)A->info.mallocs; 16797adad957SLisandro Dalcin info->memory = ((PetscObject)A)->mem; 1680d5f3da31SBarry Smith if (A->factortype) { 16814e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 16824e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 16834e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 16844e220ebcSLois Curfman McInnes } else { 16854e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 16864e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 16874e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 16884e220ebcSLois Curfman McInnes } 16893a40ed3dSBarry Smith PetscFunctionReturn(0); 169017ab2063SBarry Smith } 169117ab2063SBarry Smith 16924a2ae208SSatish Balay #undef __FUNCT__ 16934a2ae208SSatish Balay #define __FUNCT__ "MatZeroRows_SeqAIJ" 16942b40b63fSBarry Smith PetscErrorCode MatZeroRows_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 169517ab2063SBarry Smith { 1696416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 16973b98c0a2SBarry Smith PetscInt i,m = A->rmap->n - 1,d = 0; 16986849ba73SBarry Smith PetscErrorCode ierr; 169997b48c8fSBarry Smith const PetscScalar *xx; 170097b48c8fSBarry Smith PetscScalar *bb; 1701ace3abfcSBarry Smith PetscBool missing; 170217ab2063SBarry Smith 17033a40ed3dSBarry Smith PetscFunctionBegin; 170497b48c8fSBarry Smith if (x && b) { 170597b48c8fSBarry Smith ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 170697b48c8fSBarry Smith ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 170797b48c8fSBarry Smith for (i=0; i<N; i++) { 170897b48c8fSBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 170997b48c8fSBarry Smith bb[rows[i]] = diag*xx[rows[i]]; 171097b48c8fSBarry Smith } 171197b48c8fSBarry Smith ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 171297b48c8fSBarry Smith ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 171397b48c8fSBarry Smith } 171497b48c8fSBarry Smith 1715a9817697SBarry Smith if (a->keepnonzeropattern) { 1716f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 1717e32f2f54SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 1718bfeeae90SHong Zhang ierr = PetscMemzero(&a->a[a->i[rows[i]]],a->ilen[rows[i]]*sizeof(PetscScalar));CHKERRQ(ierr); 1719f1e2ffcdSBarry Smith } 1720f4df32b1SMatthew Knepley if (diag != 0.0) { 172109f38230SBarry Smith ierr = MatMissingDiagonal_SeqAIJ(A,&missing,&d);CHKERRQ(ierr); 1722e32f2f54SBarry Smith if (missing) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in row %D",d); 1723f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 1724f4df32b1SMatthew Knepley a->a[a->diag[rows[i]]] = diag; 1725f1e2ffcdSBarry Smith } 1726f1e2ffcdSBarry Smith } 172788e51ccdSHong Zhang A->same_nonzero = PETSC_TRUE; 1728f1e2ffcdSBarry Smith } else { 1729f4df32b1SMatthew Knepley if (diag != 0.0) { 173017ab2063SBarry Smith for (i=0; i<N; i++) { 1731e32f2f54SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 17327ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 1733416022c9SBarry Smith a->ilen[rows[i]] = 1; 1734f4df32b1SMatthew Knepley a->a[a->i[rows[i]]] = diag; 1735bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 17367ae801bdSBarry Smith } else { /* in case row was completely empty */ 1737f4df32b1SMatthew Knepley ierr = MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],&diag,INSERT_VALUES);CHKERRQ(ierr); 173817ab2063SBarry Smith } 173917ab2063SBarry Smith } 17403a40ed3dSBarry Smith } else { 174117ab2063SBarry Smith for (i=0; i<N; i++) { 1742e32f2f54SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 1743416022c9SBarry Smith a->ilen[rows[i]] = 0; 174417ab2063SBarry Smith } 174517ab2063SBarry Smith } 174688e51ccdSHong Zhang A->same_nonzero = PETSC_FALSE; 1747f1e2ffcdSBarry Smith } 174843a90d84SBarry Smith ierr = MatAssemblyEnd_SeqAIJ(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 17493a40ed3dSBarry Smith PetscFunctionReturn(0); 175017ab2063SBarry Smith } 175117ab2063SBarry Smith 17524a2ae208SSatish Balay #undef __FUNCT__ 17536e169961SBarry Smith #define __FUNCT__ "MatZeroRowsColumns_SeqAIJ" 17546e169961SBarry Smith PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 17556e169961SBarry Smith { 17566e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 17576e169961SBarry Smith PetscInt i,j,m = A->rmap->n - 1,d = 0; 17586e169961SBarry Smith PetscErrorCode ierr; 17592b40b63fSBarry Smith PetscBool missing,*zeroed,vecs = PETSC_FALSE; 17606e169961SBarry Smith const PetscScalar *xx; 17616e169961SBarry Smith PetscScalar *bb; 17626e169961SBarry Smith 17636e169961SBarry Smith PetscFunctionBegin; 17646e169961SBarry Smith if (x && b) { 17656e169961SBarry Smith ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 17666e169961SBarry Smith ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 17672b40b63fSBarry Smith vecs = PETSC_TRUE; 17686e169961SBarry Smith } 17696e169961SBarry Smith ierr = PetscMalloc(A->rmap->n*sizeof(PetscBool),&zeroed);CHKERRQ(ierr); 17706e169961SBarry Smith ierr = PetscMemzero(zeroed,A->rmap->n*sizeof(PetscBool));CHKERRQ(ierr); 17716e169961SBarry Smith for (i=0; i<N; i++) { 17726e169961SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 17736e169961SBarry Smith ierr = PetscMemzero(&a->a[a->i[rows[i]]],a->ilen[rows[i]]*sizeof(PetscScalar));CHKERRQ(ierr); 17746e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 17756e169961SBarry Smith } 17766e169961SBarry Smith for (i=0; i<A->rmap->n; i++) { 17776e169961SBarry Smith if (!zeroed[i]) { 17786e169961SBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 17796e169961SBarry Smith if (zeroed[a->j[j]]) { 17802b40b63fSBarry Smith if (vecs) bb[i] -= a->a[j]*xx[a->j[j]]; 17816e169961SBarry Smith a->a[j] = 0.0; 17826e169961SBarry Smith } 17836e169961SBarry Smith } 17842b40b63fSBarry Smith } else if (vecs) bb[i] = diag*xx[i]; 17856e169961SBarry Smith } 17866e169961SBarry Smith if (x && b) { 17876e169961SBarry Smith ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 17886e169961SBarry Smith ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 17896e169961SBarry Smith } 17906e169961SBarry Smith ierr = PetscFree(zeroed);CHKERRQ(ierr); 17916e169961SBarry Smith if (diag != 0.0) { 17926e169961SBarry Smith ierr = MatMissingDiagonal_SeqAIJ(A,&missing,&d);CHKERRQ(ierr); 17936e169961SBarry Smith if (missing) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in row %D",d); 17946e169961SBarry Smith for (i=0; i<N; i++) { 17956e169961SBarry Smith a->a[a->diag[rows[i]]] = diag; 17966e169961SBarry Smith } 17976e169961SBarry Smith } 17986e169961SBarry Smith A->same_nonzero = PETSC_TRUE; 17996e169961SBarry Smith ierr = MatAssemblyEnd_SeqAIJ(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 18006e169961SBarry Smith PetscFunctionReturn(0); 18016e169961SBarry Smith } 18026e169961SBarry Smith 18036e169961SBarry Smith #undef __FUNCT__ 18044a2ae208SSatish Balay #define __FUNCT__ "MatGetRow_SeqAIJ" 1805a77337e4SBarry Smith PetscErrorCode MatGetRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 180617ab2063SBarry Smith { 1807416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 180897f1f81fSBarry Smith PetscInt *itmp; 180917ab2063SBarry Smith 18103a40ed3dSBarry Smith PetscFunctionBegin; 1811e32f2f54SBarry Smith if (row < 0 || row >= A->rmap->n) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D out of range",row); 181217ab2063SBarry Smith 1813416022c9SBarry Smith *nz = a->i[row+1] - a->i[row]; 1814bfeeae90SHong Zhang if (v) *v = a->a + a->i[row]; 181517ab2063SBarry Smith if (idx) { 1816bfeeae90SHong Zhang itmp = a->j + a->i[row]; 1817bfeeae90SHong Zhang if (*nz) { 18184e093b46SBarry Smith *idx = itmp; 181917ab2063SBarry Smith } 182017ab2063SBarry Smith else *idx = 0; 182117ab2063SBarry Smith } 18223a40ed3dSBarry Smith PetscFunctionReturn(0); 182317ab2063SBarry Smith } 182417ab2063SBarry Smith 1825bfeeae90SHong Zhang /* remove this function? */ 18264a2ae208SSatish Balay #undef __FUNCT__ 18274a2ae208SSatish Balay #define __FUNCT__ "MatRestoreRow_SeqAIJ" 1828a77337e4SBarry Smith PetscErrorCode MatRestoreRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 182917ab2063SBarry Smith { 18303a40ed3dSBarry Smith PetscFunctionBegin; 18313a40ed3dSBarry Smith PetscFunctionReturn(0); 183217ab2063SBarry Smith } 183317ab2063SBarry Smith 18344a2ae208SSatish Balay #undef __FUNCT__ 18354a2ae208SSatish Balay #define __FUNCT__ "MatNorm_SeqAIJ" 1836dfbe8321SBarry Smith PetscErrorCode MatNorm_SeqAIJ(Mat A,NormType type,PetscReal *nrm) 183717ab2063SBarry Smith { 1838416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 183954f21887SBarry Smith MatScalar *v = a->a; 184036db0b34SBarry Smith PetscReal sum = 0.0; 18416849ba73SBarry Smith PetscErrorCode ierr; 184297f1f81fSBarry Smith PetscInt i,j; 184317ab2063SBarry Smith 18443a40ed3dSBarry Smith PetscFunctionBegin; 184517ab2063SBarry Smith if (type == NORM_FROBENIUS) { 1846416022c9SBarry Smith for (i=0; i<a->nz; i++) { 1847aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 184836db0b34SBarry Smith sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 184917ab2063SBarry Smith #else 185017ab2063SBarry Smith sum += (*v)*(*v); v++; 185117ab2063SBarry Smith #endif 185217ab2063SBarry Smith } 18538f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 18543a40ed3dSBarry Smith } else if (type == NORM_1) { 185536db0b34SBarry Smith PetscReal *tmp; 185697f1f81fSBarry Smith PetscInt *jj = a->j; 1857d0f46423SBarry Smith ierr = PetscMalloc((A->cmap->n+1)*sizeof(PetscReal),&tmp);CHKERRQ(ierr); 1858d0f46423SBarry Smith ierr = PetscMemzero(tmp,A->cmap->n*sizeof(PetscReal));CHKERRQ(ierr); 1859064f8208SBarry Smith *nrm = 0.0; 1860416022c9SBarry Smith for (j=0; j<a->nz; j++) { 1861bfeeae90SHong Zhang tmp[*jj++] += PetscAbsScalar(*v); v++; 186217ab2063SBarry Smith } 1863d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1864064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 186517ab2063SBarry Smith } 1866606d414cSSatish Balay ierr = PetscFree(tmp);CHKERRQ(ierr); 18673a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 1868064f8208SBarry Smith *nrm = 0.0; 1869d0f46423SBarry Smith for (j=0; j<A->rmap->n; j++) { 1870bfeeae90SHong Zhang v = a->a + a->i[j]; 187117ab2063SBarry Smith sum = 0.0; 1872416022c9SBarry Smith for (i=0; i<a->i[j+1]-a->i[j]; i++) { 1873cddf8d76SBarry Smith sum += PetscAbsScalar(*v); v++; 187417ab2063SBarry Smith } 1875064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 187617ab2063SBarry Smith } 18773a40ed3dSBarry Smith } else { 1878e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"No support for two norm"); 187917ab2063SBarry Smith } 18803a40ed3dSBarry Smith PetscFunctionReturn(0); 188117ab2063SBarry Smith } 188217ab2063SBarry Smith 18834a2ae208SSatish Balay #undef __FUNCT__ 18844a2ae208SSatish Balay #define __FUNCT__ "MatTranspose_SeqAIJ" 1885fc4dec0aSBarry Smith PetscErrorCode MatTranspose_SeqAIJ(Mat A,MatReuse reuse,Mat *B) 188617ab2063SBarry Smith { 1887416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1888416022c9SBarry Smith Mat C; 18896849ba73SBarry Smith PetscErrorCode ierr; 1890d0f46423SBarry Smith PetscInt i,*aj = a->j,*ai = a->i,m = A->rmap->n,len,*col; 189154f21887SBarry Smith MatScalar *array = a->a; 189217ab2063SBarry Smith 18933a40ed3dSBarry Smith PetscFunctionBegin; 1894e32f2f54SBarry Smith if (reuse == MAT_REUSE_MATRIX && A == *B && m != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Square matrix only for in-place"); 1895fc4dec0aSBarry Smith 1896fc4dec0aSBarry Smith if (reuse == MAT_INITIAL_MATRIX || *B == A) { 1897d0f46423SBarry Smith ierr = PetscMalloc((1+A->cmap->n)*sizeof(PetscInt),&col);CHKERRQ(ierr); 1898d0f46423SBarry Smith ierr = PetscMemzero(col,(1+A->cmap->n)*sizeof(PetscInt));CHKERRQ(ierr); 1899bfeeae90SHong Zhang 1900bfeeae90SHong Zhang for (i=0; i<ai[m]; i++) col[aj[i]] += 1; 19017adad957SLisandro Dalcin ierr = MatCreate(((PetscObject)A)->comm,&C);CHKERRQ(ierr); 1902d0f46423SBarry Smith ierr = MatSetSizes(C,A->cmap->n,m,A->cmap->n,m);CHKERRQ(ierr); 19037adad957SLisandro Dalcin ierr = MatSetType(C,((PetscObject)A)->type_name);CHKERRQ(ierr); 1904ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,col);CHKERRQ(ierr); 1905606d414cSSatish Balay ierr = PetscFree(col);CHKERRQ(ierr); 1906a541d17aSBarry Smith } else { 1907a541d17aSBarry Smith C = *B; 1908a541d17aSBarry Smith } 1909a541d17aSBarry Smith 191017ab2063SBarry Smith for (i=0; i<m; i++) { 191117ab2063SBarry Smith len = ai[i+1]-ai[i]; 191287d4246cSBarry Smith ierr = MatSetValues_SeqAIJ(C,len,aj,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 1913b9b97703SBarry Smith array += len; 1914b9b97703SBarry Smith aj += len; 191517ab2063SBarry Smith } 19166d4a8577SBarry Smith ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 19176d4a8577SBarry Smith ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 191817ab2063SBarry Smith 1919815cbec1SBarry Smith if (reuse == MAT_INITIAL_MATRIX || *B != A) { 1920416022c9SBarry Smith *B = C; 192117ab2063SBarry Smith } else { 1922eb6b5d47SBarry Smith ierr = MatHeaderMerge(A,C);CHKERRQ(ierr); 192317ab2063SBarry Smith } 19243a40ed3dSBarry Smith PetscFunctionReturn(0); 192517ab2063SBarry Smith } 192617ab2063SBarry Smith 1927cd0d46ebSvictorle EXTERN_C_BEGIN 1928cd0d46ebSvictorle #undef __FUNCT__ 19295fbd3699SBarry Smith #define __FUNCT__ "MatIsTranspose_SeqAIJ" 19307087cfbeSBarry Smith PetscErrorCode MatIsTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 1931cd0d46ebSvictorle { 1932cd0d46ebSvictorle Mat_SeqAIJ *aij = (Mat_SeqAIJ *) A->data,*bij = (Mat_SeqAIJ*) A->data; 193354f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 193454f21887SBarry Smith MatScalar *va,*vb; 19356849ba73SBarry Smith PetscErrorCode ierr; 193697f1f81fSBarry Smith PetscInt ma,na,mb,nb, i; 1937cd0d46ebSvictorle 1938cd0d46ebSvictorle PetscFunctionBegin; 1939cd0d46ebSvictorle bij = (Mat_SeqAIJ *) B->data; 1940cd0d46ebSvictorle 1941cd0d46ebSvictorle ierr = MatGetSize(A,&ma,&na);CHKERRQ(ierr); 1942cd0d46ebSvictorle ierr = MatGetSize(B,&mb,&nb);CHKERRQ(ierr); 19435485867bSBarry Smith if (ma!=nb || na!=mb){ 19445485867bSBarry Smith *f = PETSC_FALSE; 19455485867bSBarry Smith PetscFunctionReturn(0); 19465485867bSBarry Smith } 1947cd0d46ebSvictorle aii = aij->i; bii = bij->i; 1948cd0d46ebSvictorle adx = aij->j; bdx = bij->j; 1949cd0d46ebSvictorle va = aij->a; vb = bij->a; 195097f1f81fSBarry Smith ierr = PetscMalloc(ma*sizeof(PetscInt),&aptr);CHKERRQ(ierr); 195197f1f81fSBarry Smith ierr = PetscMalloc(mb*sizeof(PetscInt),&bptr);CHKERRQ(ierr); 1952cd0d46ebSvictorle for (i=0; i<ma; i++) aptr[i] = aii[i]; 1953cd0d46ebSvictorle for (i=0; i<mb; i++) bptr[i] = bii[i]; 1954cd0d46ebSvictorle 1955cd0d46ebSvictorle *f = PETSC_TRUE; 1956cd0d46ebSvictorle for (i=0; i<ma; i++) { 1957cd0d46ebSvictorle while (aptr[i]<aii[i+1]) { 195897f1f81fSBarry Smith PetscInt idc,idr; 19595485867bSBarry Smith PetscScalar vc,vr; 1960cd0d46ebSvictorle /* column/row index/value */ 19615485867bSBarry Smith idc = adx[aptr[i]]; 19625485867bSBarry Smith idr = bdx[bptr[idc]]; 19635485867bSBarry Smith vc = va[aptr[i]]; 19645485867bSBarry Smith vr = vb[bptr[idc]]; 19655485867bSBarry Smith if (i!=idr || PetscAbsScalar(vc-vr) > tol) { 19665485867bSBarry Smith *f = PETSC_FALSE; 19675485867bSBarry Smith goto done; 1968cd0d46ebSvictorle } else { 19695485867bSBarry Smith aptr[i]++; 19705485867bSBarry Smith if (B || i!=idc) bptr[idc]++; 1971cd0d46ebSvictorle } 1972cd0d46ebSvictorle } 1973cd0d46ebSvictorle } 1974cd0d46ebSvictorle done: 1975cd0d46ebSvictorle ierr = PetscFree(aptr);CHKERRQ(ierr); 19763aeef889SHong Zhang ierr = PetscFree(bptr);CHKERRQ(ierr); 1977cd0d46ebSvictorle PetscFunctionReturn(0); 1978cd0d46ebSvictorle } 1979cd0d46ebSvictorle EXTERN_C_END 1980cd0d46ebSvictorle 19811cbb95d3SBarry Smith EXTERN_C_BEGIN 19821cbb95d3SBarry Smith #undef __FUNCT__ 19831cbb95d3SBarry Smith #define __FUNCT__ "MatIsHermitianTranspose_SeqAIJ" 19847087cfbeSBarry Smith PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 19851cbb95d3SBarry Smith { 19861cbb95d3SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *) A->data,*bij = (Mat_SeqAIJ*) A->data; 198754f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 198854f21887SBarry Smith MatScalar *va,*vb; 19891cbb95d3SBarry Smith PetscErrorCode ierr; 19901cbb95d3SBarry Smith PetscInt ma,na,mb,nb, i; 19911cbb95d3SBarry Smith 19921cbb95d3SBarry Smith PetscFunctionBegin; 19931cbb95d3SBarry Smith bij = (Mat_SeqAIJ *) B->data; 19941cbb95d3SBarry Smith 19951cbb95d3SBarry Smith ierr = MatGetSize(A,&ma,&na);CHKERRQ(ierr); 19961cbb95d3SBarry Smith ierr = MatGetSize(B,&mb,&nb);CHKERRQ(ierr); 19971cbb95d3SBarry Smith if (ma!=nb || na!=mb){ 19981cbb95d3SBarry Smith *f = PETSC_FALSE; 19991cbb95d3SBarry Smith PetscFunctionReturn(0); 20001cbb95d3SBarry Smith } 20011cbb95d3SBarry Smith aii = aij->i; bii = bij->i; 20021cbb95d3SBarry Smith adx = aij->j; bdx = bij->j; 20031cbb95d3SBarry Smith va = aij->a; vb = bij->a; 20041cbb95d3SBarry Smith ierr = PetscMalloc(ma*sizeof(PetscInt),&aptr);CHKERRQ(ierr); 20051cbb95d3SBarry Smith ierr = PetscMalloc(mb*sizeof(PetscInt),&bptr);CHKERRQ(ierr); 20061cbb95d3SBarry Smith for (i=0; i<ma; i++) aptr[i] = aii[i]; 20071cbb95d3SBarry Smith for (i=0; i<mb; i++) bptr[i] = bii[i]; 20081cbb95d3SBarry Smith 20091cbb95d3SBarry Smith *f = PETSC_TRUE; 20101cbb95d3SBarry Smith for (i=0; i<ma; i++) { 20111cbb95d3SBarry Smith while (aptr[i]<aii[i+1]) { 20121cbb95d3SBarry Smith PetscInt idc,idr; 20131cbb95d3SBarry Smith PetscScalar vc,vr; 20141cbb95d3SBarry Smith /* column/row index/value */ 20151cbb95d3SBarry Smith idc = adx[aptr[i]]; 20161cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 20171cbb95d3SBarry Smith vc = va[aptr[i]]; 20181cbb95d3SBarry Smith vr = vb[bptr[idc]]; 20191cbb95d3SBarry Smith if (i!=idr || PetscAbsScalar(vc-PetscConj(vr)) > tol) { 20201cbb95d3SBarry Smith *f = PETSC_FALSE; 20211cbb95d3SBarry Smith goto done; 20221cbb95d3SBarry Smith } else { 20231cbb95d3SBarry Smith aptr[i]++; 20241cbb95d3SBarry Smith if (B || i!=idc) bptr[idc]++; 20251cbb95d3SBarry Smith } 20261cbb95d3SBarry Smith } 20271cbb95d3SBarry Smith } 20281cbb95d3SBarry Smith done: 20291cbb95d3SBarry Smith ierr = PetscFree(aptr);CHKERRQ(ierr); 20301cbb95d3SBarry Smith ierr = PetscFree(bptr);CHKERRQ(ierr); 20311cbb95d3SBarry Smith PetscFunctionReturn(0); 20321cbb95d3SBarry Smith } 20331cbb95d3SBarry Smith EXTERN_C_END 20341cbb95d3SBarry Smith 20359e29f15eSvictorle #undef __FUNCT__ 20369e29f15eSvictorle #define __FUNCT__ "MatIsSymmetric_SeqAIJ" 2037ace3abfcSBarry Smith PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 20389e29f15eSvictorle { 2039dfbe8321SBarry Smith PetscErrorCode ierr; 20409e29f15eSvictorle PetscFunctionBegin; 20415485867bSBarry Smith ierr = MatIsTranspose_SeqAIJ(A,A,tol,f);CHKERRQ(ierr); 20429e29f15eSvictorle PetscFunctionReturn(0); 20439e29f15eSvictorle } 20449e29f15eSvictorle 20454a2ae208SSatish Balay #undef __FUNCT__ 20461cbb95d3SBarry Smith #define __FUNCT__ "MatIsHermitian_SeqAIJ" 2047ace3abfcSBarry Smith PetscErrorCode MatIsHermitian_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 20481cbb95d3SBarry Smith { 20491cbb95d3SBarry Smith PetscErrorCode ierr; 20501cbb95d3SBarry Smith PetscFunctionBegin; 20511cbb95d3SBarry Smith ierr = MatIsHermitianTranspose_SeqAIJ(A,A,tol,f);CHKERRQ(ierr); 20521cbb95d3SBarry Smith PetscFunctionReturn(0); 20531cbb95d3SBarry Smith } 20541cbb95d3SBarry Smith 20551cbb95d3SBarry Smith #undef __FUNCT__ 20564a2ae208SSatish Balay #define __FUNCT__ "MatDiagonalScale_SeqAIJ" 2057dfbe8321SBarry Smith PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A,Vec ll,Vec rr) 205817ab2063SBarry Smith { 2059416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 206054f21887SBarry Smith PetscScalar *l,*r,x; 206154f21887SBarry Smith MatScalar *v; 2062dfbe8321SBarry Smith PetscErrorCode ierr; 2063d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,M,nz = a->nz,*jj; 206417ab2063SBarry Smith 20653a40ed3dSBarry Smith PetscFunctionBegin; 206617ab2063SBarry Smith if (ll) { 20673ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 20683ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 2069e1311b90SBarry Smith ierr = VecGetLocalSize(ll,&m);CHKERRQ(ierr); 2070e32f2f54SBarry Smith if (m != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Left scaling vector wrong length"); 20711ebc52fbSHong Zhang ierr = VecGetArray(ll,&l);CHKERRQ(ierr); 2072416022c9SBarry Smith v = a->a; 207317ab2063SBarry Smith for (i=0; i<m; i++) { 207417ab2063SBarry Smith x = l[i]; 2075416022c9SBarry Smith M = a->i[i+1] - a->i[i]; 207617ab2063SBarry Smith for (j=0; j<M; j++) { (*v++) *= x;} 207717ab2063SBarry Smith } 20781ebc52fbSHong Zhang ierr = VecRestoreArray(ll,&l);CHKERRQ(ierr); 2079efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 208017ab2063SBarry Smith } 208117ab2063SBarry Smith if (rr) { 2082e1311b90SBarry Smith ierr = VecGetLocalSize(rr,&n);CHKERRQ(ierr); 2083e32f2f54SBarry Smith if (n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Right scaling vector wrong length"); 20841ebc52fbSHong Zhang ierr = VecGetArray(rr,&r);CHKERRQ(ierr); 2085416022c9SBarry Smith v = a->a; jj = a->j; 208617ab2063SBarry Smith for (i=0; i<nz; i++) { 2087bfeeae90SHong Zhang (*v++) *= r[*jj++]; 208817ab2063SBarry Smith } 20891ebc52fbSHong Zhang ierr = VecRestoreArray(rr,&r);CHKERRQ(ierr); 2090efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 209117ab2063SBarry Smith } 2092*86c113feSBarry Smith a->idiagvalid = PETSC_FALSE; 2093*86c113feSBarry Smith a->ibdiagvalid = PETSC_FALSE; 20943a40ed3dSBarry Smith PetscFunctionReturn(0); 209517ab2063SBarry Smith } 209617ab2063SBarry Smith 20974a2ae208SSatish Balay #undef __FUNCT__ 20984a2ae208SSatish Balay #define __FUNCT__ "MatGetSubMatrix_SeqAIJ" 209997f1f81fSBarry Smith PetscErrorCode MatGetSubMatrix_SeqAIJ(Mat A,IS isrow,IS iscol,PetscInt csize,MatReuse scall,Mat *B) 210017ab2063SBarry Smith { 2101db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*c; 21026849ba73SBarry Smith PetscErrorCode ierr; 2103d0f46423SBarry Smith PetscInt *smap,i,k,kstart,kend,oldcols = A->cmap->n,*lens; 210497f1f81fSBarry Smith PetscInt row,mat_i,*mat_j,tcol,first,step,*mat_ilen,sum,lensi; 21055d0c19d7SBarry Smith const PetscInt *irow,*icol; 21065d0c19d7SBarry Smith PetscInt nrows,ncols; 210797f1f81fSBarry Smith PetscInt *starts,*j_new,*i_new,*aj = a->j,*ai = a->i,ii,*ailen = a->ilen; 210854f21887SBarry Smith MatScalar *a_new,*mat_a; 2109416022c9SBarry Smith Mat C; 2110ace3abfcSBarry Smith PetscBool stride,sorted; 211117ab2063SBarry Smith 21123a40ed3dSBarry Smith PetscFunctionBegin; 211314ca34e6SBarry Smith ierr = ISSorted(isrow,&sorted);CHKERRQ(ierr); 2114e32f2f54SBarry Smith if (!sorted) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"ISrow is not sorted"); 211514ca34e6SBarry Smith ierr = ISSorted(iscol,&sorted);CHKERRQ(ierr); 2116e32f2f54SBarry Smith if (!sorted) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"IScol is not sorted"); 211799141d43SSatish Balay 211817ab2063SBarry Smith ierr = ISGetIndices(isrow,&irow);CHKERRQ(ierr); 2119b9b97703SBarry Smith ierr = ISGetLocalSize(isrow,&nrows);CHKERRQ(ierr); 2120b9b97703SBarry Smith ierr = ISGetLocalSize(iscol,&ncols);CHKERRQ(ierr); 212117ab2063SBarry Smith 2122fee21e36SBarry Smith ierr = ISStrideGetInfo(iscol,&first,&step);CHKERRQ(ierr); 21230dbe5b1eSSatish Balay ierr = PetscTypeCompare((PetscObject)iscol,ISSTRIDE,&stride);CHKERRQ(ierr); 2124fee21e36SBarry Smith if (stride && step == 1) { 212502834360SBarry Smith /* special case of contiguous rows */ 21260e83c824SBarry Smith ierr = PetscMalloc2(nrows,PetscInt,&lens,nrows,PetscInt,&starts);CHKERRQ(ierr); 212702834360SBarry Smith /* loop over new rows determining lens and starting points */ 212802834360SBarry Smith for (i=0; i<nrows; i++) { 2129bfeeae90SHong Zhang kstart = ai[irow[i]]; 2130a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 213102834360SBarry Smith for (k=kstart; k<kend; k++) { 2132bfeeae90SHong Zhang if (aj[k] >= first) { 213302834360SBarry Smith starts[i] = k; 213402834360SBarry Smith break; 213502834360SBarry Smith } 213602834360SBarry Smith } 2137a2744918SBarry Smith sum = 0; 213802834360SBarry Smith while (k < kend) { 2139bfeeae90SHong Zhang if (aj[k++] >= first+ncols) break; 2140a2744918SBarry Smith sum++; 214102834360SBarry Smith } 2142a2744918SBarry Smith lens[i] = sum; 214302834360SBarry Smith } 214402834360SBarry Smith /* create submatrix */ 2145cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 214697f1f81fSBarry Smith PetscInt n_cols,n_rows; 214708480c60SBarry Smith ierr = MatGetSize(*B,&n_rows,&n_cols);CHKERRQ(ierr); 2148e32f2f54SBarry Smith if (n_rows != nrows || n_cols != ncols) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Reused submatrix wrong size"); 2149d8ced48eSBarry Smith ierr = MatZeroEntries(*B);CHKERRQ(ierr); 215008480c60SBarry Smith C = *B; 21513a40ed3dSBarry Smith } else { 21527adad957SLisandro Dalcin ierr = MatCreate(((PetscObject)A)->comm,&C);CHKERRQ(ierr); 2153f69a0ea3SMatthew Knepley ierr = MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr); 21547adad957SLisandro Dalcin ierr = MatSetType(C,((PetscObject)A)->type_name);CHKERRQ(ierr); 2155ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens);CHKERRQ(ierr); 215608480c60SBarry Smith } 2157db02288aSLois Curfman McInnes c = (Mat_SeqAIJ*)C->data; 2158db02288aSLois Curfman McInnes 215902834360SBarry Smith /* loop over rows inserting into submatrix */ 2160db02288aSLois Curfman McInnes a_new = c->a; 2161db02288aSLois Curfman McInnes j_new = c->j; 2162db02288aSLois Curfman McInnes i_new = c->i; 2163bfeeae90SHong Zhang 216402834360SBarry Smith for (i=0; i<nrows; i++) { 2165a2744918SBarry Smith ii = starts[i]; 2166a2744918SBarry Smith lensi = lens[i]; 2167a2744918SBarry Smith for (k=0; k<lensi; k++) { 2168a2744918SBarry Smith *j_new++ = aj[ii+k] - first; 216902834360SBarry Smith } 217087828ca2SBarry Smith ierr = PetscMemcpy(a_new,a->a + starts[i],lensi*sizeof(PetscScalar));CHKERRQ(ierr); 2171a2744918SBarry Smith a_new += lensi; 2172a2744918SBarry Smith i_new[i+1] = i_new[i] + lensi; 2173a2744918SBarry Smith c->ilen[i] = lensi; 217402834360SBarry Smith } 21750e83c824SBarry Smith ierr = PetscFree2(lens,starts);CHKERRQ(ierr); 21763a40ed3dSBarry Smith } else { 217702834360SBarry Smith ierr = ISGetIndices(iscol,&icol);CHKERRQ(ierr); 21780e83c824SBarry Smith ierr = PetscMalloc(oldcols*sizeof(PetscInt),&smap);CHKERRQ(ierr); 217997f1f81fSBarry Smith ierr = PetscMemzero(smap,oldcols*sizeof(PetscInt));CHKERRQ(ierr); 21800e83c824SBarry Smith ierr = PetscMalloc((1+nrows)*sizeof(PetscInt),&lens);CHKERRQ(ierr); 21814dcab191SBarry Smith for (i=0; i<ncols; i++) { 21824dcab191SBarry Smith #if defined(PETSC_USE_DEBUG) 21834dcab191SBarry Smith if (icol[i] >= oldcols) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Requesting column beyond largest column icol[%D] %D <= A->cmap->n %D",i,icol[i],oldcols); 21844dcab191SBarry Smith #endif 21854dcab191SBarry Smith smap[icol[i]] = i+1; 21864dcab191SBarry Smith } 21874dcab191SBarry Smith 218802834360SBarry Smith /* determine lens of each row */ 218902834360SBarry Smith for (i=0; i<nrows; i++) { 2190bfeeae90SHong Zhang kstart = ai[irow[i]]; 219102834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 219202834360SBarry Smith lens[i] = 0; 219302834360SBarry Smith for (k=kstart; k<kend; k++) { 2194bfeeae90SHong Zhang if (smap[aj[k]]) { 219502834360SBarry Smith lens[i]++; 219602834360SBarry Smith } 219702834360SBarry Smith } 219802834360SBarry Smith } 219917ab2063SBarry Smith /* Create and fill new matrix */ 2200a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2201ace3abfcSBarry Smith PetscBool equal; 22020f5bd95cSBarry Smith 220399141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2204e32f2f54SBarry Smith if ((*B)->rmap->n != nrows || (*B)->cmap->n != ncols) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong size"); 2205d0f46423SBarry Smith ierr = PetscMemcmp(c->ilen,lens,(*B)->rmap->n*sizeof(PetscInt),&equal);CHKERRQ(ierr); 22060f5bd95cSBarry Smith if (!equal) { 2207e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong no of nonzeros"); 220899141d43SSatish Balay } 2209d0f46423SBarry Smith ierr = PetscMemzero(c->ilen,(*B)->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 221008480c60SBarry Smith C = *B; 22113a40ed3dSBarry Smith } else { 22127adad957SLisandro Dalcin ierr = MatCreate(((PetscObject)A)->comm,&C);CHKERRQ(ierr); 2213f69a0ea3SMatthew Knepley ierr = MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr); 22147adad957SLisandro Dalcin ierr = MatSetType(C,((PetscObject)A)->type_name);CHKERRQ(ierr); 2215ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens);CHKERRQ(ierr); 221608480c60SBarry Smith } 221799141d43SSatish Balay c = (Mat_SeqAIJ *)(C->data); 221817ab2063SBarry Smith for (i=0; i<nrows; i++) { 221999141d43SSatish Balay row = irow[i]; 2220bfeeae90SHong Zhang kstart = ai[row]; 222199141d43SSatish Balay kend = kstart + a->ilen[row]; 2222bfeeae90SHong Zhang mat_i = c->i[i]; 222399141d43SSatish Balay mat_j = c->j + mat_i; 222499141d43SSatish Balay mat_a = c->a + mat_i; 222599141d43SSatish Balay mat_ilen = c->ilen + i; 222617ab2063SBarry Smith for (k=kstart; k<kend; k++) { 2227bfeeae90SHong Zhang if ((tcol=smap[a->j[k]])) { 2228ed480e8bSBarry Smith *mat_j++ = tcol - 1; 222999141d43SSatish Balay *mat_a++ = a->a[k]; 223099141d43SSatish Balay (*mat_ilen)++; 223199141d43SSatish Balay 223217ab2063SBarry Smith } 223317ab2063SBarry Smith } 223417ab2063SBarry Smith } 223502834360SBarry Smith /* Free work space */ 223602834360SBarry Smith ierr = ISRestoreIndices(iscol,&icol);CHKERRQ(ierr); 2237606d414cSSatish Balay ierr = PetscFree(smap);CHKERRQ(ierr); 2238606d414cSSatish Balay ierr = PetscFree(lens);CHKERRQ(ierr); 223902834360SBarry Smith } 22406d4a8577SBarry Smith ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 22416d4a8577SBarry Smith ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 224217ab2063SBarry Smith 224317ab2063SBarry Smith ierr = ISRestoreIndices(isrow,&irow);CHKERRQ(ierr); 2244416022c9SBarry Smith *B = C; 22453a40ed3dSBarry Smith PetscFunctionReturn(0); 224617ab2063SBarry Smith } 224717ab2063SBarry Smith 22481df811f5SHong Zhang #undef __FUNCT__ 224982d44351SHong Zhang #define __FUNCT__ "MatGetMultiProcBlock_SeqAIJ" 225082d44351SHong Zhang PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat,MPI_Comm subComm,Mat* subMat) 225182d44351SHong Zhang { 225282d44351SHong Zhang PetscErrorCode ierr; 225382d44351SHong Zhang Mat B; 225482d44351SHong Zhang 225582d44351SHong Zhang PetscFunctionBegin; 225682d44351SHong Zhang ierr = MatCreate(subComm,&B);CHKERRQ(ierr); 225782d44351SHong Zhang ierr = MatSetSizes(B,mat->rmap->n,mat->cmap->n,mat->rmap->n,mat->cmap->n);CHKERRQ(ierr); 225882d44351SHong Zhang ierr = MatSetType(B,MATSEQAIJ);CHKERRQ(ierr); 225982d44351SHong Zhang ierr = MatDuplicateNoCreate_SeqAIJ(B,mat,MAT_COPY_VALUES,PETSC_TRUE);CHKERRQ(ierr); 226082d44351SHong Zhang *subMat = B; 226182d44351SHong Zhang PetscFunctionReturn(0); 226282d44351SHong Zhang } 226382d44351SHong Zhang 226482d44351SHong Zhang #undef __FUNCT__ 22654a2ae208SSatish Balay #define __FUNCT__ "MatILUFactor_SeqAIJ" 22660481f469SBarry Smith PetscErrorCode MatILUFactor_SeqAIJ(Mat inA,IS row,IS col,const MatFactorInfo *info) 2267a871dcd8SBarry Smith { 226863b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 2269dfbe8321SBarry Smith PetscErrorCode ierr; 227063b91edcSBarry Smith Mat outA; 2271ace3abfcSBarry Smith PetscBool row_identity,col_identity; 227263b91edcSBarry Smith 22733a40ed3dSBarry Smith PetscFunctionBegin; 2274e32f2f54SBarry Smith if (info->levels != 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Only levels=0 supported for in-place ilu"); 22751df811f5SHong Zhang 2276b8a78c4aSBarry Smith ierr = ISIdentity(row,&row_identity);CHKERRQ(ierr); 2277b8a78c4aSBarry Smith ierr = ISIdentity(col,&col_identity);CHKERRQ(ierr); 2278a871dcd8SBarry Smith 227963b91edcSBarry Smith outA = inA; 2280d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 2281c38d4ed2SBarry Smith ierr = PetscObjectReference((PetscObject)row);CHKERRQ(ierr); 22826bf464f9SBarry Smith ierr = ISDestroy(&a->row);CHKERRQ(ierr); 2283c3122656SLisandro Dalcin a->row = row; 2284c38d4ed2SBarry Smith ierr = PetscObjectReference((PetscObject)col);CHKERRQ(ierr); 22856bf464f9SBarry Smith ierr = ISDestroy(&a->col);CHKERRQ(ierr); 2286c3122656SLisandro Dalcin a->col = col; 228763b91edcSBarry Smith 228836db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 22896bf464f9SBarry Smith ierr = ISDestroy(&a->icol);CHKERRQ(ierr); 22904c49b128SBarry Smith ierr = ISInvertPermutation(col,PETSC_DECIDE,&a->icol);CHKERRQ(ierr); 229152e6d16bSBarry Smith ierr = PetscLogObjectParent(inA,a->icol);CHKERRQ(ierr); 2292f0ec6fceSSatish Balay 229394a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 2294d0f46423SBarry Smith ierr = PetscMalloc((inA->rmap->n+1)*sizeof(PetscScalar),&a->solve_work);CHKERRQ(ierr); 2295d0f46423SBarry Smith ierr = PetscLogObjectMemory(inA, (inA->rmap->n+1)*sizeof(PetscScalar));CHKERRQ(ierr); 229694a9d846SBarry Smith } 229763b91edcSBarry Smith 2298f1e2ffcdSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(inA);CHKERRQ(ierr); 2299137fb511SHong Zhang if (row_identity && col_identity) { 2300ad04f41aSHong Zhang ierr = MatLUFactorNumeric_SeqAIJ_inplace(outA,inA,info);CHKERRQ(ierr); 2301137fb511SHong Zhang } else { 2302719d5645SBarry Smith ierr = MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA,inA,info);CHKERRQ(ierr); 2303137fb511SHong Zhang } 23043a40ed3dSBarry Smith PetscFunctionReturn(0); 2305a871dcd8SBarry Smith } 2306a871dcd8SBarry Smith 23074a2ae208SSatish Balay #undef __FUNCT__ 23084a2ae208SSatish Balay #define __FUNCT__ "MatScale_SeqAIJ" 2309f4df32b1SMatthew Knepley PetscErrorCode MatScale_SeqAIJ(Mat inA,PetscScalar alpha) 2310f0b747eeSBarry Smith { 2311f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 2312f4df32b1SMatthew Knepley PetscScalar oalpha = alpha; 2313efee365bSSatish Balay PetscErrorCode ierr; 23140805154bSBarry Smith PetscBLASInt one = 1,bnz = PetscBLASIntCast(a->nz); 23153a40ed3dSBarry Smith 23163a40ed3dSBarry Smith PetscFunctionBegin; 2317f4df32b1SMatthew Knepley BLASscal_(&bnz,&oalpha,a->a,&one); 2318efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 2319*86c113feSBarry Smith a->idiagvalid = PETSC_FALSE; 2320*86c113feSBarry Smith a->ibdiagvalid = PETSC_FALSE; 23213a40ed3dSBarry Smith PetscFunctionReturn(0); 2322f0b747eeSBarry Smith } 2323f0b747eeSBarry Smith 23244a2ae208SSatish Balay #undef __FUNCT__ 23254a2ae208SSatish Balay #define __FUNCT__ "MatGetSubMatrices_SeqAIJ" 232697f1f81fSBarry Smith PetscErrorCode MatGetSubMatrices_SeqAIJ(Mat A,PetscInt n,const IS irow[],const IS icol[],MatReuse scall,Mat *B[]) 2327cddf8d76SBarry Smith { 2328dfbe8321SBarry Smith PetscErrorCode ierr; 232997f1f81fSBarry Smith PetscInt i; 2330cddf8d76SBarry Smith 23313a40ed3dSBarry Smith PetscFunctionBegin; 2332cddf8d76SBarry Smith if (scall == MAT_INITIAL_MATRIX) { 2333b0a32e0cSBarry Smith ierr = PetscMalloc((n+1)*sizeof(Mat),B);CHKERRQ(ierr); 2334cddf8d76SBarry Smith } 2335cddf8d76SBarry Smith 2336cddf8d76SBarry Smith for (i=0; i<n; i++) { 23376a6a5d1dSBarry Smith ierr = MatGetSubMatrix_SeqAIJ(A,irow[i],icol[i],PETSC_DECIDE,scall,&(*B)[i]);CHKERRQ(ierr); 2338cddf8d76SBarry Smith } 23393a40ed3dSBarry Smith PetscFunctionReturn(0); 2340cddf8d76SBarry Smith } 2341cddf8d76SBarry Smith 23424a2ae208SSatish Balay #undef __FUNCT__ 23434a2ae208SSatish Balay #define __FUNCT__ "MatIncreaseOverlap_SeqAIJ" 234497f1f81fSBarry Smith PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A,PetscInt is_max,IS is[],PetscInt ov) 23454dcbc457SBarry Smith { 2346e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 23476849ba73SBarry Smith PetscErrorCode ierr; 23485d0c19d7SBarry Smith PetscInt row,i,j,k,l,m,n,*nidx,isz,val; 23495d0c19d7SBarry Smith const PetscInt *idx; 235097f1f81fSBarry Smith PetscInt start,end,*ai,*aj; 2351f1af5d2fSBarry Smith PetscBT table; 2352bbd702dbSSatish Balay 23533a40ed3dSBarry Smith PetscFunctionBegin; 2354d0f46423SBarry Smith m = A->rmap->n; 2355e4d965acSSatish Balay ai = a->i; 2356bfeeae90SHong Zhang aj = a->j; 23578a047759SSatish Balay 2358e32f2f54SBarry Smith if (ov < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"illegal negative overlap value used"); 235906763907SSatish Balay 236097f1f81fSBarry Smith ierr = PetscMalloc((m+1)*sizeof(PetscInt),&nidx);CHKERRQ(ierr); 23616831982aSBarry Smith ierr = PetscBTCreate(m,table);CHKERRQ(ierr); 236206763907SSatish Balay 2363e4d965acSSatish Balay for (i=0; i<is_max; i++) { 2364b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2365e4d965acSSatish Balay isz = 0; 23666831982aSBarry Smith ierr = PetscBTMemzero(m,table);CHKERRQ(ierr); 2367e4d965acSSatish Balay 2368e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 23694dcbc457SBarry Smith ierr = ISGetIndices(is[i],&idx);CHKERRQ(ierr); 2370b9b97703SBarry Smith ierr = ISGetLocalSize(is[i],&n);CHKERRQ(ierr); 2371e4d965acSSatish Balay 2372dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2373e4d965acSSatish Balay for (j=0; j<n ; ++j){ 2374f1af5d2fSBarry Smith if(!PetscBTLookupSet(table,idx[j])) { nidx[isz++] = idx[j];} 23754dcbc457SBarry Smith } 237606763907SSatish Balay ierr = ISRestoreIndices(is[i],&idx);CHKERRQ(ierr); 23776bf464f9SBarry Smith ierr = ISDestroy(&is[i]);CHKERRQ(ierr); 2378e4d965acSSatish Balay 237904a348a9SBarry Smith k = 0; 238004a348a9SBarry Smith for (j=0; j<ov; j++){ /* for each overlap */ 238104a348a9SBarry Smith n = isz; 238206763907SSatish Balay for (; k<n ; k++){ /* do only those rows in nidx[k], which are not done yet */ 2383e4d965acSSatish Balay row = nidx[k]; 2384e4d965acSSatish Balay start = ai[row]; 2385e4d965acSSatish Balay end = ai[row+1]; 238604a348a9SBarry Smith for (l = start; l<end ; l++){ 2387efb16452SHong Zhang val = aj[l] ; 2388f1af5d2fSBarry Smith if (!PetscBTLookupSet(table,val)) {nidx[isz++] = val;} 2389e4d965acSSatish Balay } 2390e4d965acSSatish Balay } 2391e4d965acSSatish Balay } 239270b3c8c7SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,isz,nidx,PETSC_COPY_VALUES,(is+i));CHKERRQ(ierr); 2393e4d965acSSatish Balay } 23946831982aSBarry Smith ierr = PetscBTDestroy(table);CHKERRQ(ierr); 2395606d414cSSatish Balay ierr = PetscFree(nidx);CHKERRQ(ierr); 23963a40ed3dSBarry Smith PetscFunctionReturn(0); 23974dcbc457SBarry Smith } 239817ab2063SBarry Smith 23990513a670SBarry Smith /* -------------------------------------------------------------- */ 24004a2ae208SSatish Balay #undef __FUNCT__ 24014a2ae208SSatish Balay #define __FUNCT__ "MatPermute_SeqAIJ" 2402dfbe8321SBarry Smith PetscErrorCode MatPermute_SeqAIJ(Mat A,IS rowp,IS colp,Mat *B) 24030513a670SBarry Smith { 24040513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 24056849ba73SBarry Smith PetscErrorCode ierr; 24063b98c0a2SBarry Smith PetscInt i,nz = 0,m = A->rmap->n,n = A->cmap->n; 24075d0c19d7SBarry Smith const PetscInt *row,*col; 24085d0c19d7SBarry Smith PetscInt *cnew,j,*lens; 240956cd22aeSBarry Smith IS icolp,irowp; 24103b98c0a2SBarry Smith PetscInt *cwork = PETSC_NULL; 24113b98c0a2SBarry Smith PetscScalar *vwork = PETSC_NULL; 24120513a670SBarry Smith 24133a40ed3dSBarry Smith PetscFunctionBegin; 24144c49b128SBarry Smith ierr = ISInvertPermutation(rowp,PETSC_DECIDE,&irowp);CHKERRQ(ierr); 241556cd22aeSBarry Smith ierr = ISGetIndices(irowp,&row);CHKERRQ(ierr); 24164c49b128SBarry Smith ierr = ISInvertPermutation(colp,PETSC_DECIDE,&icolp);CHKERRQ(ierr); 241756cd22aeSBarry Smith ierr = ISGetIndices(icolp,&col);CHKERRQ(ierr); 24180513a670SBarry Smith 24190513a670SBarry Smith /* determine lengths of permuted rows */ 242097f1f81fSBarry Smith ierr = PetscMalloc((m+1)*sizeof(PetscInt),&lens);CHKERRQ(ierr); 24210513a670SBarry Smith for (i=0; i<m; i++) { 24220513a670SBarry Smith lens[row[i]] = a->i[i+1] - a->i[i]; 24230513a670SBarry Smith } 24247adad957SLisandro Dalcin ierr = MatCreate(((PetscObject)A)->comm,B);CHKERRQ(ierr); 2425f69a0ea3SMatthew Knepley ierr = MatSetSizes(*B,m,n,m,n);CHKERRQ(ierr); 24267adad957SLisandro Dalcin ierr = MatSetType(*B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2427ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(*B,0,lens);CHKERRQ(ierr); 2428606d414cSSatish Balay ierr = PetscFree(lens);CHKERRQ(ierr); 24290513a670SBarry Smith 243097f1f81fSBarry Smith ierr = PetscMalloc(n*sizeof(PetscInt),&cnew);CHKERRQ(ierr); 24310513a670SBarry Smith for (i=0; i<m; i++) { 243232ec9ce4SBarry Smith ierr = MatGetRow_SeqAIJ(A,i,&nz,&cwork,&vwork);CHKERRQ(ierr); 24330513a670SBarry Smith for (j=0; j<nz; j++) { cnew[j] = col[cwork[j]];} 2434cdc0ba36SBarry Smith ierr = MatSetValues_SeqAIJ(*B,1,&row[i],nz,cnew,vwork,INSERT_VALUES);CHKERRQ(ierr); 243532ec9ce4SBarry Smith ierr = MatRestoreRow_SeqAIJ(A,i,&nz,&cwork,&vwork);CHKERRQ(ierr); 24360513a670SBarry Smith } 2437606d414cSSatish Balay ierr = PetscFree(cnew);CHKERRQ(ierr); 24383c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 24390513a670SBarry Smith ierr = MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 24400513a670SBarry Smith ierr = MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 244156cd22aeSBarry Smith ierr = ISRestoreIndices(irowp,&row);CHKERRQ(ierr); 244256cd22aeSBarry Smith ierr = ISRestoreIndices(icolp,&col);CHKERRQ(ierr); 24436bf464f9SBarry Smith ierr = ISDestroy(&irowp);CHKERRQ(ierr); 24446bf464f9SBarry Smith ierr = ISDestroy(&icolp);CHKERRQ(ierr); 24453a40ed3dSBarry Smith PetscFunctionReturn(0); 24460513a670SBarry Smith } 24470513a670SBarry Smith 24484a2ae208SSatish Balay #undef __FUNCT__ 24494a2ae208SSatish Balay #define __FUNCT__ "MatCopy_SeqAIJ" 2450dfbe8321SBarry Smith PetscErrorCode MatCopy_SeqAIJ(Mat A,Mat B,MatStructure str) 2451cb5b572fSBarry Smith { 2452dfbe8321SBarry Smith PetscErrorCode ierr; 2453cb5b572fSBarry Smith 2454cb5b572fSBarry Smith PetscFunctionBegin; 245533f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 245633f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2457be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2458be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ*)B->data; 2459be6bf707SBarry Smith 2460700c5bfcSBarry Smith if (a->i[A->rmap->n] != b->i[B->rmap->n]) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Number of nonzeros in two matrices are different"); 2461d0f46423SBarry Smith ierr = PetscMemcpy(b->a,a->a,(a->i[A->rmap->n])*sizeof(PetscScalar));CHKERRQ(ierr); 2462cb5b572fSBarry Smith } else { 2463cb5b572fSBarry Smith ierr = MatCopy_Basic(A,B,str);CHKERRQ(ierr); 2464cb5b572fSBarry Smith } 2465cb5b572fSBarry Smith PetscFunctionReturn(0); 2466cb5b572fSBarry Smith } 2467cb5b572fSBarry Smith 24684a2ae208SSatish Balay #undef __FUNCT__ 24694a2ae208SSatish Balay #define __FUNCT__ "MatSetUpPreallocation_SeqAIJ" 2470dfbe8321SBarry Smith PetscErrorCode MatSetUpPreallocation_SeqAIJ(Mat A) 2471273d9f13SBarry Smith { 2472dfbe8321SBarry Smith PetscErrorCode ierr; 2473273d9f13SBarry Smith 2474273d9f13SBarry Smith PetscFunctionBegin; 2475ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(A,PETSC_DEFAULT,0);CHKERRQ(ierr); 2476273d9f13SBarry Smith PetscFunctionReturn(0); 2477273d9f13SBarry Smith } 2478273d9f13SBarry Smith 24794a2ae208SSatish Balay #undef __FUNCT__ 24804a2ae208SSatish Balay #define __FUNCT__ "MatGetArray_SeqAIJ" 2481a77337e4SBarry Smith PetscErrorCode MatGetArray_SeqAIJ(Mat A,PetscScalar *array[]) 24826c0721eeSBarry Smith { 24836c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 24846c0721eeSBarry Smith PetscFunctionBegin; 24856c0721eeSBarry Smith *array = a->a; 24866c0721eeSBarry Smith PetscFunctionReturn(0); 24876c0721eeSBarry Smith } 24886c0721eeSBarry Smith 24894a2ae208SSatish Balay #undef __FUNCT__ 24904a2ae208SSatish Balay #define __FUNCT__ "MatRestoreArray_SeqAIJ" 2491dfbe8321SBarry Smith PetscErrorCode MatRestoreArray_SeqAIJ(Mat A,PetscScalar *array[]) 24926c0721eeSBarry Smith { 24936c0721eeSBarry Smith PetscFunctionBegin; 24946c0721eeSBarry Smith PetscFunctionReturn(0); 24956c0721eeSBarry Smith } 2496273d9f13SBarry Smith 2497ee4f033dSBarry Smith #undef __FUNCT__ 2498ee4f033dSBarry Smith #define __FUNCT__ "MatFDColoringApply_SeqAIJ" 2499dfbe8321SBarry Smith PetscErrorCode MatFDColoringApply_SeqAIJ(Mat J,MatFDColoring coloring,Vec x1,MatStructure *flag,void *sctx) 2500ee4f033dSBarry Smith { 25016849ba73SBarry Smith PetscErrorCode (*f)(void*,Vec,Vec,void*) = (PetscErrorCode (*)(void*,Vec,Vec,void *))coloring->f; 25026849ba73SBarry Smith PetscErrorCode ierr; 250397f1f81fSBarry Smith PetscInt k,N,start,end,l,row,col,srow,**vscaleforrow,m1,m2; 2504efb30889SBarry Smith PetscScalar dx,*y,*xx,*w3_array; 250587828ca2SBarry Smith PetscScalar *vscale_array; 2506ee4f033dSBarry Smith PetscReal epsilon = coloring->error_rel,umin = coloring->umin; 2507ee4f033dSBarry Smith Vec w1,w2,w3; 2508ee4f033dSBarry Smith void *fctx = coloring->fctx; 2509ace3abfcSBarry Smith PetscBool flg = PETSC_FALSE; 2510ee4f033dSBarry Smith 2511ee4f033dSBarry Smith PetscFunctionBegin; 2512ee4f033dSBarry Smith if (!coloring->w1) { 2513ee4f033dSBarry Smith ierr = VecDuplicate(x1,&coloring->w1);CHKERRQ(ierr); 251452e6d16bSBarry Smith ierr = PetscLogObjectParent(coloring,coloring->w1);CHKERRQ(ierr); 2515ee4f033dSBarry Smith ierr = VecDuplicate(x1,&coloring->w2);CHKERRQ(ierr); 251652e6d16bSBarry Smith ierr = PetscLogObjectParent(coloring,coloring->w2);CHKERRQ(ierr); 2517ee4f033dSBarry Smith ierr = VecDuplicate(x1,&coloring->w3);CHKERRQ(ierr); 251852e6d16bSBarry Smith ierr = PetscLogObjectParent(coloring,coloring->w3);CHKERRQ(ierr); 2519ee4f033dSBarry Smith } 2520ee4f033dSBarry Smith w1 = coloring->w1; w2 = coloring->w2; w3 = coloring->w3; 2521ee4f033dSBarry Smith 2522ee4f033dSBarry Smith ierr = MatSetUnfactored(J);CHKERRQ(ierr); 2523acfcf0e5SJed Brown ierr = PetscOptionsGetBool(((PetscObject)coloring)->prefix,"-mat_fd_coloring_dont_rezero",&flg,PETSC_NULL);CHKERRQ(ierr); 2524ee4f033dSBarry Smith if (flg) { 2525ae15b995SBarry Smith ierr = PetscInfo(coloring,"Not calling MatZeroEntries()\n");CHKERRQ(ierr); 2526ee4f033dSBarry Smith } else { 2527ace3abfcSBarry Smith PetscBool assembled; 25280b9b6f31SBarry Smith ierr = MatAssembled(J,&assembled);CHKERRQ(ierr); 25290b9b6f31SBarry Smith if (assembled) { 2530ee4f033dSBarry Smith ierr = MatZeroEntries(J);CHKERRQ(ierr); 2531ee4f033dSBarry Smith } 25320b9b6f31SBarry Smith } 2533ee4f033dSBarry Smith 2534ee4f033dSBarry Smith ierr = VecGetOwnershipRange(x1,&start,&end);CHKERRQ(ierr); 2535ee4f033dSBarry Smith ierr = VecGetSize(x1,&N);CHKERRQ(ierr); 2536ee4f033dSBarry Smith 2537ee4f033dSBarry Smith /* 2538ee4f033dSBarry Smith This is a horrible, horrible, hack. See DMMGComputeJacobian_Multigrid() it inproperly sets 2539ee4f033dSBarry Smith coloring->F for the coarser grids from the finest 2540ee4f033dSBarry Smith */ 2541ee4f033dSBarry Smith if (coloring->F) { 2542ee4f033dSBarry Smith ierr = VecGetLocalSize(coloring->F,&m1);CHKERRQ(ierr); 2543ee4f033dSBarry Smith ierr = VecGetLocalSize(w1,&m2);CHKERRQ(ierr); 2544ee4f033dSBarry Smith if (m1 != m2) { 2545ee4f033dSBarry Smith coloring->F = 0; 2546ee4f033dSBarry Smith } 2547ee4f033dSBarry Smith } 2548ee4f033dSBarry Smith 2549ee4f033dSBarry Smith if (coloring->F) { 2550ee4f033dSBarry Smith w1 = coloring->F; 2551ee4f033dSBarry Smith coloring->F = 0; 2552ee4f033dSBarry Smith } else { 255366f9b7ceSBarry Smith ierr = PetscLogEventBegin(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr); 2554ee4f033dSBarry Smith ierr = (*f)(sctx,x1,w1,fctx);CHKERRQ(ierr); 255566f9b7ceSBarry Smith ierr = PetscLogEventEnd(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr); 2556ee4f033dSBarry Smith } 2557ee4f033dSBarry Smith 2558ee4f033dSBarry Smith /* 2559ee4f033dSBarry Smith Compute all the scale factors and share with other processors 2560ee4f033dSBarry Smith */ 25611ebc52fbSHong Zhang ierr = VecGetArray(x1,&xx);CHKERRQ(ierr);xx = xx - start; 25621ebc52fbSHong Zhang ierr = VecGetArray(coloring->vscale,&vscale_array);CHKERRQ(ierr);vscale_array = vscale_array - start; 2563ee4f033dSBarry Smith for (k=0; k<coloring->ncolors; k++) { 2564ee4f033dSBarry Smith /* 2565ee4f033dSBarry Smith Loop over each column associated with color adding the 2566ee4f033dSBarry Smith perturbation to the vector w3. 2567ee4f033dSBarry Smith */ 2568ee4f033dSBarry Smith for (l=0; l<coloring->ncolumns[k]; l++) { 2569ee4f033dSBarry Smith col = coloring->columns[k][l]; /* column of the matrix we are probing for */ 2570ee4f033dSBarry Smith dx = xx[col]; 2571ee4f033dSBarry Smith if (dx == 0.0) dx = 1.0; 2572ee4f033dSBarry Smith #if !defined(PETSC_USE_COMPLEX) 2573ee4f033dSBarry Smith if (dx < umin && dx >= 0.0) dx = umin; 2574ee4f033dSBarry Smith else if (dx < 0.0 && dx > -umin) dx = -umin; 2575ee4f033dSBarry Smith #else 2576ee4f033dSBarry Smith if (PetscAbsScalar(dx) < umin && PetscRealPart(dx) >= 0.0) dx = umin; 2577ee4f033dSBarry Smith else if (PetscRealPart(dx) < 0.0 && PetscAbsScalar(dx) < umin) dx = -umin; 2578ee4f033dSBarry Smith #endif 2579ee4f033dSBarry Smith dx *= epsilon; 2580ee4f033dSBarry Smith vscale_array[col] = 1.0/dx; 2581ee4f033dSBarry Smith } 2582ee4f033dSBarry Smith } 25831ebc52fbSHong Zhang vscale_array = vscale_array + start;ierr = VecRestoreArray(coloring->vscale,&vscale_array);CHKERRQ(ierr); 2584ee4f033dSBarry Smith ierr = VecGhostUpdateBegin(coloring->vscale,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2585ee4f033dSBarry Smith ierr = VecGhostUpdateEnd(coloring->vscale,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2586ee4f033dSBarry Smith 2587ee4f033dSBarry Smith /* ierr = VecView(coloring->vscale,PETSC_VIEWER_STDOUT_WORLD); 2588ee4f033dSBarry Smith ierr = VecView(x1,PETSC_VIEWER_STDOUT_WORLD);*/ 2589ee4f033dSBarry Smith 2590ee4f033dSBarry Smith if (coloring->vscaleforrow) vscaleforrow = coloring->vscaleforrow; 2591ee4f033dSBarry Smith else vscaleforrow = coloring->columnsforrow; 2592ee4f033dSBarry Smith 25931ebc52fbSHong Zhang ierr = VecGetArray(coloring->vscale,&vscale_array);CHKERRQ(ierr); 2594ee4f033dSBarry Smith /* 2595ee4f033dSBarry Smith Loop over each color 2596ee4f033dSBarry Smith */ 2597ee4f033dSBarry Smith for (k=0; k<coloring->ncolors; k++) { 259849b058dcSBarry Smith coloring->currentcolor = k; 2599ee4f033dSBarry Smith ierr = VecCopy(x1,w3);CHKERRQ(ierr); 26001ebc52fbSHong Zhang ierr = VecGetArray(w3,&w3_array);CHKERRQ(ierr);w3_array = w3_array - start; 2601ee4f033dSBarry Smith /* 2602ee4f033dSBarry Smith Loop over each column associated with color adding the 2603ee4f033dSBarry Smith perturbation to the vector w3. 2604ee4f033dSBarry Smith */ 2605ee4f033dSBarry Smith for (l=0; l<coloring->ncolumns[k]; l++) { 2606ee4f033dSBarry Smith col = coloring->columns[k][l]; /* column of the matrix we are probing for */ 2607ee4f033dSBarry Smith dx = xx[col]; 26085b8514ebSBarry Smith if (dx == 0.0) dx = 1.0; 2609ee4f033dSBarry Smith #if !defined(PETSC_USE_COMPLEX) 2610ee4f033dSBarry Smith if (dx < umin && dx >= 0.0) dx = umin; 2611ee4f033dSBarry Smith else if (dx < 0.0 && dx > -umin) dx = -umin; 2612ee4f033dSBarry Smith #else 2613ee4f033dSBarry Smith if (PetscAbsScalar(dx) < umin && PetscRealPart(dx) >= 0.0) dx = umin; 2614ee4f033dSBarry Smith else if (PetscRealPart(dx) < 0.0 && PetscAbsScalar(dx) < umin) dx = -umin; 2615ee4f033dSBarry Smith #endif 2616ee4f033dSBarry Smith dx *= epsilon; 2617e32f2f54SBarry Smith if (!PetscAbsScalar(dx)) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Computed 0 differencing parameter"); 2618ee4f033dSBarry Smith w3_array[col] += dx; 2619ee4f033dSBarry Smith } 26201ebc52fbSHong Zhang w3_array = w3_array + start; ierr = VecRestoreArray(w3,&w3_array);CHKERRQ(ierr); 2621ee4f033dSBarry Smith 2622ee4f033dSBarry Smith /* 2623ee4f033dSBarry Smith Evaluate function at x1 + dx (here dx is a vector of perturbations) 2624ee4f033dSBarry Smith */ 2625ee4f033dSBarry Smith 262666f9b7ceSBarry Smith ierr = PetscLogEventBegin(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr); 2627ee4f033dSBarry Smith ierr = (*f)(sctx,w3,w2,fctx);CHKERRQ(ierr); 262866f9b7ceSBarry Smith ierr = PetscLogEventEnd(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr); 2629efb30889SBarry Smith ierr = VecAXPY(w2,-1.0,w1);CHKERRQ(ierr); 2630ee4f033dSBarry Smith 2631ee4f033dSBarry Smith /* 2632ee4f033dSBarry Smith Loop over rows of vector, putting results into Jacobian matrix 2633ee4f033dSBarry Smith */ 26341ebc52fbSHong Zhang ierr = VecGetArray(w2,&y);CHKERRQ(ierr); 2635ee4f033dSBarry Smith for (l=0; l<coloring->nrows[k]; l++) { 2636ee4f033dSBarry Smith row = coloring->rows[k][l]; 2637ee4f033dSBarry Smith col = coloring->columnsforrow[k][l]; 2638ee4f033dSBarry Smith y[row] *= vscale_array[vscaleforrow[k][l]]; 2639ee4f033dSBarry Smith srow = row + start; 2640ee4f033dSBarry Smith ierr = MatSetValues_SeqAIJ(J,1,&srow,1,&col,y+row,INSERT_VALUES);CHKERRQ(ierr); 2641ee4f033dSBarry Smith } 26421ebc52fbSHong Zhang ierr = VecRestoreArray(w2,&y);CHKERRQ(ierr); 2643ee4f033dSBarry Smith } 264449b058dcSBarry Smith coloring->currentcolor = k; 26451ebc52fbSHong Zhang ierr = VecRestoreArray(coloring->vscale,&vscale_array);CHKERRQ(ierr); 26461ebc52fbSHong Zhang xx = xx + start; ierr = VecRestoreArray(x1,&xx);CHKERRQ(ierr); 2647ee4f033dSBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2648ee4f033dSBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2649ee4f033dSBarry Smith PetscFunctionReturn(0); 2650ee4f033dSBarry Smith } 2651ee4f033dSBarry Smith 26528229c054SShri Abhyankar /* 26538229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 26548229c054SShri Abhyankar have different nonzero structure. 26558229c054SShri Abhyankar */ 2656ac90fabeSBarry Smith #undef __FUNCT__ 26578229c054SShri Abhyankar #define __FUNCT__ "MatAXPYGetPreallocation_SeqAIJ" 26588229c054SShri Abhyankar PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y,Mat X,PetscInt* nnz) 2659ec7775f6SShri Abhyankar { 26608229c054SShri Abhyankar PetscInt i,m=Y->rmap->N; 2661ec7775f6SShri Abhyankar Mat_SeqAIJ *x = (Mat_SeqAIJ*)X->data; 2662ec7775f6SShri Abhyankar Mat_SeqAIJ *y = (Mat_SeqAIJ*)Y->data; 2663ec7775f6SShri Abhyankar const PetscInt *xi = x->i,*yi = y->i; 2664ec7775f6SShri Abhyankar 2665ec7775f6SShri Abhyankar PetscFunctionBegin; 2666ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 2667ec7775f6SShri Abhyankar for(i=0; i<m; i++) { 26688af7cee1SJed Brown PetscInt j,k,nzx = xi[i+1] - xi[i],nzy = yi[i+1] - yi[i]; 26698af7cee1SJed Brown const PetscInt *xj = x->j+xi[i],*yj = y->j+yi[i]; 26708af7cee1SJed Brown nnz[i] = 0; 26718af7cee1SJed Brown for (j=0,k=0; j<nzx; j++) { /* Point in X */ 26728af7cee1SJed Brown for (; k<nzy && yj[k]<xj[j]; k++) nnz[i]++; /* Catch up to X */ 26738af7cee1SJed Brown if (k<nzy && yj[k]==xj[j]) k++; /* Skip duplicate */ 26748af7cee1SJed Brown nnz[i]++; 26758af7cee1SJed Brown } 26768af7cee1SJed Brown for (; k<nzy; k++) nnz[i]++; 2677ec7775f6SShri Abhyankar } 2678ec7775f6SShri Abhyankar PetscFunctionReturn(0); 2679ec7775f6SShri Abhyankar } 2680ec7775f6SShri Abhyankar 2681ec7775f6SShri Abhyankar #undef __FUNCT__ 2682ac90fabeSBarry Smith #define __FUNCT__ "MatAXPY_SeqAIJ" 2683f4df32b1SMatthew Knepley PetscErrorCode MatAXPY_SeqAIJ(Mat Y,PetscScalar a,Mat X,MatStructure str) 2684ac90fabeSBarry Smith { 2685dfbe8321SBarry Smith PetscErrorCode ierr; 268697f1f81fSBarry Smith PetscInt i; 2687ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data,*y = (Mat_SeqAIJ *)Y->data; 26880805154bSBarry Smith PetscBLASInt one=1,bnz = PetscBLASIntCast(x->nz); 2689ac90fabeSBarry Smith 2690ac90fabeSBarry Smith PetscFunctionBegin; 2691ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 2692f4df32b1SMatthew Knepley PetscScalar alpha = a; 2693f4df32b1SMatthew Knepley BLASaxpy_(&bnz,&alpha,x->a,&one,y->a,&one); 2694*86c113feSBarry Smith y->idiagvalid = PETSC_FALSE; 2695*86c113feSBarry Smith y->ibdiagvalid = PETSC_FALSE; 2696c537a176SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 2697a30b2313SHong Zhang if (y->xtoy && y->XtoY != X) { 2698a30b2313SHong Zhang ierr = PetscFree(y->xtoy);CHKERRQ(ierr); 26996bf464f9SBarry Smith ierr = MatDestroy(&y->XtoY);CHKERRQ(ierr); 2700a30b2313SHong Zhang } 2701a30b2313SHong Zhang if (!y->xtoy) { /* get xtoy */ 2702d0f46423SBarry Smith ierr = MatAXPYGetxtoy_Private(X->rmap->n,x->i,x->j,PETSC_NULL, y->i,y->j,PETSC_NULL, &y->xtoy);CHKERRQ(ierr); 2703a30b2313SHong Zhang y->XtoY = X; 2704407f6b05SHong Zhang ierr = PetscObjectReference((PetscObject)X);CHKERRQ(ierr); 2705c537a176SHong Zhang } 2706f4df32b1SMatthew Knepley for (i=0; i<x->nz; i++) y->a[y->xtoy[i]] += a*(x->a[i]); 27071e2582c4SBarry Smith ierr = PetscInfo3(Y,"ratio of nnz(X)/nnz(Y): %d/%d = %G\n",x->nz,y->nz,(PetscReal)(x->nz)/y->nz);CHKERRQ(ierr); 2708ac90fabeSBarry Smith } else { 27098229c054SShri Abhyankar Mat B; 27108229c054SShri Abhyankar PetscInt *nnz; 271116b2e9dcSShri Abhyankar ierr = PetscMalloc(Y->rmap->N*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 2712ec7775f6SShri Abhyankar ierr = MatCreate(((PetscObject)Y)->comm,&B);CHKERRQ(ierr); 2713bc5a2726SShri Abhyankar ierr = PetscObjectSetName((PetscObject)B,((PetscObject)Y)->name);CHKERRQ(ierr); 27144aa94f47SShri Abhyankar ierr = MatSetSizes(B,Y->rmap->n,Y->cmap->n,Y->rmap->N,Y->cmap->N);CHKERRQ(ierr); 2715ec7775f6SShri Abhyankar ierr = MatSetType(B,MATSEQAIJ);CHKERRQ(ierr); 27168229c054SShri Abhyankar ierr = MatAXPYGetPreallocation_SeqAIJ(Y,X,nnz);CHKERRQ(ierr); 27178229c054SShri Abhyankar ierr = MatSeqAIJSetPreallocation(B,PETSC_NULL,nnz);CHKERRQ(ierr); 2718ec7775f6SShri Abhyankar ierr = MatAXPY_BasicWithPreallocation(B,Y,a,X,str);CHKERRQ(ierr); 2719ec7775f6SShri Abhyankar ierr = MatHeaderReplace(Y,B);CHKERRQ(ierr); 27208229c054SShri Abhyankar ierr = PetscFree(nnz);CHKERRQ(ierr); 2721ac90fabeSBarry Smith } 2722ac90fabeSBarry Smith PetscFunctionReturn(0); 2723ac90fabeSBarry Smith } 2724ac90fabeSBarry Smith 2725521d7252SBarry Smith #undef __FUNCT__ 2726521d7252SBarry Smith #define __FUNCT__ "MatSetBlockSize_SeqAIJ" 2727521d7252SBarry Smith PetscErrorCode MatSetBlockSize_SeqAIJ(Mat A,PetscInt bs) 2728521d7252SBarry Smith { 272941c166b1SJed Brown PetscErrorCode ierr; 273041c166b1SJed Brown 2731521d7252SBarry Smith PetscFunctionBegin; 273241c166b1SJed Brown ierr = PetscLayoutSetBlockSize(A->rmap,bs);CHKERRQ(ierr); 273341c166b1SJed Brown ierr = PetscLayoutSetBlockSize(A->cmap,bs);CHKERRQ(ierr); 2734521d7252SBarry Smith PetscFunctionReturn(0); 2735521d7252SBarry Smith } 2736521d7252SBarry Smith 2737354c94deSBarry Smith #undef __FUNCT__ 2738354c94deSBarry Smith #define __FUNCT__ "MatConjugate_SeqAIJ" 27397087cfbeSBarry Smith PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 2740354c94deSBarry Smith { 2741354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 2742354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 2743354c94deSBarry Smith PetscInt i,nz; 2744354c94deSBarry Smith PetscScalar *a; 2745354c94deSBarry Smith 2746354c94deSBarry Smith PetscFunctionBegin; 2747354c94deSBarry Smith nz = aij->nz; 2748354c94deSBarry Smith a = aij->a; 2749354c94deSBarry Smith for (i=0; i<nz; i++) { 2750354c94deSBarry Smith a[i] = PetscConj(a[i]); 2751354c94deSBarry Smith } 2752354c94deSBarry Smith #else 2753354c94deSBarry Smith PetscFunctionBegin; 2754354c94deSBarry Smith #endif 2755354c94deSBarry Smith PetscFunctionReturn(0); 2756354c94deSBarry Smith } 2757354c94deSBarry Smith 2758e34fafa9SBarry Smith #undef __FUNCT__ 2759985db425SBarry Smith #define __FUNCT__ "MatGetRowMaxAbs_SeqAIJ" 2760985db425SBarry Smith PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 2761e34fafa9SBarry Smith { 2762e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2763e34fafa9SBarry Smith PetscErrorCode ierr; 2764d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 2765e34fafa9SBarry Smith PetscReal atmp; 2766985db425SBarry Smith PetscScalar *x; 2767e34fafa9SBarry Smith MatScalar *aa; 2768e34fafa9SBarry Smith 2769e34fafa9SBarry Smith PetscFunctionBegin; 2770e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2771e34fafa9SBarry Smith aa = a->a; 2772e34fafa9SBarry Smith ai = a->i; 2773e34fafa9SBarry Smith aj = a->j; 2774e34fafa9SBarry Smith 2775985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 2776e34fafa9SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2777e34fafa9SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 2778e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2779e34fafa9SBarry Smith for (i=0; i<m; i++) { 2780e34fafa9SBarry Smith ncols = ai[1] - ai[0]; ai++; 27819189402eSHong Zhang x[i] = 0.0; 2782e34fafa9SBarry Smith for (j=0; j<ncols; j++){ 2783985db425SBarry Smith atmp = PetscAbsScalar(*aa); 2784985db425SBarry Smith if (PetscAbsScalar(x[i]) < atmp) {x[i] = atmp; if (idx) idx[i] = *aj;} 2785985db425SBarry Smith aa++; aj++; 2786985db425SBarry Smith } 2787985db425SBarry Smith } 2788985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2789985db425SBarry Smith PetscFunctionReturn(0); 2790985db425SBarry Smith } 2791985db425SBarry Smith 2792985db425SBarry Smith #undef __FUNCT__ 2793985db425SBarry Smith #define __FUNCT__ "MatGetRowMax_SeqAIJ" 2794985db425SBarry Smith PetscErrorCode MatGetRowMax_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 2795985db425SBarry Smith { 2796985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2797985db425SBarry Smith PetscErrorCode ierr; 2798d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 2799985db425SBarry Smith PetscScalar *x; 2800985db425SBarry Smith MatScalar *aa; 2801985db425SBarry Smith 2802985db425SBarry Smith PetscFunctionBegin; 2803e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2804985db425SBarry Smith aa = a->a; 2805985db425SBarry Smith ai = a->i; 2806985db425SBarry Smith aj = a->j; 2807985db425SBarry Smith 2808985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 2809985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2810985db425SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 2811e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2812985db425SBarry Smith for (i=0; i<m; i++) { 2813985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 2814d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 2815985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 2816985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 2817985db425SBarry Smith x[i] = 0.0; 2818985db425SBarry Smith if (idx) { 2819985db425SBarry Smith idx[i] = 0; /* in case ncols is zero */ 2820985db425SBarry Smith for (j=0;j<ncols;j++) { /* find first implicit 0.0 in the row */ 2821985db425SBarry Smith if (aj[j] > j) { 2822985db425SBarry Smith idx[i] = j; 2823985db425SBarry Smith break; 2824985db425SBarry Smith } 2825985db425SBarry Smith } 2826985db425SBarry Smith } 2827985db425SBarry Smith } 2828985db425SBarry Smith for (j=0; j<ncols; j++){ 2829985db425SBarry Smith if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 2830985db425SBarry Smith aa++; aj++; 2831985db425SBarry Smith } 2832985db425SBarry Smith } 2833985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2834985db425SBarry Smith PetscFunctionReturn(0); 2835985db425SBarry Smith } 2836985db425SBarry Smith 2837985db425SBarry Smith #undef __FUNCT__ 2838c87e5d42SMatthew Knepley #define __FUNCT__ "MatGetRowMinAbs_SeqAIJ" 2839c87e5d42SMatthew Knepley PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 2840c87e5d42SMatthew Knepley { 2841c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2842c87e5d42SMatthew Knepley PetscErrorCode ierr; 2843c87e5d42SMatthew Knepley PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 2844c87e5d42SMatthew Knepley PetscReal atmp; 2845c87e5d42SMatthew Knepley PetscScalar *x; 2846c87e5d42SMatthew Knepley MatScalar *aa; 2847c87e5d42SMatthew Knepley 2848c87e5d42SMatthew Knepley PetscFunctionBegin; 2849e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2850c87e5d42SMatthew Knepley aa = a->a; 2851c87e5d42SMatthew Knepley ai = a->i; 2852c87e5d42SMatthew Knepley aj = a->j; 2853c87e5d42SMatthew Knepley 2854c87e5d42SMatthew Knepley ierr = VecSet(v,0.0);CHKERRQ(ierr); 2855c87e5d42SMatthew Knepley ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2856c87e5d42SMatthew Knepley ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 2857e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2858c87e5d42SMatthew Knepley for (i=0; i<m; i++) { 2859c87e5d42SMatthew Knepley ncols = ai[1] - ai[0]; ai++; 2860289a08f5SMatthew Knepley if (ncols) { 2861289a08f5SMatthew Knepley /* Get first nonzero */ 2862289a08f5SMatthew Knepley for(j = 0; j < ncols; j++) { 2863289a08f5SMatthew Knepley atmp = PetscAbsScalar(aa[j]); 2864289a08f5SMatthew Knepley if (atmp > 1.0e-12) {x[i] = atmp; if (idx) idx[i] = aj[j]; break;} 2865289a08f5SMatthew Knepley } 2866289a08f5SMatthew Knepley if (j == ncols) {x[i] = *aa; if (idx) idx[i] = *aj;} 2867289a08f5SMatthew Knepley } else { 2868289a08f5SMatthew Knepley x[i] = 0.0; if (idx) idx[i] = 0; 2869289a08f5SMatthew Knepley } 2870c87e5d42SMatthew Knepley for(j = 0; j < ncols; j++) { 2871c87e5d42SMatthew Knepley atmp = PetscAbsScalar(*aa); 2872289a08f5SMatthew Knepley if (atmp > 1.0e-12 && PetscAbsScalar(x[i]) > atmp) {x[i] = atmp; if (idx) idx[i] = *aj;} 2873c87e5d42SMatthew Knepley aa++; aj++; 2874c87e5d42SMatthew Knepley } 2875c87e5d42SMatthew Knepley } 2876c87e5d42SMatthew Knepley ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2877c87e5d42SMatthew Knepley PetscFunctionReturn(0); 2878c87e5d42SMatthew Knepley } 2879c87e5d42SMatthew Knepley 2880c87e5d42SMatthew Knepley #undef __FUNCT__ 2881985db425SBarry Smith #define __FUNCT__ "MatGetRowMin_SeqAIJ" 2882985db425SBarry Smith PetscErrorCode MatGetRowMin_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 2883985db425SBarry Smith { 2884985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2885985db425SBarry Smith PetscErrorCode ierr; 2886d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 2887985db425SBarry Smith PetscScalar *x; 2888985db425SBarry Smith MatScalar *aa; 2889985db425SBarry Smith 2890985db425SBarry Smith PetscFunctionBegin; 2891e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2892985db425SBarry Smith aa = a->a; 2893985db425SBarry Smith ai = a->i; 2894985db425SBarry Smith aj = a->j; 2895985db425SBarry Smith 2896985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 2897985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2898985db425SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 2899e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2900985db425SBarry Smith for (i=0; i<m; i++) { 2901985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 2902d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 2903985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 2904985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 2905985db425SBarry Smith x[i] = 0.0; 2906985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 2907985db425SBarry Smith idx[i] = 0; /* in case ncols is zero */ 2908985db425SBarry Smith for (j=0;j<ncols;j++) { 2909985db425SBarry Smith if (aj[j] > j) { 2910985db425SBarry Smith idx[i] = j; 2911985db425SBarry Smith break; 2912985db425SBarry Smith } 2913985db425SBarry Smith } 2914985db425SBarry Smith } 2915985db425SBarry Smith } 2916985db425SBarry Smith for (j=0; j<ncols; j++){ 2917985db425SBarry Smith if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 2918985db425SBarry Smith aa++; aj++; 2919e34fafa9SBarry Smith } 2920e34fafa9SBarry Smith } 2921e34fafa9SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2922e34fafa9SBarry Smith PetscFunctionReturn(0); 2923e34fafa9SBarry Smith } 2924bbead8a2SBarry Smith 2925bbead8a2SBarry Smith #include <petscblaslapack.h> 2926bbead8a2SBarry Smith #include <../src/mat/blockinvert.h> 2927bbead8a2SBarry Smith 2928bbead8a2SBarry Smith #undef __FUNCT__ 2929bbead8a2SBarry Smith #define __FUNCT__ "MatInvertBlockDiagonal_SeqAIJ" 2930bbead8a2SBarry Smith PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A,PetscScalar **values) 2931bbead8a2SBarry Smith { 2932bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 2933bbead8a2SBarry Smith PetscErrorCode ierr; 293434fc4b71SJed Brown PetscInt i,bs = A->rmap->bs,mbs = A->rmap->n/A->rmap->bs,ipvt[5],bs2 = bs*bs,*v_pivots,ij[7],*IJ,j; 2935bbead8a2SBarry Smith MatScalar *diag,work[25],*v_work; 2936bbead8a2SBarry Smith PetscReal shift = 0.0; 2937bbead8a2SBarry Smith 2938bbead8a2SBarry Smith PetscFunctionBegin; 29394a0d0026SBarry Smith if (a->ibdiagvalid) { 29404a0d0026SBarry Smith if (values) *values = a->ibdiag; 29414a0d0026SBarry Smith PetscFunctionReturn(0); 29424a0d0026SBarry Smith } 2943bbead8a2SBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 2944bbead8a2SBarry Smith if (!a->ibdiag) { 2945bbead8a2SBarry Smith ierr = PetscMalloc(bs2*mbs*sizeof(PetscScalar),&a->ibdiag);CHKERRQ(ierr); 2946bbead8a2SBarry Smith ierr = PetscLogObjectMemory(A,bs2*mbs*sizeof(PetscScalar));CHKERRQ(ierr); 2947bbead8a2SBarry Smith } 2948bbead8a2SBarry Smith diag = a->ibdiag; 2949bbead8a2SBarry Smith if (values) *values = a->ibdiag; 2950bbead8a2SBarry Smith /* factor and invert each block */ 2951bbead8a2SBarry Smith switch (bs){ 2952bbead8a2SBarry Smith case 1: 2953bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 2954bbead8a2SBarry Smith ierr = MatGetValues(A,1,&i,1,&i,diag+i);CHKERRQ(ierr); 2955bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 2956bbead8a2SBarry Smith } 2957bbead8a2SBarry Smith break; 2958bbead8a2SBarry Smith case 2: 2959bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 2960bbead8a2SBarry Smith ij[0] = 2*i; ij[1] = 2*i + 1; 2961bbead8a2SBarry Smith ierr = MatGetValues(A,2,ij,2,ij,diag);CHKERRQ(ierr); 2962bbead8a2SBarry Smith ierr = Kernel_A_gets_inverse_A_2(diag,shift);CHKERRQ(ierr); 2963bbead8a2SBarry Smith diag += 4; 2964bbead8a2SBarry Smith } 2965bbead8a2SBarry Smith break; 2966bbead8a2SBarry Smith case 3: 2967bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 2968bbead8a2SBarry Smith ij[0] = 3*i; ij[1] = 3*i + 1; ij[2] = 3*i + 2; 2969bbead8a2SBarry Smith ierr = MatGetValues(A,3,ij,3,ij,diag);CHKERRQ(ierr); 2970bbead8a2SBarry Smith ierr = Kernel_A_gets_inverse_A_3(diag,shift);CHKERRQ(ierr); 2971bbead8a2SBarry Smith diag += 9; 2972bbead8a2SBarry Smith } 2973bbead8a2SBarry Smith break; 2974bbead8a2SBarry Smith case 4: 2975bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 2976bbead8a2SBarry Smith ij[0] = 4*i; ij[1] = 4*i + 1; ij[2] = 4*i + 2; ij[3] = 4*i + 3; 2977bbead8a2SBarry Smith ierr = MatGetValues(A,4,ij,4,ij,diag);CHKERRQ(ierr); 2978bbead8a2SBarry Smith ierr = Kernel_A_gets_inverse_A_4(diag,shift);CHKERRQ(ierr); 2979bbead8a2SBarry Smith diag += 16; 2980bbead8a2SBarry Smith } 2981bbead8a2SBarry Smith break; 2982bbead8a2SBarry Smith case 5: 2983bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 2984bbead8a2SBarry Smith ij[0] = 5*i; ij[1] = 5*i + 1; ij[2] = 5*i + 2; ij[3] = 5*i + 3; ij[4] = 5*i + 4; 2985bbead8a2SBarry Smith ierr = MatGetValues(A,5,ij,5,ij,diag);CHKERRQ(ierr); 2986bbead8a2SBarry Smith ierr = Kernel_A_gets_inverse_A_5(diag,ipvt,work,shift);CHKERRQ(ierr); 2987bbead8a2SBarry Smith diag += 25; 2988bbead8a2SBarry Smith } 2989bbead8a2SBarry Smith break; 2990bbead8a2SBarry Smith case 6: 2991bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 2992bbead8a2SBarry Smith ij[0] = 6*i; ij[1] = 6*i + 1; ij[2] = 6*i + 2; ij[3] = 6*i + 3; ij[4] = 6*i + 4; ij[5] = 6*i + 5; 2993bbead8a2SBarry Smith ierr = MatGetValues(A,6,ij,6,ij,diag);CHKERRQ(ierr); 2994bbead8a2SBarry Smith ierr = Kernel_A_gets_inverse_A_6(diag,shift);CHKERRQ(ierr); 2995bbead8a2SBarry Smith diag += 36; 2996bbead8a2SBarry Smith } 2997bbead8a2SBarry Smith break; 2998bbead8a2SBarry Smith case 7: 2999bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3000bbead8a2SBarry Smith ij[0] = 7*i; ij[1] = 7*i + 1; ij[2] = 7*i + 2; ij[3] = 7*i + 3; ij[4] = 7*i + 4; ij[5] = 7*i + 5; ij[5] = 7*i + 6; 3001bbead8a2SBarry Smith ierr = MatGetValues(A,7,ij,7,ij,diag);CHKERRQ(ierr); 3002bbead8a2SBarry Smith ierr = Kernel_A_gets_inverse_A_7(diag,shift);CHKERRQ(ierr); 3003bbead8a2SBarry Smith diag += 49; 3004bbead8a2SBarry Smith } 3005bbead8a2SBarry Smith break; 3006bbead8a2SBarry Smith default: 3007bbead8a2SBarry Smith ierr = PetscMalloc3(bs,MatScalar,&v_work,bs,PetscInt,&v_pivots,bs,PetscInt,&IJ);CHKERRQ(ierr); 3008bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3009bbead8a2SBarry Smith for (j=0; j<bs; j++) { 3010bbead8a2SBarry Smith IJ[j] = bs*i + j; 3011bbead8a2SBarry Smith } 3012bbead8a2SBarry Smith ierr = MatGetValues(A,bs,IJ,bs,IJ,diag);CHKERRQ(ierr); 3013bbead8a2SBarry Smith ierr = Kernel_A_gets_inverse_A(bs,diag,v_pivots,v_work);CHKERRQ(ierr); 3014bbead8a2SBarry Smith diag += bs2; 3015bbead8a2SBarry Smith } 3016bbead8a2SBarry Smith ierr = PetscFree3(v_work,v_pivots,IJ);CHKERRQ(ierr); 3017bbead8a2SBarry Smith } 3018bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 3019bbead8a2SBarry Smith PetscFunctionReturn(0); 3020bbead8a2SBarry Smith } 3021bbead8a2SBarry Smith 30227087cfbeSBarry Smith extern PetscErrorCode MatFDColoringApply_AIJ(Mat,MatFDColoring,Vec,MatStructure*,void*); 3023682d7d0cSBarry Smith /* -------------------------------------------------------------------*/ 30240a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3025cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3026cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3027cb5b572fSBarry Smith MatMult_SeqAIJ, 302897304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 30297c922b88SBarry Smith MatMultTranspose_SeqAIJ, 30307c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3031db4efbfdSBarry Smith 0, 3032db4efbfdSBarry Smith 0, 3033db4efbfdSBarry Smith 0, 3034db4efbfdSBarry Smith /*10*/ 0, 3035cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3036cb5b572fSBarry Smith 0, 303741f059aeSBarry Smith MatSOR_SeqAIJ, 303817ab2063SBarry Smith MatTranspose_SeqAIJ, 303997304618SKris Buschelman /*15*/ MatGetInfo_SeqAIJ, 3040cb5b572fSBarry Smith MatEqual_SeqAIJ, 3041cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3042cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3043cb5b572fSBarry Smith MatNorm_SeqAIJ, 304497304618SKris Buschelman /*20*/ 0, 3045cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3046cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3047cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3048d519adbfSMatthew Knepley /*24*/ MatZeroRows_SeqAIJ, 3049db4efbfdSBarry Smith 0, 3050db4efbfdSBarry Smith 0, 3051db4efbfdSBarry Smith 0, 3052db4efbfdSBarry Smith 0, 3053d519adbfSMatthew Knepley /*29*/ MatSetUpPreallocation_SeqAIJ, 3054db4efbfdSBarry Smith 0, 3055db4efbfdSBarry Smith 0, 30566c0721eeSBarry Smith MatGetArray_SeqAIJ, 30576c0721eeSBarry Smith MatRestoreArray_SeqAIJ, 3058d519adbfSMatthew Knepley /*34*/ MatDuplicate_SeqAIJ, 3059cb5b572fSBarry Smith 0, 3060cb5b572fSBarry Smith 0, 3061cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3062cb5b572fSBarry Smith 0, 3063d519adbfSMatthew Knepley /*39*/ MatAXPY_SeqAIJ, 3064cb5b572fSBarry Smith MatGetSubMatrices_SeqAIJ, 3065cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3066cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3067cb5b572fSBarry Smith MatCopy_SeqAIJ, 3068d519adbfSMatthew Knepley /*44*/ MatGetRowMax_SeqAIJ, 3069cb5b572fSBarry Smith MatScale_SeqAIJ, 3070cb5b572fSBarry Smith 0, 307179299369SBarry Smith MatDiagonalSet_SeqAIJ, 30726e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 3073d519adbfSMatthew Knepley /*49*/ MatSetBlockSize_SeqAIJ, 30743b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 30753b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 30763b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3077a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 3078d519adbfSMatthew Knepley /*54*/ MatFDColoringCreate_SeqAIJ, 3079b9617806SBarry Smith 0, 30800513a670SBarry Smith 0, 3081cda55fadSBarry Smith MatPermute_SeqAIJ, 3082cda55fadSBarry Smith 0, 3083d519adbfSMatthew Knepley /*59*/ 0, 3084b9b97703SBarry Smith MatDestroy_SeqAIJ, 3085b9b97703SBarry Smith MatView_SeqAIJ, 3086357abbc8SBarry Smith 0, 3087ee4f033dSBarry Smith 0, 3088d519adbfSMatthew Knepley /*64*/ 0, 3089ee4f033dSBarry Smith 0, 3090ee4f033dSBarry Smith 0, 3091ee4f033dSBarry Smith 0, 3092ee4f033dSBarry Smith 0, 3093d519adbfSMatthew Knepley /*69*/ MatGetRowMaxAbs_SeqAIJ, 3094c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3095ee4f033dSBarry Smith 0, 3096ee4f033dSBarry Smith MatSetColoring_SeqAIJ, 3097dcf5cc72SBarry Smith #if defined(PETSC_HAVE_ADIC) 3098ee4f033dSBarry Smith MatSetValuesAdic_SeqAIJ, 3099dcf5cc72SBarry Smith #else 3100dcf5cc72SBarry Smith 0, 3101dcf5cc72SBarry Smith #endif 3102d519adbfSMatthew Knepley /*74*/ MatSetValuesAdifor_SeqAIJ, 31033acb8795SBarry Smith MatFDColoringApply_AIJ, 310497304618SKris Buschelman 0, 310597304618SKris Buschelman 0, 310697304618SKris Buschelman 0, 31076ce1633cSBarry Smith /*79*/ MatFindZeroDiagonals_SeqAIJ, 310897304618SKris Buschelman 0, 310997304618SKris Buschelman 0, 311097304618SKris Buschelman 0, 3111bc011b1eSHong Zhang MatLoad_SeqAIJ, 3112d519adbfSMatthew Knepley /*84*/ MatIsSymmetric_SeqAIJ, 31131cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 31146284ec50SHong Zhang 0, 31156284ec50SHong Zhang 0, 3116bc011b1eSHong Zhang 0, 3117d519adbfSMatthew Knepley /*89*/ MatMatMult_SeqAIJ_SeqAIJ, 311826be0446SHong Zhang MatMatMultSymbolic_SeqAIJ_SeqAIJ, 311926be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3120d439da42SKris Buschelman MatPtAP_Basic, 31217ba1a0bfSKris Buschelman MatPtAPSymbolic_SeqAIJ, 3122d519adbfSMatthew Knepley /*94*/ MatPtAPNumeric_SeqAIJ, 3123bc011b1eSHong Zhang MatMatMultTranspose_SeqAIJ_SeqAIJ, 3124bc011b1eSHong Zhang MatMatMultTransposeSymbolic_SeqAIJ_SeqAIJ, 3125bc011b1eSHong Zhang MatMatMultTransposeNumeric_SeqAIJ_SeqAIJ, 31267ba1a0bfSKris Buschelman MatPtAPSymbolic_SeqAIJ_SeqAIJ, 3127d519adbfSMatthew Knepley /*99*/ MatPtAPNumeric_SeqAIJ_SeqAIJ, 3128609c6c4dSKris Buschelman 0, 3129609c6c4dSKris Buschelman 0, 313087d4246cSBarry Smith MatConjugate_SeqAIJ, 313187d4246cSBarry Smith 0, 3132d519adbfSMatthew Knepley /*104*/MatSetValuesRow_SeqAIJ, 313399cafbc1SBarry Smith MatRealPart_SeqAIJ, 3134f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3135f5edf698SHong Zhang 0, 31362bebee5dSHong Zhang 0, 3137cbd44569SHong Zhang /*109*/MatMatSolve_SeqAIJ, 3138985db425SBarry Smith 0, 31392af78befSBarry Smith MatGetRowMin_SeqAIJ, 31402af78befSBarry Smith 0, 3141599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3142d519adbfSMatthew Knepley /*114*/0, 3143599ef60dSHong Zhang 0, 31443c2a7987SHong Zhang 0, 3145fe97e370SBarry Smith 0, 3146fbdbba38SShri Abhyankar 0, 3147fbdbba38SShri Abhyankar /*119*/0, 3148fbdbba38SShri Abhyankar 0, 3149fbdbba38SShri Abhyankar 0, 315082d44351SHong Zhang 0, 3151b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 31520716a85fSBarry Smith /*124*/MatFindNonzeroRows_SeqAIJ, 3153bbead8a2SBarry Smith MatGetColumnNorms_SeqAIJ, 315437868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 315537868618SMatthew G Knepley 0, 315637868618SMatthew G Knepley 0, 315737868618SMatthew G Knepley /*129*/0 31589e29f15eSvictorle }; 315917ab2063SBarry Smith 3160fb2e594dSBarry Smith EXTERN_C_BEGIN 31614a2ae208SSatish Balay #undef __FUNCT__ 31624a2ae208SSatish Balay #define __FUNCT__ "MatSeqAIJSetColumnIndices_SeqAIJ" 31637087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat,PetscInt *indices) 3164bef8e0ddSBarry Smith { 3165bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 316697f1f81fSBarry Smith PetscInt i,nz,n; 3167bef8e0ddSBarry Smith 3168bef8e0ddSBarry Smith PetscFunctionBegin; 3169bef8e0ddSBarry Smith 3170bef8e0ddSBarry Smith nz = aij->maxnz; 3171d0f46423SBarry Smith n = mat->rmap->n; 3172bef8e0ddSBarry Smith for (i=0; i<nz; i++) { 3173bef8e0ddSBarry Smith aij->j[i] = indices[i]; 3174bef8e0ddSBarry Smith } 3175bef8e0ddSBarry Smith aij->nz = nz; 3176bef8e0ddSBarry Smith for (i=0; i<n; i++) { 3177bef8e0ddSBarry Smith aij->ilen[i] = aij->imax[i]; 3178bef8e0ddSBarry Smith } 3179bef8e0ddSBarry Smith 3180bef8e0ddSBarry Smith PetscFunctionReturn(0); 3181bef8e0ddSBarry Smith } 3182fb2e594dSBarry Smith EXTERN_C_END 3183bef8e0ddSBarry Smith 31844a2ae208SSatish Balay #undef __FUNCT__ 31854a2ae208SSatish Balay #define __FUNCT__ "MatSeqAIJSetColumnIndices" 3186bef8e0ddSBarry Smith /*@ 3187bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3188bef8e0ddSBarry Smith in the matrix. 3189bef8e0ddSBarry Smith 3190bef8e0ddSBarry Smith Input Parameters: 3191bef8e0ddSBarry Smith + mat - the SeqAIJ matrix 3192bef8e0ddSBarry Smith - indices - the column indices 3193bef8e0ddSBarry Smith 319415091d37SBarry Smith Level: advanced 319515091d37SBarry Smith 3196bef8e0ddSBarry Smith Notes: 3197bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3198bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 3199bef8e0ddSBarry Smith of the MatSetValues() operation. 3200bef8e0ddSBarry Smith 3201bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 3202d1be2dadSMatthew Knepley MatCreateSeqAIJ(), and the columns indices MUST be sorted. 3203bef8e0ddSBarry Smith 3204bef8e0ddSBarry Smith MUST be called before any calls to MatSetValues(); 3205bef8e0ddSBarry Smith 3206b9617806SBarry Smith The indices should start with zero, not one. 3207b9617806SBarry Smith 3208bef8e0ddSBarry Smith @*/ 32097087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat,PetscInt *indices) 3210bef8e0ddSBarry Smith { 32114ac538c5SBarry Smith PetscErrorCode ierr; 3212bef8e0ddSBarry Smith 3213bef8e0ddSBarry Smith PetscFunctionBegin; 32140700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 32154482741eSBarry Smith PetscValidPointer(indices,2); 32164ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatSeqAIJSetColumnIndices_C",(Mat,PetscInt *),(mat,indices));CHKERRQ(ierr); 3217bef8e0ddSBarry Smith PetscFunctionReturn(0); 3218bef8e0ddSBarry Smith } 3219bef8e0ddSBarry Smith 3220be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/ 3221be6bf707SBarry Smith 3222fb2e594dSBarry Smith EXTERN_C_BEGIN 32234a2ae208SSatish Balay #undef __FUNCT__ 32244a2ae208SSatish Balay #define __FUNCT__ "MatStoreValues_SeqAIJ" 32257087cfbeSBarry Smith PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3226be6bf707SBarry Smith { 3227be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 32286849ba73SBarry Smith PetscErrorCode ierr; 3229d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3230be6bf707SBarry Smith 3231be6bf707SBarry Smith PetscFunctionBegin; 3232be6bf707SBarry Smith if (aij->nonew != 1) { 3233e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3234be6bf707SBarry Smith } 3235be6bf707SBarry Smith 3236be6bf707SBarry Smith /* allocate space for values if not already there */ 3237be6bf707SBarry Smith if (!aij->saved_values) { 323887828ca2SBarry Smith ierr = PetscMalloc((nz+1)*sizeof(PetscScalar),&aij->saved_values);CHKERRQ(ierr); 32399518dbb4SMatthew Knepley ierr = PetscLogObjectMemory(mat,(nz+1)*sizeof(PetscScalar));CHKERRQ(ierr); 3240be6bf707SBarry Smith } 3241be6bf707SBarry Smith 3242be6bf707SBarry Smith /* copy values over */ 324387828ca2SBarry Smith ierr = PetscMemcpy(aij->saved_values,aij->a,nz*sizeof(PetscScalar));CHKERRQ(ierr); 3244be6bf707SBarry Smith PetscFunctionReturn(0); 3245be6bf707SBarry Smith } 3246fb2e594dSBarry Smith EXTERN_C_END 3247be6bf707SBarry Smith 32484a2ae208SSatish Balay #undef __FUNCT__ 3249b9617806SBarry Smith #define __FUNCT__ "MatStoreValues" 3250be6bf707SBarry Smith /*@ 3251be6bf707SBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows, for 3252be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3253be6bf707SBarry Smith nonlinear portion. 3254be6bf707SBarry Smith 3255be6bf707SBarry Smith Collect on Mat 3256be6bf707SBarry Smith 3257be6bf707SBarry Smith Input Parameters: 32580e609b76SBarry Smith . mat - the matrix (currently only AIJ matrices support this option) 3259be6bf707SBarry Smith 326015091d37SBarry Smith Level: advanced 326115091d37SBarry Smith 3262be6bf707SBarry Smith Common Usage, with SNESSolve(): 3263be6bf707SBarry Smith $ Create Jacobian matrix 3264be6bf707SBarry Smith $ Set linear terms into matrix 3265be6bf707SBarry Smith $ Apply boundary conditions to matrix, at this time matrix must have 3266be6bf707SBarry Smith $ final nonzero structure (i.e. setting the nonlinear terms and applying 3267be6bf707SBarry Smith $ boundary conditions again will not change the nonzero structure 3268512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3269be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3270be6bf707SBarry Smith $ Call SNESSetJacobian() with matrix 3271be6bf707SBarry Smith $ In your Jacobian routine 3272be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3273be6bf707SBarry Smith $ Set nonlinear terms in matrix 3274be6bf707SBarry Smith 3275be6bf707SBarry Smith Common Usage without SNESSolve(), i.e. when you handle nonlinear solve yourself: 3276be6bf707SBarry Smith $ // build linear portion of Jacobian 3277512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3278be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3279be6bf707SBarry Smith $ loop over nonlinear iterations 3280be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3281be6bf707SBarry Smith $ // call MatSetValues(mat,...) to set nonliner portion of Jacobian 3282be6bf707SBarry Smith $ // call MatAssemblyBegin/End() on matrix 3283be6bf707SBarry Smith $ Solve linear system with Jacobian 3284be6bf707SBarry Smith $ endloop 3285be6bf707SBarry Smith 3286be6bf707SBarry Smith Notes: 3287be6bf707SBarry Smith Matrix must already be assemblied before calling this routine 3288512a5fc5SBarry Smith Must set the matrix option MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); before 3289be6bf707SBarry Smith calling this routine. 3290be6bf707SBarry Smith 32910c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 32920c468ba9SBarry Smith and does not allocated additional space. 32930c468ba9SBarry Smith 3294be6bf707SBarry Smith .seealso: MatRetrieveValues() 3295be6bf707SBarry Smith 3296be6bf707SBarry Smith @*/ 32977087cfbeSBarry Smith PetscErrorCode MatStoreValues(Mat mat) 3298be6bf707SBarry Smith { 32994ac538c5SBarry Smith PetscErrorCode ierr; 3300be6bf707SBarry Smith 3301be6bf707SBarry Smith PetscFunctionBegin; 33020700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3303e32f2f54SBarry Smith if (!mat->assembled) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 3304e32f2f54SBarry Smith if (mat->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 33054ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatStoreValues_C",(Mat),(mat));CHKERRQ(ierr); 3306be6bf707SBarry Smith PetscFunctionReturn(0); 3307be6bf707SBarry Smith } 3308be6bf707SBarry Smith 3309fb2e594dSBarry Smith EXTERN_C_BEGIN 33104a2ae208SSatish Balay #undef __FUNCT__ 33114a2ae208SSatish Balay #define __FUNCT__ "MatRetrieveValues_SeqAIJ" 33127087cfbeSBarry Smith PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3313be6bf707SBarry Smith { 3314be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 33156849ba73SBarry Smith PetscErrorCode ierr; 3316d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3317be6bf707SBarry Smith 3318be6bf707SBarry Smith PetscFunctionBegin; 3319be6bf707SBarry Smith if (aij->nonew != 1) { 3320e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3321be6bf707SBarry Smith } 3322be6bf707SBarry Smith if (!aij->saved_values) { 3323e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatStoreValues(A);first"); 3324be6bf707SBarry Smith } 3325be6bf707SBarry Smith /* copy values over */ 332687828ca2SBarry Smith ierr = PetscMemcpy(aij->a,aij->saved_values,nz*sizeof(PetscScalar));CHKERRQ(ierr); 3327be6bf707SBarry Smith PetscFunctionReturn(0); 3328be6bf707SBarry Smith } 3329fb2e594dSBarry Smith EXTERN_C_END 3330be6bf707SBarry Smith 33314a2ae208SSatish Balay #undef __FUNCT__ 33324a2ae208SSatish Balay #define __FUNCT__ "MatRetrieveValues" 3333be6bf707SBarry Smith /*@ 3334be6bf707SBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for 3335be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3336be6bf707SBarry Smith nonlinear portion. 3337be6bf707SBarry Smith 3338be6bf707SBarry Smith Collect on Mat 3339be6bf707SBarry Smith 3340be6bf707SBarry Smith Input Parameters: 3341be6bf707SBarry Smith . mat - the matrix (currently on AIJ matrices support this option) 3342be6bf707SBarry Smith 334315091d37SBarry Smith Level: advanced 334415091d37SBarry Smith 3345be6bf707SBarry Smith .seealso: MatStoreValues() 3346be6bf707SBarry Smith 3347be6bf707SBarry Smith @*/ 33487087cfbeSBarry Smith PetscErrorCode MatRetrieveValues(Mat mat) 3349be6bf707SBarry Smith { 33504ac538c5SBarry Smith PetscErrorCode ierr; 3351be6bf707SBarry Smith 3352be6bf707SBarry Smith PetscFunctionBegin; 33530700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3354e32f2f54SBarry Smith if (!mat->assembled) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 3355e32f2f54SBarry Smith if (mat->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 33564ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatRetrieveValues_C",(Mat),(mat));CHKERRQ(ierr); 3357be6bf707SBarry Smith PetscFunctionReturn(0); 3358be6bf707SBarry Smith } 3359be6bf707SBarry Smith 3360f83d6046SBarry Smith 3361be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/ 33624a2ae208SSatish Balay #undef __FUNCT__ 33634a2ae208SSatish Balay #define __FUNCT__ "MatCreateSeqAIJ" 336417ab2063SBarry Smith /*@C 3365682d7d0cSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in AIJ (compressed row) format 33660d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 33676e62573dSLois Curfman McInnes the user should preallocate the matrix storage by setting the parameter nz 336851c19458SBarry Smith (or the array nnz). By setting these parameters accurately, performance 33692bd5e0b2SLois Curfman McInnes during matrix assembly can be increased by more than a factor of 50. 337017ab2063SBarry Smith 3371db81eaa0SLois Curfman McInnes Collective on MPI_Comm 3372db81eaa0SLois Curfman McInnes 337317ab2063SBarry Smith Input Parameters: 3374db81eaa0SLois Curfman McInnes + comm - MPI communicator, set to PETSC_COMM_SELF 337517ab2063SBarry Smith . m - number of rows 337617ab2063SBarry Smith . n - number of columns 337717ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 337851c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 33792bd5e0b2SLois Curfman McInnes (possibly different for each row) or PETSC_NULL 338017ab2063SBarry Smith 338117ab2063SBarry Smith Output Parameter: 3382416022c9SBarry Smith . A - the matrix 338317ab2063SBarry Smith 3384175b88e8SBarry Smith It is recommended that one use the MatCreate(), MatSetType() and/or MatSetFromOptions(), 3385ae1d86c5SBarry Smith MatXXXXSetPreallocation() paradgm instead of this routine directly. 3386175b88e8SBarry Smith [MatXXXXSetPreallocation() is, for example, MatSeqAIJSetPreallocation] 3387175b88e8SBarry Smith 3388b259b22eSLois Curfman McInnes Notes: 338949a6f317SBarry Smith If nnz is given then nz is ignored 339049a6f317SBarry Smith 339117ab2063SBarry Smith The AIJ format (also called the Yale sparse matrix format or 339217ab2063SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 33930002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 339444cd7ae7SLois Curfman McInnes either one (as in Fortran) or zero. See the users' manual for details. 339517ab2063SBarry Smith 339617ab2063SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 3397a40aa06bSLois Curfman McInnes Set nz=PETSC_DEFAULT and nnz=PETSC_NULL for PETSc to control dynamic memory 33983d323bbdSBarry Smith allocation. For large problems you MUST preallocate memory or you 33996da5968aSLois Curfman McInnes will get TERRIBLE performance, see the users' manual chapter on matrices. 340017ab2063SBarry Smith 3401682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 34024fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3403682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 34046c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 34056c7ebb05SLois Curfman McInnes 34066c7ebb05SLois Curfman McInnes Options Database Keys: 3407698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 34089db58ca8SBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 340917ab2063SBarry Smith 3410027ccd11SLois Curfman McInnes Level: intermediate 3411027ccd11SLois Curfman McInnes 341236db0b34SBarry Smith .seealso: MatCreate(), MatCreateMPIAIJ(), MatSetValues(), MatSeqAIJSetColumnIndices(), MatCreateSeqAIJWithArrays() 341336db0b34SBarry Smith 341417ab2063SBarry Smith @*/ 34157087cfbeSBarry Smith PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt nz,const PetscInt nnz[],Mat *A) 341617ab2063SBarry Smith { 3417dfbe8321SBarry Smith PetscErrorCode ierr; 34186945ee14SBarry Smith 34193a40ed3dSBarry Smith PetscFunctionBegin; 3420f69a0ea3SMatthew Knepley ierr = MatCreate(comm,A);CHKERRQ(ierr); 3421117016b1SBarry Smith ierr = MatSetSizes(*A,m,n,m,n);CHKERRQ(ierr); 3422c4752a88SBarry Smith ierr = MatSetType(*A,MATSEQAIJ);CHKERRQ(ierr); 3423d28bb7d2SJed Brown ierr = MatSeqAIJSetPreallocation_SeqAIJ(*A,nz,nnz);CHKERRQ(ierr); 3424273d9f13SBarry Smith PetscFunctionReturn(0); 3425273d9f13SBarry Smith } 3426273d9f13SBarry Smith 34274a2ae208SSatish Balay #undef __FUNCT__ 34284a2ae208SSatish Balay #define __FUNCT__ "MatSeqAIJSetPreallocation" 3429273d9f13SBarry Smith /*@C 3430273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3431273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3432273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3433273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3434273d9f13SBarry Smith 3435273d9f13SBarry Smith Collective on MPI_Comm 3436273d9f13SBarry Smith 3437273d9f13SBarry Smith Input Parameters: 3438117016b1SBarry Smith + B - The matrix-free 3439273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3440273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 3441273d9f13SBarry Smith (possibly different for each row) or PETSC_NULL 3442273d9f13SBarry Smith 3443273d9f13SBarry Smith Notes: 344449a6f317SBarry Smith If nnz is given then nz is ignored 344549a6f317SBarry Smith 3446273d9f13SBarry Smith The AIJ format (also called the Yale sparse matrix format or 3447273d9f13SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 3448273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3449273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3450273d9f13SBarry Smith 3451273d9f13SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 3452273d9f13SBarry Smith Set nz=PETSC_DEFAULT and nnz=PETSC_NULL for PETSc to control dynamic memory 3453273d9f13SBarry Smith allocation. For large problems you MUST preallocate memory or you 3454273d9f13SBarry Smith will get TERRIBLE performance, see the users' manual chapter on matrices. 3455273d9f13SBarry Smith 3456aa95bbe8SBarry Smith You can call MatGetInfo() to get information on how effective the preallocation was; 3457aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3458aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3459aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3460aa95bbe8SBarry Smith 3461a96a251dSBarry Smith Developers: Use nz of MAT_SKIP_ALLOCATION to not allocate any space for the matrix 3462a96a251dSBarry Smith entries or columns indices 3463a96a251dSBarry Smith 3464273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3465273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3466273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3467273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3468273d9f13SBarry Smith 3469273d9f13SBarry Smith Options Database Keys: 3470698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 3471698d4c6aSKris Buschelman . -mat_inode_limit <limit> - Sets inode limit (max limit=5) 3472273d9f13SBarry Smith - -mat_aij_oneindex - Internally use indexing starting at 1 3473273d9f13SBarry Smith rather than 0. Note that when calling MatSetValues(), 3474273d9f13SBarry Smith the user still MUST index entries starting at 0! 3475273d9f13SBarry Smith 3476273d9f13SBarry Smith Level: intermediate 3477273d9f13SBarry Smith 3478aa95bbe8SBarry Smith .seealso: MatCreate(), MatCreateMPIAIJ(), MatSetValues(), MatSeqAIJSetColumnIndices(), MatCreateSeqAIJWithArrays(), MatGetInfo() 3479273d9f13SBarry Smith 3480273d9f13SBarry Smith @*/ 34817087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation(Mat B,PetscInt nz,const PetscInt nnz[]) 3482273d9f13SBarry Smith { 34834ac538c5SBarry Smith PetscErrorCode ierr; 3484a23d5eceSKris Buschelman 3485a23d5eceSKris Buschelman PetscFunctionBegin; 34864ac538c5SBarry Smith ierr = PetscTryMethod(B,"MatSeqAIJSetPreallocation_C",(Mat,PetscInt,const PetscInt[]),(B,nz,nnz));CHKERRQ(ierr); 3487a23d5eceSKris Buschelman PetscFunctionReturn(0); 3488a23d5eceSKris Buschelman } 3489a23d5eceSKris Buschelman 3490a23d5eceSKris Buschelman EXTERN_C_BEGIN 3491a23d5eceSKris Buschelman #undef __FUNCT__ 3492a23d5eceSKris Buschelman #define __FUNCT__ "MatSeqAIJSetPreallocation_SeqAIJ" 34937087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B,PetscInt nz,const PetscInt *nnz) 3494a23d5eceSKris Buschelman { 3495273d9f13SBarry Smith Mat_SeqAIJ *b; 3496ace3abfcSBarry Smith PetscBool skipallocation = PETSC_FALSE; 34976849ba73SBarry Smith PetscErrorCode ierr; 349897f1f81fSBarry Smith PetscInt i; 3499273d9f13SBarry Smith 3500273d9f13SBarry Smith PetscFunctionBegin; 3501d5d45c9bSBarry Smith 3502a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3503c461c341SBarry Smith skipallocation = PETSC_TRUE; 3504c461c341SBarry Smith nz = 0; 3505c461c341SBarry Smith } 3506c461c341SBarry Smith 350726283091SBarry Smith ierr = PetscLayoutSetBlockSize(B->rmap,1);CHKERRQ(ierr); 350826283091SBarry Smith ierr = PetscLayoutSetBlockSize(B->cmap,1);CHKERRQ(ierr); 350926283091SBarry Smith ierr = PetscLayoutSetUp(B->rmap);CHKERRQ(ierr); 351026283091SBarry Smith ierr = PetscLayoutSetUp(B->cmap);CHKERRQ(ierr); 3511899cda47SBarry Smith 3512435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 3513e32f2f54SBarry Smith if (nz < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nz cannot be less than 0: value %d",nz); 3514b73539f3SBarry Smith if (nnz) { 3515d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) { 3516e32f2f54SBarry Smith if (nnz[i] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be less than 0: local row %d value %d",i,nnz[i]); 3517e32f2f54SBarry Smith if (nnz[i] > B->cmap->n) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be greater than row length: local row %d value %d rowlength %d",i,nnz[i],B->cmap->n); 3518b73539f3SBarry Smith } 3519b73539f3SBarry Smith } 3520b73539f3SBarry Smith 3521273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 3522273d9f13SBarry Smith b = (Mat_SeqAIJ*)B->data; 3523273d9f13SBarry Smith 3524ab93d7beSBarry Smith if (!skipallocation) { 35252ee49352SLisandro Dalcin if (!b->imax) { 3526d0f46423SBarry Smith ierr = PetscMalloc2(B->rmap->n,PetscInt,&b->imax,B->rmap->n,PetscInt,&b->ilen);CHKERRQ(ierr); 3527d0f46423SBarry Smith ierr = PetscLogObjectMemory(B,2*B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 35282ee49352SLisandro Dalcin } 3529273d9f13SBarry Smith if (!nnz) { 3530435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 3531c62bd62aSJed Brown else if (nz < 0) nz = 1; 3532d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) b->imax[i] = nz; 3533d0f46423SBarry Smith nz = nz*B->rmap->n; 3534273d9f13SBarry Smith } else { 3535273d9f13SBarry Smith nz = 0; 3536d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) {b->imax[i] = nnz[i]; nz += nnz[i];} 3537273d9f13SBarry Smith } 3538ab93d7beSBarry Smith /* b->ilen will count nonzeros in each row so far. */ 3539d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) { b->ilen[i] = 0; } 3540ab93d7beSBarry Smith 3541273d9f13SBarry Smith /* allocate the matrix space */ 35422ee49352SLisandro Dalcin ierr = MatSeqXAIJFreeAIJ(B,&b->a,&b->j,&b->i);CHKERRQ(ierr); 3543d0f46423SBarry Smith ierr = PetscMalloc3(nz,PetscScalar,&b->a,nz,PetscInt,&b->j,B->rmap->n+1,PetscInt,&b->i);CHKERRQ(ierr); 3544d0f46423SBarry Smith ierr = PetscLogObjectMemory(B,(B->rmap->n+1)*sizeof(PetscInt)+nz*(sizeof(PetscScalar)+sizeof(PetscInt)));CHKERRQ(ierr); 3545bfeeae90SHong Zhang b->i[0] = 0; 3546d0f46423SBarry Smith for (i=1; i<B->rmap->n+1; i++) { 35475da197adSKris Buschelman b->i[i] = b->i[i-1] + b->imax[i-1]; 35485da197adSKris Buschelman } 3549273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 3550e6b907acSBarry Smith b->free_a = PETSC_TRUE; 3551e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 3552c461c341SBarry Smith } else { 3553e6b907acSBarry Smith b->free_a = PETSC_FALSE; 3554e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 3555c461c341SBarry Smith } 3556273d9f13SBarry Smith 3557273d9f13SBarry Smith b->nz = 0; 3558273d9f13SBarry Smith b->maxnz = nz; 3559273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 3560273d9f13SBarry Smith PetscFunctionReturn(0); 3561273d9f13SBarry Smith } 3562a23d5eceSKris Buschelman EXTERN_C_END 3563273d9f13SBarry Smith 3564a1661176SMatthew Knepley #undef __FUNCT__ 3565a1661176SMatthew Knepley #define __FUNCT__ "MatSeqAIJSetPreallocationCSR" 356658d36128SBarry Smith /*@ 3567a1661176SMatthew Knepley MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in AIJ format. 3568a1661176SMatthew Knepley 3569a1661176SMatthew Knepley Input Parameters: 3570a1661176SMatthew Knepley + B - the matrix 3571a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 3572a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 3573a1661176SMatthew Knepley - v - optional values in the matrix 3574a1661176SMatthew Knepley 3575a1661176SMatthew Knepley Level: developer 3576a1661176SMatthew Knepley 357758d36128SBarry Smith The i,j,v values are COPIED with this routine; to avoid the copy use MatCreateSeqAIJWithArrays() 357858d36128SBarry Smith 3579a1661176SMatthew Knepley .keywords: matrix, aij, compressed row, sparse, sequential 3580a1661176SMatthew Knepley 3581a1661176SMatthew Knepley .seealso: MatCreate(), MatCreateSeqAIJ(), MatSetValues(), MatSeqAIJSetPreallocation(), MatCreateSeqAIJ(), SeqAIJ 3582a1661176SMatthew Knepley @*/ 3583a1661176SMatthew Knepley PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B,const PetscInt i[],const PetscInt j[],const PetscScalar v[]) 3584a1661176SMatthew Knepley { 3585a1661176SMatthew Knepley PetscErrorCode ierr; 3586a1661176SMatthew Knepley 3587a1661176SMatthew Knepley PetscFunctionBegin; 35880700a824SBarry Smith PetscValidHeaderSpecific(B,MAT_CLASSID,1); 35894ac538c5SBarry Smith ierr = PetscTryMethod(B,"MatSeqAIJSetPreallocationCSR_C",(Mat,const PetscInt[],const PetscInt[],const PetscScalar[]),(B,i,j,v));CHKERRQ(ierr); 3590a1661176SMatthew Knepley PetscFunctionReturn(0); 3591a1661176SMatthew Knepley } 3592a1661176SMatthew Knepley 3593a1661176SMatthew Knepley EXTERN_C_BEGIN 3594a1661176SMatthew Knepley #undef __FUNCT__ 3595a1661176SMatthew Knepley #define __FUNCT__ "MatSeqAIJSetPreallocationCSR_SeqAIJ" 35967087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B,const PetscInt Ii[],const PetscInt J[],const PetscScalar v[]) 3597a1661176SMatthew Knepley { 3598a1661176SMatthew Knepley PetscInt i; 3599a1661176SMatthew Knepley PetscInt m,n; 3600a1661176SMatthew Knepley PetscInt nz; 3601a1661176SMatthew Knepley PetscInt *nnz, nz_max = 0; 3602a1661176SMatthew Knepley PetscScalar *values; 3603a1661176SMatthew Knepley PetscErrorCode ierr; 3604a1661176SMatthew Knepley 3605a1661176SMatthew Knepley PetscFunctionBegin; 3606a1661176SMatthew Knepley ierr = MatGetSize(B, &m, &n);CHKERRQ(ierr); 3607a1661176SMatthew Knepley 360865e19b50SBarry Smith if (Ii[0]) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %D", Ii[0]); 3609a1661176SMatthew Knepley ierr = PetscMalloc((m+1) * sizeof(PetscInt), &nnz);CHKERRQ(ierr); 3610a1661176SMatthew Knepley for(i = 0; i < m; i++) { 3611b7940d39SSatish Balay nz = Ii[i+1]- Ii[i]; 3612a1661176SMatthew Knepley nz_max = PetscMax(nz_max, nz); 361365e19b50SBarry Smith if (nz < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Local row %D has a negative number of columns %D", i, nnz); 3614a1661176SMatthew Knepley nnz[i] = nz; 3615a1661176SMatthew Knepley } 3616a1661176SMatthew Knepley ierr = MatSeqAIJSetPreallocation(B, 0, nnz);CHKERRQ(ierr); 3617a1661176SMatthew Knepley ierr = PetscFree(nnz);CHKERRQ(ierr); 3618a1661176SMatthew Knepley 3619a1661176SMatthew Knepley if (v) { 3620a1661176SMatthew Knepley values = (PetscScalar*) v; 3621a1661176SMatthew Knepley } else { 36220e83c824SBarry Smith ierr = PetscMalloc(nz_max*sizeof(PetscScalar), &values);CHKERRQ(ierr); 3623a1661176SMatthew Knepley ierr = PetscMemzero(values, nz_max*sizeof(PetscScalar));CHKERRQ(ierr); 3624a1661176SMatthew Knepley } 3625a1661176SMatthew Knepley 3626a1661176SMatthew Knepley for(i = 0; i < m; i++) { 3627b7940d39SSatish Balay nz = Ii[i+1] - Ii[i]; 3628b7940d39SSatish Balay ierr = MatSetValues_SeqAIJ(B, 1, &i, nz, J+Ii[i], values + (v ? Ii[i] : 0), INSERT_VALUES);CHKERRQ(ierr); 3629a1661176SMatthew Knepley } 3630a1661176SMatthew Knepley 3631a1661176SMatthew Knepley ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3632a1661176SMatthew Knepley ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3633a1661176SMatthew Knepley 3634a1661176SMatthew Knepley if (!v) { 3635a1661176SMatthew Knepley ierr = PetscFree(values);CHKERRQ(ierr); 3636a1661176SMatthew Knepley } 3637a1661176SMatthew Knepley PetscFunctionReturn(0); 3638a1661176SMatthew Knepley } 3639a1661176SMatthew Knepley EXTERN_C_END 3640a1661176SMatthew Knepley 3641c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 3642c6db04a5SJed Brown #include <private/petscaxpy.h> 3643170fe5c8SBarry Smith 3644170fe5c8SBarry Smith #undef __FUNCT__ 3645170fe5c8SBarry Smith #define __FUNCT__ "MatMatMultNumeric_SeqDense_SeqAIJ" 3646170fe5c8SBarry Smith /* 3647170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 3648170fe5c8SBarry Smith 3649170fe5c8SBarry Smith n p p 3650170fe5c8SBarry Smith ( ) ( ) ( ) 3651170fe5c8SBarry Smith m ( A ) * n ( B ) = m ( C ) 3652170fe5c8SBarry Smith ( ) ( ) ( ) 3653170fe5c8SBarry Smith 3654170fe5c8SBarry Smith */ 3655170fe5c8SBarry Smith PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A,Mat B,Mat C) 3656170fe5c8SBarry Smith { 3657170fe5c8SBarry Smith PetscErrorCode ierr; 3658170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense*)A->data; 3659170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ*)B->data; 3660170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense*)C->data; 36611de00fd4SBarry Smith PetscInt i,n,m,q,p; 3662170fe5c8SBarry Smith const PetscInt *ii,*idx; 3663170fe5c8SBarry Smith const PetscScalar *b,*a,*a_q; 3664170fe5c8SBarry Smith PetscScalar *c,*c_q; 3665170fe5c8SBarry Smith 3666170fe5c8SBarry Smith PetscFunctionBegin; 3667d0f46423SBarry Smith m = A->rmap->n; 3668d0f46423SBarry Smith n = A->cmap->n; 3669d0f46423SBarry Smith p = B->cmap->n; 3670170fe5c8SBarry Smith a = sub_a->v; 3671170fe5c8SBarry Smith b = sub_b->a; 3672170fe5c8SBarry Smith c = sub_c->v; 3673170fe5c8SBarry Smith ierr = PetscMemzero(c,m*p*sizeof(PetscScalar));CHKERRQ(ierr); 3674170fe5c8SBarry Smith 3675170fe5c8SBarry Smith ii = sub_b->i; 3676170fe5c8SBarry Smith idx = sub_b->j; 3677170fe5c8SBarry Smith for (i=0; i<n; i++) { 3678170fe5c8SBarry Smith q = ii[i+1] - ii[i]; 3679170fe5c8SBarry Smith while (q-->0) { 3680170fe5c8SBarry Smith c_q = c + m*(*idx); 3681170fe5c8SBarry Smith a_q = a + m*i; 3682be7314b0SBarry Smith PetscAXPY(c_q,*b,a_q,m); 3683170fe5c8SBarry Smith idx++; 3684170fe5c8SBarry Smith b++; 3685170fe5c8SBarry Smith } 3686170fe5c8SBarry Smith } 3687170fe5c8SBarry Smith PetscFunctionReturn(0); 3688170fe5c8SBarry Smith } 3689170fe5c8SBarry Smith 3690170fe5c8SBarry Smith #undef __FUNCT__ 3691170fe5c8SBarry Smith #define __FUNCT__ "MatMatMultSymbolic_SeqDense_SeqAIJ" 3692170fe5c8SBarry Smith PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A,Mat B,PetscReal fill,Mat *C) 3693170fe5c8SBarry Smith { 3694170fe5c8SBarry Smith PetscErrorCode ierr; 3695d0f46423SBarry Smith PetscInt m=A->rmap->n,n=B->cmap->n; 3696170fe5c8SBarry Smith Mat Cmat; 3697170fe5c8SBarry Smith 3698170fe5c8SBarry Smith PetscFunctionBegin; 3699e32f2f54SBarry Smith if (A->cmap->n != B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"A->cmap->n %d != B->rmap->n %d\n",A->cmap->n,B->rmap->n); 370039804f7cSBarry Smith ierr = MatCreate(((PetscObject)A)->comm,&Cmat);CHKERRQ(ierr); 3701170fe5c8SBarry Smith ierr = MatSetSizes(Cmat,m,n,m,n);CHKERRQ(ierr); 3702170fe5c8SBarry Smith ierr = MatSetType(Cmat,MATSEQDENSE);CHKERRQ(ierr); 3703170fe5c8SBarry Smith ierr = MatSeqDenseSetPreallocation(Cmat,PETSC_NULL);CHKERRQ(ierr); 3704170fe5c8SBarry Smith Cmat->assembled = PETSC_TRUE; 3705170fe5c8SBarry Smith *C = Cmat; 3706170fe5c8SBarry Smith PetscFunctionReturn(0); 3707170fe5c8SBarry Smith } 3708170fe5c8SBarry Smith 3709170fe5c8SBarry Smith /* ----------------------------------------------------------------*/ 3710170fe5c8SBarry Smith #undef __FUNCT__ 3711170fe5c8SBarry Smith #define __FUNCT__ "MatMatMult_SeqDense_SeqAIJ" 3712170fe5c8SBarry Smith PetscErrorCode MatMatMult_SeqDense_SeqAIJ(Mat A,Mat B,MatReuse scall,PetscReal fill,Mat *C) 3713170fe5c8SBarry Smith { 3714170fe5c8SBarry Smith PetscErrorCode ierr; 3715170fe5c8SBarry Smith 3716170fe5c8SBarry Smith PetscFunctionBegin; 3717170fe5c8SBarry Smith if (scall == MAT_INITIAL_MATRIX){ 3718170fe5c8SBarry Smith ierr = MatMatMultSymbolic_SeqDense_SeqAIJ(A,B,fill,C);CHKERRQ(ierr); 3719170fe5c8SBarry Smith } 3720170fe5c8SBarry Smith ierr = MatMatMultNumeric_SeqDense_SeqAIJ(A,B,*C);CHKERRQ(ierr); 3721170fe5c8SBarry Smith PetscFunctionReturn(0); 3722170fe5c8SBarry Smith } 3723170fe5c8SBarry Smith 3724170fe5c8SBarry Smith 37250bad9183SKris Buschelman /*MC 3726fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 37270bad9183SKris Buschelman based on compressed sparse row format. 37280bad9183SKris Buschelman 37290bad9183SKris Buschelman Options Database Keys: 37300bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 37310bad9183SKris Buschelman 37320bad9183SKris Buschelman Level: beginner 37330bad9183SKris Buschelman 3734f587520bSBarry Smith .seealso: MatCreateSeqAIJ(), MatSetFromOptions(), MatSetType(), MatCreate(), MatType 37350bad9183SKris Buschelman M*/ 37360bad9183SKris Buschelman 3737a6175056SHong Zhang EXTERN_C_BEGIN 3738b5e56a35SBarry Smith #if defined(PETSC_HAVE_PASTIX) 3739b5e56a35SBarry Smith extern PetscErrorCode MatGetFactor_seqaij_pastix(Mat,MatFactorType,Mat*); 3740b5e56a35SBarry Smith #endif 3741ce63c4c1SBarry Smith #if defined(PETSC_HAVE_ESSL) && !defined(PETSC_USE_COMPLEX) && !defined(PETSC_USE_REAL_SINGLE) && !defined(PETSC_USE_REAL___FLOAT128) 3742af1023dbSSatish Balay extern PetscErrorCode MatGetFactor_seqaij_essl(Mat,MatFactorType,Mat *); 3743af1023dbSSatish Balay #endif 37447087cfbeSBarry Smith extern PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat,MatType,MatReuse,Mat*); 37457087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_petsc(Mat,MatFactorType,Mat*); 37467087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_bas(Mat,MatFactorType,Mat*); 37477087cfbeSBarry Smith extern PetscErrorCode MatGetFactorAvailable_seqaij_petsc(Mat,MatFactorType,PetscBool *); 3748611f576cSBarry Smith #if defined(PETSC_HAVE_MUMPS) 37497087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_aij_mumps(Mat,MatFactorType,Mat*); 3750611f576cSBarry Smith #endif 3751611f576cSBarry Smith #if defined(PETSC_HAVE_SUPERLU) 37527087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_superlu(Mat,MatFactorType,Mat*); 3753611f576cSBarry Smith #endif 3754f3c0ef26SHong Zhang #if defined(PETSC_HAVE_SUPERLU_DIST) 3755f3c0ef26SHong Zhang extern PetscErrorCode MatGetFactor_seqaij_superlu_dist(Mat,MatFactorType,Mat*); 3756f3c0ef26SHong Zhang #endif 3757611f576cSBarry Smith #if defined(PETSC_HAVE_SPOOLES) 37587087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_spooles(Mat,MatFactorType,Mat*); 3759611f576cSBarry Smith #endif 3760eb3b5408SSatish Balay #if defined(PETSC_HAVE_UMFPACK) 37617087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_umfpack(Mat,MatFactorType,Mat*); 3762eb3b5408SSatish Balay #endif 3763586621ddSJed Brown #if defined(PETSC_HAVE_CHOLMOD) 37647087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_cholmod(Mat,MatFactorType,Mat*); 3765586621ddSJed Brown #endif 3766719d5645SBarry Smith #if defined(PETSC_HAVE_LUSOL) 37677087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_lusol(Mat,MatFactorType,Mat*); 3768719d5645SBarry Smith #endif 3769b3866ffcSBarry Smith #if defined(PETSC_HAVE_MATLAB_ENGINE) 37707087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_matlab(Mat,MatFactorType,Mat*); 37717087cfbeSBarry Smith extern PetscErrorCode MatlabEnginePut_SeqAIJ(PetscObject,void*); 37727087cfbeSBarry Smith extern PetscErrorCode MatlabEngineGet_SeqAIJ(PetscObject,void*); 3773b3866ffcSBarry Smith #endif 377417667f90SBarry Smith EXTERN_C_END 377517667f90SBarry Smith 377617667f90SBarry Smith EXTERN_C_BEGIN 37774a2ae208SSatish Balay #undef __FUNCT__ 37784a2ae208SSatish Balay #define __FUNCT__ "MatCreate_SeqAIJ" 37797087cfbeSBarry Smith PetscErrorCode MatCreate_SeqAIJ(Mat B) 3780273d9f13SBarry Smith { 3781273d9f13SBarry Smith Mat_SeqAIJ *b; 3782dfbe8321SBarry Smith PetscErrorCode ierr; 378338baddfdSBarry Smith PetscMPIInt size; 3784273d9f13SBarry Smith 3785273d9f13SBarry Smith PetscFunctionBegin; 37867adad957SLisandro Dalcin ierr = MPI_Comm_size(((PetscObject)B)->comm,&size);CHKERRQ(ierr); 3787e32f2f54SBarry Smith if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Comm must be of size 1"); 3788273d9f13SBarry Smith 378938f2d2fdSLisandro Dalcin ierr = PetscNewLog(B,Mat_SeqAIJ,&b);CHKERRQ(ierr); 3790b0a32e0cSBarry Smith B->data = (void*)b; 3791549d3d68SSatish Balay ierr = PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps));CHKERRQ(ierr); 3792416022c9SBarry Smith b->row = 0; 3793416022c9SBarry Smith b->col = 0; 379482bf6240SBarry Smith b->icol = 0; 3795b810aeb4SBarry Smith b->reallocs = 0; 379636db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 3797f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 3798416022c9SBarry Smith b->nonew = 0; 3799416022c9SBarry Smith b->diag = 0; 3800416022c9SBarry Smith b->solve_work = 0; 38012a1b7f2aSHong Zhang B->spptr = 0; 3802be6bf707SBarry Smith b->saved_values = 0; 3803d7f994e1SBarry Smith b->idiag = 0; 380471f1c65dSBarry Smith b->mdiag = 0; 380571f1c65dSBarry Smith b->ssor_work = 0; 380671f1c65dSBarry Smith b->omega = 1.0; 380771f1c65dSBarry Smith b->fshift = 0.0; 380871f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 3809bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 3810a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 3811a30b2313SHong Zhang b->xtoy = 0; 3812a30b2313SHong Zhang b->XtoY = 0; 381388e51ccdSHong Zhang B->same_nonzero = PETSC_FALSE; 381417ab2063SBarry Smith 381535d8aa7fSBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ);CHKERRQ(ierr); 3816b3866ffcSBarry Smith #if defined(PETSC_HAVE_MATLAB_ENGINE) 3817700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_matlab_C","MatGetFactor_seqaij_matlab",MatGetFactor_seqaij_matlab);CHKERRQ(ierr); 3818b3866ffcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"PetscMatlabEnginePut_C","MatlabEnginePut_SeqAIJ",MatlabEnginePut_SeqAIJ);CHKERRQ(ierr); 3819b3866ffcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"PetscMatlabEngineGet_C","MatlabEngineGet_SeqAIJ",MatlabEngineGet_SeqAIJ);CHKERRQ(ierr); 3820b3866ffcSBarry Smith #endif 3821b5e56a35SBarry Smith #if defined(PETSC_HAVE_PASTIX) 3822700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_pastix_C","MatGetFactor_seqaij_pastix",MatGetFactor_seqaij_pastix);CHKERRQ(ierr); 3823b5e56a35SBarry Smith #endif 3824ce63c4c1SBarry Smith #if defined(PETSC_HAVE_ESSL) && !defined(PETSC_USE_COMPLEX) && !defined(PETSC_USE_REAL_SINGLE) && !defined(PETSC_USE_REAL___FLOAT128) 3825700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_essl_C","MatGetFactor_seqaij_essl",MatGetFactor_seqaij_essl);CHKERRQ(ierr); 3826719d5645SBarry Smith #endif 3827611f576cSBarry Smith #if defined(PETSC_HAVE_SUPERLU) 3828700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_superlu_C","MatGetFactor_seqaij_superlu",MatGetFactor_seqaij_superlu);CHKERRQ(ierr); 3829611f576cSBarry Smith #endif 3830f3c0ef26SHong Zhang #if defined(PETSC_HAVE_SUPERLU_DIST) 3831700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_superlu_dist_C","MatGetFactor_seqaij_superlu_dist",MatGetFactor_seqaij_superlu_dist);CHKERRQ(ierr); 3832f3c0ef26SHong Zhang #endif 3833611f576cSBarry Smith #if defined(PETSC_HAVE_SPOOLES) 3834700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_spooles_C","MatGetFactor_seqaij_spooles",MatGetFactor_seqaij_spooles);CHKERRQ(ierr); 3835611f576cSBarry Smith #endif 3836611f576cSBarry Smith #if defined(PETSC_HAVE_MUMPS) 3837700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_mumps_C","MatGetFactor_aij_mumps",MatGetFactor_aij_mumps);CHKERRQ(ierr); 3838611f576cSBarry Smith #endif 3839eb3b5408SSatish Balay #if defined(PETSC_HAVE_UMFPACK) 3840700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_umfpack_C","MatGetFactor_seqaij_umfpack",MatGetFactor_seqaij_umfpack);CHKERRQ(ierr); 3841eb3b5408SSatish Balay #endif 3842586621ddSJed Brown #if defined(PETSC_HAVE_CHOLMOD) 3843700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_cholmod_C","MatGetFactor_seqaij_cholmod",MatGetFactor_seqaij_cholmod);CHKERRQ(ierr); 3844586621ddSJed Brown #endif 3845719d5645SBarry Smith #if defined(PETSC_HAVE_LUSOL) 3846700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_lusol_C","MatGetFactor_seqaij_lusol",MatGetFactor_seqaij_lusol);CHKERRQ(ierr); 3847719d5645SBarry Smith #endif 3848700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_petsc_C","MatGetFactor_seqaij_petsc",MatGetFactor_seqaij_petsc);CHKERRQ(ierr); 3849700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactorAvailable_petsc_C","MatGetFactorAvailable_seqaij_petsc",MatGetFactorAvailable_seqaij_petsc);CHKERRQ(ierr); 3850700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_bas_C","MatGetFactor_seqaij_bas",MatGetFactor_seqaij_bas);CHKERRQ(ierr); 3851700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatSeqAIJSetColumnIndices_C","MatSeqAIJSetColumnIndices_SeqAIJ",MatSeqAIJSetColumnIndices_SeqAIJ);CHKERRQ(ierr); 3852700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatStoreValues_C","MatStoreValues_SeqAIJ",MatStoreValues_SeqAIJ);CHKERRQ(ierr); 3853700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatRetrieveValues_C","MatRetrieveValues_SeqAIJ",MatRetrieveValues_SeqAIJ);CHKERRQ(ierr); 3854700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatConvert_seqaij_seqsbaij_C","MatConvert_SeqAIJ_SeqSBAIJ",MatConvert_SeqAIJ_SeqSBAIJ);CHKERRQ(ierr); 3855700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatConvert_seqaij_seqbaij_C","MatConvert_SeqAIJ_SeqBAIJ",MatConvert_SeqAIJ_SeqBAIJ);CHKERRQ(ierr); 3856700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatConvert_seqaij_seqaijperm_C","MatConvert_SeqAIJ_SeqAIJPERM",MatConvert_SeqAIJ_SeqAIJPERM);CHKERRQ(ierr); 3857700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatConvert_seqaij_seqaijcrl_C","MatConvert_SeqAIJ_SeqAIJCRL",MatConvert_SeqAIJ_SeqAIJCRL);CHKERRQ(ierr); 3858700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatIsTranspose_C","MatIsTranspose_SeqAIJ",MatIsTranspose_SeqAIJ);CHKERRQ(ierr); 3859700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatIsHermitianTranspose_C","MatIsHermitianTranspose_SeqAIJ",MatIsTranspose_SeqAIJ);CHKERRQ(ierr); 3860700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatSeqAIJSetPreallocation_C","MatSeqAIJSetPreallocation_SeqAIJ",MatSeqAIJSetPreallocation_SeqAIJ);CHKERRQ(ierr); 3861700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatSeqAIJSetPreallocationCSR_C","MatSeqAIJSetPreallocationCSR_SeqAIJ",MatSeqAIJSetPreallocationCSR_SeqAIJ);CHKERRQ(ierr); 3862700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatReorderForNonzeroDiagonal_C","MatReorderForNonzeroDiagonal_SeqAIJ",MatReorderForNonzeroDiagonal_SeqAIJ);CHKERRQ(ierr); 3863700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatMatMult_seqdense_seqaij_C","MatMatMult_SeqDense_SeqAIJ",MatMatMult_SeqDense_SeqAIJ);CHKERRQ(ierr); 3864700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatMatMultSymbolic_seqdense_seqaij_C","MatMatMultSymbolic_SeqDense_SeqAIJ",MatMatMultSymbolic_SeqDense_SeqAIJ);CHKERRQ(ierr); 3865700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatMatMultNumeric_seqdense_seqaij_C","MatMatMultNumeric_SeqDense_SeqAIJ",MatMatMultNumeric_SeqDense_SeqAIJ);CHKERRQ(ierr); 38664108e4d5SBarry Smith ierr = MatCreate_SeqAIJ_Inode(B);CHKERRQ(ierr); 386717667f90SBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ);CHKERRQ(ierr); 38683a40ed3dSBarry Smith PetscFunctionReturn(0); 386917ab2063SBarry Smith } 3870273d9f13SBarry Smith EXTERN_C_END 387117ab2063SBarry Smith 3872ff34cdc8SBarry Smith #if defined(PETSC_HAVE_PTHREADCLASSES) 387351d315f7SKerry Stevens EXTERN_C_BEGIN 387451d315f7SKerry Stevens #undef __FUNCT__ 38757d6a0e61SBarry Smith #define __FUNCT__ "MatCreate_SeqAIJPThread" 38767d6a0e61SBarry Smith PetscErrorCode MatCreate_SeqAIJPThread(Mat B) 387751d315f7SKerry Stevens { 387851d315f7SKerry Stevens PetscErrorCode ierr; 387951d315f7SKerry Stevens 388051d315f7SKerry Stevens PetscFunctionBegin; 388151d315f7SKerry Stevens ierr = MatCreate_SeqAIJ(B); 388251d315f7SKerry Stevens ierr = PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps));CHKERRQ(ierr); 38837d6a0e61SBarry Smith B->ops->mult = MatMult_SeqAIJPThread; 38847d6a0e61SBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJPTHREAD);CHKERRQ(ierr); 388551d315f7SKerry Stevens PetscFunctionReturn(0); 388651d315f7SKerry Stevens } 388751d315f7SKerry Stevens EXTERN_C_END 3888ba61063dSBarry Smith #endif 388951d315f7SKerry Stevens 38904a2ae208SSatish Balay #undef __FUNCT__ 3891b24902e0SBarry Smith #define __FUNCT__ "MatDuplicateNoCreate_SeqAIJ" 3892b24902e0SBarry Smith /* 3893b24902e0SBarry Smith Given a matrix generated with MatGetFactor() duplicates all the information in A into B 3894b24902e0SBarry Smith */ 3895ace3abfcSBarry Smith PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C,Mat A,MatDuplicateOption cpvalues,PetscBool mallocmatspace) 389617ab2063SBarry Smith { 3897416022c9SBarry Smith Mat_SeqAIJ *c,*a = (Mat_SeqAIJ*)A->data; 38986849ba73SBarry Smith PetscErrorCode ierr; 3899d0f46423SBarry Smith PetscInt i,m = A->rmap->n; 390017ab2063SBarry Smith 39013a40ed3dSBarry Smith PetscFunctionBegin; 3902273d9f13SBarry Smith c = (Mat_SeqAIJ*)C->data; 3903273d9f13SBarry Smith 3904d5f3da31SBarry Smith C->factortype = A->factortype; 3905416022c9SBarry Smith c->row = 0; 3906416022c9SBarry Smith c->col = 0; 390782bf6240SBarry Smith c->icol = 0; 39086ad4291fSHong Zhang c->reallocs = 0; 390917ab2063SBarry Smith 39106ad4291fSHong Zhang C->assembled = PETSC_TRUE; 391117ab2063SBarry Smith 3912aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->rmap,&C->rmap);CHKERRQ(ierr); 3913aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->cmap,&C->cmap);CHKERRQ(ierr); 3914eec197d1SBarry Smith 391533b91e9fSSatish Balay ierr = PetscMalloc2(m,PetscInt,&c->imax,m,PetscInt,&c->ilen);CHKERRQ(ierr); 39169518dbb4SMatthew Knepley ierr = PetscLogObjectMemory(C, 2*m*sizeof(PetscInt));CHKERRQ(ierr); 391717ab2063SBarry Smith for (i=0; i<m; i++) { 3918416022c9SBarry Smith c->imax[i] = a->imax[i]; 3919416022c9SBarry Smith c->ilen[i] = a->ilen[i]; 392017ab2063SBarry Smith } 392117ab2063SBarry Smith 392217ab2063SBarry Smith /* allocate the matrix space */ 3923f77e22a1SHong Zhang if (mallocmatspace){ 3924a96a251dSBarry Smith ierr = PetscMalloc3(a->i[m],PetscScalar,&c->a,a->i[m],PetscInt,&c->j,m+1,PetscInt,&c->i);CHKERRQ(ierr); 39259518dbb4SMatthew Knepley ierr = PetscLogObjectMemory(C, a->i[m]*(sizeof(PetscScalar)+sizeof(PetscInt))+(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 3926f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 392797f1f81fSBarry Smith ierr = PetscMemcpy(c->i,a->i,(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 392817ab2063SBarry Smith if (m > 0) { 392997f1f81fSBarry Smith ierr = PetscMemcpy(c->j,a->j,(a->i[m])*sizeof(PetscInt));CHKERRQ(ierr); 3930be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 3931bfeeae90SHong Zhang ierr = PetscMemcpy(c->a,a->a,(a->i[m])*sizeof(PetscScalar));CHKERRQ(ierr); 3932be6bf707SBarry Smith } else { 3933bfeeae90SHong Zhang ierr = PetscMemzero(c->a,(a->i[m])*sizeof(PetscScalar));CHKERRQ(ierr); 393417ab2063SBarry Smith } 393508480c60SBarry Smith } 3936f77e22a1SHong Zhang } 393717ab2063SBarry Smith 39386ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 3939416022c9SBarry Smith c->roworiented = a->roworiented; 3940416022c9SBarry Smith c->nonew = a->nonew; 3941416022c9SBarry Smith if (a->diag) { 394297f1f81fSBarry Smith ierr = PetscMalloc((m+1)*sizeof(PetscInt),&c->diag);CHKERRQ(ierr); 394352e6d16bSBarry Smith ierr = PetscLogObjectMemory(C,(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 394417ab2063SBarry Smith for (i=0; i<m; i++) { 3945416022c9SBarry Smith c->diag[i] = a->diag[i]; 394617ab2063SBarry Smith } 39473a40ed3dSBarry Smith } else c->diag = 0; 39486ad4291fSHong Zhang c->solve_work = 0; 39496ad4291fSHong Zhang c->saved_values = 0; 39506ad4291fSHong Zhang c->idiag = 0; 395171f1c65dSBarry Smith c->ssor_work = 0; 3952a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 3953e6b907acSBarry Smith c->free_a = PETSC_TRUE; 3954e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 39556ad4291fSHong Zhang c->xtoy = 0; 39566ad4291fSHong Zhang c->XtoY = 0; 39576ad4291fSHong Zhang 3958416022c9SBarry Smith c->nz = a->nz; 39598ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 3960273d9f13SBarry Smith C->preallocated = PETSC_TRUE; 3961754ec7b1SSatish Balay 39626ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 39636ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 3964cd6b891eSBarry Smith c->compressedrow.check = a->compressedrow.check; 3965cd6b891eSBarry Smith if (a->compressedrow.use){ 39666ad4291fSHong Zhang i = a->compressedrow.nrows; 39670e83c824SBarry Smith ierr = PetscMalloc2(i+1,PetscInt,&c->compressedrow.i,i,PetscInt,&c->compressedrow.rindex);CHKERRQ(ierr); 39686ad4291fSHong Zhang ierr = PetscMemcpy(c->compressedrow.i,a->compressedrow.i,(i+1)*sizeof(PetscInt));CHKERRQ(ierr); 39696ad4291fSHong Zhang ierr = PetscMemcpy(c->compressedrow.rindex,a->compressedrow.rindex,i*sizeof(PetscInt));CHKERRQ(ierr); 397027ea64f8SHong Zhang } else { 397127ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 397227ea64f8SHong Zhang c->compressedrow.i = PETSC_NULL; 397327ea64f8SHong Zhang c->compressedrow.rindex = PETSC_NULL; 39746ad4291fSHong Zhang } 397588e51ccdSHong Zhang C->same_nonzero = A->same_nonzero; 39764108e4d5SBarry Smith ierr = MatDuplicate_SeqAIJ_Inode(A,cpvalues,&C);CHKERRQ(ierr); 39774846f1f5SKris Buschelman 39787adad957SLisandro Dalcin ierr = PetscFListDuplicate(((PetscObject)A)->qlist,&((PetscObject)C)->qlist);CHKERRQ(ierr); 39793a40ed3dSBarry Smith PetscFunctionReturn(0); 398017ab2063SBarry Smith } 398117ab2063SBarry Smith 39824a2ae208SSatish Balay #undef __FUNCT__ 3983b24902e0SBarry Smith #define __FUNCT__ "MatDuplicate_SeqAIJ" 3984b24902e0SBarry Smith PetscErrorCode MatDuplicate_SeqAIJ(Mat A,MatDuplicateOption cpvalues,Mat *B) 3985b24902e0SBarry Smith { 3986b24902e0SBarry Smith PetscErrorCode ierr; 3987b24902e0SBarry Smith 3988b24902e0SBarry Smith PetscFunctionBegin; 3989b24902e0SBarry Smith ierr = MatCreate(((PetscObject)A)->comm,B);CHKERRQ(ierr); 39904b6263acSBarry Smith ierr = MatSetSizes(*B,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 3991b24902e0SBarry Smith ierr = MatSetType(*B,MATSEQAIJ);CHKERRQ(ierr); 3992f77e22a1SHong Zhang ierr = MatDuplicateNoCreate_SeqAIJ(*B,A,cpvalues,PETSC_TRUE);CHKERRQ(ierr); 3993b24902e0SBarry Smith PetscFunctionReturn(0); 3994b24902e0SBarry Smith } 3995b24902e0SBarry Smith 3996b24902e0SBarry Smith #undef __FUNCT__ 39974a2ae208SSatish Balay #define __FUNCT__ "MatLoad_SeqAIJ" 3998112444f4SShri Abhyankar PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 3999fbdbba38SShri Abhyankar { 4000fbdbba38SShri Abhyankar Mat_SeqAIJ *a; 4001fbdbba38SShri Abhyankar PetscErrorCode ierr; 4002fbdbba38SShri Abhyankar PetscInt i,sum,nz,header[4],*rowlengths = 0,M,N,rows,cols; 4003fbdbba38SShri Abhyankar int fd; 4004fbdbba38SShri Abhyankar PetscMPIInt size; 4005fbdbba38SShri Abhyankar MPI_Comm comm; 4006bbead8a2SBarry Smith PetscInt bs = 1; 4007fbdbba38SShri Abhyankar 4008fbdbba38SShri Abhyankar PetscFunctionBegin; 4009fbdbba38SShri Abhyankar ierr = PetscObjectGetComm((PetscObject)viewer,&comm);CHKERRQ(ierr); 4010fbdbba38SShri Abhyankar ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 4011fbdbba38SShri Abhyankar if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"view must have one processor"); 4012bbead8a2SBarry Smith 4013bbead8a2SBarry Smith ierr = PetscOptionsBegin(comm,PETSC_NULL,"Options for loading SEQAIJ matrix","Mat");CHKERRQ(ierr); 4014bbead8a2SBarry Smith ierr = PetscOptionsInt("-matload_block_size","Set the blocksize used to store the matrix","MatLoad",bs,&bs,PETSC_NULL);CHKERRQ(ierr); 4015bbead8a2SBarry Smith ierr = PetscOptionsEnd();CHKERRQ(ierr); 4016bbead8a2SBarry Smith 4017fbdbba38SShri Abhyankar ierr = PetscViewerBinaryGetDescriptor(viewer,&fd);CHKERRQ(ierr); 4018fbdbba38SShri Abhyankar ierr = PetscBinaryRead(fd,header,4,PETSC_INT);CHKERRQ(ierr); 4019fbdbba38SShri Abhyankar if (header[0] != MAT_FILE_CLASSID) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"not matrix object in file"); 4020fbdbba38SShri Abhyankar M = header[1]; N = header[2]; nz = header[3]; 4021fbdbba38SShri Abhyankar 4022bbead8a2SBarry Smith if (nz < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Matrix stored in special format on disk,cannot load as SeqAIJ"); 4023fbdbba38SShri Abhyankar 4024fbdbba38SShri Abhyankar /* read in row lengths */ 4025fbdbba38SShri Abhyankar ierr = PetscMalloc(M*sizeof(PetscInt),&rowlengths);CHKERRQ(ierr); 4026fbdbba38SShri Abhyankar ierr = PetscBinaryRead(fd,rowlengths,M,PETSC_INT);CHKERRQ(ierr); 4027fbdbba38SShri Abhyankar 4028fbdbba38SShri Abhyankar /* check if sum of rowlengths is same as nz */ 4029fbdbba38SShri Abhyankar for (i=0,sum=0; i< M; i++) sum +=rowlengths[i]; 4030fbdbba38SShri Abhyankar if (sum != nz) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_FILE_READ,"Inconsistant matrix data in file. no-nonzeros = %d, sum-row-lengths = %d\n",nz,sum); 4031fbdbba38SShri Abhyankar 4032fbdbba38SShri Abhyankar /* set global size if not set already*/ 4033f501eaabSShri Abhyankar if (newMat->rmap->n < 0 && newMat->rmap->N < 0 && newMat->cmap->n < 0 && newMat->cmap->N < 0) { 4034fbdbba38SShri Abhyankar ierr = MatSetSizes(newMat,PETSC_DECIDE,PETSC_DECIDE,M,N);CHKERRQ(ierr); 4035aabbc4fbSShri Abhyankar } else { 4036fbdbba38SShri Abhyankar /* if sizes and type are already set, check if the vector global sizes are correct */ 4037fbdbba38SShri Abhyankar ierr = MatGetSize(newMat,&rows,&cols);CHKERRQ(ierr); 40384c5b953cSHong Zhang if (rows < 0 && cols < 0){ /* user might provide local size instead of global size */ 40394c5b953cSHong Zhang ierr = MatGetLocalSize(newMat,&rows,&cols);CHKERRQ(ierr); 40404c5b953cSHong Zhang } 4041f501eaabSShri Abhyankar if (M != rows || N != cols) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%d, %d) than the input matrix (%d, %d)",M,N,rows,cols); 4042aabbc4fbSShri Abhyankar } 4043fbdbba38SShri Abhyankar ierr = MatSeqAIJSetPreallocation_SeqAIJ(newMat,0,rowlengths);CHKERRQ(ierr); 4044fbdbba38SShri Abhyankar a = (Mat_SeqAIJ*)newMat->data; 4045fbdbba38SShri Abhyankar 4046fbdbba38SShri Abhyankar ierr = PetscBinaryRead(fd,a->j,nz,PETSC_INT);CHKERRQ(ierr); 4047fbdbba38SShri Abhyankar 4048fbdbba38SShri Abhyankar /* read in nonzero values */ 4049fbdbba38SShri Abhyankar ierr = PetscBinaryRead(fd,a->a,nz,PETSC_SCALAR);CHKERRQ(ierr); 4050fbdbba38SShri Abhyankar 4051fbdbba38SShri Abhyankar /* set matrix "i" values */ 4052fbdbba38SShri Abhyankar a->i[0] = 0; 4053fbdbba38SShri Abhyankar for (i=1; i<= M; i++) { 4054fbdbba38SShri Abhyankar a->i[i] = a->i[i-1] + rowlengths[i-1]; 4055fbdbba38SShri Abhyankar a->ilen[i-1] = rowlengths[i-1]; 4056fbdbba38SShri Abhyankar } 4057fbdbba38SShri Abhyankar ierr = PetscFree(rowlengths);CHKERRQ(ierr); 4058fbdbba38SShri Abhyankar 4059fbdbba38SShri Abhyankar ierr = MatAssemblyBegin(newMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4060fbdbba38SShri Abhyankar ierr = MatAssemblyEnd(newMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4061bbead8a2SBarry Smith if (bs > 1) {ierr = MatSetBlockSize(newMat,bs);CHKERRQ(ierr);} 4062fbdbba38SShri Abhyankar PetscFunctionReturn(0); 4063fbdbba38SShri Abhyankar } 4064fbdbba38SShri Abhyankar 4065fbdbba38SShri Abhyankar #undef __FUNCT__ 4066b9617806SBarry Smith #define __FUNCT__ "MatEqual_SeqAIJ" 4067ace3abfcSBarry Smith PetscErrorCode MatEqual_SeqAIJ(Mat A,Mat B,PetscBool * flg) 40687264ac53SSatish Balay { 40697264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data,*b = (Mat_SeqAIJ *)B->data; 4070dfbe8321SBarry Smith PetscErrorCode ierr; 4071eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 4072eeffb40dSHong Zhang PetscInt k; 4073eeffb40dSHong Zhang #endif 40747264ac53SSatish Balay 40753a40ed3dSBarry Smith PetscFunctionBegin; 4076bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 4077d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) ||(a->nz != b->nz)) { 4078ca44d042SBarry Smith *flg = PETSC_FALSE; 4079ca44d042SBarry Smith PetscFunctionReturn(0); 4080bcd2baecSBarry Smith } 40817264ac53SSatish Balay 40827264ac53SSatish Balay /* if the a->i are the same */ 4083d0f46423SBarry Smith ierr = PetscMemcmp(a->i,b->i,(A->rmap->n+1)*sizeof(PetscInt),flg);CHKERRQ(ierr); 4084abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 40857264ac53SSatish Balay 40867264ac53SSatish Balay /* if a->j are the same */ 408797f1f81fSBarry Smith ierr = PetscMemcmp(a->j,b->j,(a->nz)*sizeof(PetscInt),flg);CHKERRQ(ierr); 4088abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 4089bcd2baecSBarry Smith 4090bcd2baecSBarry Smith /* if a->a are the same */ 4091eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 4092eeffb40dSHong Zhang for (k=0; k<a->nz; k++){ 4093eeffb40dSHong Zhang if (PetscRealPart(a->a[k]) != PetscRealPart(b->a[k]) || PetscImaginaryPart(a->a[k]) != PetscImaginaryPart(b->a[k])){ 4094eeffb40dSHong Zhang *flg = PETSC_FALSE; 40953a40ed3dSBarry Smith PetscFunctionReturn(0); 4096eeffb40dSHong Zhang } 4097eeffb40dSHong Zhang } 4098eeffb40dSHong Zhang #else 4099eeffb40dSHong Zhang ierr = PetscMemcmp(a->a,b->a,(a->nz)*sizeof(PetscScalar),flg);CHKERRQ(ierr); 4100eeffb40dSHong Zhang #endif 4101eeffb40dSHong Zhang PetscFunctionReturn(0); 41027264ac53SSatish Balay } 410336db0b34SBarry Smith 41044a2ae208SSatish Balay #undef __FUNCT__ 41054a2ae208SSatish Balay #define __FUNCT__ "MatCreateSeqAIJWithArrays" 410605869f15SSatish Balay /*@ 410736db0b34SBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential AIJ matrix using matrix elements (in CSR format) 410836db0b34SBarry Smith provided by the user. 410936db0b34SBarry Smith 4110c75a6043SHong Zhang Collective on MPI_Comm 411136db0b34SBarry Smith 411236db0b34SBarry Smith Input Parameters: 411336db0b34SBarry Smith + comm - must be an MPI communicator of size 1 411436db0b34SBarry Smith . m - number of rows 411536db0b34SBarry Smith . n - number of columns 411636db0b34SBarry Smith . i - row indices 411736db0b34SBarry Smith . j - column indices 411836db0b34SBarry Smith - a - matrix values 411936db0b34SBarry Smith 412036db0b34SBarry Smith Output Parameter: 412136db0b34SBarry Smith . mat - the matrix 412236db0b34SBarry Smith 412336db0b34SBarry Smith Level: intermediate 412436db0b34SBarry Smith 412536db0b34SBarry Smith Notes: 41260551d7c0SBarry Smith The i, j, and a arrays are not copied by this routine, the user must free these arrays 4127292fb18eSBarry Smith once the matrix is destroyed and not before 412836db0b34SBarry Smith 412936db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 413036db0b34SBarry Smith 4131bfeeae90SHong Zhang The i and j indices are 0 based 413236db0b34SBarry Smith 4133a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 4134a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 4135a4552177SSatish Balay as shown: 4136a4552177SSatish Balay 4137a4552177SSatish Balay 1 0 0 4138a4552177SSatish Balay 2 0 3 4139a4552177SSatish Balay 4 5 6 4140a4552177SSatish Balay 4141a4552177SSatish Balay i = {0,1,3,6} [size = nrow+1 = 3+1] 41429985e31cSBarry Smith j = {0,0,2,0,1,2} [size = nz = 6]; values must be sorted for each row 4143a4552177SSatish Balay v = {1,2,3,4,5,6} [size = nz = 6] 4144a4552177SSatish Balay 41459985e31cSBarry Smith 41462fb0ec9aSBarry Smith .seealso: MatCreate(), MatCreateMPIAIJ(), MatCreateSeqAIJ(), MatCreateMPIAIJWithArrays(), MatMPIAIJSetPreallocationCSR() 414736db0b34SBarry Smith 414836db0b34SBarry Smith @*/ 41497087cfbeSBarry Smith PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt* i,PetscInt*j,PetscScalar *a,Mat *mat) 415036db0b34SBarry Smith { 4151dfbe8321SBarry Smith PetscErrorCode ierr; 4152cbcfb4deSHong Zhang PetscInt ii; 415336db0b34SBarry Smith Mat_SeqAIJ *aij; 4154cbcfb4deSHong Zhang #if defined(PETSC_USE_DEBUG) 4155cbcfb4deSHong Zhang PetscInt jj; 4156cbcfb4deSHong Zhang #endif 415736db0b34SBarry Smith 415836db0b34SBarry Smith PetscFunctionBegin; 4159a96a251dSBarry Smith if (i[0]) { 4160e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"i (row indices) must start with 0"); 416136db0b34SBarry Smith } 4162f69a0ea3SMatthew Knepley ierr = MatCreate(comm,mat);CHKERRQ(ierr); 4163f69a0ea3SMatthew Knepley ierr = MatSetSizes(*mat,m,n,m,n);CHKERRQ(ierr); 4164ab93d7beSBarry Smith ierr = MatSetType(*mat,MATSEQAIJ);CHKERRQ(ierr); 4165ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(*mat,MAT_SKIP_ALLOCATION,0);CHKERRQ(ierr); 4166ab93d7beSBarry Smith aij = (Mat_SeqAIJ*)(*mat)->data; 4167ab93d7beSBarry Smith ierr = PetscMalloc2(m,PetscInt,&aij->imax,m,PetscInt,&aij->ilen);CHKERRQ(ierr); 4168ab93d7beSBarry Smith 416936db0b34SBarry Smith aij->i = i; 417036db0b34SBarry Smith aij->j = j; 417136db0b34SBarry Smith aij->a = a; 417236db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 417336db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 4174e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 4175e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 417636db0b34SBarry Smith 417736db0b34SBarry Smith for (ii=0; ii<m; ii++) { 417836db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii+1] - i[ii]; 41792515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 4180e32f2f54SBarry Smith if (i[ii+1] - i[ii] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row length in i (row indices) row = %d length = %d",ii,i[ii+1] - i[ii]); 41819985e31cSBarry Smith for (jj=i[ii]+1; jj<i[ii+1]; jj++) { 4182e32f2f54SBarry Smith if (j[jj] < j[jj-1]) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %D (actual colum %D) in row %D is not sorted",jj-i[ii],j[jj],ii); 4183e32f2f54SBarry Smith if (j[jj] == j[jj]-1) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %D (actual colum %D) in row %D is identical to previous entry",jj-i[ii],j[jj],ii); 41849985e31cSBarry Smith } 418536db0b34SBarry Smith #endif 418636db0b34SBarry Smith } 41872515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 418836db0b34SBarry Smith for (ii=0; ii<aij->i[m]; ii++) { 4189e32f2f54SBarry Smith if (j[ii] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column index at location = %d index = %d",ii,j[ii]); 4190e32f2f54SBarry Smith if (j[ii] > n - 1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column index to large at location = %d index = %d",ii,j[ii]); 419136db0b34SBarry Smith } 419236db0b34SBarry Smith #endif 419336db0b34SBarry Smith 4194b65db4caSBarry Smith ierr = MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4195b65db4caSBarry Smith ierr = MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 419636db0b34SBarry Smith PetscFunctionReturn(0); 419736db0b34SBarry Smith } 419836db0b34SBarry Smith 4199cc8ba8e1SBarry Smith #undef __FUNCT__ 4200ee4f033dSBarry Smith #define __FUNCT__ "MatSetColoring_SeqAIJ" 4201dfbe8321SBarry Smith PetscErrorCode MatSetColoring_SeqAIJ(Mat A,ISColoring coloring) 4202cc8ba8e1SBarry Smith { 4203dfbe8321SBarry Smith PetscErrorCode ierr; 4204cc8ba8e1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 420536db0b34SBarry Smith 4206cc8ba8e1SBarry Smith PetscFunctionBegin; 42078ee2e534SBarry Smith if (coloring->ctype == IS_COLORING_GLOBAL) { 4208cc8ba8e1SBarry Smith ierr = ISColoringReference(coloring);CHKERRQ(ierr); 4209cc8ba8e1SBarry Smith a->coloring = coloring; 421012c595b3SBarry Smith } else if (coloring->ctype == IS_COLORING_GHOSTED) { 421197f1f81fSBarry Smith PetscInt i,*larray; 421212c595b3SBarry Smith ISColoring ocoloring; 421308b6dcc0SBarry Smith ISColoringValue *colors; 421412c595b3SBarry Smith 421512c595b3SBarry Smith /* set coloring for diagonal portion */ 42160e83c824SBarry Smith ierr = PetscMalloc(A->cmap->n*sizeof(PetscInt),&larray);CHKERRQ(ierr); 4217d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) { 421812c595b3SBarry Smith larray[i] = i; 421912c595b3SBarry Smith } 4220992144d0SBarry Smith ierr = ISGlobalToLocalMappingApply(A->cmap->mapping,IS_GTOLM_MASK,A->cmap->n,larray,PETSC_NULL,larray);CHKERRQ(ierr); 42210e83c824SBarry Smith ierr = PetscMalloc(A->cmap->n*sizeof(ISColoringValue),&colors);CHKERRQ(ierr); 4222d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) { 422312c595b3SBarry Smith colors[i] = coloring->colors[larray[i]]; 422412c595b3SBarry Smith } 422512c595b3SBarry Smith ierr = PetscFree(larray);CHKERRQ(ierr); 4226d0f46423SBarry Smith ierr = ISColoringCreate(PETSC_COMM_SELF,coloring->n,A->cmap->n,colors,&ocoloring);CHKERRQ(ierr); 422712c595b3SBarry Smith a->coloring = ocoloring; 422812c595b3SBarry Smith } 4229cc8ba8e1SBarry Smith PetscFunctionReturn(0); 4230cc8ba8e1SBarry Smith } 4231cc8ba8e1SBarry Smith 4232dcf5cc72SBarry Smith #if defined(PETSC_HAVE_ADIC) 4233ee4f033dSBarry Smith EXTERN_C_BEGIN 4234c6db04a5SJed Brown #include <adic/ad_utils.h> 4235ee4f033dSBarry Smith EXTERN_C_END 4236cc8ba8e1SBarry Smith 4237cc8ba8e1SBarry Smith #undef __FUNCT__ 4238ee4f033dSBarry Smith #define __FUNCT__ "MatSetValuesAdic_SeqAIJ" 4239dfbe8321SBarry Smith PetscErrorCode MatSetValuesAdic_SeqAIJ(Mat A,void *advalues) 4240cc8ba8e1SBarry Smith { 4241cc8ba8e1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 4242d0f46423SBarry Smith PetscInt m = A->rmap->n,*ii = a->i,*jj = a->j,nz,i,j,nlen; 42434440f671SBarry Smith PetscScalar *v = a->a,*values = ((PetscScalar*)advalues)+1; 424408b6dcc0SBarry Smith ISColoringValue *color; 4245cc8ba8e1SBarry Smith 4246cc8ba8e1SBarry Smith PetscFunctionBegin; 4247e32f2f54SBarry Smith if (!a->coloring) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Coloring not set for matrix"); 42484440f671SBarry Smith nlen = PetscADGetDerivTypeSize()/sizeof(PetscScalar); 4249cc8ba8e1SBarry Smith color = a->coloring->colors; 4250cc8ba8e1SBarry Smith /* loop over rows */ 4251cc8ba8e1SBarry Smith for (i=0; i<m; i++) { 4252cc8ba8e1SBarry Smith nz = ii[i+1] - ii[i]; 4253cc8ba8e1SBarry Smith /* loop over columns putting computed value into matrix */ 4254cc8ba8e1SBarry Smith for (j=0; j<nz; j++) { 4255cc8ba8e1SBarry Smith *v++ = values[color[*jj++]]; 4256cc8ba8e1SBarry Smith } 42574440f671SBarry Smith values += nlen; /* jump to next row of derivatives */ 4258ee4f033dSBarry Smith } 4259ee4f033dSBarry Smith PetscFunctionReturn(0); 4260ee4f033dSBarry Smith } 4261ee4f033dSBarry Smith #endif 4262ee4f033dSBarry Smith 4263ee4f033dSBarry Smith #undef __FUNCT__ 4264ee4f033dSBarry Smith #define __FUNCT__ "MatSetValuesAdifor_SeqAIJ" 426597f1f81fSBarry Smith PetscErrorCode MatSetValuesAdifor_SeqAIJ(Mat A,PetscInt nl,void *advalues) 4266ee4f033dSBarry Smith { 4267ee4f033dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 4268d0f46423SBarry Smith PetscInt m = A->rmap->n,*ii = a->i,*jj = a->j,nz,i,j; 426954f21887SBarry Smith MatScalar *v = a->a; 427054f21887SBarry Smith PetscScalar *values = (PetscScalar *)advalues; 427108b6dcc0SBarry Smith ISColoringValue *color; 4272ee4f033dSBarry Smith 4273ee4f033dSBarry Smith PetscFunctionBegin; 4274e32f2f54SBarry Smith if (!a->coloring) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Coloring not set for matrix"); 4275ee4f033dSBarry Smith color = a->coloring->colors; 4276ee4f033dSBarry Smith /* loop over rows */ 4277ee4f033dSBarry Smith for (i=0; i<m; i++) { 4278ee4f033dSBarry Smith nz = ii[i+1] - ii[i]; 4279ee4f033dSBarry Smith /* loop over columns putting computed value into matrix */ 4280ee4f033dSBarry Smith for (j=0; j<nz; j++) { 4281ee4f033dSBarry Smith *v++ = values[color[*jj++]]; 4282ee4f033dSBarry Smith } 4283ee4f033dSBarry Smith values += nl; /* jump to next row of derivatives */ 4284cc8ba8e1SBarry Smith } 4285cc8ba8e1SBarry Smith PetscFunctionReturn(0); 4286cc8ba8e1SBarry Smith } 428736db0b34SBarry Smith 428881824310SBarry Smith /* 428981824310SBarry Smith Special version for direct calls from Fortran 429081824310SBarry Smith */ 4291c6db04a5SJed Brown #include <private/fortranimpl.h> 429281824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 429381824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 429481824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 429581824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 429681824310SBarry Smith #endif 429781824310SBarry Smith 429881824310SBarry Smith /* Change these macros so can be used in void function */ 429981824310SBarry Smith #undef CHKERRQ 43007adad957SLisandro Dalcin #define CHKERRQ(ierr) CHKERRABORT(((PetscObject)A)->comm,ierr) 430181824310SBarry Smith #undef SETERRQ2 4302e32f2f54SBarry Smith #define SETERRQ2(comm,ierr,b,c,d) CHKERRABORT(comm,ierr) 430381824310SBarry Smith 430481824310SBarry Smith EXTERN_C_BEGIN 430581824310SBarry Smith #undef __FUNCT__ 430681824310SBarry Smith #define __FUNCT__ "matsetvaluesseqaij_" 43071f6cc5b2SSatish Balay void PETSC_STDCALL matsetvaluesseqaij_(Mat *AA,PetscInt *mm,const PetscInt im[],PetscInt *nn,const PetscInt in[],const PetscScalar v[],InsertMode *isis, PetscErrorCode *_ierr) 430881824310SBarry Smith { 430981824310SBarry Smith Mat A = *AA; 431081824310SBarry Smith PetscInt m = *mm, n = *nn; 431181824310SBarry Smith InsertMode is = *isis; 431281824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 431381824310SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 431481824310SBarry Smith PetscInt *imax,*ai,*ailen; 431581824310SBarry Smith PetscErrorCode ierr; 431681824310SBarry Smith PetscInt *aj,nonew = a->nonew,lastcol = -1; 431754f21887SBarry Smith MatScalar *ap,value,*aa; 4318ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 4319ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 432081824310SBarry Smith 432181824310SBarry Smith PetscFunctionBegin; 4322d9e2c085SLisandro Dalcin ierr = MatPreallocated(A);CHKERRQ(ierr); 432381824310SBarry Smith imax = a->imax; 432481824310SBarry Smith ai = a->i; 432581824310SBarry Smith ailen = a->ilen; 432681824310SBarry Smith aj = a->j; 432781824310SBarry Smith aa = a->a; 432881824310SBarry Smith 432981824310SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 433081824310SBarry Smith row = im[k]; 433181824310SBarry Smith if (row < 0) continue; 433281824310SBarry Smith #if defined(PETSC_USE_DEBUG) 4333d0f46423SBarry Smith if (row >= A->rmap->n) SETERRABORT(((PetscObject)A)->comm,PETSC_ERR_ARG_OUTOFRANGE,"Row too large"); 433481824310SBarry Smith #endif 433581824310SBarry Smith rp = aj + ai[row]; ap = aa + ai[row]; 433681824310SBarry Smith rmax = imax[row]; nrow = ailen[row]; 433781824310SBarry Smith low = 0; 433881824310SBarry Smith high = nrow; 433981824310SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 434081824310SBarry Smith if (in[l] < 0) continue; 434181824310SBarry Smith #if defined(PETSC_USE_DEBUG) 4342d0f46423SBarry Smith if (in[l] >= A->cmap->n) SETERRABORT(((PetscObject)A)->comm,PETSC_ERR_ARG_OUTOFRANGE,"Column too large"); 434381824310SBarry Smith #endif 434481824310SBarry Smith col = in[l]; 434581824310SBarry Smith if (roworiented) { 434681824310SBarry Smith value = v[l + k*n]; 434781824310SBarry Smith } else { 434881824310SBarry Smith value = v[k + l*m]; 434981824310SBarry Smith } 435081824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 435181824310SBarry Smith 435281824310SBarry Smith if (col <= lastcol) low = 0; else high = nrow; 435381824310SBarry Smith lastcol = col; 435481824310SBarry Smith while (high-low > 5) { 435581824310SBarry Smith t = (low+high)/2; 435681824310SBarry Smith if (rp[t] > col) high = t; 435781824310SBarry Smith else low = t; 435881824310SBarry Smith } 435981824310SBarry Smith for (i=low; i<high; i++) { 436081824310SBarry Smith if (rp[i] > col) break; 436181824310SBarry Smith if (rp[i] == col) { 436281824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 436381824310SBarry Smith else ap[i] = value; 436481824310SBarry Smith goto noinsert; 436581824310SBarry Smith } 436681824310SBarry Smith } 436781824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 436881824310SBarry Smith if (nonew == 1) goto noinsert; 43697adad957SLisandro Dalcin if (nonew == -1) SETERRABORT(((PetscObject)A)->comm,PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero in the matrix"); 4370fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 437181824310SBarry Smith N = nrow++ - 1; a->nz++; high++; 437281824310SBarry Smith /* shift up all the later entries in this row */ 437381824310SBarry Smith for (ii=N; ii>=i; ii--) { 437481824310SBarry Smith rp[ii+1] = rp[ii]; 437581824310SBarry Smith ap[ii+1] = ap[ii]; 437681824310SBarry Smith } 437781824310SBarry Smith rp[i] = col; 437881824310SBarry Smith ap[i] = value; 437981824310SBarry Smith noinsert:; 438081824310SBarry Smith low = i + 1; 438181824310SBarry Smith } 438281824310SBarry Smith ailen[row] = nrow; 438381824310SBarry Smith } 438481824310SBarry Smith A->same_nonzero = PETSC_FALSE; 438581824310SBarry Smith PetscFunctionReturnVoid(); 438681824310SBarry Smith } 438781824310SBarry Smith EXTERN_C_END 438862298a1eSBarry Smith 4389