1b377110cSBarry Smith 2d5d45c9bSBarry Smith /* 33369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 4d5d45c9bSBarry Smith matrix storage format. 5d5d45c9bSBarry Smith */ 63369ce9aSBarry Smith 77c4f633dSBarry Smith 8c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 9c6db04a5SJed Brown #include <petscblaslapack.h> 10c6db04a5SJed Brown #include <petscbt.h> 11d441b888SJed Brown #include <../src/mat/blocktranspose.h> 120716a85fSBarry Smith 130716a85fSBarry Smith #undef __FUNCT__ 140716a85fSBarry Smith #define __FUNCT__ "MatGetColumnNorms_SeqAIJ" 150716a85fSBarry Smith PetscErrorCode MatGetColumnNorms_SeqAIJ(Mat A,NormType type,PetscReal *norms) 160716a85fSBarry Smith { 170716a85fSBarry Smith PetscErrorCode ierr; 180716a85fSBarry Smith PetscInt i,m,n; 190716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 200716a85fSBarry Smith 210716a85fSBarry Smith PetscFunctionBegin; 220716a85fSBarry Smith ierr = MatGetSize(A,&m,&n);CHKERRQ(ierr); 230716a85fSBarry Smith ierr = PetscMemzero(norms,n*sizeof(PetscReal));CHKERRQ(ierr); 240716a85fSBarry Smith if (type == NORM_2) { 250716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 260716a85fSBarry Smith norms[aij->j[i]] += PetscAbsScalar(aij->a[i]*aij->a[i]); 270716a85fSBarry Smith } 280716a85fSBarry Smith } else if (type == NORM_1) { 290716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 300716a85fSBarry Smith norms[aij->j[i]] += PetscAbsScalar(aij->a[i]); 310716a85fSBarry Smith } 320716a85fSBarry Smith } else if (type == NORM_INFINITY) { 330716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 340716a85fSBarry Smith norms[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]),norms[aij->j[i]]); 350716a85fSBarry Smith } 360716a85fSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Unknown NormType"); 370716a85fSBarry Smith 380716a85fSBarry Smith if (type == NORM_2) { 398f1a2a5eSBarry Smith for (i=0; i<n; i++) norms[i] = PetscSqrtReal(norms[i]); 400716a85fSBarry Smith } 410716a85fSBarry Smith PetscFunctionReturn(0); 420716a85fSBarry Smith } 430716a85fSBarry Smith 444a2ae208SSatish Balay #undef __FUNCT__ 456ce1633cSBarry Smith #define __FUNCT__ "MatFindZeroDiagonals_SeqAIJ" 466ce1633cSBarry Smith PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A,IS *zrows) 476ce1633cSBarry Smith { 486ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 496ce1633cSBarry Smith const MatScalar *aa = a->a; 506ce1633cSBarry Smith PetscInt i,m=A->rmap->n,cnt = 0; 516ce1633cSBarry Smith const PetscInt *jj = a->j,*diag; 526ce1633cSBarry Smith PetscInt *rows; 536ce1633cSBarry Smith PetscErrorCode ierr; 546ce1633cSBarry Smith 556ce1633cSBarry Smith PetscFunctionBegin; 566ce1633cSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 576ce1633cSBarry Smith diag = a->diag; 586ce1633cSBarry Smith for (i=0; i<m; i++) { 596ce1633cSBarry Smith if ((jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 606ce1633cSBarry Smith cnt++; 616ce1633cSBarry Smith } 626ce1633cSBarry Smith } 636ce1633cSBarry Smith ierr = PetscMalloc(cnt*sizeof(PetscInt),&rows);CHKERRQ(ierr); 646ce1633cSBarry Smith cnt = 0; 656ce1633cSBarry Smith for (i=0; i<m; i++) { 666ce1633cSBarry Smith if ((jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 676ce1633cSBarry Smith rows[cnt++] = i; 686ce1633cSBarry Smith } 696ce1633cSBarry Smith } 706ce1633cSBarry Smith ierr = ISCreateGeneral(((PetscObject)A)->comm,cnt,rows,PETSC_OWN_POINTER,zrows);CHKERRQ(ierr); 716ce1633cSBarry Smith PetscFunctionReturn(0); 726ce1633cSBarry Smith } 736ce1633cSBarry Smith 746ce1633cSBarry Smith #undef __FUNCT__ 75b3a44c85SBarry Smith #define __FUNCT__ "MatFindNonzeroRows_SeqAIJ" 76b3a44c85SBarry Smith PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A,IS *keptrows) 77b3a44c85SBarry Smith { 78b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 79b3a44c85SBarry Smith const MatScalar *aa; 80b3a44c85SBarry Smith PetscInt m=A->rmap->n,cnt = 0; 81b3a44c85SBarry Smith const PetscInt *ii; 82b3a44c85SBarry Smith PetscInt n,i,j,*rows; 83b3a44c85SBarry Smith PetscErrorCode ierr; 84b3a44c85SBarry Smith 85b3a44c85SBarry Smith PetscFunctionBegin; 86b3a44c85SBarry Smith *keptrows = 0; 87b3a44c85SBarry Smith ii = a->i; 88b3a44c85SBarry Smith for (i=0; i<m; i++) { 89b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 90b3a44c85SBarry Smith if (!n) { 91b3a44c85SBarry Smith cnt++; 92b3a44c85SBarry Smith goto ok1; 93b3a44c85SBarry Smith } 94b3a44c85SBarry Smith aa = a->a + ii[i]; 95b3a44c85SBarry Smith for (j=0; j<n; j++) { 96b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 97b3a44c85SBarry Smith } 98b3a44c85SBarry Smith cnt++; 99b3a44c85SBarry Smith ok1:; 100b3a44c85SBarry Smith } 101b3a44c85SBarry Smith if (!cnt) PetscFunctionReturn(0); 102b3a44c85SBarry Smith ierr = PetscMalloc((A->rmap->n-cnt)*sizeof(PetscInt),&rows);CHKERRQ(ierr); 103b3a44c85SBarry Smith cnt = 0; 104b3a44c85SBarry Smith for (i=0; i<m; i++) { 105b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 106b3a44c85SBarry Smith if (!n) continue; 107b3a44c85SBarry Smith aa = a->a + ii[i]; 108b3a44c85SBarry Smith for (j=0; j<n; j++) { 109b3a44c85SBarry Smith if (aa[j] != 0.0) { 110b3a44c85SBarry Smith rows[cnt++] = i; 111b3a44c85SBarry Smith break; 112b3a44c85SBarry Smith } 113b3a44c85SBarry Smith } 114b3a44c85SBarry Smith } 115b3a44c85SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,cnt,rows,PETSC_OWN_POINTER,keptrows);CHKERRQ(ierr); 116b3a44c85SBarry Smith PetscFunctionReturn(0); 117b3a44c85SBarry Smith } 118b3a44c85SBarry Smith 119b3a44c85SBarry Smith #undef __FUNCT__ 12079299369SBarry Smith #define __FUNCT__ "MatDiagonalSet_SeqAIJ" 1217087cfbeSBarry Smith PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y,Vec D,InsertMode is) 12279299369SBarry Smith { 12379299369SBarry Smith PetscErrorCode ierr; 12479299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) Y->data; 125d0f46423SBarry Smith PetscInt i,*diag, m = Y->rmap->n; 12654f21887SBarry Smith MatScalar *aa = aij->a; 12754f21887SBarry Smith PetscScalar *v; 128ace3abfcSBarry Smith PetscBool missing; 12979299369SBarry Smith 13079299369SBarry Smith PetscFunctionBegin; 13109f38230SBarry Smith if (Y->assembled) { 13209f38230SBarry Smith ierr = MatMissingDiagonal_SeqAIJ(Y,&missing,PETSC_NULL);CHKERRQ(ierr); 13309f38230SBarry Smith if (!missing) { 13479299369SBarry Smith diag = aij->diag; 13579299369SBarry Smith ierr = VecGetArray(D,&v);CHKERRQ(ierr); 13679299369SBarry Smith if (is == INSERT_VALUES) { 13779299369SBarry Smith for (i=0; i<m; i++) { 13879299369SBarry Smith aa[diag[i]] = v[i]; 13979299369SBarry Smith } 14079299369SBarry Smith } else { 14179299369SBarry Smith for (i=0; i<m; i++) { 14279299369SBarry Smith aa[diag[i]] += v[i]; 14379299369SBarry Smith } 14479299369SBarry Smith } 14579299369SBarry Smith ierr = VecRestoreArray(D,&v);CHKERRQ(ierr); 14679299369SBarry Smith PetscFunctionReturn(0); 14779299369SBarry Smith } 14886c113feSBarry Smith aij->idiagvalid = PETSC_FALSE; 14986c113feSBarry Smith aij->ibdiagvalid = PETSC_FALSE; 15009f38230SBarry Smith } 15109f38230SBarry Smith ierr = MatDiagonalSet_Default(Y,D,is);CHKERRQ(ierr); 15209f38230SBarry Smith PetscFunctionReturn(0); 15309f38230SBarry Smith } 15479299369SBarry Smith 15579299369SBarry Smith #undef __FUNCT__ 1564a2ae208SSatish Balay #define __FUNCT__ "MatGetRowIJ_SeqAIJ" 157ace3abfcSBarry Smith PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *m,PetscInt *ia[],PetscInt *ja[],PetscBool *done) 15817ab2063SBarry Smith { 159416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 160dfbe8321SBarry Smith PetscErrorCode ierr; 16197f1f81fSBarry Smith PetscInt i,ishift; 16217ab2063SBarry Smith 1633a40ed3dSBarry Smith PetscFunctionBegin; 164d0f46423SBarry Smith *m = A->rmap->n; 1653a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 166bfeeae90SHong Zhang ishift = 0; 16753e63a63SBarry Smith if (symmetric && !A->structurally_symmetric) { 168d0f46423SBarry Smith ierr = MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,ishift,oshift,ia,ja);CHKERRQ(ierr); 169bfeeae90SHong Zhang } else if (oshift == 1) { 170d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 1713b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 172d0f46423SBarry Smith ierr = PetscMalloc((A->rmap->n+1)*sizeof(PetscInt),ia);CHKERRQ(ierr); 173d0f46423SBarry Smith for (i=0; i<A->rmap->n+1; i++) (*ia)[i] = a->i[i] + 1; 174ecc77c7aSBarry Smith if (ja) { 17597f1f81fSBarry Smith ierr = PetscMalloc((nz+1)*sizeof(PetscInt),ja);CHKERRQ(ierr); 1763b2fbd54SBarry Smith for (i=0; i<nz; i++) (*ja)[i] = a->j[i] + 1; 177ecc77c7aSBarry Smith } 1786945ee14SBarry Smith } else { 179ecc77c7aSBarry Smith *ia = a->i; 180ecc77c7aSBarry Smith if (ja) *ja = a->j; 181a2ce50c7SBarry Smith } 1823a40ed3dSBarry Smith PetscFunctionReturn(0); 183a2744918SBarry Smith } 184a2744918SBarry Smith 1854a2ae208SSatish Balay #undef __FUNCT__ 1864a2ae208SSatish Balay #define __FUNCT__ "MatRestoreRowIJ_SeqAIJ" 187ace3abfcSBarry Smith PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,PetscInt *ia[],PetscInt *ja[],PetscBool *done) 1886945ee14SBarry Smith { 189dfbe8321SBarry Smith PetscErrorCode ierr; 1906945ee14SBarry Smith 1913a40ed3dSBarry Smith PetscFunctionBegin; 1923a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 193bfeeae90SHong Zhang if ((symmetric && !A->structurally_symmetric) || oshift == 1) { 194606d414cSSatish Balay ierr = PetscFree(*ia);CHKERRQ(ierr); 195ecc77c7aSBarry Smith if (ja) {ierr = PetscFree(*ja);CHKERRQ(ierr);} 196bcd2baecSBarry Smith } 1973a40ed3dSBarry Smith PetscFunctionReturn(0); 19817ab2063SBarry Smith } 19917ab2063SBarry Smith 2004a2ae208SSatish Balay #undef __FUNCT__ 2014a2ae208SSatish Balay #define __FUNCT__ "MatGetColumnIJ_SeqAIJ" 202ace3abfcSBarry Smith PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *nn,PetscInt *ia[],PetscInt *ja[],PetscBool *done) 2033b2fbd54SBarry Smith { 2043b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 205dfbe8321SBarry Smith PetscErrorCode ierr; 206d0f46423SBarry Smith PetscInt i,*collengths,*cia,*cja,n = A->cmap->n,m = A->rmap->n; 20797f1f81fSBarry Smith PetscInt nz = a->i[m],row,*jj,mr,col; 2083b2fbd54SBarry Smith 2093a40ed3dSBarry Smith PetscFunctionBegin; 210899cda47SBarry Smith *nn = n; 2113a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2123b2fbd54SBarry Smith if (symmetric) { 213d0f46423SBarry Smith ierr = MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,0,oshift,ia,ja);CHKERRQ(ierr); 2143b2fbd54SBarry Smith } else { 21597f1f81fSBarry Smith ierr = PetscMalloc((n+1)*sizeof(PetscInt),&collengths);CHKERRQ(ierr); 21697f1f81fSBarry Smith ierr = PetscMemzero(collengths,n*sizeof(PetscInt));CHKERRQ(ierr); 21797f1f81fSBarry Smith ierr = PetscMalloc((n+1)*sizeof(PetscInt),&cia);CHKERRQ(ierr); 21897f1f81fSBarry Smith ierr = PetscMalloc((nz+1)*sizeof(PetscInt),&cja);CHKERRQ(ierr); 2193b2fbd54SBarry Smith jj = a->j; 2203b2fbd54SBarry Smith for (i=0; i<nz; i++) { 221bfeeae90SHong Zhang collengths[jj[i]]++; 2223b2fbd54SBarry Smith } 2233b2fbd54SBarry Smith cia[0] = oshift; 2243b2fbd54SBarry Smith for (i=0; i<n; i++) { 2253b2fbd54SBarry Smith cia[i+1] = cia[i] + collengths[i]; 2263b2fbd54SBarry Smith } 22797f1f81fSBarry Smith ierr = PetscMemzero(collengths,n*sizeof(PetscInt));CHKERRQ(ierr); 2283b2fbd54SBarry Smith jj = a->j; 229a93ec695SBarry Smith for (row=0; row<m; row++) { 230a93ec695SBarry Smith mr = a->i[row+1] - a->i[row]; 231a93ec695SBarry Smith for (i=0; i<mr; i++) { 232bfeeae90SHong Zhang col = *jj++; 2333b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2343b2fbd54SBarry Smith } 2353b2fbd54SBarry Smith } 236606d414cSSatish Balay ierr = PetscFree(collengths);CHKERRQ(ierr); 2373b2fbd54SBarry Smith *ia = cia; *ja = cja; 2383b2fbd54SBarry Smith } 2393a40ed3dSBarry Smith PetscFunctionReturn(0); 2403b2fbd54SBarry Smith } 2413b2fbd54SBarry Smith 2424a2ae208SSatish Balay #undef __FUNCT__ 2434a2ae208SSatish Balay #define __FUNCT__ "MatRestoreColumnIJ_SeqAIJ" 244ace3abfcSBarry Smith PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,PetscInt *ia[],PetscInt *ja[],PetscBool *done) 2453b2fbd54SBarry Smith { 246dfbe8321SBarry Smith PetscErrorCode ierr; 247606d414cSSatish Balay 2483a40ed3dSBarry Smith PetscFunctionBegin; 2493a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2503b2fbd54SBarry Smith 251606d414cSSatish Balay ierr = PetscFree(*ia);CHKERRQ(ierr); 252606d414cSSatish Balay ierr = PetscFree(*ja);CHKERRQ(ierr); 2533b2fbd54SBarry Smith 2543a40ed3dSBarry Smith PetscFunctionReturn(0); 2553b2fbd54SBarry Smith } 2563b2fbd54SBarry Smith 25787d4246cSBarry Smith #undef __FUNCT__ 25887d4246cSBarry Smith #define __FUNCT__ "MatSetValuesRow_SeqAIJ" 25987d4246cSBarry Smith PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A,PetscInt row,const PetscScalar v[]) 26087d4246cSBarry Smith { 26187d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 26287d4246cSBarry Smith PetscInt *ai = a->i; 26387d4246cSBarry Smith PetscErrorCode ierr; 26487d4246cSBarry Smith 26587d4246cSBarry Smith PetscFunctionBegin; 26687d4246cSBarry Smith ierr = PetscMemcpy(a->a+ai[row],v,(ai[row+1]-ai[row])*sizeof(PetscScalar));CHKERRQ(ierr); 26787d4246cSBarry Smith PetscFunctionReturn(0); 26887d4246cSBarry Smith } 26987d4246cSBarry Smith 2704a2ae208SSatish Balay #undef __FUNCT__ 2714a2ae208SSatish Balay #define __FUNCT__ "MatSetValues_SeqAIJ" 27297f1f81fSBarry Smith PetscErrorCode MatSetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 27317ab2063SBarry Smith { 274416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 275e2ee6c50SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 27697f1f81fSBarry Smith PetscInt *imax = a->imax,*ai = a->i,*ailen = a->ilen; 2776849ba73SBarry Smith PetscErrorCode ierr; 278e2ee6c50SBarry Smith PetscInt *aj = a->j,nonew = a->nonew,lastcol = -1; 27954f21887SBarry Smith MatScalar *ap,value,*aa = a->a; 280ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 281ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 28217ab2063SBarry Smith 2833a40ed3dSBarry Smith PetscFunctionBegin; 28471fd2e92SBarry Smith if (v) PetscValidScalarPointer(v,6); 28517ab2063SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 286416022c9SBarry Smith row = im[k]; 2875ef9f2a5SBarry Smith if (row < 0) continue; 2882515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 289e32f2f54SBarry Smith if (row >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",row,A->rmap->n-1); 2903b2fbd54SBarry Smith #endif 291bfeeae90SHong Zhang rp = aj + ai[row]; ap = aa + ai[row]; 29217ab2063SBarry Smith rmax = imax[row]; nrow = ailen[row]; 293416022c9SBarry Smith low = 0; 294c71e6ed7SBarry Smith high = nrow; 29517ab2063SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 2965ef9f2a5SBarry Smith if (in[l] < 0) continue; 2972515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 298e32f2f54SBarry Smith if (in[l] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",in[l],A->cmap->n-1); 2993b2fbd54SBarry Smith #endif 300bfeeae90SHong Zhang col = in[l]; 30116371a99SBarry Smith if (v) { 3024b0e389bSBarry Smith if (roworiented) { 3035ef9f2a5SBarry Smith value = v[l + k*n]; 304bef8e0ddSBarry Smith } else { 3054b0e389bSBarry Smith value = v[k + l*m]; 3064b0e389bSBarry Smith } 30716371a99SBarry Smith } else { 30875567043SBarry Smith value = 0.; 30916371a99SBarry Smith } 310abc0a331SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 31136db0b34SBarry Smith 3127cd84e04SBarry Smith if (col <= lastcol) low = 0; else high = nrow; 313e2ee6c50SBarry Smith lastcol = col; 314416022c9SBarry Smith while (high-low > 5) { 315416022c9SBarry Smith t = (low+high)/2; 316416022c9SBarry Smith if (rp[t] > col) high = t; 317416022c9SBarry Smith else low = t; 31817ab2063SBarry Smith } 319416022c9SBarry Smith for (i=low; i<high; i++) { 32017ab2063SBarry Smith if (rp[i] > col) break; 32117ab2063SBarry Smith if (rp[i] == col) { 322416022c9SBarry Smith if (is == ADD_VALUES) ap[i] += value; 32317ab2063SBarry Smith else ap[i] = value; 324e44c0bd4SBarry Smith low = i + 1; 32517ab2063SBarry Smith goto noinsert; 32617ab2063SBarry Smith } 32717ab2063SBarry Smith } 328abc0a331SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 329c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 330e32f2f54SBarry Smith if (nonew == -1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero at (%D,%D) in the matrix",row,col); 331fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 332c03d1d03SSatish Balay N = nrow++ - 1; a->nz++; high++; 333416022c9SBarry Smith /* shift up all the later entries in this row */ 334416022c9SBarry Smith for (ii=N; ii>=i; ii--) { 33517ab2063SBarry Smith rp[ii+1] = rp[ii]; 33617ab2063SBarry Smith ap[ii+1] = ap[ii]; 33717ab2063SBarry Smith } 33817ab2063SBarry Smith rp[i] = col; 33917ab2063SBarry Smith ap[i] = value; 340416022c9SBarry Smith low = i + 1; 341e44c0bd4SBarry Smith noinsert:; 34217ab2063SBarry Smith } 34317ab2063SBarry Smith ailen[row] = nrow; 34417ab2063SBarry Smith } 34588e51ccdSHong Zhang A->same_nonzero = PETSC_FALSE; 3463a40ed3dSBarry Smith PetscFunctionReturn(0); 34717ab2063SBarry Smith } 34817ab2063SBarry Smith 34981824310SBarry Smith 3504a2ae208SSatish Balay #undef __FUNCT__ 3514a2ae208SSatish Balay #define __FUNCT__ "MatGetValues_SeqAIJ" 352a77337e4SBarry Smith PetscErrorCode MatGetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],PetscScalar v[]) 3537eb43aa7SLois Curfman McInnes { 3547eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 35597f1f81fSBarry Smith PetscInt *rp,k,low,high,t,row,nrow,i,col,l,*aj = a->j; 35697f1f81fSBarry Smith PetscInt *ai = a->i,*ailen = a->ilen; 35754f21887SBarry Smith MatScalar *ap,*aa = a->a; 3587eb43aa7SLois Curfman McInnes 3593a40ed3dSBarry Smith PetscFunctionBegin; 3607eb43aa7SLois Curfman McInnes for (k=0; k<m; k++) { /* loop over rows */ 3617eb43aa7SLois Curfman McInnes row = im[k]; 362e32f2f54SBarry Smith if (row < 0) {v += n; continue;} /* SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row: %D",row); */ 363e32f2f54SBarry Smith if (row >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",row,A->rmap->n-1); 364bfeeae90SHong Zhang rp = aj + ai[row]; ap = aa + ai[row]; 3657eb43aa7SLois Curfman McInnes nrow = ailen[row]; 3667eb43aa7SLois Curfman McInnes for (l=0; l<n; l++) { /* loop over columns */ 367e32f2f54SBarry Smith if (in[l] < 0) {v++; continue;} /* SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column: %D",in[l]); */ 368e32f2f54SBarry Smith if (in[l] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",in[l],A->cmap->n-1); 369bfeeae90SHong Zhang col = in[l] ; 3707eb43aa7SLois Curfman McInnes high = nrow; low = 0; /* assume unsorted */ 3717eb43aa7SLois Curfman McInnes while (high-low > 5) { 3727eb43aa7SLois Curfman McInnes t = (low+high)/2; 3737eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 3747eb43aa7SLois Curfman McInnes else low = t; 3757eb43aa7SLois Curfman McInnes } 3767eb43aa7SLois Curfman McInnes for (i=low; i<high; i++) { 3777eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 3787eb43aa7SLois Curfman McInnes if (rp[i] == col) { 379b49de8d1SLois Curfman McInnes *v++ = ap[i]; 3807eb43aa7SLois Curfman McInnes goto finished; 3817eb43aa7SLois Curfman McInnes } 3827eb43aa7SLois Curfman McInnes } 38397e567efSBarry Smith *v++ = 0.0; 3847eb43aa7SLois Curfman McInnes finished:; 3857eb43aa7SLois Curfman McInnes } 3867eb43aa7SLois Curfman McInnes } 3873a40ed3dSBarry Smith PetscFunctionReturn(0); 3887eb43aa7SLois Curfman McInnes } 3897eb43aa7SLois Curfman McInnes 39017ab2063SBarry Smith 3914a2ae208SSatish Balay #undef __FUNCT__ 3924a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqAIJ_Binary" 393dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Binary(Mat A,PetscViewer viewer) 39417ab2063SBarry Smith { 395416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3966849ba73SBarry Smith PetscErrorCode ierr; 3976f69ff64SBarry Smith PetscInt i,*col_lens; 3986f69ff64SBarry Smith int fd; 39917ab2063SBarry Smith 4003a40ed3dSBarry Smith PetscFunctionBegin; 401b0a32e0cSBarry Smith ierr = PetscViewerBinaryGetDescriptor(viewer,&fd);CHKERRQ(ierr); 402d0f46423SBarry Smith ierr = PetscMalloc((4+A->rmap->n)*sizeof(PetscInt),&col_lens);CHKERRQ(ierr); 4030700a824SBarry Smith col_lens[0] = MAT_FILE_CLASSID; 404d0f46423SBarry Smith col_lens[1] = A->rmap->n; 405d0f46423SBarry Smith col_lens[2] = A->cmap->n; 406416022c9SBarry Smith col_lens[3] = a->nz; 407416022c9SBarry Smith 408416022c9SBarry Smith /* store lengths of each row and write (including header) to file */ 409d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 410416022c9SBarry Smith col_lens[4+i] = a->i[i+1] - a->i[i]; 41117ab2063SBarry Smith } 412d0f46423SBarry Smith ierr = PetscBinaryWrite(fd,col_lens,4+A->rmap->n,PETSC_INT,PETSC_TRUE);CHKERRQ(ierr); 413606d414cSSatish Balay ierr = PetscFree(col_lens);CHKERRQ(ierr); 414416022c9SBarry Smith 415416022c9SBarry Smith /* store column indices (zero start index) */ 4166f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,a->j,a->nz,PETSC_INT,PETSC_FALSE);CHKERRQ(ierr); 417416022c9SBarry Smith 418416022c9SBarry Smith /* store nonzero values */ 4196f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,a->a,a->nz,PETSC_SCALAR,PETSC_FALSE);CHKERRQ(ierr); 4203a40ed3dSBarry Smith PetscFunctionReturn(0); 42117ab2063SBarry Smith } 422416022c9SBarry Smith 42309573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat,PetscViewer); 424cd155464SBarry Smith 4254a2ae208SSatish Balay #undef __FUNCT__ 4264a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqAIJ_ASCII" 427dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_ASCII(Mat A,PetscViewer viewer) 428416022c9SBarry Smith { 429416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 430dfbe8321SBarry Smith PetscErrorCode ierr; 431d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,shift=0; 432e060cb09SBarry Smith const char *name; 433f3ef73ceSBarry Smith PetscViewerFormat format; 43417ab2063SBarry Smith 4353a40ed3dSBarry Smith PetscFunctionBegin; 436b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 43771c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 43897f1f81fSBarry Smith PetscInt nofinalvalue = 0; 439d0f46423SBarry Smith if ((a->i[m] == a->i[m-1]) || (a->j[a->nz-1] != A->cmap->n-!shift)) { 440d00d2cf4SBarry Smith nofinalvalue = 1; 441d00d2cf4SBarry Smith } 442d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 443d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Size = %D %D \n",m,A->cmap->n);CHKERRQ(ierr); 44477431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Nonzeros = %D \n",a->nz);CHKERRQ(ierr); 44577431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"zzz = zeros(%D,3);\n",a->nz+nofinalvalue);CHKERRQ(ierr); 446b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"zzz = [\n");CHKERRQ(ierr); 44717ab2063SBarry Smith 44817ab2063SBarry Smith for (i=0; i<m; i++) { 449416022c9SBarry Smith for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 450aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 45177431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e + %18.16ei \n",i+1,a->j[j]+!shift,PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 45217ab2063SBarry Smith #else 45377431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e\n",i+1,a->j[j]+!shift,a->a[j]);CHKERRQ(ierr); 45417ab2063SBarry Smith #endif 45517ab2063SBarry Smith } 45617ab2063SBarry Smith } 457d00d2cf4SBarry Smith if (nofinalvalue) { 458d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e\n",m,A->cmap->n,0.0);CHKERRQ(ierr); 459d00d2cf4SBarry Smith } 460317d6ea6SBarry Smith ierr = PetscObjectGetName((PetscObject)A,&name);CHKERRQ(ierr); 461fb9695e5SSatish Balay ierr = PetscViewerASCIIPrintf(viewer,"];\n %s = spconvert(zzz);\n",name);CHKERRQ(ierr); 462d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 46368369a75SKris Buschelman } else if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO) { 464cd155464SBarry Smith PetscFunctionReturn(0); 465fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 466d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 4677566de4bSShri Abhyankar ierr = PetscObjectPrintClassNamePrefixType((PetscObject)A,viewer,"Matrix Object");CHKERRQ(ierr); 46844cd7ae7SLois Curfman McInnes for (i=0; i<m; i++) { 46977431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 47044cd7ae7SLois Curfman McInnes for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 471aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 47236db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 473a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G + %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 47436db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 475a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G - %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 47636db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 477a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,PetscRealPart(a->a[j]));CHKERRQ(ierr); 4786831982aSBarry Smith } 47944cd7ae7SLois Curfman McInnes #else 480a83599f4SBarry Smith if (a->a[j] != 0.0) {ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,a->a[j]);CHKERRQ(ierr);} 48144cd7ae7SLois Curfman McInnes #endif 48244cd7ae7SLois Curfman McInnes } 483b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 48444cd7ae7SLois Curfman McInnes } 485d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 486fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 48797f1f81fSBarry Smith PetscInt nzd=0,fshift=1,*sptr; 488d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 4897566de4bSShri Abhyankar ierr = PetscObjectPrintClassNamePrefixType((PetscObject)A,viewer,"Matrix Object");CHKERRQ(ierr); 49097f1f81fSBarry Smith ierr = PetscMalloc((m+1)*sizeof(PetscInt),&sptr);CHKERRQ(ierr); 491496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 492496be53dSLois Curfman McInnes sptr[i] = nzd+1; 493496be53dSLois Curfman McInnes for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 494496be53dSLois Curfman McInnes if (a->j[j] >= i) { 495aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 49636db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 497496be53dSLois Curfman McInnes #else 498496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 499496be53dSLois Curfman McInnes #endif 500496be53dSLois Curfman McInnes } 501496be53dSLois Curfman McInnes } 502496be53dSLois Curfman McInnes } 5032e44a96cSLois Curfman McInnes sptr[m] = nzd+1; 50477431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %D %D\n\n",m,nzd);CHKERRQ(ierr); 5052e44a96cSLois Curfman McInnes for (i=0; i<m+1; i+=6) { 50677431f27SBarry Smith if (i+4<m) {ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4],sptr[i+5]);CHKERRQ(ierr);} 50777431f27SBarry Smith else if (i+3<m) {ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4]);CHKERRQ(ierr);} 50877431f27SBarry Smith else if (i+2<m) {ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3]);CHKERRQ(ierr);} 50977431f27SBarry Smith else if (i+1<m) {ierr = PetscViewerASCIIPrintf(viewer," %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2]);CHKERRQ(ierr);} 51077431f27SBarry Smith else if (i<m) {ierr = PetscViewerASCIIPrintf(viewer," %D %D\n",sptr[i],sptr[i+1]);CHKERRQ(ierr);} 51177431f27SBarry Smith else {ierr = PetscViewerASCIIPrintf(viewer," %D\n",sptr[i]);CHKERRQ(ierr);} 512496be53dSLois Curfman McInnes } 513b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 514606d414cSSatish Balay ierr = PetscFree(sptr);CHKERRQ(ierr); 515496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 516496be53dSLois Curfman McInnes for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 51777431f27SBarry Smith if (a->j[j] >= i) {ierr = PetscViewerASCIIPrintf(viewer," %D ",a->j[j]+fshift);CHKERRQ(ierr);} 518496be53dSLois Curfman McInnes } 519b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 520496be53dSLois Curfman McInnes } 521b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 522496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 523496be53dSLois Curfman McInnes for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 524496be53dSLois Curfman McInnes if (a->j[j] >= i) { 525aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 52636db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) { 527b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %18.16e %18.16e ",PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 5286831982aSBarry Smith } 529496be53dSLois Curfman McInnes #else 530b0a32e0cSBarry Smith if (a->a[j] != 0.0) {ierr = PetscViewerASCIIPrintf(viewer," %18.16e ",a->a[j]);CHKERRQ(ierr);} 531496be53dSLois Curfman McInnes #endif 532496be53dSLois Curfman McInnes } 533496be53dSLois Curfman McInnes } 534b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 535496be53dSLois Curfman McInnes } 536d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 537fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 53897f1f81fSBarry Smith PetscInt cnt = 0,jcnt; 53987828ca2SBarry Smith PetscScalar value; 54002594712SBarry Smith 541d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 5427566de4bSShri Abhyankar ierr = PetscObjectPrintClassNamePrefixType((PetscObject)A,viewer,"Matrix Object");CHKERRQ(ierr); 54302594712SBarry Smith for (i=0; i<m; i++) { 54402594712SBarry Smith jcnt = 0; 545d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 546e24b481bSBarry Smith if (jcnt < a->i[i+1]-a->i[i] && j == a->j[cnt]) { 54702594712SBarry Smith value = a->a[cnt++]; 548e24b481bSBarry Smith jcnt++; 54902594712SBarry Smith } else { 55002594712SBarry Smith value = 0.0; 55102594712SBarry Smith } 552aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 553b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %7.5e+%7.5e i ",PetscRealPart(value),PetscImaginaryPart(value));CHKERRQ(ierr); 55402594712SBarry Smith #else 555b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %7.5e ",value);CHKERRQ(ierr); 55602594712SBarry Smith #endif 55702594712SBarry Smith } 558b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 55902594712SBarry Smith } 560d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 5613c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 562d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 5637566de4bSShri Abhyankar ierr = PetscObjectPrintClassNamePrefixType((PetscObject)A,viewer,"Matrix Object");CHKERRQ(ierr); 5643c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 5653c215bfdSMatthew Knepley ierr = PetscViewerASCIIPrintf(viewer,"%%matrix complex general\n");CHKERRQ(ierr); 5663c215bfdSMatthew Knepley #else 5673c215bfdSMatthew Knepley ierr = PetscViewerASCIIPrintf(viewer,"%%matrix real general\n");CHKERRQ(ierr); 5683c215bfdSMatthew Knepley #endif 569d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %D\n", m, A->cmap->n, a->nz);CHKERRQ(ierr); 5703c215bfdSMatthew Knepley for (i=0; i<m; i++) { 5713c215bfdSMatthew Knepley for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 5723c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 5733c215bfdSMatthew Knepley if (PetscImaginaryPart(a->a[j]) > 0.0) { 5743c215bfdSMatthew Knepley ierr = PetscViewerASCIIPrintf(viewer,"%D %D, %G %G\n", i+shift,a->j[j]+shift,PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 5753c215bfdSMatthew Knepley } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 5763c215bfdSMatthew Knepley ierr = PetscViewerASCIIPrintf(viewer,"%D %D, %G -%G\n", i+shift,a->j[j]+shift,PetscRealPart(a->a[j]),-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 5773c215bfdSMatthew Knepley } else { 5783c215bfdSMatthew Knepley ierr = PetscViewerASCIIPrintf(viewer,"%D %D, %G\n", i+shift,a->j[j]+shift,PetscRealPart(a->a[j]));CHKERRQ(ierr); 5793c215bfdSMatthew Knepley } 5803c215bfdSMatthew Knepley #else 5813c215bfdSMatthew Knepley ierr = PetscViewerASCIIPrintf(viewer,"%D %D %G\n", i+shift, a->j[j]+shift, a->a[j]);CHKERRQ(ierr); 5823c215bfdSMatthew Knepley #endif 5833c215bfdSMatthew Knepley } 5843c215bfdSMatthew Knepley } 585d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 5863a40ed3dSBarry Smith } else { 587d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 5887566de4bSShri Abhyankar ierr = PetscObjectPrintClassNamePrefixType((PetscObject)A,viewer,"Matrix Object");CHKERRQ(ierr); 589d5f3da31SBarry Smith if (A->factortype){ 59016cd7e1dSShri Abhyankar for (i=0; i<m; i++) { 59116cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 59216cd7e1dSShri Abhyankar /* L part */ 59316cd7e1dSShri Abhyankar for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 59416cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 59516cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 59616cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G + %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 59716cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 59816cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G - %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 59916cd7e1dSShri Abhyankar } else { 60016cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,PetscRealPart(a->a[j]));CHKERRQ(ierr); 60116cd7e1dSShri Abhyankar } 60216cd7e1dSShri Abhyankar #else 60316cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,a->a[j]);CHKERRQ(ierr); 60416cd7e1dSShri Abhyankar #endif 60516cd7e1dSShri Abhyankar } 60616cd7e1dSShri Abhyankar /* diagonal */ 60716cd7e1dSShri Abhyankar j = a->diag[i]; 60816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 60916cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 6102c990fa1SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (%D, %G + %G i)",a->j[j]+shift,PetscRealPart(1.0/a->a[j]),PetscImaginaryPart(1.0/a->a[j]));CHKERRQ(ierr); 61116cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 6122c990fa1SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (%D, %G - %G i)",a->j[j]+shift,PetscRealPart(1.0/a->a[j]),-PetscImaginaryPart(1.0/a->a[j]));CHKERRQ(ierr); 61316cd7e1dSShri Abhyankar } else { 6142c990fa1SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,PetscRealPart(1.0/a->a[j]));CHKERRQ(ierr); 61516cd7e1dSShri Abhyankar } 61616cd7e1dSShri Abhyankar #else 6172c990fa1SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,1.0/a->a[j]);CHKERRQ(ierr); 61816cd7e1dSShri Abhyankar #endif 61916cd7e1dSShri Abhyankar 62016cd7e1dSShri Abhyankar /* U part */ 62116cd7e1dSShri Abhyankar for (j=a->diag[i+1]+1+shift; j<a->diag[i]+shift; j++) { 62216cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 62316cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 62416cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G + %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 62516cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 62616cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G - %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 62716cd7e1dSShri Abhyankar } else { 62816cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,PetscRealPart(a->a[j]));CHKERRQ(ierr); 62916cd7e1dSShri Abhyankar } 63016cd7e1dSShri Abhyankar #else 63116cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,a->a[j]);CHKERRQ(ierr); 63216cd7e1dSShri Abhyankar #endif 63316cd7e1dSShri Abhyankar } 63416cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 63516cd7e1dSShri Abhyankar } 63616cd7e1dSShri Abhyankar } else { 63717ab2063SBarry Smith for (i=0; i<m; i++) { 63877431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 639416022c9SBarry Smith for (j=a->i[i]+shift; j<a->i[i+1]+shift; j++) { 640aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 64136db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 642a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G + %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 64336db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 644a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G - %G i)",a->j[j]+shift,PetscRealPart(a->a[j]),-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 6453a40ed3dSBarry Smith } else { 646a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,PetscRealPart(a->a[j]));CHKERRQ(ierr); 64717ab2063SBarry Smith } 64817ab2063SBarry Smith #else 649a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",a->j[j]+shift,a->a[j]);CHKERRQ(ierr); 65017ab2063SBarry Smith #endif 65117ab2063SBarry Smith } 652b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 65317ab2063SBarry Smith } 65416cd7e1dSShri Abhyankar } 655d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 65617ab2063SBarry Smith } 657b0a32e0cSBarry Smith ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 6583a40ed3dSBarry Smith PetscFunctionReturn(0); 659416022c9SBarry Smith } 660416022c9SBarry Smith 6614a2ae208SSatish Balay #undef __FUNCT__ 6624a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqAIJ_Draw_Zoom" 663dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw,void *Aa) 664416022c9SBarry Smith { 665480ef9eaSBarry Smith Mat A = (Mat) Aa; 666416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 667dfbe8321SBarry Smith PetscErrorCode ierr; 668d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,color; 66936db0b34SBarry Smith PetscReal xl,yl,xr,yr,x_l,x_r,y_l,y_r,maxv = 0.0; 670b0a32e0cSBarry Smith PetscViewer viewer; 671f3ef73ceSBarry Smith PetscViewerFormat format; 672cddf8d76SBarry Smith 6733a40ed3dSBarry Smith PetscFunctionBegin; 674480ef9eaSBarry Smith ierr = PetscObjectQuery((PetscObject)A,"Zoomviewer",(PetscObject*)&viewer);CHKERRQ(ierr); 675b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 67619bcc07fSBarry Smith 677b0a32e0cSBarry Smith ierr = PetscDrawGetCoordinates(draw,&xl,&yl,&xr,&yr);CHKERRQ(ierr); 678416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 6790513a670SBarry Smith 680fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 6810513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 682b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 683416022c9SBarry Smith for (i=0; i<m; i++) { 684cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 685bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 686bfeeae90SHong Zhang x_l = a->j[j] ; x_r = x_l + 1.0; 687aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 68836db0b34SBarry Smith if (PetscRealPart(a->a[j]) >= 0.) continue; 689cddf8d76SBarry Smith #else 690cddf8d76SBarry Smith if (a->a[j] >= 0.) continue; 691cddf8d76SBarry Smith #endif 692b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 693cddf8d76SBarry Smith } 694cddf8d76SBarry Smith } 695b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 696cddf8d76SBarry Smith for (i=0; i<m; i++) { 697cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 698bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 699bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 700cddf8d76SBarry Smith if (a->a[j] != 0.) continue; 701b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 702cddf8d76SBarry Smith } 703cddf8d76SBarry Smith } 704b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 705cddf8d76SBarry Smith for (i=0; i<m; i++) { 706cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 707bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 708bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 709aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 71036db0b34SBarry Smith if (PetscRealPart(a->a[j]) <= 0.) continue; 711cddf8d76SBarry Smith #else 712cddf8d76SBarry Smith if (a->a[j] <= 0.) continue; 713cddf8d76SBarry Smith #endif 714b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 715416022c9SBarry Smith } 716416022c9SBarry Smith } 7170513a670SBarry Smith } else { 7180513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 7190513a670SBarry Smith /* first determine max of all nonzero values */ 72097f1f81fSBarry Smith PetscInt nz = a->nz,count; 721b0a32e0cSBarry Smith PetscDraw popup; 72236db0b34SBarry Smith PetscReal scale; 7230513a670SBarry Smith 7240513a670SBarry Smith for (i=0; i<nz; i++) { 7250513a670SBarry Smith if (PetscAbsScalar(a->a[i]) > maxv) maxv = PetscAbsScalar(a->a[i]); 7260513a670SBarry Smith } 727b0a32e0cSBarry Smith scale = (245.0 - PETSC_DRAW_BASIC_COLORS)/maxv; 728b0a32e0cSBarry Smith ierr = PetscDrawGetPopup(draw,&popup);CHKERRQ(ierr); 729b0a32e0cSBarry Smith if (popup) {ierr = PetscDrawScalePopup(popup,0.0,maxv);CHKERRQ(ierr);} 7300513a670SBarry Smith count = 0; 7310513a670SBarry Smith for (i=0; i<m; i++) { 7320513a670SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 733bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 734bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 73597f1f81fSBarry Smith color = PETSC_DRAW_BASIC_COLORS + (PetscInt)(scale*PetscAbsScalar(a->a[count])); 736b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 7370513a670SBarry Smith count++; 7380513a670SBarry Smith } 7390513a670SBarry Smith } 7400513a670SBarry Smith } 741480ef9eaSBarry Smith PetscFunctionReturn(0); 742480ef9eaSBarry Smith } 743cddf8d76SBarry Smith 7444a2ae208SSatish Balay #undef __FUNCT__ 7454a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqAIJ_Draw" 746dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw(Mat A,PetscViewer viewer) 747480ef9eaSBarry Smith { 748dfbe8321SBarry Smith PetscErrorCode ierr; 749b0a32e0cSBarry Smith PetscDraw draw; 75036db0b34SBarry Smith PetscReal xr,yr,xl,yl,h,w; 751ace3abfcSBarry Smith PetscBool isnull; 752480ef9eaSBarry Smith 753480ef9eaSBarry Smith PetscFunctionBegin; 754b0a32e0cSBarry Smith ierr = PetscViewerDrawGetDraw(viewer,0,&draw);CHKERRQ(ierr); 755b0a32e0cSBarry Smith ierr = PetscDrawIsNull(draw,&isnull);CHKERRQ(ierr); 756480ef9eaSBarry Smith if (isnull) PetscFunctionReturn(0); 757480ef9eaSBarry Smith 758480ef9eaSBarry Smith ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",(PetscObject)viewer);CHKERRQ(ierr); 759d0f46423SBarry Smith xr = A->cmap->n; yr = A->rmap->n; h = yr/10.0; w = xr/10.0; 760480ef9eaSBarry Smith xr += w; yr += h; xl = -w; yl = -h; 761b0a32e0cSBarry Smith ierr = PetscDrawSetCoordinates(draw,xl,yl,xr,yr);CHKERRQ(ierr); 762b0a32e0cSBarry Smith ierr = PetscDrawZoom(draw,MatView_SeqAIJ_Draw_Zoom,A);CHKERRQ(ierr); 763480ef9eaSBarry Smith ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",PETSC_NULL);CHKERRQ(ierr); 7643a40ed3dSBarry Smith PetscFunctionReturn(0); 765416022c9SBarry Smith } 766416022c9SBarry Smith 7674a2ae208SSatish Balay #undef __FUNCT__ 7684a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqAIJ" 769dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ(Mat A,PetscViewer viewer) 770416022c9SBarry Smith { 771dfbe8321SBarry Smith PetscErrorCode ierr; 772ace3abfcSBarry Smith PetscBool iascii,isbinary,isdraw; 773416022c9SBarry Smith 7743a40ed3dSBarry Smith PetscFunctionBegin; 7752692d6eeSBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 7762692d6eeSBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 7772692d6eeSBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSCVIEWERDRAW,&isdraw);CHKERRQ(ierr); 778c45a1595SBarry Smith if (iascii) { 7793a40ed3dSBarry Smith ierr = MatView_SeqAIJ_ASCII(A,viewer);CHKERRQ(ierr); 7800f5bd95cSBarry Smith } else if (isbinary) { 7813a40ed3dSBarry Smith ierr = MatView_SeqAIJ_Binary(A,viewer);CHKERRQ(ierr); 7820f5bd95cSBarry Smith } else if (isdraw) { 7833a40ed3dSBarry Smith ierr = MatView_SeqAIJ_Draw(A,viewer);CHKERRQ(ierr); 784913ac41fSBarry Smith } else SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"Viewer type %s not supported by SeqAIJ matrices",((PetscObject)viewer)->type_name); 7854108e4d5SBarry Smith ierr = MatView_SeqAIJ_Inode(A,viewer);CHKERRQ(ierr); 7863a40ed3dSBarry Smith PetscFunctionReturn(0); 78717ab2063SBarry Smith } 78819bcc07fSBarry Smith 7894a2ae208SSatish Balay #undef __FUNCT__ 7904a2ae208SSatish Balay #define __FUNCT__ "MatAssemblyEnd_SeqAIJ" 791dfbe8321SBarry Smith PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A,MatAssemblyType mode) 79217ab2063SBarry Smith { 793416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 7946849ba73SBarry Smith PetscErrorCode ierr; 79597f1f81fSBarry Smith PetscInt fshift = 0,i,j,*ai = a->i,*aj = a->j,*imax = a->imax; 796d0f46423SBarry Smith PetscInt m = A->rmap->n,*ip,N,*ailen = a->ilen,rmax = 0; 79754f21887SBarry Smith MatScalar *aa = a->a,*ap; 7983447b6efSHong Zhang PetscReal ratio=0.6; 79917ab2063SBarry Smith 8003a40ed3dSBarry Smith PetscFunctionBegin; 8013a40ed3dSBarry Smith if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0); 80217ab2063SBarry Smith 80343ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 80417ab2063SBarry Smith for (i=1; i<m; i++) { 805416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 80617ab2063SBarry Smith fshift += imax[i-1] - ailen[i-1]; 80794a9d846SBarry Smith rmax = PetscMax(rmax,ailen[i]); 80817ab2063SBarry Smith if (fshift) { 809bfeeae90SHong Zhang ip = aj + ai[i] ; 810bfeeae90SHong Zhang ap = aa + ai[i] ; 81117ab2063SBarry Smith N = ailen[i]; 81217ab2063SBarry Smith for (j=0; j<N; j++) { 81317ab2063SBarry Smith ip[j-fshift] = ip[j]; 81417ab2063SBarry Smith ap[j-fshift] = ap[j]; 81517ab2063SBarry Smith } 81617ab2063SBarry Smith } 81717ab2063SBarry Smith ai[i] = ai[i-1] + ailen[i-1]; 81817ab2063SBarry Smith } 81917ab2063SBarry Smith if (m) { 82017ab2063SBarry Smith fshift += imax[m-1] - ailen[m-1]; 82117ab2063SBarry Smith ai[m] = ai[m-1] + ailen[m-1]; 82217ab2063SBarry Smith } 82317ab2063SBarry Smith /* reset ilen and imax for each row */ 82417ab2063SBarry Smith for (i=0; i<m; i++) { 82517ab2063SBarry Smith ailen[i] = imax[i] = ai[i+1] - ai[i]; 82617ab2063SBarry Smith } 827bfeeae90SHong Zhang a->nz = ai[m]; 82865e19b50SBarry Smith if (fshift && a->nounused == -1) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_PLIB, "Unused space detected in matrix: %D X %D, %D unneeded", m, A->cmap->n, fshift); 82917ab2063SBarry Smith 83009f38230SBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 831d0f46423SBarry Smith ierr = PetscInfo4(A,"Matrix size: %D X %D; storage space: %D unneeded,%D used\n",m,A->cmap->n,fshift,a->nz);CHKERRQ(ierr); 832ae15b995SBarry Smith ierr = PetscInfo1(A,"Number of mallocs during MatSetValues() is %D\n",a->reallocs);CHKERRQ(ierr); 833ae15b995SBarry Smith ierr = PetscInfo1(A,"Maximum nonzeros in any row is %D\n",rmax);CHKERRQ(ierr); 8348e58a170SBarry Smith A->info.mallocs += a->reallocs; 835dd5f02e7SSatish Balay a->reallocs = 0; 8364e220ebcSLois Curfman McInnes A->info.nz_unneeded = (double)fshift; 83736db0b34SBarry Smith a->rmax = rmax; 8384e220ebcSLois Curfman McInnes 839cd6b891eSBarry Smith ierr = MatCheckCompressedRow(A,&a->compressedrow,a->i,m,ratio);CHKERRQ(ierr); 84088e51ccdSHong Zhang A->same_nonzero = PETSC_TRUE; 84171c2f376SKris Buschelman 8424108e4d5SBarry Smith ierr = MatAssemblyEnd_SeqAIJ_Inode(A,mode);CHKERRQ(ierr); 84371f1c65dSBarry Smith 84471f1c65dSBarry Smith a->idiagvalid = PETSC_FALSE; 845bbead8a2SBarry Smith a->ibdiagvalid = PETSC_FALSE; 8463a40ed3dSBarry Smith PetscFunctionReturn(0); 84717ab2063SBarry Smith } 84817ab2063SBarry Smith 8494a2ae208SSatish Balay #undef __FUNCT__ 85099cafbc1SBarry Smith #define __FUNCT__ "MatRealPart_SeqAIJ" 85199cafbc1SBarry Smith PetscErrorCode MatRealPart_SeqAIJ(Mat A) 85299cafbc1SBarry Smith { 85399cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 85499cafbc1SBarry Smith PetscInt i,nz = a->nz; 85554f21887SBarry Smith MatScalar *aa = a->a; 85699cafbc1SBarry Smith 85799cafbc1SBarry Smith PetscFunctionBegin; 85899cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscRealPart(aa[i]); 85986c113feSBarry Smith a->idiagvalid = PETSC_FALSE; 86086c113feSBarry Smith a->ibdiagvalid = PETSC_FALSE; 86199cafbc1SBarry Smith PetscFunctionReturn(0); 86299cafbc1SBarry Smith } 86399cafbc1SBarry Smith 86499cafbc1SBarry Smith #undef __FUNCT__ 86599cafbc1SBarry Smith #define __FUNCT__ "MatImaginaryPart_SeqAIJ" 86699cafbc1SBarry Smith PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 86799cafbc1SBarry Smith { 86899cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 86999cafbc1SBarry Smith PetscInt i,nz = a->nz; 87054f21887SBarry Smith MatScalar *aa = a->a; 87199cafbc1SBarry Smith 87299cafbc1SBarry Smith PetscFunctionBegin; 87399cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 87486c113feSBarry Smith a->idiagvalid = PETSC_FALSE; 87586c113feSBarry Smith a->ibdiagvalid = PETSC_FALSE; 87699cafbc1SBarry Smith PetscFunctionReturn(0); 87799cafbc1SBarry Smith } 87899cafbc1SBarry Smith 87999cafbc1SBarry Smith #undef __FUNCT__ 8804a2ae208SSatish Balay #define __FUNCT__ "MatZeroEntries_SeqAIJ" 881dfbe8321SBarry Smith PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 88217ab2063SBarry Smith { 883416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 884dfbe8321SBarry Smith PetscErrorCode ierr; 8853a40ed3dSBarry Smith 8863a40ed3dSBarry Smith PetscFunctionBegin; 887d0f46423SBarry Smith ierr = PetscMemzero(a->a,(a->i[A->rmap->n])*sizeof(PetscScalar));CHKERRQ(ierr); 88886c113feSBarry Smith a->idiagvalid = PETSC_FALSE; 88986c113feSBarry Smith a->ibdiagvalid = PETSC_FALSE; 8903a40ed3dSBarry Smith PetscFunctionReturn(0); 89117ab2063SBarry Smith } 892416022c9SBarry Smith 8934a2ae208SSatish Balay #undef __FUNCT__ 8944a2ae208SSatish Balay #define __FUNCT__ "MatDestroy_SeqAIJ" 895dfbe8321SBarry Smith PetscErrorCode MatDestroy_SeqAIJ(Mat A) 89617ab2063SBarry Smith { 897416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 898dfbe8321SBarry Smith PetscErrorCode ierr; 899d5d45c9bSBarry Smith 9003a40ed3dSBarry Smith PetscFunctionBegin; 901aa482453SBarry Smith #if defined(PETSC_USE_LOG) 902d0f46423SBarry Smith PetscLogObjectState((PetscObject)A,"Rows=%D, Cols=%D, NZ=%D",A->rmap->n,A->cmap->n,a->nz); 90317ab2063SBarry Smith #endif 904e6b907acSBarry Smith ierr = MatSeqXAIJFreeAIJ(A,&a->a,&a->j,&a->i);CHKERRQ(ierr); 9056bf464f9SBarry Smith ierr = ISDestroy(&a->row);CHKERRQ(ierr); 9066bf464f9SBarry Smith ierr = ISDestroy(&a->col);CHKERRQ(ierr); 90705b42c5fSBarry Smith ierr = PetscFree(a->diag);CHKERRQ(ierr); 908d48dcb14SBarry Smith ierr = PetscFree(a->ibdiag);CHKERRQ(ierr); 90905b42c5fSBarry Smith ierr = PetscFree2(a->imax,a->ilen);CHKERRQ(ierr); 91071f1c65dSBarry Smith ierr = PetscFree3(a->idiag,a->mdiag,a->ssor_work);CHKERRQ(ierr); 91105b42c5fSBarry Smith ierr = PetscFree(a->solve_work);CHKERRQ(ierr); 9126bf464f9SBarry Smith ierr = ISDestroy(&a->icol);CHKERRQ(ierr); 91305b42c5fSBarry Smith ierr = PetscFree(a->saved_values);CHKERRQ(ierr); 9146bf464f9SBarry Smith ierr = ISColoringDestroy(&a->coloring);CHKERRQ(ierr); 91505b42c5fSBarry Smith ierr = PetscFree(a->xtoy);CHKERRQ(ierr); 9166bf464f9SBarry Smith ierr = MatDestroy(&a->XtoY);CHKERRQ(ierr); 917cd6b891eSBarry Smith ierr = PetscFree2(a->compressedrow.i,a->compressedrow.rindex);CHKERRQ(ierr); 9180b7e3e3dSHong Zhang ierr = PetscFree(a->matmult_abdense);CHKERRQ(ierr); 919a30b2313SHong Zhang 9204108e4d5SBarry Smith ierr = MatDestroy_SeqAIJ_Inode(A);CHKERRQ(ierr); 921bf0cc555SLisandro Dalcin ierr = PetscFree(A->data);CHKERRQ(ierr); 922901853e0SKris Buschelman 923dbd8c25aSHong Zhang ierr = PetscObjectChangeTypeName((PetscObject)A,0);CHKERRQ(ierr); 924901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatSeqAIJSetColumnIndices_C","",PETSC_NULL);CHKERRQ(ierr); 925901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatStoreValues_C","",PETSC_NULL);CHKERRQ(ierr); 926901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatRetrieveValues_C","",PETSC_NULL);CHKERRQ(ierr); 927901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatConvert_seqaij_seqsbaij_C","",PETSC_NULL);CHKERRQ(ierr); 928901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatConvert_seqaij_seqbaij_C","",PETSC_NULL);CHKERRQ(ierr); 9295a11e1b2SBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatConvert_seqaij_seqaijperm_C","",PETSC_NULL);CHKERRQ(ierr); 930901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatIsTranspose_C","",PETSC_NULL);CHKERRQ(ierr); 931901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatSeqAIJSetPreallocation_C","",PETSC_NULL);CHKERRQ(ierr); 932a1661176SMatthew Knepley ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatSeqAIJSetPreallocationCSR_C","",PETSC_NULL);CHKERRQ(ierr); 933901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatReorderForNonzeroDiagonal_C","",PETSC_NULL);CHKERRQ(ierr); 9343a40ed3dSBarry Smith PetscFunctionReturn(0); 93517ab2063SBarry Smith } 93617ab2063SBarry Smith 9374a2ae208SSatish Balay #undef __FUNCT__ 9384a2ae208SSatish Balay #define __FUNCT__ "MatSetOption_SeqAIJ" 939ace3abfcSBarry Smith PetscErrorCode MatSetOption_SeqAIJ(Mat A,MatOption op,PetscBool flg) 94017ab2063SBarry Smith { 941416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 9424846f1f5SKris Buschelman PetscErrorCode ierr; 9433a40ed3dSBarry Smith 9443a40ed3dSBarry Smith PetscFunctionBegin; 945a65d3064SKris Buschelman switch (op) { 946a65d3064SKris Buschelman case MAT_ROW_ORIENTED: 9474e0d8c25SBarry Smith a->roworiented = flg; 948a65d3064SKris Buschelman break; 949a9817697SBarry Smith case MAT_KEEP_NONZERO_PATTERN: 950a9817697SBarry Smith a->keepnonzeropattern = flg; 951a65d3064SKris Buschelman break; 952512a5fc5SBarry Smith case MAT_NEW_NONZERO_LOCATIONS: 953512a5fc5SBarry Smith a->nonew = (flg ? 0 : 1); 954a65d3064SKris Buschelman break; 955a65d3064SKris Buschelman case MAT_NEW_NONZERO_LOCATION_ERR: 9564e0d8c25SBarry Smith a->nonew = (flg ? -1 : 0); 957a65d3064SKris Buschelman break; 958a65d3064SKris Buschelman case MAT_NEW_NONZERO_ALLOCATION_ERR: 9594e0d8c25SBarry Smith a->nonew = (flg ? -2 : 0); 960a65d3064SKris Buschelman break; 96128b2fa4aSMatthew Knepley case MAT_UNUSED_NONZERO_LOCATION_ERR: 96228b2fa4aSMatthew Knepley a->nounused = (flg ? -1 : 0); 96328b2fa4aSMatthew Knepley break; 964a65d3064SKris Buschelman case MAT_IGNORE_ZERO_ENTRIES: 9654e0d8c25SBarry Smith a->ignorezeroentries = flg; 9660df259c2SBarry Smith break; 967cd6b891eSBarry Smith case MAT_CHECK_COMPRESSED_ROW: 968cd6b891eSBarry Smith a->compressedrow.check = flg; 969d487561eSHong Zhang break; 9703d472b54SHong Zhang case MAT_SPD: 9713d472b54SHong Zhang A->spd_set = PETSC_TRUE; 9723d472b54SHong Zhang A->spd = flg; 9733d472b54SHong Zhang if (flg) { 9743d472b54SHong Zhang A->symmetric = PETSC_TRUE; 9753d472b54SHong Zhang A->structurally_symmetric = PETSC_TRUE; 9763d472b54SHong Zhang A->symmetric_set = PETSC_TRUE; 9773d472b54SHong Zhang A->structurally_symmetric_set = PETSC_TRUE; 9783d472b54SHong Zhang } 9793d472b54SHong Zhang break; 980b1646e73SJed Brown case MAT_SYMMETRIC: 981b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 982b1646e73SJed Brown case MAT_HERMITIAN: 983b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 9844e0d8c25SBarry Smith case MAT_NEW_DIAGONALS: 985a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 986a65d3064SKris Buschelman case MAT_USE_HASH_TABLE: 987290bbb0aSBarry Smith ierr = PetscInfo1(A,"Option %s ignored\n",MatOptions[op]);CHKERRQ(ierr); 988a65d3064SKris Buschelman break; 989b87ac2d8SJed Brown case MAT_USE_INODES: 990b87ac2d8SJed Brown /* Not an error because MatSetOption_SeqAIJ_Inode handles this one */ 991b87ac2d8SJed Brown break; 992a65d3064SKris Buschelman default: 993e32f2f54SBarry Smith SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"unknown option %d",op); 994a65d3064SKris Buschelman } 9954108e4d5SBarry Smith ierr = MatSetOption_SeqAIJ_Inode(A,op,flg);CHKERRQ(ierr); 9963a40ed3dSBarry Smith PetscFunctionReturn(0); 99717ab2063SBarry Smith } 99817ab2063SBarry Smith 9994a2ae208SSatish Balay #undef __FUNCT__ 10004a2ae208SSatish Balay #define __FUNCT__ "MatGetDiagonal_SeqAIJ" 1001dfbe8321SBarry Smith PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A,Vec v) 100217ab2063SBarry Smith { 1003416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 10046849ba73SBarry Smith PetscErrorCode ierr; 1005d3e70bfaSHong Zhang PetscInt i,j,n,*ai=a->i,*aj=a->j,nz; 100635e7444dSHong Zhang PetscScalar *aa=a->a,*x,zero=0.0; 100717ab2063SBarry Smith 10083a40ed3dSBarry Smith PetscFunctionBegin; 1009d3e70bfaSHong Zhang ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 1010e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 101135e7444dSHong Zhang 1012d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU){ 1013d3e70bfaSHong Zhang PetscInt *diag=a->diag; 101435e7444dSHong Zhang ierr = VecGetArray(v,&x);CHKERRQ(ierr); 10152c990fa1SHong Zhang for (i=0; i<n; i++) x[i] = 1.0/aa[diag[i]]; 101635e7444dSHong Zhang ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 101735e7444dSHong Zhang PetscFunctionReturn(0); 101835e7444dSHong Zhang } 101935e7444dSHong Zhang 10202dcb1b2aSMatthew Knepley ierr = VecSet(v,zero);CHKERRQ(ierr); 10211ebc52fbSHong Zhang ierr = VecGetArray(v,&x);CHKERRQ(ierr); 102235e7444dSHong Zhang for (i=0; i<n; i++) { 102335e7444dSHong Zhang nz = ai[i+1] - ai[i]; 10242f5a7c2eSBarry Smith if (!nz) x[i] = 0.0; 102535e7444dSHong Zhang for (j=ai[i]; j<ai[i+1]; j++){ 102635e7444dSHong Zhang if (aj[j] == i) { 102735e7444dSHong Zhang x[i] = aa[j]; 102817ab2063SBarry Smith break; 102917ab2063SBarry Smith } 103017ab2063SBarry Smith } 103117ab2063SBarry Smith } 10321ebc52fbSHong Zhang ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 10333a40ed3dSBarry Smith PetscFunctionReturn(0); 103417ab2063SBarry Smith } 103517ab2063SBarry Smith 1036c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 10374a2ae208SSatish Balay #undef __FUNCT__ 10384a2ae208SSatish Balay #define __FUNCT__ "MatMultTransposeAdd_SeqAIJ" 1039dfbe8321SBarry Smith PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A,Vec xx,Vec zz,Vec yy) 104017ab2063SBarry Smith { 1041416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 10425c897100SBarry Smith PetscScalar *x,*y; 1043dfbe8321SBarry Smith PetscErrorCode ierr; 1044d0f46423SBarry Smith PetscInt m = A->rmap->n; 10455c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1046a77337e4SBarry Smith MatScalar *v; 1047a77337e4SBarry Smith PetscScalar alpha; 104804fbf559SBarry Smith PetscInt n,i,j,*idx,*ii,*ridx=PETSC_NULL; 10493447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1050ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 10515c897100SBarry Smith #endif 105217ab2063SBarry Smith 10533a40ed3dSBarry Smith PetscFunctionBegin; 10542e8a6d31SBarry Smith if (zz != yy) {ierr = VecCopy(zz,yy);CHKERRQ(ierr);} 10551ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 10561ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 10575c897100SBarry Smith 10585c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1059bfeeae90SHong Zhang fortranmulttransposeaddaij_(&m,x,a->i,a->j,a->a,y); 10605c897100SBarry Smith #else 10613447b6efSHong Zhang if (usecprow){ 10623447b6efSHong Zhang m = cprow.nrows; 10633447b6efSHong Zhang ii = cprow.i; 10647b2bb3b9SHong Zhang ridx = cprow.rindex; 10653447b6efSHong Zhang } else { 10663447b6efSHong Zhang ii = a->i; 10673447b6efSHong Zhang } 106817ab2063SBarry Smith for (i=0; i<m; i++) { 10693447b6efSHong Zhang idx = a->j + ii[i] ; 10703447b6efSHong Zhang v = a->a + ii[i] ; 10713447b6efSHong Zhang n = ii[i+1] - ii[i]; 10723447b6efSHong Zhang if (usecprow){ 10737b2bb3b9SHong Zhang alpha = x[ridx[i]]; 10743447b6efSHong Zhang } else { 107517ab2063SBarry Smith alpha = x[i]; 10763447b6efSHong Zhang } 107704fbf559SBarry Smith for (j=0; j<n; j++) y[idx[j]] += alpha*v[j]; 107817ab2063SBarry Smith } 10795c897100SBarry Smith #endif 1080dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 10811ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 10821ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 10833a40ed3dSBarry Smith PetscFunctionReturn(0); 108417ab2063SBarry Smith } 108517ab2063SBarry Smith 10864a2ae208SSatish Balay #undef __FUNCT__ 10875c897100SBarry Smith #define __FUNCT__ "MatMultTranspose_SeqAIJ" 1088dfbe8321SBarry Smith PetscErrorCode MatMultTranspose_SeqAIJ(Mat A,Vec xx,Vec yy) 10895c897100SBarry Smith { 1090dfbe8321SBarry Smith PetscErrorCode ierr; 10915c897100SBarry Smith 10925c897100SBarry Smith PetscFunctionBegin; 1093170fe5c8SBarry Smith ierr = VecSet(yy,0.0);CHKERRQ(ierr); 10945c897100SBarry Smith ierr = MatMultTransposeAdd_SeqAIJ(A,xx,yy,yy);CHKERRQ(ierr); 10955c897100SBarry Smith PetscFunctionReturn(0); 10965c897100SBarry Smith } 10975c897100SBarry Smith 1098c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 10995c897100SBarry Smith #undef __FUNCT__ 11004a2ae208SSatish Balay #define __FUNCT__ "MatMult_SeqAIJ" 1101dfbe8321SBarry Smith PetscErrorCode MatMult_SeqAIJ(Mat A,Vec xx,Vec yy) 110217ab2063SBarry Smith { 1103416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1104d9fead3dSBarry Smith PetscScalar *y; 110554f21887SBarry Smith const PetscScalar *x; 110654f21887SBarry Smith const MatScalar *aa; 1107dfbe8321SBarry Smith PetscErrorCode ierr; 1108003131ecSBarry Smith PetscInt m=A->rmap->n; 1109003131ecSBarry Smith const PetscInt *aj,*ii,*ridx=PETSC_NULL; 11108aee2decSHong Zhang PetscInt n,i,nonzerorow=0; 1111362ced78SSatish Balay PetscScalar sum; 1112ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 111317ab2063SBarry Smith 1114b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 111597952fefSHong Zhang #pragma disjoint(*x,*y,*aa) 1116fee21e36SBarry Smith #endif 1117fee21e36SBarry Smith 11183a40ed3dSBarry Smith PetscFunctionBegin; 11193649974fSBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 11201ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 112197952fefSHong Zhang aj = a->j; 112297952fefSHong Zhang aa = a->a; 1123416022c9SBarry Smith ii = a->i; 11244eb6d288SHong Zhang if (usecprow){ /* use compressed row format */ 112597952fefSHong Zhang m = a->compressedrow.nrows; 112697952fefSHong Zhang ii = a->compressedrow.i; 112797952fefSHong Zhang ridx = a->compressedrow.rindex; 112897952fefSHong Zhang for (i=0; i<m; i++){ 112997952fefSHong Zhang n = ii[i+1] - ii[i]; 113097952fefSHong Zhang aj = a->j + ii[i]; 113197952fefSHong Zhang aa = a->a + ii[i]; 113297952fefSHong Zhang sum = 0.0; 1133a46b3154SVictor Eijkhout nonzerorow += (n>0); 1134003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 1135003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 113697952fefSHong Zhang y[*ridx++] = sum; 113797952fefSHong Zhang } 113897952fefSHong Zhang } else { /* do not use compressed row format */ 1139b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 1140b05257ddSBarry Smith fortranmultaij_(&m,x,ii,aj,aa,y); 1141b05257ddSBarry Smith #else 114217ab2063SBarry Smith for (i=0; i<m; i++) { 1143003131ecSBarry Smith n = ii[i+1] - ii[i]; 1144003131ecSBarry Smith aj = a->j + ii[i]; 1145003131ecSBarry Smith aa = a->a + ii[i]; 114617ab2063SBarry Smith sum = 0.0; 1147a46b3154SVictor Eijkhout nonzerorow += (n>0); 1148003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 114917ab2063SBarry Smith y[i] = sum; 115017ab2063SBarry Smith } 11518d195f9aSBarry Smith #endif 1152b05257ddSBarry Smith } 1153dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*a->nz - nonzerorow);CHKERRQ(ierr); 11543649974fSBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 11551ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 11563a40ed3dSBarry Smith PetscFunctionReturn(0); 115717ab2063SBarry Smith } 115817ab2063SBarry Smith 115963db405bSBarry Smith #if defined(PETSC_HAVE_PTHREADCLASSES) 116063db405bSBarry Smith 11610c74a584SJed Brown /* ******************* */ 1162700485ddSSatish Balay #if defined(PETSC_HAVE_PTHREADCLASSES) 1163cfcfc605SKerry Stevens extern PetscBool PetscUseThreadPool; 1164fdfc40dbSShri Abhyankar #if defined(PETSC_HAVE_CPU_SET_T) 1165cfcfc605SKerry Stevens void* DoCoreAffinity(void); 1166fdfc40dbSShri Abhyankar #endif 1167cfcfc605SKerry Stevens 11680ca81413SKerry Stevens typedef struct { 11690ca81413SKerry Stevens const MatScalar* matdata; 11700ca81413SKerry Stevens const PetscScalar* vecdata; 11710ca81413SKerry Stevens PetscScalar* vecout; 11720ca81413SKerry Stevens const PetscInt* colindnz; 11730ca81413SKerry Stevens const PetscInt* rownumnz; 11740ca81413SKerry Stevens PetscInt numrows; 11750ca81413SKerry Stevens const PetscInt* specidx; 11760ca81413SKerry Stevens PetscInt nzr; 11770ca81413SKerry Stevens } MatMult_KernelData; 11780ca81413SKerry Stevens 11790ca81413SKerry Stevens void* MatMult_Kernel(void *arg) 11800ca81413SKerry Stevens { 1181cfcfc605SKerry Stevens if(PetscUseThreadPool==PETSC_FALSE) { 1182fdfc40dbSShri Abhyankar #if defined(PETSC_HAVE_CPU_SET_T) 1183cfcfc605SKerry Stevens DoCoreAffinity(); 1184fdfc40dbSShri Abhyankar #endif 1185cfcfc605SKerry Stevens } 11860ca81413SKerry Stevens MatMult_KernelData *data = (MatMult_KernelData*)arg; 11870ca81413SKerry Stevens PetscScalar sum; 11880ca81413SKerry Stevens const MatScalar *aabase = data->matdata,*aa; 11890ca81413SKerry Stevens const PetscScalar *x = data->vecdata; 11900ca81413SKerry Stevens PetscScalar *y = data->vecout; 11910ca81413SKerry Stevens const PetscInt *ajbase = data->colindnz,*aj; 11920ca81413SKerry Stevens const PetscInt *ii = data->rownumnz; 11930ca81413SKerry Stevens PetscInt m = data->numrows; 11940ca81413SKerry Stevens const PetscInt *ridx = data->specidx; 11950ca81413SKerry Stevens PetscInt i,n,nonzerorow = 0; 11960ca81413SKerry Stevens 11970ca81413SKerry Stevens if(ridx!=NULL) { 11980ca81413SKerry Stevens for (i=0; i<m; i++){ 11990ca81413SKerry Stevens n = ii[i+1] - ii[i]; 12000ca81413SKerry Stevens aj = ajbase + ii[i]; 12010ca81413SKerry Stevens aa = aabase + ii[i]; 12020ca81413SKerry Stevens sum = 0.0; 1203cfcfc605SKerry Stevens if(n>0) { 120451d315f7SKerry Stevens PetscSparseDensePlusDot(sum,x,aa,aj,n); 120551d315f7SKerry Stevens nonzerorow++; 1206cfcfc605SKerry Stevens } 12070ca81413SKerry Stevens y[*ridx++] = sum; 12080ca81413SKerry Stevens } 12090ca81413SKerry Stevens } 12100ca81413SKerry Stevens else { 121151d315f7SKerry Stevens PetscInt ibase = data->nzr; 12120ca81413SKerry Stevens for (i=0; i<m; i++) { 12130ca81413SKerry Stevens n = ii[i+1] - ii[i]; 12140ca81413SKerry Stevens aj = ajbase + ii[i]; 12150ca81413SKerry Stevens aa = aabase + ii[i]; 12160ca81413SKerry Stevens sum = 0.0; 1217cfcfc605SKerry Stevens if(n>0) { 121851d315f7SKerry Stevens PetscSparseDensePlusDot(sum,x,aa,aj,n); 121951d315f7SKerry Stevens nonzerorow++; 1220cfcfc605SKerry Stevens } 122151d315f7SKerry Stevens y[i+ibase] = sum; 12220ca81413SKerry Stevens } 12230ca81413SKerry Stevens } 12240ca81413SKerry Stevens data->nzr = nonzerorow; 12250ca81413SKerry Stevens return NULL; 12260ca81413SKerry Stevens } 1227700485ddSSatish Balay #endif 12280ca81413SKerry Stevens 12290ca81413SKerry Stevens extern PetscMPIInt PetscMaxThreads; 12304b83fb64SBarry Smith extern PetscErrorCode (*MainJob)(void* (*pFunc)(void*),void**,PetscInt); 123151d315f7SKerry Stevens 12320ca81413SKerry Stevens #undef __FUNCT__ 12337d6a0e61SBarry Smith #define __FUNCT__ "MatMult_SeqAIJPThread" 12347d6a0e61SBarry Smith PetscErrorCode MatMult_SeqAIJPThread(Mat A,Vec xx,Vec yy) 12350ca81413SKerry Stevens { 12360ca81413SKerry Stevens Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 12370ca81413SKerry Stevens PetscScalar *y; 12380ca81413SKerry Stevens const PetscScalar *x; 12390ca81413SKerry Stevens PetscErrorCode ierr; 12400ca81413SKerry Stevens PetscInt m=A->rmap->n,nonzerorow=0; 12410ca81413SKerry Stevens PetscBool usecprow=a->compressedrow.use; 12420ca81413SKerry Stevens 12430ca81413SKerry Stevens #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 12440ca81413SKerry Stevens #pragma disjoint(*x,*y,*aa) 12450ca81413SKerry Stevens #endif 12460ca81413SKerry Stevens 12470ca81413SKerry Stevens PetscFunctionBegin; 12480ca81413SKerry Stevens ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 12490ca81413SKerry Stevens ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 12500ca81413SKerry Stevens 12510ca81413SKerry Stevens if(usecprow) { 12520ca81413SKerry Stevens PetscInt NumPerThread,iindex; 12530ca81413SKerry Stevens const MatScalar *aa = a->a; 12540ca81413SKerry Stevens const PetscInt *aj = a->j,*ii = a->compressedrow.i,*ridx=a->compressedrow.rindex; 12550ca81413SKerry Stevens PetscInt i,iStartVal,iEndVal,iStartIndex,iEndIndex; 12560c74a584SJed Brown const PetscInt iNumThreads = PetscMaxThreads; /* this number could be different */ 1257cfcfc605SKerry Stevens MatMult_KernelData* kerneldatap = (MatMult_KernelData*)malloc(iNumThreads*sizeof(MatMult_KernelData)); 1258cfcfc605SKerry Stevens MatMult_KernelData** pdata = (MatMult_KernelData**)malloc(iNumThreads*sizeof(MatMult_KernelData*)); 12590ca81413SKerry Stevens 12600ca81413SKerry Stevens m = a->compressedrow.nrows; 12610ca81413SKerry Stevens NumPerThread = ii[m]/iNumThreads; 12620ca81413SKerry Stevens iindex = 0; 12630ca81413SKerry Stevens for(i=0; i<iNumThreads;i++) { 12640ca81413SKerry Stevens iStartIndex = iindex; 12650ca81413SKerry Stevens iStartVal = ii[iStartIndex]; 12660ca81413SKerry Stevens iEndVal = iStartVal; 12670c74a584SJed Brown /* determine number of rows to process */ 12680ca81413SKerry Stevens while(iEndVal-iStartVal<NumPerThread) { 12690ca81413SKerry Stevens iindex++; 12700ca81413SKerry Stevens iEndVal = ii[iindex]; 12710ca81413SKerry Stevens } 12720c74a584SJed Brown /* determine whether to go back 1 */ 12730ca81413SKerry Stevens if(iEndVal-iStartVal-NumPerThread>NumPerThread-(ii[iindex-1]-iStartVal)) { 12740ca81413SKerry Stevens iindex--; 12750ca81413SKerry Stevens iEndVal = ii[iindex]; 12760ca81413SKerry Stevens } 12770ca81413SKerry Stevens iEndIndex = iindex; 1278cfcfc605SKerry Stevens kerneldatap[i].matdata = aa; 12790ca81413SKerry Stevens kerneldatap[i].vecdata = x; 12800ca81413SKerry Stevens kerneldatap[i].vecout = y; 12810ca81413SKerry Stevens kerneldatap[i].colindnz = aj; 12820ca81413SKerry Stevens kerneldatap[i].rownumnz = ii + iStartIndex; 12830ca81413SKerry Stevens kerneldatap[i].numrows = iEndIndex - iStartIndex + 1; 12840ca81413SKerry Stevens kerneldatap[i].specidx = ridx + iStartVal; 12850ca81413SKerry Stevens kerneldatap[i].nzr = 0; 1286cfcfc605SKerry Stevens pdata[i] = &kerneldatap[i]; 12870ca81413SKerry Stevens iindex++; 12880ca81413SKerry Stevens } 1289cfcfc605SKerry Stevens ierr = MainJob(MatMult_Kernel,(void**)pdata,iNumThreads); 1290cfcfc605SKerry Stevens /* collect results */ 129151d315f7SKerry Stevens for(i=0; i<iNumThreads; i++) { 1292cfcfc605SKerry Stevens nonzerorow += kerneldatap[i].nzr; 129351d315f7SKerry Stevens } 1294cfcfc605SKerry Stevens free(kerneldatap); 1295cfcfc605SKerry Stevens free(pdata); 129651d315f7SKerry Stevens } 129751d315f7SKerry Stevens else { 129851d315f7SKerry Stevens #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 129951d315f7SKerry Stevens fortranmultaij_(&m,x,a->i,a->j,a->a,y); 130051d315f7SKerry Stevens #else 130151d315f7SKerry Stevens PetscInt i,iindex; 130251d315f7SKerry Stevens const MatScalar *aa = a->a; 130351d315f7SKerry Stevens const PetscInt *aj = a->j,*ii = a->i; 13040c74a584SJed Brown const PetscInt iNumThreads = PetscMaxThreads; /* this number could be different */ 130551d315f7SKerry Stevens PetscInt Q = m/iNumThreads; 130651d315f7SKerry Stevens PetscInt R = m-Q*iNumThreads; 130751d315f7SKerry Stevens PetscBool S; 130851d315f7SKerry Stevens 130951d315f7SKerry Stevens MatMult_KernelData* kerneldatap = (MatMult_KernelData*)malloc(iNumThreads*sizeof(MatMult_KernelData)); 131051d315f7SKerry Stevens MatMult_KernelData** pdata = (MatMult_KernelData**)malloc(iNumThreads*sizeof(MatMult_KernelData*)); 131151d315f7SKerry Stevens 131251d315f7SKerry Stevens iindex = 0; 131351d315f7SKerry Stevens for(i=0; i<iNumThreads;i++) { 1314b50af74fSBarry Smith S = (PetscBool)(i<R); 131551d315f7SKerry Stevens kerneldatap[i].matdata = aa; 131651d315f7SKerry Stevens kerneldatap[i].vecdata = x; 131751d315f7SKerry Stevens kerneldatap[i].vecout = y; 131851d315f7SKerry Stevens kerneldatap[i].colindnz = aj; 131951d315f7SKerry Stevens kerneldatap[i].rownumnz = ii + iindex; 132051d315f7SKerry Stevens kerneldatap[i].numrows = S?Q+1:Q; 132151d315f7SKerry Stevens kerneldatap[i].specidx = PETSC_NULL; 13220c74a584SJed Brown kerneldatap[i].nzr = iindex; /* serves as the 'base' row (needed to access correctly into output vector y) */ 132351d315f7SKerry Stevens pdata[i] = &kerneldatap[i]; 132451d315f7SKerry Stevens iindex += kerneldatap[i].numrows; 132551d315f7SKerry Stevens } 13260ca81413SKerry Stevens MainJob(MatMult_Kernel,(void**)pdata,iNumThreads); 13270c74a584SJed Brown /* collect results */ 13280ca81413SKerry Stevens for(i=0; i<iNumThreads; i++) { 13290ca81413SKerry Stevens nonzerorow += kerneldatap[i].nzr; 13300ca81413SKerry Stevens } 133151d315f7SKerry Stevens free(kerneldatap); 133251d315f7SKerry Stevens free(pdata); 13330ca81413SKerry Stevens #endif 13340ca81413SKerry Stevens } 13350ca81413SKerry Stevens 13360ca81413SKerry Stevens ierr = PetscLogFlops(2.0*a->nz - nonzerorow);CHKERRQ(ierr); 13370ca81413SKerry Stevens ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 13380ca81413SKerry Stevens ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 13390ca81413SKerry Stevens PetscFunctionReturn(0); 13400ca81413SKerry Stevens } 13410c74a584SJed Brown /* ******************* */ 1342ba61063dSBarry Smith #endif 13430ca81413SKerry Stevens 1344c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 13454a2ae208SSatish Balay #undef __FUNCT__ 13464a2ae208SSatish Balay #define __FUNCT__ "MatMultAdd_SeqAIJ" 1347dfbe8321SBarry Smith PetscErrorCode MatMultAdd_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz) 134817ab2063SBarry Smith { 1349416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1350f15663dcSBarry Smith PetscScalar *y,*z; 1351f15663dcSBarry Smith const PetscScalar *x; 135254f21887SBarry Smith const MatScalar *aa; 1353dfbe8321SBarry Smith PetscErrorCode ierr; 1354d0f46423SBarry Smith PetscInt m = A->rmap->n,*aj,*ii; 1355f15663dcSBarry Smith PetscInt n,i,*ridx=PETSC_NULL; 1356362ced78SSatish Balay PetscScalar sum; 1357ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 13589ea0dfa2SSatish Balay 13593a40ed3dSBarry Smith PetscFunctionBegin; 1360f15663dcSBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 13611ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 13622e8a6d31SBarry Smith if (zz != yy) { 13631ebc52fbSHong Zhang ierr = VecGetArray(zz,&z);CHKERRQ(ierr); 13642e8a6d31SBarry Smith } else { 13652e8a6d31SBarry Smith z = y; 13662e8a6d31SBarry Smith } 1367bfeeae90SHong Zhang 136897952fefSHong Zhang aj = a->j; 136997952fefSHong Zhang aa = a->a; 1370cddf8d76SBarry Smith ii = a->i; 13714eb6d288SHong Zhang if (usecprow){ /* use compressed row format */ 13724eb6d288SHong Zhang if (zz != yy){ 13734eb6d288SHong Zhang ierr = PetscMemcpy(z,y,m*sizeof(PetscScalar));CHKERRQ(ierr); 13744eb6d288SHong Zhang } 137597952fefSHong Zhang m = a->compressedrow.nrows; 137697952fefSHong Zhang ii = a->compressedrow.i; 137797952fefSHong Zhang ridx = a->compressedrow.rindex; 137897952fefSHong Zhang for (i=0; i<m; i++){ 137997952fefSHong Zhang n = ii[i+1] - ii[i]; 138097952fefSHong Zhang aj = a->j + ii[i]; 138197952fefSHong Zhang aa = a->a + ii[i]; 138297952fefSHong Zhang sum = y[*ridx]; 1383f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 138497952fefSHong Zhang z[*ridx++] = sum; 138597952fefSHong Zhang } 138697952fefSHong Zhang } else { /* do not use compressed row format */ 1387f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 1388f15663dcSBarry Smith fortranmultaddaij_(&m,x,ii,aj,aa,y,z); 1389f15663dcSBarry Smith #else 139017ab2063SBarry Smith for (i=0; i<m; i++) { 1391f15663dcSBarry Smith n = ii[i+1] - ii[i]; 1392f15663dcSBarry Smith aj = a->j + ii[i]; 1393f15663dcSBarry Smith aa = a->a + ii[i]; 139417ab2063SBarry Smith sum = y[i]; 1395f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 139617ab2063SBarry Smith z[i] = sum; 139717ab2063SBarry Smith } 139802ab625aSSatish Balay #endif 1399f15663dcSBarry Smith } 1400dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1401f15663dcSBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 14021ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 14032e8a6d31SBarry Smith if (zz != yy) { 14041ebc52fbSHong Zhang ierr = VecRestoreArray(zz,&z);CHKERRQ(ierr); 14052e8a6d31SBarry Smith } 14068154be41SBarry Smith #if defined(PETSC_HAVE_CUSP) 14076b375ea7SVictor Minden /* 1408918e98c3SVictor Minden ierr = VecView(xx,0);CHKERRQ(ierr); 1409918e98c3SVictor Minden ierr = VecView(zz,0);CHKERRQ(ierr); 1410918e98c3SVictor Minden ierr = MatView(A,0);CHKERRQ(ierr); 14116b375ea7SVictor Minden */ 1412918e98c3SVictor Minden #endif 14133a40ed3dSBarry Smith PetscFunctionReturn(0); 141417ab2063SBarry Smith } 141517ab2063SBarry Smith 141617ab2063SBarry Smith /* 141717ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 141817ab2063SBarry Smith */ 14194a2ae208SSatish Balay #undef __FUNCT__ 14204a2ae208SSatish Balay #define __FUNCT__ "MatMarkDiagonal_SeqAIJ" 1421dfbe8321SBarry Smith PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 142217ab2063SBarry Smith { 1423416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 14246849ba73SBarry Smith PetscErrorCode ierr; 1425d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n; 142617ab2063SBarry Smith 14273a40ed3dSBarry Smith PetscFunctionBegin; 142809f38230SBarry Smith if (!a->diag) { 142909f38230SBarry Smith ierr = PetscMalloc(m*sizeof(PetscInt),&a->diag);CHKERRQ(ierr); 14309518dbb4SMatthew Knepley ierr = PetscLogObjectMemory(A, m*sizeof(PetscInt));CHKERRQ(ierr); 143109f38230SBarry Smith } 1432d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 143309f38230SBarry Smith a->diag[i] = a->i[i+1]; 1434bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1435bfeeae90SHong Zhang if (a->j[j] == i) { 143609f38230SBarry Smith a->diag[i] = j; 143717ab2063SBarry Smith break; 143817ab2063SBarry Smith } 143917ab2063SBarry Smith } 144017ab2063SBarry Smith } 14413a40ed3dSBarry Smith PetscFunctionReturn(0); 144217ab2063SBarry Smith } 144317ab2063SBarry Smith 1444be5855fcSBarry Smith /* 1445be5855fcSBarry Smith Checks for missing diagonals 1446be5855fcSBarry Smith */ 14474a2ae208SSatish Balay #undef __FUNCT__ 14484a2ae208SSatish Balay #define __FUNCT__ "MatMissingDiagonal_SeqAIJ" 1449ace3abfcSBarry Smith PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A,PetscBool *missing,PetscInt *d) 1450be5855fcSBarry Smith { 1451be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 145297f1f81fSBarry Smith PetscInt *diag,*jj = a->j,i; 1453be5855fcSBarry Smith 1454be5855fcSBarry Smith PetscFunctionBegin; 145509f38230SBarry Smith *missing = PETSC_FALSE; 1456d0f46423SBarry Smith if (A->rmap->n > 0 && !jj) { 145709f38230SBarry Smith *missing = PETSC_TRUE; 145809f38230SBarry Smith if (d) *d = 0; 145909f38230SBarry Smith PetscInfo(A,"Matrix has no entries therefor is missing diagonal"); 146009f38230SBarry Smith } else { 1461f1e2ffcdSBarry Smith diag = a->diag; 1462d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 1463bfeeae90SHong Zhang if (jj[diag[i]] != i) { 146409f38230SBarry Smith *missing = PETSC_TRUE; 146509f38230SBarry Smith if (d) *d = i; 146609f38230SBarry Smith PetscInfo1(A,"Matrix is missing diagonal number %D",i); 146709f38230SBarry Smith } 1468be5855fcSBarry Smith } 1469be5855fcSBarry Smith } 1470be5855fcSBarry Smith PetscFunctionReturn(0); 1471be5855fcSBarry Smith } 1472be5855fcSBarry Smith 147371f1c65dSBarry Smith EXTERN_C_BEGIN 147471f1c65dSBarry Smith #undef __FUNCT__ 147571f1c65dSBarry Smith #define __FUNCT__ "MatInvertDiagonal_SeqAIJ" 14767087cfbeSBarry Smith PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A,PetscScalar omega,PetscScalar fshift) 147771f1c65dSBarry Smith { 147871f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 147971f1c65dSBarry Smith PetscErrorCode ierr; 1480d0f46423SBarry Smith PetscInt i,*diag,m = A->rmap->n; 148154f21887SBarry Smith MatScalar *v = a->a; 148254f21887SBarry Smith PetscScalar *idiag,*mdiag; 148371f1c65dSBarry Smith 148471f1c65dSBarry Smith PetscFunctionBegin; 148571f1c65dSBarry Smith if (a->idiagvalid) PetscFunctionReturn(0); 148671f1c65dSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 148771f1c65dSBarry Smith diag = a->diag; 148871f1c65dSBarry Smith if (!a->idiag) { 148971f1c65dSBarry Smith ierr = PetscMalloc3(m,PetscScalar,&a->idiag,m,PetscScalar,&a->mdiag,m,PetscScalar,&a->ssor_work);CHKERRQ(ierr); 149071f1c65dSBarry Smith ierr = PetscLogObjectMemory(A, 3*m*sizeof(PetscScalar));CHKERRQ(ierr); 149171f1c65dSBarry Smith v = a->a; 149271f1c65dSBarry Smith } 149371f1c65dSBarry Smith mdiag = a->mdiag; 149471f1c65dSBarry Smith idiag = a->idiag; 149571f1c65dSBarry Smith 1496028cd4eaSSatish Balay if (omega == 1.0 && !PetscAbsScalar(fshift)) { 149771f1c65dSBarry Smith for (i=0; i<m; i++) { 149871f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1499e32f2f54SBarry Smith if (!PetscAbsScalar(mdiag[i])) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Zero diagonal on row %D",i); 150071f1c65dSBarry Smith idiag[i] = 1.0/v[diag[i]]; 150171f1c65dSBarry Smith } 150271f1c65dSBarry Smith ierr = PetscLogFlops(m);CHKERRQ(ierr); 150371f1c65dSBarry Smith } else { 150471f1c65dSBarry Smith for (i=0; i<m; i++) { 150571f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 150671f1c65dSBarry Smith idiag[i] = omega/(fshift + v[diag[i]]); 150771f1c65dSBarry Smith } 1508dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*m);CHKERRQ(ierr); 150971f1c65dSBarry Smith } 151071f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 151171f1c65dSBarry Smith PetscFunctionReturn(0); 151271f1c65dSBarry Smith } 15135a9745a3SMatthew Knepley EXTERN_C_END 151471f1c65dSBarry Smith 1515c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 15164a2ae208SSatish Balay #undef __FUNCT__ 151741f059aeSBarry Smith #define __FUNCT__ "MatSOR_SeqAIJ" 151841f059aeSBarry Smith PetscErrorCode MatSOR_SeqAIJ(Mat A,Vec bb,PetscReal omega,MatSORType flag,PetscReal fshift,PetscInt its,PetscInt lits,Vec xx) 151917ab2063SBarry Smith { 1520416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1521e6d1f457SBarry Smith PetscScalar *x,d,sum,*t,scale; 1522e6d1f457SBarry Smith const MatScalar *v = a->a,*idiag=0,*mdiag; 152354f21887SBarry Smith const PetscScalar *b, *bs,*xb, *ts; 1524dfbe8321SBarry Smith PetscErrorCode ierr; 1525d0f46423SBarry Smith PetscInt n = A->cmap->n,m = A->rmap->n,i; 152697f1f81fSBarry Smith const PetscInt *idx,*diag; 152717ab2063SBarry Smith 15283a40ed3dSBarry Smith PetscFunctionBegin; 1529b965ef7fSBarry Smith its = its*lits; 153091723122SBarry Smith 153171f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 153271f1c65dSBarry Smith if (!a->idiagvalid) {ierr = MatInvertDiagonal_SeqAIJ(A,omega,fshift);CHKERRQ(ierr);} 153371f1c65dSBarry Smith a->fshift = fshift; 153471f1c65dSBarry Smith a->omega = omega; 1535ed480e8bSBarry Smith 153671f1c65dSBarry Smith diag = a->diag; 153771f1c65dSBarry Smith t = a->ssor_work; 1538ed480e8bSBarry Smith idiag = a->idiag; 153971f1c65dSBarry Smith mdiag = a->mdiag; 1540ed480e8bSBarry Smith 15411ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 15423649974fSBarry Smith ierr = VecGetArrayRead(bb,&b);CHKERRQ(ierr); 154371f1c65dSBarry Smith CHKMEMQ; 1544ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 154517ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 154617ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1547ed480e8bSBarry Smith bs = b; 154817ab2063SBarry Smith for (i=0; i<m; i++) { 154971f1c65dSBarry Smith d = fshift + mdiag[i]; 1550416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1551ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1552ed480e8bSBarry Smith v = a->a + diag[i] + 1; 155317ab2063SBarry Smith sum = b[i]*d/omega; 1554003131ecSBarry Smith PetscSparseDensePlusDot(sum,bs,v,idx,n); 155517ab2063SBarry Smith x[i] = sum; 155617ab2063SBarry Smith } 15571ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 15583649974fSBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 1559efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 15603a40ed3dSBarry Smith PetscFunctionReturn(0); 156117ab2063SBarry Smith } 1562c783ea89SBarry Smith 156348af12d7SBarry Smith if (flag == SOR_APPLY_LOWER) { 1564e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"SOR_APPLY_LOWER is not implemented"); 15653a40ed3dSBarry Smith } else if (flag & SOR_EISENSTAT) { 156617ab2063SBarry Smith /* Let A = L + U + D; where L is lower trianglar, 1567887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 156817ab2063SBarry Smith 156917ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 157017ab2063SBarry Smith 1571887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 157217ab2063SBarry Smith */ 157317ab2063SBarry Smith scale = (2.0/omega) - 1.0; 157417ab2063SBarry Smith 157517ab2063SBarry Smith /* x = (E + U)^{-1} b */ 157617ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1577416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1578ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1579ed480e8bSBarry Smith v = a->a + diag[i] + 1; 158017ab2063SBarry Smith sum = b[i]; 1581e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 1582ed480e8bSBarry Smith x[i] = sum*idiag[i]; 158317ab2063SBarry Smith } 158417ab2063SBarry Smith 158517ab2063SBarry Smith /* t = b - (2*E - D)x */ 1586416022c9SBarry Smith v = a->a; 1587ed480e8bSBarry Smith for (i=0; i<m; i++) { t[i] = b[i] - scale*(v[*diag++])*x[i]; } 158817ab2063SBarry Smith 158917ab2063SBarry Smith /* t = (E + L)^{-1}t */ 1590ed480e8bSBarry Smith ts = t; 1591416022c9SBarry Smith diag = a->diag; 159217ab2063SBarry Smith for (i=0; i<m; i++) { 1593416022c9SBarry Smith n = diag[i] - a->i[i]; 1594ed480e8bSBarry Smith idx = a->j + a->i[i]; 1595ed480e8bSBarry Smith v = a->a + a->i[i]; 159617ab2063SBarry Smith sum = t[i]; 1597003131ecSBarry Smith PetscSparseDenseMinusDot(sum,ts,v,idx,n); 1598ed480e8bSBarry Smith t[i] = sum*idiag[i]; 1599733d66baSBarry Smith /* x = x + t */ 1600733d66baSBarry Smith x[i] += t[i]; 160117ab2063SBarry Smith } 160217ab2063SBarry Smith 1603dc0b31edSSatish Balay ierr = PetscLogFlops(6.0*m-1 + 2.0*a->nz);CHKERRQ(ierr); 16041ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 16053649974fSBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 16063a40ed3dSBarry Smith PetscFunctionReturn(0); 160717ab2063SBarry Smith } 160817ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 160917ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP){ 161017ab2063SBarry Smith for (i=0; i<m; i++) { 1611416022c9SBarry Smith n = diag[i] - a->i[i]; 1612ed480e8bSBarry Smith idx = a->j + a->i[i]; 1613ed480e8bSBarry Smith v = a->a + a->i[i]; 161417ab2063SBarry Smith sum = b[i]; 1615e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 16165c99c7daSBarry Smith t[i] = sum; 1617ed480e8bSBarry Smith x[i] = sum*idiag[i]; 161817ab2063SBarry Smith } 16195c99c7daSBarry Smith xb = t; 1620efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 16213a40ed3dSBarry Smith } else xb = b; 162217ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP){ 162317ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1624416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1625ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1626ed480e8bSBarry Smith v = a->a + diag[i] + 1; 162717ab2063SBarry Smith sum = xb[i]; 1628e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 16295c99c7daSBarry Smith if (xb == b) { 1630ed480e8bSBarry Smith x[i] = sum*idiag[i]; 16315c99c7daSBarry Smith } else { 16325c99c7daSBarry Smith x[i] = (1-omega)*x[i] + sum*idiag[i]; 163317ab2063SBarry Smith } 16345c99c7daSBarry Smith } 1635efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 163617ab2063SBarry Smith } 163717ab2063SBarry Smith its--; 163817ab2063SBarry Smith } 163917ab2063SBarry Smith while (its--) { 164017ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP){ 164117ab2063SBarry Smith for (i=0; i<m; i++) { 1642416022c9SBarry Smith n = a->i[i+1] - a->i[i]; 1643ed480e8bSBarry Smith idx = a->j + a->i[i]; 1644ed480e8bSBarry Smith v = a->a + a->i[i]; 164517ab2063SBarry Smith sum = b[i]; 1646e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 1647ed480e8bSBarry Smith x[i] = (1. - omega)*x[i] + (sum + mdiag[i]*x[i])*idiag[i]; 164817ab2063SBarry Smith } 16499f863219SBarry Smith ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 165017ab2063SBarry Smith } 165117ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP){ 165217ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1653416022c9SBarry Smith n = a->i[i+1] - a->i[i]; 1654ed480e8bSBarry Smith idx = a->j + a->i[i]; 1655ed480e8bSBarry Smith v = a->a + a->i[i]; 165617ab2063SBarry Smith sum = b[i]; 1657e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 1658ed480e8bSBarry Smith x[i] = (1. - omega)*x[i] + (sum + mdiag[i]*x[i])*idiag[i]; 165917ab2063SBarry Smith } 16609f863219SBarry Smith ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 166117ab2063SBarry Smith } 166217ab2063SBarry Smith } 16631ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 16643649974fSBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 166571f1c65dSBarry Smith CHKMEMQ; PetscFunctionReturn(0); 166617ab2063SBarry Smith } 166717ab2063SBarry Smith 16682af78befSBarry Smith 16694a2ae208SSatish Balay #undef __FUNCT__ 16704a2ae208SSatish Balay #define __FUNCT__ "MatGetInfo_SeqAIJ" 1671dfbe8321SBarry Smith PetscErrorCode MatGetInfo_SeqAIJ(Mat A,MatInfoType flag,MatInfo *info) 167217ab2063SBarry Smith { 1673416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 16744e220ebcSLois Curfman McInnes 16753a40ed3dSBarry Smith PetscFunctionBegin; 16764e220ebcSLois Curfman McInnes info->block_size = 1.0; 16774e220ebcSLois Curfman McInnes info->nz_allocated = (double)a->maxnz; 16784e220ebcSLois Curfman McInnes info->nz_used = (double)a->nz; 16794e220ebcSLois Curfman McInnes info->nz_unneeded = (double)(a->maxnz - a->nz); 16804e220ebcSLois Curfman McInnes info->assemblies = (double)A->num_ass; 16818e58a170SBarry Smith info->mallocs = (double)A->info.mallocs; 16827adad957SLisandro Dalcin info->memory = ((PetscObject)A)->mem; 1683d5f3da31SBarry Smith if (A->factortype) { 16844e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 16854e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 16864e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 16874e220ebcSLois Curfman McInnes } else { 16884e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 16894e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 16904e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 16914e220ebcSLois Curfman McInnes } 16923a40ed3dSBarry Smith PetscFunctionReturn(0); 169317ab2063SBarry Smith } 169417ab2063SBarry Smith 16954a2ae208SSatish Balay #undef __FUNCT__ 16964a2ae208SSatish Balay #define __FUNCT__ "MatZeroRows_SeqAIJ" 16972b40b63fSBarry Smith PetscErrorCode MatZeroRows_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 169817ab2063SBarry Smith { 1699416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 17003b98c0a2SBarry Smith PetscInt i,m = A->rmap->n - 1,d = 0; 17016849ba73SBarry Smith PetscErrorCode ierr; 170297b48c8fSBarry Smith const PetscScalar *xx; 170397b48c8fSBarry Smith PetscScalar *bb; 1704ace3abfcSBarry Smith PetscBool missing; 170517ab2063SBarry Smith 17063a40ed3dSBarry Smith PetscFunctionBegin; 170797b48c8fSBarry Smith if (x && b) { 170897b48c8fSBarry Smith ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 170997b48c8fSBarry Smith ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 171097b48c8fSBarry Smith for (i=0; i<N; i++) { 171197b48c8fSBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 171297b48c8fSBarry Smith bb[rows[i]] = diag*xx[rows[i]]; 171397b48c8fSBarry Smith } 171497b48c8fSBarry Smith ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 171597b48c8fSBarry Smith ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 171697b48c8fSBarry Smith } 171797b48c8fSBarry Smith 1718a9817697SBarry Smith if (a->keepnonzeropattern) { 1719f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 1720e32f2f54SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 1721bfeeae90SHong Zhang ierr = PetscMemzero(&a->a[a->i[rows[i]]],a->ilen[rows[i]]*sizeof(PetscScalar));CHKERRQ(ierr); 1722f1e2ffcdSBarry Smith } 1723f4df32b1SMatthew Knepley if (diag != 0.0) { 172409f38230SBarry Smith ierr = MatMissingDiagonal_SeqAIJ(A,&missing,&d);CHKERRQ(ierr); 1725e32f2f54SBarry Smith if (missing) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in row %D",d); 1726f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 1727f4df32b1SMatthew Knepley a->a[a->diag[rows[i]]] = diag; 1728f1e2ffcdSBarry Smith } 1729f1e2ffcdSBarry Smith } 173088e51ccdSHong Zhang A->same_nonzero = PETSC_TRUE; 1731f1e2ffcdSBarry Smith } else { 1732f4df32b1SMatthew Knepley if (diag != 0.0) { 173317ab2063SBarry Smith for (i=0; i<N; i++) { 1734e32f2f54SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 17357ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 1736416022c9SBarry Smith a->ilen[rows[i]] = 1; 1737f4df32b1SMatthew Knepley a->a[a->i[rows[i]]] = diag; 1738bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 17397ae801bdSBarry Smith } else { /* in case row was completely empty */ 1740f4df32b1SMatthew Knepley ierr = MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],&diag,INSERT_VALUES);CHKERRQ(ierr); 174117ab2063SBarry Smith } 174217ab2063SBarry Smith } 17433a40ed3dSBarry Smith } else { 174417ab2063SBarry Smith for (i=0; i<N; i++) { 1745e32f2f54SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 1746416022c9SBarry Smith a->ilen[rows[i]] = 0; 174717ab2063SBarry Smith } 174817ab2063SBarry Smith } 174988e51ccdSHong Zhang A->same_nonzero = PETSC_FALSE; 1750f1e2ffcdSBarry Smith } 175143a90d84SBarry Smith ierr = MatAssemblyEnd_SeqAIJ(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 17523a40ed3dSBarry Smith PetscFunctionReturn(0); 175317ab2063SBarry Smith } 175417ab2063SBarry Smith 17554a2ae208SSatish Balay #undef __FUNCT__ 17566e169961SBarry Smith #define __FUNCT__ "MatZeroRowsColumns_SeqAIJ" 17576e169961SBarry Smith PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 17586e169961SBarry Smith { 17596e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 17606e169961SBarry Smith PetscInt i,j,m = A->rmap->n - 1,d = 0; 17616e169961SBarry Smith PetscErrorCode ierr; 17622b40b63fSBarry Smith PetscBool missing,*zeroed,vecs = PETSC_FALSE; 17636e169961SBarry Smith const PetscScalar *xx; 17646e169961SBarry Smith PetscScalar *bb; 17656e169961SBarry Smith 17666e169961SBarry Smith PetscFunctionBegin; 17676e169961SBarry Smith if (x && b) { 17686e169961SBarry Smith ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 17696e169961SBarry Smith ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 17702b40b63fSBarry Smith vecs = PETSC_TRUE; 17716e169961SBarry Smith } 17726e169961SBarry Smith ierr = PetscMalloc(A->rmap->n*sizeof(PetscBool),&zeroed);CHKERRQ(ierr); 17736e169961SBarry Smith ierr = PetscMemzero(zeroed,A->rmap->n*sizeof(PetscBool));CHKERRQ(ierr); 17746e169961SBarry Smith for (i=0; i<N; i++) { 17756e169961SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 17766e169961SBarry Smith ierr = PetscMemzero(&a->a[a->i[rows[i]]],a->ilen[rows[i]]*sizeof(PetscScalar));CHKERRQ(ierr); 17776e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 17786e169961SBarry Smith } 17796e169961SBarry Smith for (i=0; i<A->rmap->n; i++) { 17806e169961SBarry Smith if (!zeroed[i]) { 17816e169961SBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 17826e169961SBarry Smith if (zeroed[a->j[j]]) { 17832b40b63fSBarry Smith if (vecs) bb[i] -= a->a[j]*xx[a->j[j]]; 17846e169961SBarry Smith a->a[j] = 0.0; 17856e169961SBarry Smith } 17866e169961SBarry Smith } 17872b40b63fSBarry Smith } else if (vecs) bb[i] = diag*xx[i]; 17886e169961SBarry Smith } 17896e169961SBarry Smith if (x && b) { 17906e169961SBarry Smith ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 17916e169961SBarry Smith ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 17926e169961SBarry Smith } 17936e169961SBarry Smith ierr = PetscFree(zeroed);CHKERRQ(ierr); 17946e169961SBarry Smith if (diag != 0.0) { 17956e169961SBarry Smith ierr = MatMissingDiagonal_SeqAIJ(A,&missing,&d);CHKERRQ(ierr); 17966e169961SBarry Smith if (missing) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in row %D",d); 17976e169961SBarry Smith for (i=0; i<N; i++) { 17986e169961SBarry Smith a->a[a->diag[rows[i]]] = diag; 17996e169961SBarry Smith } 18006e169961SBarry Smith } 18016e169961SBarry Smith A->same_nonzero = PETSC_TRUE; 18026e169961SBarry Smith ierr = MatAssemblyEnd_SeqAIJ(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 18036e169961SBarry Smith PetscFunctionReturn(0); 18046e169961SBarry Smith } 18056e169961SBarry Smith 18066e169961SBarry Smith #undef __FUNCT__ 18074a2ae208SSatish Balay #define __FUNCT__ "MatGetRow_SeqAIJ" 1808a77337e4SBarry Smith PetscErrorCode MatGetRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 180917ab2063SBarry Smith { 1810416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 181197f1f81fSBarry Smith PetscInt *itmp; 181217ab2063SBarry Smith 18133a40ed3dSBarry Smith PetscFunctionBegin; 1814e32f2f54SBarry Smith if (row < 0 || row >= A->rmap->n) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D out of range",row); 181517ab2063SBarry Smith 1816416022c9SBarry Smith *nz = a->i[row+1] - a->i[row]; 1817bfeeae90SHong Zhang if (v) *v = a->a + a->i[row]; 181817ab2063SBarry Smith if (idx) { 1819bfeeae90SHong Zhang itmp = a->j + a->i[row]; 1820bfeeae90SHong Zhang if (*nz) { 18214e093b46SBarry Smith *idx = itmp; 182217ab2063SBarry Smith } 182317ab2063SBarry Smith else *idx = 0; 182417ab2063SBarry Smith } 18253a40ed3dSBarry Smith PetscFunctionReturn(0); 182617ab2063SBarry Smith } 182717ab2063SBarry Smith 1828bfeeae90SHong Zhang /* remove this function? */ 18294a2ae208SSatish Balay #undef __FUNCT__ 18304a2ae208SSatish Balay #define __FUNCT__ "MatRestoreRow_SeqAIJ" 1831a77337e4SBarry Smith PetscErrorCode MatRestoreRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 183217ab2063SBarry Smith { 18333a40ed3dSBarry Smith PetscFunctionBegin; 18343a40ed3dSBarry Smith PetscFunctionReturn(0); 183517ab2063SBarry Smith } 183617ab2063SBarry Smith 18374a2ae208SSatish Balay #undef __FUNCT__ 18384a2ae208SSatish Balay #define __FUNCT__ "MatNorm_SeqAIJ" 1839dfbe8321SBarry Smith PetscErrorCode MatNorm_SeqAIJ(Mat A,NormType type,PetscReal *nrm) 184017ab2063SBarry Smith { 1841416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 184254f21887SBarry Smith MatScalar *v = a->a; 184336db0b34SBarry Smith PetscReal sum = 0.0; 18446849ba73SBarry Smith PetscErrorCode ierr; 184597f1f81fSBarry Smith PetscInt i,j; 184617ab2063SBarry Smith 18473a40ed3dSBarry Smith PetscFunctionBegin; 184817ab2063SBarry Smith if (type == NORM_FROBENIUS) { 1849416022c9SBarry Smith for (i=0; i<a->nz; i++) { 1850aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 185136db0b34SBarry Smith sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 185217ab2063SBarry Smith #else 185317ab2063SBarry Smith sum += (*v)*(*v); v++; 185417ab2063SBarry Smith #endif 185517ab2063SBarry Smith } 18568f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 18573a40ed3dSBarry Smith } else if (type == NORM_1) { 185836db0b34SBarry Smith PetscReal *tmp; 185997f1f81fSBarry Smith PetscInt *jj = a->j; 1860d0f46423SBarry Smith ierr = PetscMalloc((A->cmap->n+1)*sizeof(PetscReal),&tmp);CHKERRQ(ierr); 1861d0f46423SBarry Smith ierr = PetscMemzero(tmp,A->cmap->n*sizeof(PetscReal));CHKERRQ(ierr); 1862064f8208SBarry Smith *nrm = 0.0; 1863416022c9SBarry Smith for (j=0; j<a->nz; j++) { 1864bfeeae90SHong Zhang tmp[*jj++] += PetscAbsScalar(*v); v++; 186517ab2063SBarry Smith } 1866d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1867064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 186817ab2063SBarry Smith } 1869606d414cSSatish Balay ierr = PetscFree(tmp);CHKERRQ(ierr); 18703a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 1871064f8208SBarry Smith *nrm = 0.0; 1872d0f46423SBarry Smith for (j=0; j<A->rmap->n; j++) { 1873bfeeae90SHong Zhang v = a->a + a->i[j]; 187417ab2063SBarry Smith sum = 0.0; 1875416022c9SBarry Smith for (i=0; i<a->i[j+1]-a->i[j]; i++) { 1876cddf8d76SBarry Smith sum += PetscAbsScalar(*v); v++; 187717ab2063SBarry Smith } 1878064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 187917ab2063SBarry Smith } 18803a40ed3dSBarry Smith } else { 1881e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"No support for two norm"); 188217ab2063SBarry Smith } 18833a40ed3dSBarry Smith PetscFunctionReturn(0); 188417ab2063SBarry Smith } 188517ab2063SBarry Smith 18864a2ae208SSatish Balay #undef __FUNCT__ 18874a2ae208SSatish Balay #define __FUNCT__ "MatTranspose_SeqAIJ" 1888fc4dec0aSBarry Smith PetscErrorCode MatTranspose_SeqAIJ(Mat A,MatReuse reuse,Mat *B) 188917ab2063SBarry Smith { 1890416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1891416022c9SBarry Smith Mat C; 18926849ba73SBarry Smith PetscErrorCode ierr; 1893d0f46423SBarry Smith PetscInt i,*aj = a->j,*ai = a->i,m = A->rmap->n,len,*col; 189454f21887SBarry Smith MatScalar *array = a->a; 189517ab2063SBarry Smith 18963a40ed3dSBarry Smith PetscFunctionBegin; 1897e32f2f54SBarry Smith if (reuse == MAT_REUSE_MATRIX && A == *B && m != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Square matrix only for in-place"); 1898fc4dec0aSBarry Smith 1899fc4dec0aSBarry Smith if (reuse == MAT_INITIAL_MATRIX || *B == A) { 1900d0f46423SBarry Smith ierr = PetscMalloc((1+A->cmap->n)*sizeof(PetscInt),&col);CHKERRQ(ierr); 1901d0f46423SBarry Smith ierr = PetscMemzero(col,(1+A->cmap->n)*sizeof(PetscInt));CHKERRQ(ierr); 1902bfeeae90SHong Zhang 1903bfeeae90SHong Zhang for (i=0; i<ai[m]; i++) col[aj[i]] += 1; 19047adad957SLisandro Dalcin ierr = MatCreate(((PetscObject)A)->comm,&C);CHKERRQ(ierr); 1905d0f46423SBarry Smith ierr = MatSetSizes(C,A->cmap->n,m,A->cmap->n,m);CHKERRQ(ierr); 19067adad957SLisandro Dalcin ierr = MatSetType(C,((PetscObject)A)->type_name);CHKERRQ(ierr); 1907ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,col);CHKERRQ(ierr); 1908606d414cSSatish Balay ierr = PetscFree(col);CHKERRQ(ierr); 1909a541d17aSBarry Smith } else { 1910a541d17aSBarry Smith C = *B; 1911a541d17aSBarry Smith } 1912a541d17aSBarry Smith 191317ab2063SBarry Smith for (i=0; i<m; i++) { 191417ab2063SBarry Smith len = ai[i+1]-ai[i]; 191587d4246cSBarry Smith ierr = MatSetValues_SeqAIJ(C,len,aj,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 1916b9b97703SBarry Smith array += len; 1917b9b97703SBarry Smith aj += len; 191817ab2063SBarry Smith } 19196d4a8577SBarry Smith ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 19206d4a8577SBarry Smith ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 192117ab2063SBarry Smith 1922815cbec1SBarry Smith if (reuse == MAT_INITIAL_MATRIX || *B != A) { 1923416022c9SBarry Smith *B = C; 192417ab2063SBarry Smith } else { 1925eb6b5d47SBarry Smith ierr = MatHeaderMerge(A,C);CHKERRQ(ierr); 192617ab2063SBarry Smith } 19273a40ed3dSBarry Smith PetscFunctionReturn(0); 192817ab2063SBarry Smith } 192917ab2063SBarry Smith 1930cd0d46ebSvictorle EXTERN_C_BEGIN 1931cd0d46ebSvictorle #undef __FUNCT__ 19325fbd3699SBarry Smith #define __FUNCT__ "MatIsTranspose_SeqAIJ" 19337087cfbeSBarry Smith PetscErrorCode MatIsTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 1934cd0d46ebSvictorle { 1935cd0d46ebSvictorle Mat_SeqAIJ *aij = (Mat_SeqAIJ *) A->data,*bij = (Mat_SeqAIJ*) A->data; 193654f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 193754f21887SBarry Smith MatScalar *va,*vb; 19386849ba73SBarry Smith PetscErrorCode ierr; 193997f1f81fSBarry Smith PetscInt ma,na,mb,nb, i; 1940cd0d46ebSvictorle 1941cd0d46ebSvictorle PetscFunctionBegin; 1942cd0d46ebSvictorle bij = (Mat_SeqAIJ *) B->data; 1943cd0d46ebSvictorle 1944cd0d46ebSvictorle ierr = MatGetSize(A,&ma,&na);CHKERRQ(ierr); 1945cd0d46ebSvictorle ierr = MatGetSize(B,&mb,&nb);CHKERRQ(ierr); 19465485867bSBarry Smith if (ma!=nb || na!=mb){ 19475485867bSBarry Smith *f = PETSC_FALSE; 19485485867bSBarry Smith PetscFunctionReturn(0); 19495485867bSBarry Smith } 1950cd0d46ebSvictorle aii = aij->i; bii = bij->i; 1951cd0d46ebSvictorle adx = aij->j; bdx = bij->j; 1952cd0d46ebSvictorle va = aij->a; vb = bij->a; 195397f1f81fSBarry Smith ierr = PetscMalloc(ma*sizeof(PetscInt),&aptr);CHKERRQ(ierr); 195497f1f81fSBarry Smith ierr = PetscMalloc(mb*sizeof(PetscInt),&bptr);CHKERRQ(ierr); 1955cd0d46ebSvictorle for (i=0; i<ma; i++) aptr[i] = aii[i]; 1956cd0d46ebSvictorle for (i=0; i<mb; i++) bptr[i] = bii[i]; 1957cd0d46ebSvictorle 1958cd0d46ebSvictorle *f = PETSC_TRUE; 1959cd0d46ebSvictorle for (i=0; i<ma; i++) { 1960cd0d46ebSvictorle while (aptr[i]<aii[i+1]) { 196197f1f81fSBarry Smith PetscInt idc,idr; 19625485867bSBarry Smith PetscScalar vc,vr; 1963cd0d46ebSvictorle /* column/row index/value */ 19645485867bSBarry Smith idc = adx[aptr[i]]; 19655485867bSBarry Smith idr = bdx[bptr[idc]]; 19665485867bSBarry Smith vc = va[aptr[i]]; 19675485867bSBarry Smith vr = vb[bptr[idc]]; 19685485867bSBarry Smith if (i!=idr || PetscAbsScalar(vc-vr) > tol) { 19695485867bSBarry Smith *f = PETSC_FALSE; 19705485867bSBarry Smith goto done; 1971cd0d46ebSvictorle } else { 19725485867bSBarry Smith aptr[i]++; 19735485867bSBarry Smith if (B || i!=idc) bptr[idc]++; 1974cd0d46ebSvictorle } 1975cd0d46ebSvictorle } 1976cd0d46ebSvictorle } 1977cd0d46ebSvictorle done: 1978cd0d46ebSvictorle ierr = PetscFree(aptr);CHKERRQ(ierr); 19793aeef889SHong Zhang ierr = PetscFree(bptr);CHKERRQ(ierr); 1980cd0d46ebSvictorle PetscFunctionReturn(0); 1981cd0d46ebSvictorle } 1982cd0d46ebSvictorle EXTERN_C_END 1983cd0d46ebSvictorle 19841cbb95d3SBarry Smith EXTERN_C_BEGIN 19851cbb95d3SBarry Smith #undef __FUNCT__ 19861cbb95d3SBarry Smith #define __FUNCT__ "MatIsHermitianTranspose_SeqAIJ" 19877087cfbeSBarry Smith PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 19881cbb95d3SBarry Smith { 19891cbb95d3SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *) A->data,*bij = (Mat_SeqAIJ*) A->data; 199054f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 199154f21887SBarry Smith MatScalar *va,*vb; 19921cbb95d3SBarry Smith PetscErrorCode ierr; 19931cbb95d3SBarry Smith PetscInt ma,na,mb,nb, i; 19941cbb95d3SBarry Smith 19951cbb95d3SBarry Smith PetscFunctionBegin; 19961cbb95d3SBarry Smith bij = (Mat_SeqAIJ *) B->data; 19971cbb95d3SBarry Smith 19981cbb95d3SBarry Smith ierr = MatGetSize(A,&ma,&na);CHKERRQ(ierr); 19991cbb95d3SBarry Smith ierr = MatGetSize(B,&mb,&nb);CHKERRQ(ierr); 20001cbb95d3SBarry Smith if (ma!=nb || na!=mb){ 20011cbb95d3SBarry Smith *f = PETSC_FALSE; 20021cbb95d3SBarry Smith PetscFunctionReturn(0); 20031cbb95d3SBarry Smith } 20041cbb95d3SBarry Smith aii = aij->i; bii = bij->i; 20051cbb95d3SBarry Smith adx = aij->j; bdx = bij->j; 20061cbb95d3SBarry Smith va = aij->a; vb = bij->a; 20071cbb95d3SBarry Smith ierr = PetscMalloc(ma*sizeof(PetscInt),&aptr);CHKERRQ(ierr); 20081cbb95d3SBarry Smith ierr = PetscMalloc(mb*sizeof(PetscInt),&bptr);CHKERRQ(ierr); 20091cbb95d3SBarry Smith for (i=0; i<ma; i++) aptr[i] = aii[i]; 20101cbb95d3SBarry Smith for (i=0; i<mb; i++) bptr[i] = bii[i]; 20111cbb95d3SBarry Smith 20121cbb95d3SBarry Smith *f = PETSC_TRUE; 20131cbb95d3SBarry Smith for (i=0; i<ma; i++) { 20141cbb95d3SBarry Smith while (aptr[i]<aii[i+1]) { 20151cbb95d3SBarry Smith PetscInt idc,idr; 20161cbb95d3SBarry Smith PetscScalar vc,vr; 20171cbb95d3SBarry Smith /* column/row index/value */ 20181cbb95d3SBarry Smith idc = adx[aptr[i]]; 20191cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 20201cbb95d3SBarry Smith vc = va[aptr[i]]; 20211cbb95d3SBarry Smith vr = vb[bptr[idc]]; 20221cbb95d3SBarry Smith if (i!=idr || PetscAbsScalar(vc-PetscConj(vr)) > tol) { 20231cbb95d3SBarry Smith *f = PETSC_FALSE; 20241cbb95d3SBarry Smith goto done; 20251cbb95d3SBarry Smith } else { 20261cbb95d3SBarry Smith aptr[i]++; 20271cbb95d3SBarry Smith if (B || i!=idc) bptr[idc]++; 20281cbb95d3SBarry Smith } 20291cbb95d3SBarry Smith } 20301cbb95d3SBarry Smith } 20311cbb95d3SBarry Smith done: 20321cbb95d3SBarry Smith ierr = PetscFree(aptr);CHKERRQ(ierr); 20331cbb95d3SBarry Smith ierr = PetscFree(bptr);CHKERRQ(ierr); 20341cbb95d3SBarry Smith PetscFunctionReturn(0); 20351cbb95d3SBarry Smith } 20361cbb95d3SBarry Smith EXTERN_C_END 20371cbb95d3SBarry Smith 20389e29f15eSvictorle #undef __FUNCT__ 20399e29f15eSvictorle #define __FUNCT__ "MatIsSymmetric_SeqAIJ" 2040ace3abfcSBarry Smith PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 20419e29f15eSvictorle { 2042dfbe8321SBarry Smith PetscErrorCode ierr; 20439e29f15eSvictorle PetscFunctionBegin; 20445485867bSBarry Smith ierr = MatIsTranspose_SeqAIJ(A,A,tol,f);CHKERRQ(ierr); 20459e29f15eSvictorle PetscFunctionReturn(0); 20469e29f15eSvictorle } 20479e29f15eSvictorle 20484a2ae208SSatish Balay #undef __FUNCT__ 20491cbb95d3SBarry Smith #define __FUNCT__ "MatIsHermitian_SeqAIJ" 2050ace3abfcSBarry Smith PetscErrorCode MatIsHermitian_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 20511cbb95d3SBarry Smith { 20521cbb95d3SBarry Smith PetscErrorCode ierr; 20531cbb95d3SBarry Smith PetscFunctionBegin; 20541cbb95d3SBarry Smith ierr = MatIsHermitianTranspose_SeqAIJ(A,A,tol,f);CHKERRQ(ierr); 20551cbb95d3SBarry Smith PetscFunctionReturn(0); 20561cbb95d3SBarry Smith } 20571cbb95d3SBarry Smith 20581cbb95d3SBarry Smith #undef __FUNCT__ 20594a2ae208SSatish Balay #define __FUNCT__ "MatDiagonalScale_SeqAIJ" 2060dfbe8321SBarry Smith PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A,Vec ll,Vec rr) 206117ab2063SBarry Smith { 2062416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 206354f21887SBarry Smith PetscScalar *l,*r,x; 206454f21887SBarry Smith MatScalar *v; 2065dfbe8321SBarry Smith PetscErrorCode ierr; 2066d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,M,nz = a->nz,*jj; 206717ab2063SBarry Smith 20683a40ed3dSBarry Smith PetscFunctionBegin; 206917ab2063SBarry Smith if (ll) { 20703ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 20713ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 2072e1311b90SBarry Smith ierr = VecGetLocalSize(ll,&m);CHKERRQ(ierr); 2073e32f2f54SBarry Smith if (m != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Left scaling vector wrong length"); 20741ebc52fbSHong Zhang ierr = VecGetArray(ll,&l);CHKERRQ(ierr); 2075416022c9SBarry Smith v = a->a; 207617ab2063SBarry Smith for (i=0; i<m; i++) { 207717ab2063SBarry Smith x = l[i]; 2078416022c9SBarry Smith M = a->i[i+1] - a->i[i]; 207917ab2063SBarry Smith for (j=0; j<M; j++) { (*v++) *= x;} 208017ab2063SBarry Smith } 20811ebc52fbSHong Zhang ierr = VecRestoreArray(ll,&l);CHKERRQ(ierr); 2082efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 208317ab2063SBarry Smith } 208417ab2063SBarry Smith if (rr) { 2085e1311b90SBarry Smith ierr = VecGetLocalSize(rr,&n);CHKERRQ(ierr); 2086e32f2f54SBarry Smith if (n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Right scaling vector wrong length"); 20871ebc52fbSHong Zhang ierr = VecGetArray(rr,&r);CHKERRQ(ierr); 2088416022c9SBarry Smith v = a->a; jj = a->j; 208917ab2063SBarry Smith for (i=0; i<nz; i++) { 2090bfeeae90SHong Zhang (*v++) *= r[*jj++]; 209117ab2063SBarry Smith } 20921ebc52fbSHong Zhang ierr = VecRestoreArray(rr,&r);CHKERRQ(ierr); 2093efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 209417ab2063SBarry Smith } 209586c113feSBarry Smith a->idiagvalid = PETSC_FALSE; 209686c113feSBarry Smith a->ibdiagvalid = PETSC_FALSE; 20973a40ed3dSBarry Smith PetscFunctionReturn(0); 209817ab2063SBarry Smith } 209917ab2063SBarry Smith 21004a2ae208SSatish Balay #undef __FUNCT__ 21014a2ae208SSatish Balay #define __FUNCT__ "MatGetSubMatrix_SeqAIJ" 210297f1f81fSBarry Smith PetscErrorCode MatGetSubMatrix_SeqAIJ(Mat A,IS isrow,IS iscol,PetscInt csize,MatReuse scall,Mat *B) 210317ab2063SBarry Smith { 2104db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*c; 21056849ba73SBarry Smith PetscErrorCode ierr; 2106d0f46423SBarry Smith PetscInt *smap,i,k,kstart,kend,oldcols = A->cmap->n,*lens; 210797f1f81fSBarry Smith PetscInt row,mat_i,*mat_j,tcol,first,step,*mat_ilen,sum,lensi; 21085d0c19d7SBarry Smith const PetscInt *irow,*icol; 21095d0c19d7SBarry Smith PetscInt nrows,ncols; 211097f1f81fSBarry Smith PetscInt *starts,*j_new,*i_new,*aj = a->j,*ai = a->i,ii,*ailen = a->ilen; 211154f21887SBarry Smith MatScalar *a_new,*mat_a; 2112416022c9SBarry Smith Mat C; 2113ace3abfcSBarry Smith PetscBool stride,sorted; 211417ab2063SBarry Smith 21153a40ed3dSBarry Smith PetscFunctionBegin; 211614ca34e6SBarry Smith ierr = ISSorted(isrow,&sorted);CHKERRQ(ierr); 2117e32f2f54SBarry Smith if (!sorted) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"ISrow is not sorted"); 211814ca34e6SBarry Smith ierr = ISSorted(iscol,&sorted);CHKERRQ(ierr); 2119e32f2f54SBarry Smith if (!sorted) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"IScol is not sorted"); 212099141d43SSatish Balay 212117ab2063SBarry Smith ierr = ISGetIndices(isrow,&irow);CHKERRQ(ierr); 2122b9b97703SBarry Smith ierr = ISGetLocalSize(isrow,&nrows);CHKERRQ(ierr); 2123b9b97703SBarry Smith ierr = ISGetLocalSize(iscol,&ncols);CHKERRQ(ierr); 212417ab2063SBarry Smith 2125fee21e36SBarry Smith ierr = ISStrideGetInfo(iscol,&first,&step);CHKERRQ(ierr); 21260dbe5b1eSSatish Balay ierr = PetscTypeCompare((PetscObject)iscol,ISSTRIDE,&stride);CHKERRQ(ierr); 2127fee21e36SBarry Smith if (stride && step == 1) { 212802834360SBarry Smith /* special case of contiguous rows */ 21290e83c824SBarry Smith ierr = PetscMalloc2(nrows,PetscInt,&lens,nrows,PetscInt,&starts);CHKERRQ(ierr); 213002834360SBarry Smith /* loop over new rows determining lens and starting points */ 213102834360SBarry Smith for (i=0; i<nrows; i++) { 2132bfeeae90SHong Zhang kstart = ai[irow[i]]; 2133a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 213402834360SBarry Smith for (k=kstart; k<kend; k++) { 2135bfeeae90SHong Zhang if (aj[k] >= first) { 213602834360SBarry Smith starts[i] = k; 213702834360SBarry Smith break; 213802834360SBarry Smith } 213902834360SBarry Smith } 2140a2744918SBarry Smith sum = 0; 214102834360SBarry Smith while (k < kend) { 2142bfeeae90SHong Zhang if (aj[k++] >= first+ncols) break; 2143a2744918SBarry Smith sum++; 214402834360SBarry Smith } 2145a2744918SBarry Smith lens[i] = sum; 214602834360SBarry Smith } 214702834360SBarry Smith /* create submatrix */ 2148cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 214997f1f81fSBarry Smith PetscInt n_cols,n_rows; 215008480c60SBarry Smith ierr = MatGetSize(*B,&n_rows,&n_cols);CHKERRQ(ierr); 2151e32f2f54SBarry Smith if (n_rows != nrows || n_cols != ncols) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Reused submatrix wrong size"); 2152d8ced48eSBarry Smith ierr = MatZeroEntries(*B);CHKERRQ(ierr); 215308480c60SBarry Smith C = *B; 21543a40ed3dSBarry Smith } else { 21557adad957SLisandro Dalcin ierr = MatCreate(((PetscObject)A)->comm,&C);CHKERRQ(ierr); 2156f69a0ea3SMatthew Knepley ierr = MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr); 21577adad957SLisandro Dalcin ierr = MatSetType(C,((PetscObject)A)->type_name);CHKERRQ(ierr); 2158ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens);CHKERRQ(ierr); 215908480c60SBarry Smith } 2160db02288aSLois Curfman McInnes c = (Mat_SeqAIJ*)C->data; 2161db02288aSLois Curfman McInnes 216202834360SBarry Smith /* loop over rows inserting into submatrix */ 2163db02288aSLois Curfman McInnes a_new = c->a; 2164db02288aSLois Curfman McInnes j_new = c->j; 2165db02288aSLois Curfman McInnes i_new = c->i; 2166bfeeae90SHong Zhang 216702834360SBarry Smith for (i=0; i<nrows; i++) { 2168a2744918SBarry Smith ii = starts[i]; 2169a2744918SBarry Smith lensi = lens[i]; 2170a2744918SBarry Smith for (k=0; k<lensi; k++) { 2171a2744918SBarry Smith *j_new++ = aj[ii+k] - first; 217202834360SBarry Smith } 217387828ca2SBarry Smith ierr = PetscMemcpy(a_new,a->a + starts[i],lensi*sizeof(PetscScalar));CHKERRQ(ierr); 2174a2744918SBarry Smith a_new += lensi; 2175a2744918SBarry Smith i_new[i+1] = i_new[i] + lensi; 2176a2744918SBarry Smith c->ilen[i] = lensi; 217702834360SBarry Smith } 21780e83c824SBarry Smith ierr = PetscFree2(lens,starts);CHKERRQ(ierr); 21793a40ed3dSBarry Smith } else { 218002834360SBarry Smith ierr = ISGetIndices(iscol,&icol);CHKERRQ(ierr); 21810e83c824SBarry Smith ierr = PetscMalloc(oldcols*sizeof(PetscInt),&smap);CHKERRQ(ierr); 218297f1f81fSBarry Smith ierr = PetscMemzero(smap,oldcols*sizeof(PetscInt));CHKERRQ(ierr); 21830e83c824SBarry Smith ierr = PetscMalloc((1+nrows)*sizeof(PetscInt),&lens);CHKERRQ(ierr); 21844dcab191SBarry Smith for (i=0; i<ncols; i++) { 21854dcab191SBarry Smith #if defined(PETSC_USE_DEBUG) 21864dcab191SBarry Smith if (icol[i] >= oldcols) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Requesting column beyond largest column icol[%D] %D <= A->cmap->n %D",i,icol[i],oldcols); 21874dcab191SBarry Smith #endif 21884dcab191SBarry Smith smap[icol[i]] = i+1; 21894dcab191SBarry Smith } 21904dcab191SBarry Smith 219102834360SBarry Smith /* determine lens of each row */ 219202834360SBarry Smith for (i=0; i<nrows; i++) { 2193bfeeae90SHong Zhang kstart = ai[irow[i]]; 219402834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 219502834360SBarry Smith lens[i] = 0; 219602834360SBarry Smith for (k=kstart; k<kend; k++) { 2197bfeeae90SHong Zhang if (smap[aj[k]]) { 219802834360SBarry Smith lens[i]++; 219902834360SBarry Smith } 220002834360SBarry Smith } 220102834360SBarry Smith } 220217ab2063SBarry Smith /* Create and fill new matrix */ 2203a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2204ace3abfcSBarry Smith PetscBool equal; 22050f5bd95cSBarry Smith 220699141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2207e32f2f54SBarry Smith if ((*B)->rmap->n != nrows || (*B)->cmap->n != ncols) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong size"); 2208d0f46423SBarry Smith ierr = PetscMemcmp(c->ilen,lens,(*B)->rmap->n*sizeof(PetscInt),&equal);CHKERRQ(ierr); 22090f5bd95cSBarry Smith if (!equal) { 2210e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong no of nonzeros"); 221199141d43SSatish Balay } 2212d0f46423SBarry Smith ierr = PetscMemzero(c->ilen,(*B)->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 221308480c60SBarry Smith C = *B; 22143a40ed3dSBarry Smith } else { 22157adad957SLisandro Dalcin ierr = MatCreate(((PetscObject)A)->comm,&C);CHKERRQ(ierr); 2216f69a0ea3SMatthew Knepley ierr = MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr); 22177adad957SLisandro Dalcin ierr = MatSetType(C,((PetscObject)A)->type_name);CHKERRQ(ierr); 2218ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens);CHKERRQ(ierr); 221908480c60SBarry Smith } 222099141d43SSatish Balay c = (Mat_SeqAIJ *)(C->data); 222117ab2063SBarry Smith for (i=0; i<nrows; i++) { 222299141d43SSatish Balay row = irow[i]; 2223bfeeae90SHong Zhang kstart = ai[row]; 222499141d43SSatish Balay kend = kstart + a->ilen[row]; 2225bfeeae90SHong Zhang mat_i = c->i[i]; 222699141d43SSatish Balay mat_j = c->j + mat_i; 222799141d43SSatish Balay mat_a = c->a + mat_i; 222899141d43SSatish Balay mat_ilen = c->ilen + i; 222917ab2063SBarry Smith for (k=kstart; k<kend; k++) { 2230bfeeae90SHong Zhang if ((tcol=smap[a->j[k]])) { 2231ed480e8bSBarry Smith *mat_j++ = tcol - 1; 223299141d43SSatish Balay *mat_a++ = a->a[k]; 223399141d43SSatish Balay (*mat_ilen)++; 223499141d43SSatish Balay 223517ab2063SBarry Smith } 223617ab2063SBarry Smith } 223717ab2063SBarry Smith } 223802834360SBarry Smith /* Free work space */ 223902834360SBarry Smith ierr = ISRestoreIndices(iscol,&icol);CHKERRQ(ierr); 2240606d414cSSatish Balay ierr = PetscFree(smap);CHKERRQ(ierr); 2241606d414cSSatish Balay ierr = PetscFree(lens);CHKERRQ(ierr); 224202834360SBarry Smith } 22436d4a8577SBarry Smith ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 22446d4a8577SBarry Smith ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 224517ab2063SBarry Smith 224617ab2063SBarry Smith ierr = ISRestoreIndices(isrow,&irow);CHKERRQ(ierr); 2247416022c9SBarry Smith *B = C; 22483a40ed3dSBarry Smith PetscFunctionReturn(0); 224917ab2063SBarry Smith } 225017ab2063SBarry Smith 22511df811f5SHong Zhang #undef __FUNCT__ 225282d44351SHong Zhang #define __FUNCT__ "MatGetMultiProcBlock_SeqAIJ" 225382d44351SHong Zhang PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat,MPI_Comm subComm,Mat* subMat) 225482d44351SHong Zhang { 225582d44351SHong Zhang PetscErrorCode ierr; 225682d44351SHong Zhang Mat B; 225782d44351SHong Zhang 225882d44351SHong Zhang PetscFunctionBegin; 225982d44351SHong Zhang ierr = MatCreate(subComm,&B);CHKERRQ(ierr); 226082d44351SHong Zhang ierr = MatSetSizes(B,mat->rmap->n,mat->cmap->n,mat->rmap->n,mat->cmap->n);CHKERRQ(ierr); 226182d44351SHong Zhang ierr = MatSetType(B,MATSEQAIJ);CHKERRQ(ierr); 226282d44351SHong Zhang ierr = MatDuplicateNoCreate_SeqAIJ(B,mat,MAT_COPY_VALUES,PETSC_TRUE);CHKERRQ(ierr); 226382d44351SHong Zhang *subMat = B; 226482d44351SHong Zhang PetscFunctionReturn(0); 226582d44351SHong Zhang } 226682d44351SHong Zhang 226782d44351SHong Zhang #undef __FUNCT__ 22684a2ae208SSatish Balay #define __FUNCT__ "MatILUFactor_SeqAIJ" 22690481f469SBarry Smith PetscErrorCode MatILUFactor_SeqAIJ(Mat inA,IS row,IS col,const MatFactorInfo *info) 2270a871dcd8SBarry Smith { 227163b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 2272dfbe8321SBarry Smith PetscErrorCode ierr; 227363b91edcSBarry Smith Mat outA; 2274ace3abfcSBarry Smith PetscBool row_identity,col_identity; 227563b91edcSBarry Smith 22763a40ed3dSBarry Smith PetscFunctionBegin; 2277e32f2f54SBarry Smith if (info->levels != 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Only levels=0 supported for in-place ilu"); 22781df811f5SHong Zhang 2279b8a78c4aSBarry Smith ierr = ISIdentity(row,&row_identity);CHKERRQ(ierr); 2280b8a78c4aSBarry Smith ierr = ISIdentity(col,&col_identity);CHKERRQ(ierr); 2281a871dcd8SBarry Smith 228263b91edcSBarry Smith outA = inA; 2283d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 2284c38d4ed2SBarry Smith ierr = PetscObjectReference((PetscObject)row);CHKERRQ(ierr); 22856bf464f9SBarry Smith ierr = ISDestroy(&a->row);CHKERRQ(ierr); 2286c3122656SLisandro Dalcin a->row = row; 2287c38d4ed2SBarry Smith ierr = PetscObjectReference((PetscObject)col);CHKERRQ(ierr); 22886bf464f9SBarry Smith ierr = ISDestroy(&a->col);CHKERRQ(ierr); 2289c3122656SLisandro Dalcin a->col = col; 229063b91edcSBarry Smith 229136db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 22926bf464f9SBarry Smith ierr = ISDestroy(&a->icol);CHKERRQ(ierr); 22934c49b128SBarry Smith ierr = ISInvertPermutation(col,PETSC_DECIDE,&a->icol);CHKERRQ(ierr); 229452e6d16bSBarry Smith ierr = PetscLogObjectParent(inA,a->icol);CHKERRQ(ierr); 2295f0ec6fceSSatish Balay 229694a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 2297d0f46423SBarry Smith ierr = PetscMalloc((inA->rmap->n+1)*sizeof(PetscScalar),&a->solve_work);CHKERRQ(ierr); 2298d0f46423SBarry Smith ierr = PetscLogObjectMemory(inA, (inA->rmap->n+1)*sizeof(PetscScalar));CHKERRQ(ierr); 229994a9d846SBarry Smith } 230063b91edcSBarry Smith 2301f1e2ffcdSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(inA);CHKERRQ(ierr); 2302137fb511SHong Zhang if (row_identity && col_identity) { 2303ad04f41aSHong Zhang ierr = MatLUFactorNumeric_SeqAIJ_inplace(outA,inA,info);CHKERRQ(ierr); 2304137fb511SHong Zhang } else { 2305719d5645SBarry Smith ierr = MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA,inA,info);CHKERRQ(ierr); 2306137fb511SHong Zhang } 23073a40ed3dSBarry Smith PetscFunctionReturn(0); 2308a871dcd8SBarry Smith } 2309a871dcd8SBarry Smith 23104a2ae208SSatish Balay #undef __FUNCT__ 23114a2ae208SSatish Balay #define __FUNCT__ "MatScale_SeqAIJ" 2312f4df32b1SMatthew Knepley PetscErrorCode MatScale_SeqAIJ(Mat inA,PetscScalar alpha) 2313f0b747eeSBarry Smith { 2314f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 2315f4df32b1SMatthew Knepley PetscScalar oalpha = alpha; 2316efee365bSSatish Balay PetscErrorCode ierr; 23170805154bSBarry Smith PetscBLASInt one = 1,bnz = PetscBLASIntCast(a->nz); 23183a40ed3dSBarry Smith 23193a40ed3dSBarry Smith PetscFunctionBegin; 2320f4df32b1SMatthew Knepley BLASscal_(&bnz,&oalpha,a->a,&one); 2321efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 232286c113feSBarry Smith a->idiagvalid = PETSC_FALSE; 232386c113feSBarry Smith a->ibdiagvalid = PETSC_FALSE; 23243a40ed3dSBarry Smith PetscFunctionReturn(0); 2325f0b747eeSBarry Smith } 2326f0b747eeSBarry Smith 23274a2ae208SSatish Balay #undef __FUNCT__ 23284a2ae208SSatish Balay #define __FUNCT__ "MatGetSubMatrices_SeqAIJ" 232997f1f81fSBarry Smith PetscErrorCode MatGetSubMatrices_SeqAIJ(Mat A,PetscInt n,const IS irow[],const IS icol[],MatReuse scall,Mat *B[]) 2330cddf8d76SBarry Smith { 2331dfbe8321SBarry Smith PetscErrorCode ierr; 233297f1f81fSBarry Smith PetscInt i; 2333cddf8d76SBarry Smith 23343a40ed3dSBarry Smith PetscFunctionBegin; 2335cddf8d76SBarry Smith if (scall == MAT_INITIAL_MATRIX) { 2336b0a32e0cSBarry Smith ierr = PetscMalloc((n+1)*sizeof(Mat),B);CHKERRQ(ierr); 2337cddf8d76SBarry Smith } 2338cddf8d76SBarry Smith 2339cddf8d76SBarry Smith for (i=0; i<n; i++) { 23406a6a5d1dSBarry Smith ierr = MatGetSubMatrix_SeqAIJ(A,irow[i],icol[i],PETSC_DECIDE,scall,&(*B)[i]);CHKERRQ(ierr); 2341cddf8d76SBarry Smith } 23423a40ed3dSBarry Smith PetscFunctionReturn(0); 2343cddf8d76SBarry Smith } 2344cddf8d76SBarry Smith 23454a2ae208SSatish Balay #undef __FUNCT__ 23464a2ae208SSatish Balay #define __FUNCT__ "MatIncreaseOverlap_SeqAIJ" 234797f1f81fSBarry Smith PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A,PetscInt is_max,IS is[],PetscInt ov) 23484dcbc457SBarry Smith { 2349e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 23506849ba73SBarry Smith PetscErrorCode ierr; 23515d0c19d7SBarry Smith PetscInt row,i,j,k,l,m,n,*nidx,isz,val; 23525d0c19d7SBarry Smith const PetscInt *idx; 235397f1f81fSBarry Smith PetscInt start,end,*ai,*aj; 2354f1af5d2fSBarry Smith PetscBT table; 2355bbd702dbSSatish Balay 23563a40ed3dSBarry Smith PetscFunctionBegin; 2357d0f46423SBarry Smith m = A->rmap->n; 2358e4d965acSSatish Balay ai = a->i; 2359bfeeae90SHong Zhang aj = a->j; 23608a047759SSatish Balay 2361e32f2f54SBarry Smith if (ov < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"illegal negative overlap value used"); 236206763907SSatish Balay 236397f1f81fSBarry Smith ierr = PetscMalloc((m+1)*sizeof(PetscInt),&nidx);CHKERRQ(ierr); 23646831982aSBarry Smith ierr = PetscBTCreate(m,table);CHKERRQ(ierr); 236506763907SSatish Balay 2366e4d965acSSatish Balay for (i=0; i<is_max; i++) { 2367b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2368e4d965acSSatish Balay isz = 0; 23696831982aSBarry Smith ierr = PetscBTMemzero(m,table);CHKERRQ(ierr); 2370e4d965acSSatish Balay 2371e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 23724dcbc457SBarry Smith ierr = ISGetIndices(is[i],&idx);CHKERRQ(ierr); 2373b9b97703SBarry Smith ierr = ISGetLocalSize(is[i],&n);CHKERRQ(ierr); 2374e4d965acSSatish Balay 2375dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2376e4d965acSSatish Balay for (j=0; j<n ; ++j){ 2377f1af5d2fSBarry Smith if(!PetscBTLookupSet(table,idx[j])) { nidx[isz++] = idx[j];} 23784dcbc457SBarry Smith } 237906763907SSatish Balay ierr = ISRestoreIndices(is[i],&idx);CHKERRQ(ierr); 23806bf464f9SBarry Smith ierr = ISDestroy(&is[i]);CHKERRQ(ierr); 2381e4d965acSSatish Balay 238204a348a9SBarry Smith k = 0; 238304a348a9SBarry Smith for (j=0; j<ov; j++){ /* for each overlap */ 238404a348a9SBarry Smith n = isz; 238506763907SSatish Balay for (; k<n ; k++){ /* do only those rows in nidx[k], which are not done yet */ 2386e4d965acSSatish Balay row = nidx[k]; 2387e4d965acSSatish Balay start = ai[row]; 2388e4d965acSSatish Balay end = ai[row+1]; 238904a348a9SBarry Smith for (l = start; l<end ; l++){ 2390efb16452SHong Zhang val = aj[l] ; 2391f1af5d2fSBarry Smith if (!PetscBTLookupSet(table,val)) {nidx[isz++] = val;} 2392e4d965acSSatish Balay } 2393e4d965acSSatish Balay } 2394e4d965acSSatish Balay } 239570b3c8c7SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,isz,nidx,PETSC_COPY_VALUES,(is+i));CHKERRQ(ierr); 2396e4d965acSSatish Balay } 23976831982aSBarry Smith ierr = PetscBTDestroy(table);CHKERRQ(ierr); 2398606d414cSSatish Balay ierr = PetscFree(nidx);CHKERRQ(ierr); 23993a40ed3dSBarry Smith PetscFunctionReturn(0); 24004dcbc457SBarry Smith } 240117ab2063SBarry Smith 24020513a670SBarry Smith /* -------------------------------------------------------------- */ 24034a2ae208SSatish Balay #undef __FUNCT__ 24044a2ae208SSatish Balay #define __FUNCT__ "MatPermute_SeqAIJ" 2405dfbe8321SBarry Smith PetscErrorCode MatPermute_SeqAIJ(Mat A,IS rowp,IS colp,Mat *B) 24060513a670SBarry Smith { 24070513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 24086849ba73SBarry Smith PetscErrorCode ierr; 24093b98c0a2SBarry Smith PetscInt i,nz = 0,m = A->rmap->n,n = A->cmap->n; 24105d0c19d7SBarry Smith const PetscInt *row,*col; 24115d0c19d7SBarry Smith PetscInt *cnew,j,*lens; 241256cd22aeSBarry Smith IS icolp,irowp; 24133b98c0a2SBarry Smith PetscInt *cwork = PETSC_NULL; 24143b98c0a2SBarry Smith PetscScalar *vwork = PETSC_NULL; 24150513a670SBarry Smith 24163a40ed3dSBarry Smith PetscFunctionBegin; 24174c49b128SBarry Smith ierr = ISInvertPermutation(rowp,PETSC_DECIDE,&irowp);CHKERRQ(ierr); 241856cd22aeSBarry Smith ierr = ISGetIndices(irowp,&row);CHKERRQ(ierr); 24194c49b128SBarry Smith ierr = ISInvertPermutation(colp,PETSC_DECIDE,&icolp);CHKERRQ(ierr); 242056cd22aeSBarry Smith ierr = ISGetIndices(icolp,&col);CHKERRQ(ierr); 24210513a670SBarry Smith 24220513a670SBarry Smith /* determine lengths of permuted rows */ 242397f1f81fSBarry Smith ierr = PetscMalloc((m+1)*sizeof(PetscInt),&lens);CHKERRQ(ierr); 24240513a670SBarry Smith for (i=0; i<m; i++) { 24250513a670SBarry Smith lens[row[i]] = a->i[i+1] - a->i[i]; 24260513a670SBarry Smith } 24277adad957SLisandro Dalcin ierr = MatCreate(((PetscObject)A)->comm,B);CHKERRQ(ierr); 2428f69a0ea3SMatthew Knepley ierr = MatSetSizes(*B,m,n,m,n);CHKERRQ(ierr); 24297adad957SLisandro Dalcin ierr = MatSetType(*B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2430ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(*B,0,lens);CHKERRQ(ierr); 2431606d414cSSatish Balay ierr = PetscFree(lens);CHKERRQ(ierr); 24320513a670SBarry Smith 243397f1f81fSBarry Smith ierr = PetscMalloc(n*sizeof(PetscInt),&cnew);CHKERRQ(ierr); 24340513a670SBarry Smith for (i=0; i<m; i++) { 243532ec9ce4SBarry Smith ierr = MatGetRow_SeqAIJ(A,i,&nz,&cwork,&vwork);CHKERRQ(ierr); 24360513a670SBarry Smith for (j=0; j<nz; j++) { cnew[j] = col[cwork[j]];} 2437cdc0ba36SBarry Smith ierr = MatSetValues_SeqAIJ(*B,1,&row[i],nz,cnew,vwork,INSERT_VALUES);CHKERRQ(ierr); 243832ec9ce4SBarry Smith ierr = MatRestoreRow_SeqAIJ(A,i,&nz,&cwork,&vwork);CHKERRQ(ierr); 24390513a670SBarry Smith } 2440606d414cSSatish Balay ierr = PetscFree(cnew);CHKERRQ(ierr); 24413c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 24420513a670SBarry Smith ierr = MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 24430513a670SBarry Smith ierr = MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 244456cd22aeSBarry Smith ierr = ISRestoreIndices(irowp,&row);CHKERRQ(ierr); 244556cd22aeSBarry Smith ierr = ISRestoreIndices(icolp,&col);CHKERRQ(ierr); 24466bf464f9SBarry Smith ierr = ISDestroy(&irowp);CHKERRQ(ierr); 24476bf464f9SBarry Smith ierr = ISDestroy(&icolp);CHKERRQ(ierr); 24483a40ed3dSBarry Smith PetscFunctionReturn(0); 24490513a670SBarry Smith } 24500513a670SBarry Smith 24514a2ae208SSatish Balay #undef __FUNCT__ 24524a2ae208SSatish Balay #define __FUNCT__ "MatCopy_SeqAIJ" 2453dfbe8321SBarry Smith PetscErrorCode MatCopy_SeqAIJ(Mat A,Mat B,MatStructure str) 2454cb5b572fSBarry Smith { 2455dfbe8321SBarry Smith PetscErrorCode ierr; 2456cb5b572fSBarry Smith 2457cb5b572fSBarry Smith PetscFunctionBegin; 245833f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 245933f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2460be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2461be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ*)B->data; 2462be6bf707SBarry Smith 2463700c5bfcSBarry Smith if (a->i[A->rmap->n] != b->i[B->rmap->n]) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Number of nonzeros in two matrices are different"); 2464d0f46423SBarry Smith ierr = PetscMemcpy(b->a,a->a,(a->i[A->rmap->n])*sizeof(PetscScalar));CHKERRQ(ierr); 2465cb5b572fSBarry Smith } else { 2466cb5b572fSBarry Smith ierr = MatCopy_Basic(A,B,str);CHKERRQ(ierr); 2467cb5b572fSBarry Smith } 2468cb5b572fSBarry Smith PetscFunctionReturn(0); 2469cb5b572fSBarry Smith } 2470cb5b572fSBarry Smith 24714a2ae208SSatish Balay #undef __FUNCT__ 24724a2ae208SSatish Balay #define __FUNCT__ "MatSetUpPreallocation_SeqAIJ" 2473dfbe8321SBarry Smith PetscErrorCode MatSetUpPreallocation_SeqAIJ(Mat A) 2474273d9f13SBarry Smith { 2475dfbe8321SBarry Smith PetscErrorCode ierr; 2476273d9f13SBarry Smith 2477273d9f13SBarry Smith PetscFunctionBegin; 2478ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(A,PETSC_DEFAULT,0);CHKERRQ(ierr); 2479273d9f13SBarry Smith PetscFunctionReturn(0); 2480273d9f13SBarry Smith } 2481273d9f13SBarry Smith 24824a2ae208SSatish Balay #undef __FUNCT__ 24834a2ae208SSatish Balay #define __FUNCT__ "MatGetArray_SeqAIJ" 2484a77337e4SBarry Smith PetscErrorCode MatGetArray_SeqAIJ(Mat A,PetscScalar *array[]) 24856c0721eeSBarry Smith { 24866c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 24876c0721eeSBarry Smith PetscFunctionBegin; 24886c0721eeSBarry Smith *array = a->a; 24896c0721eeSBarry Smith PetscFunctionReturn(0); 24906c0721eeSBarry Smith } 24916c0721eeSBarry Smith 24924a2ae208SSatish Balay #undef __FUNCT__ 24934a2ae208SSatish Balay #define __FUNCT__ "MatRestoreArray_SeqAIJ" 2494dfbe8321SBarry Smith PetscErrorCode MatRestoreArray_SeqAIJ(Mat A,PetscScalar *array[]) 24956c0721eeSBarry Smith { 24966c0721eeSBarry Smith PetscFunctionBegin; 24976c0721eeSBarry Smith PetscFunctionReturn(0); 24986c0721eeSBarry Smith } 2499273d9f13SBarry Smith 2500ee4f033dSBarry Smith #undef __FUNCT__ 2501ee4f033dSBarry Smith #define __FUNCT__ "MatFDColoringApply_SeqAIJ" 2502dfbe8321SBarry Smith PetscErrorCode MatFDColoringApply_SeqAIJ(Mat J,MatFDColoring coloring,Vec x1,MatStructure *flag,void *sctx) 2503ee4f033dSBarry Smith { 25046849ba73SBarry Smith PetscErrorCode (*f)(void*,Vec,Vec,void*) = (PetscErrorCode (*)(void*,Vec,Vec,void *))coloring->f; 25056849ba73SBarry Smith PetscErrorCode ierr; 250697f1f81fSBarry Smith PetscInt k,N,start,end,l,row,col,srow,**vscaleforrow,m1,m2; 2507efb30889SBarry Smith PetscScalar dx,*y,*xx,*w3_array; 250887828ca2SBarry Smith PetscScalar *vscale_array; 2509ee4f033dSBarry Smith PetscReal epsilon = coloring->error_rel,umin = coloring->umin; 2510ee4f033dSBarry Smith Vec w1,w2,w3; 2511ee4f033dSBarry Smith void *fctx = coloring->fctx; 2512ace3abfcSBarry Smith PetscBool flg = PETSC_FALSE; 2513ee4f033dSBarry Smith 2514ee4f033dSBarry Smith PetscFunctionBegin; 2515ee4f033dSBarry Smith if (!coloring->w1) { 2516ee4f033dSBarry Smith ierr = VecDuplicate(x1,&coloring->w1);CHKERRQ(ierr); 251752e6d16bSBarry Smith ierr = PetscLogObjectParent(coloring,coloring->w1);CHKERRQ(ierr); 2518ee4f033dSBarry Smith ierr = VecDuplicate(x1,&coloring->w2);CHKERRQ(ierr); 251952e6d16bSBarry Smith ierr = PetscLogObjectParent(coloring,coloring->w2);CHKERRQ(ierr); 2520ee4f033dSBarry Smith ierr = VecDuplicate(x1,&coloring->w3);CHKERRQ(ierr); 252152e6d16bSBarry Smith ierr = PetscLogObjectParent(coloring,coloring->w3);CHKERRQ(ierr); 2522ee4f033dSBarry Smith } 2523ee4f033dSBarry Smith w1 = coloring->w1; w2 = coloring->w2; w3 = coloring->w3; 2524ee4f033dSBarry Smith 2525ee4f033dSBarry Smith ierr = MatSetUnfactored(J);CHKERRQ(ierr); 2526acfcf0e5SJed Brown ierr = PetscOptionsGetBool(((PetscObject)coloring)->prefix,"-mat_fd_coloring_dont_rezero",&flg,PETSC_NULL);CHKERRQ(ierr); 2527ee4f033dSBarry Smith if (flg) { 2528ae15b995SBarry Smith ierr = PetscInfo(coloring,"Not calling MatZeroEntries()\n");CHKERRQ(ierr); 2529ee4f033dSBarry Smith } else { 2530ace3abfcSBarry Smith PetscBool assembled; 25310b9b6f31SBarry Smith ierr = MatAssembled(J,&assembled);CHKERRQ(ierr); 25320b9b6f31SBarry Smith if (assembled) { 2533ee4f033dSBarry Smith ierr = MatZeroEntries(J);CHKERRQ(ierr); 2534ee4f033dSBarry Smith } 25350b9b6f31SBarry Smith } 2536ee4f033dSBarry Smith 2537ee4f033dSBarry Smith ierr = VecGetOwnershipRange(x1,&start,&end);CHKERRQ(ierr); 2538ee4f033dSBarry Smith ierr = VecGetSize(x1,&N);CHKERRQ(ierr); 2539ee4f033dSBarry Smith 2540ee4f033dSBarry Smith /* 2541ee4f033dSBarry Smith This is a horrible, horrible, hack. See DMMGComputeJacobian_Multigrid() it inproperly sets 2542ee4f033dSBarry Smith coloring->F for the coarser grids from the finest 2543ee4f033dSBarry Smith */ 2544ee4f033dSBarry Smith if (coloring->F) { 2545ee4f033dSBarry Smith ierr = VecGetLocalSize(coloring->F,&m1);CHKERRQ(ierr); 2546ee4f033dSBarry Smith ierr = VecGetLocalSize(w1,&m2);CHKERRQ(ierr); 2547ee4f033dSBarry Smith if (m1 != m2) { 2548ee4f033dSBarry Smith coloring->F = 0; 2549ee4f033dSBarry Smith } 2550ee4f033dSBarry Smith } 2551ee4f033dSBarry Smith 2552ee4f033dSBarry Smith if (coloring->F) { 2553ee4f033dSBarry Smith w1 = coloring->F; 2554ee4f033dSBarry Smith coloring->F = 0; 2555ee4f033dSBarry Smith } else { 255666f9b7ceSBarry Smith ierr = PetscLogEventBegin(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr); 2557ee4f033dSBarry Smith ierr = (*f)(sctx,x1,w1,fctx);CHKERRQ(ierr); 255866f9b7ceSBarry Smith ierr = PetscLogEventEnd(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr); 2559ee4f033dSBarry Smith } 2560ee4f033dSBarry Smith 2561ee4f033dSBarry Smith /* 2562ee4f033dSBarry Smith Compute all the scale factors and share with other processors 2563ee4f033dSBarry Smith */ 25641ebc52fbSHong Zhang ierr = VecGetArray(x1,&xx);CHKERRQ(ierr);xx = xx - start; 25651ebc52fbSHong Zhang ierr = VecGetArray(coloring->vscale,&vscale_array);CHKERRQ(ierr);vscale_array = vscale_array - start; 2566ee4f033dSBarry Smith for (k=0; k<coloring->ncolors; k++) { 2567ee4f033dSBarry Smith /* 2568ee4f033dSBarry Smith Loop over each column associated with color adding the 2569ee4f033dSBarry Smith perturbation to the vector w3. 2570ee4f033dSBarry Smith */ 2571ee4f033dSBarry Smith for (l=0; l<coloring->ncolumns[k]; l++) { 2572ee4f033dSBarry Smith col = coloring->columns[k][l]; /* column of the matrix we are probing for */ 2573ee4f033dSBarry Smith dx = xx[col]; 2574ee4f033dSBarry Smith if (dx == 0.0) dx = 1.0; 2575ee4f033dSBarry Smith #if !defined(PETSC_USE_COMPLEX) 2576ee4f033dSBarry Smith if (dx < umin && dx >= 0.0) dx = umin; 2577ee4f033dSBarry Smith else if (dx < 0.0 && dx > -umin) dx = -umin; 2578ee4f033dSBarry Smith #else 2579ee4f033dSBarry Smith if (PetscAbsScalar(dx) < umin && PetscRealPart(dx) >= 0.0) dx = umin; 2580ee4f033dSBarry Smith else if (PetscRealPart(dx) < 0.0 && PetscAbsScalar(dx) < umin) dx = -umin; 2581ee4f033dSBarry Smith #endif 2582ee4f033dSBarry Smith dx *= epsilon; 2583ee4f033dSBarry Smith vscale_array[col] = 1.0/dx; 2584ee4f033dSBarry Smith } 2585ee4f033dSBarry Smith } 25861ebc52fbSHong Zhang vscale_array = vscale_array + start;ierr = VecRestoreArray(coloring->vscale,&vscale_array);CHKERRQ(ierr); 2587ee4f033dSBarry Smith ierr = VecGhostUpdateBegin(coloring->vscale,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2588ee4f033dSBarry Smith ierr = VecGhostUpdateEnd(coloring->vscale,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2589ee4f033dSBarry Smith 2590ee4f033dSBarry Smith /* ierr = VecView(coloring->vscale,PETSC_VIEWER_STDOUT_WORLD); 2591ee4f033dSBarry Smith ierr = VecView(x1,PETSC_VIEWER_STDOUT_WORLD);*/ 2592ee4f033dSBarry Smith 2593ee4f033dSBarry Smith if (coloring->vscaleforrow) vscaleforrow = coloring->vscaleforrow; 2594ee4f033dSBarry Smith else vscaleforrow = coloring->columnsforrow; 2595ee4f033dSBarry Smith 25961ebc52fbSHong Zhang ierr = VecGetArray(coloring->vscale,&vscale_array);CHKERRQ(ierr); 2597ee4f033dSBarry Smith /* 2598ee4f033dSBarry Smith Loop over each color 2599ee4f033dSBarry Smith */ 2600ee4f033dSBarry Smith for (k=0; k<coloring->ncolors; k++) { 260149b058dcSBarry Smith coloring->currentcolor = k; 2602ee4f033dSBarry Smith ierr = VecCopy(x1,w3);CHKERRQ(ierr); 26031ebc52fbSHong Zhang ierr = VecGetArray(w3,&w3_array);CHKERRQ(ierr);w3_array = w3_array - start; 2604ee4f033dSBarry Smith /* 2605ee4f033dSBarry Smith Loop over each column associated with color adding the 2606ee4f033dSBarry Smith perturbation to the vector w3. 2607ee4f033dSBarry Smith */ 2608ee4f033dSBarry Smith for (l=0; l<coloring->ncolumns[k]; l++) { 2609ee4f033dSBarry Smith col = coloring->columns[k][l]; /* column of the matrix we are probing for */ 2610ee4f033dSBarry Smith dx = xx[col]; 26115b8514ebSBarry Smith if (dx == 0.0) dx = 1.0; 2612ee4f033dSBarry Smith #if !defined(PETSC_USE_COMPLEX) 2613ee4f033dSBarry Smith if (dx < umin && dx >= 0.0) dx = umin; 2614ee4f033dSBarry Smith else if (dx < 0.0 && dx > -umin) dx = -umin; 2615ee4f033dSBarry Smith #else 2616ee4f033dSBarry Smith if (PetscAbsScalar(dx) < umin && PetscRealPart(dx) >= 0.0) dx = umin; 2617ee4f033dSBarry Smith else if (PetscRealPart(dx) < 0.0 && PetscAbsScalar(dx) < umin) dx = -umin; 2618ee4f033dSBarry Smith #endif 2619ee4f033dSBarry Smith dx *= epsilon; 2620e32f2f54SBarry Smith if (!PetscAbsScalar(dx)) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Computed 0 differencing parameter"); 2621ee4f033dSBarry Smith w3_array[col] += dx; 2622ee4f033dSBarry Smith } 26231ebc52fbSHong Zhang w3_array = w3_array + start; ierr = VecRestoreArray(w3,&w3_array);CHKERRQ(ierr); 2624ee4f033dSBarry Smith 2625ee4f033dSBarry Smith /* 2626ee4f033dSBarry Smith Evaluate function at x1 + dx (here dx is a vector of perturbations) 2627ee4f033dSBarry Smith */ 2628ee4f033dSBarry Smith 262966f9b7ceSBarry Smith ierr = PetscLogEventBegin(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr); 2630ee4f033dSBarry Smith ierr = (*f)(sctx,w3,w2,fctx);CHKERRQ(ierr); 263166f9b7ceSBarry Smith ierr = PetscLogEventEnd(MAT_FDColoringFunction,0,0,0,0);CHKERRQ(ierr); 2632efb30889SBarry Smith ierr = VecAXPY(w2,-1.0,w1);CHKERRQ(ierr); 2633ee4f033dSBarry Smith 2634ee4f033dSBarry Smith /* 2635ee4f033dSBarry Smith Loop over rows of vector, putting results into Jacobian matrix 2636ee4f033dSBarry Smith */ 26371ebc52fbSHong Zhang ierr = VecGetArray(w2,&y);CHKERRQ(ierr); 2638ee4f033dSBarry Smith for (l=0; l<coloring->nrows[k]; l++) { 2639ee4f033dSBarry Smith row = coloring->rows[k][l]; 2640ee4f033dSBarry Smith col = coloring->columnsforrow[k][l]; 2641ee4f033dSBarry Smith y[row] *= vscale_array[vscaleforrow[k][l]]; 2642ee4f033dSBarry Smith srow = row + start; 2643ee4f033dSBarry Smith ierr = MatSetValues_SeqAIJ(J,1,&srow,1,&col,y+row,INSERT_VALUES);CHKERRQ(ierr); 2644ee4f033dSBarry Smith } 26451ebc52fbSHong Zhang ierr = VecRestoreArray(w2,&y);CHKERRQ(ierr); 2646ee4f033dSBarry Smith } 264749b058dcSBarry Smith coloring->currentcolor = k; 26481ebc52fbSHong Zhang ierr = VecRestoreArray(coloring->vscale,&vscale_array);CHKERRQ(ierr); 26491ebc52fbSHong Zhang xx = xx + start; ierr = VecRestoreArray(x1,&xx);CHKERRQ(ierr); 2650ee4f033dSBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2651ee4f033dSBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2652ee4f033dSBarry Smith PetscFunctionReturn(0); 2653ee4f033dSBarry Smith } 2654ee4f033dSBarry Smith 26558229c054SShri Abhyankar /* 26568229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 26578229c054SShri Abhyankar have different nonzero structure. 26588229c054SShri Abhyankar */ 2659ac90fabeSBarry Smith #undef __FUNCT__ 26608229c054SShri Abhyankar #define __FUNCT__ "MatAXPYGetPreallocation_SeqAIJ" 26618229c054SShri Abhyankar PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y,Mat X,PetscInt* nnz) 2662ec7775f6SShri Abhyankar { 26638229c054SShri Abhyankar PetscInt i,m=Y->rmap->N; 2664ec7775f6SShri Abhyankar Mat_SeqAIJ *x = (Mat_SeqAIJ*)X->data; 2665ec7775f6SShri Abhyankar Mat_SeqAIJ *y = (Mat_SeqAIJ*)Y->data; 2666ec7775f6SShri Abhyankar const PetscInt *xi = x->i,*yi = y->i; 2667ec7775f6SShri Abhyankar 2668ec7775f6SShri Abhyankar PetscFunctionBegin; 2669ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 2670ec7775f6SShri Abhyankar for(i=0; i<m; i++) { 26718af7cee1SJed Brown PetscInt j,k,nzx = xi[i+1] - xi[i],nzy = yi[i+1] - yi[i]; 26728af7cee1SJed Brown const PetscInt *xj = x->j+xi[i],*yj = y->j+yi[i]; 26738af7cee1SJed Brown nnz[i] = 0; 26748af7cee1SJed Brown for (j=0,k=0; j<nzx; j++) { /* Point in X */ 26758af7cee1SJed Brown for (; k<nzy && yj[k]<xj[j]; k++) nnz[i]++; /* Catch up to X */ 26768af7cee1SJed Brown if (k<nzy && yj[k]==xj[j]) k++; /* Skip duplicate */ 26778af7cee1SJed Brown nnz[i]++; 26788af7cee1SJed Brown } 26798af7cee1SJed Brown for (; k<nzy; k++) nnz[i]++; 2680ec7775f6SShri Abhyankar } 2681ec7775f6SShri Abhyankar PetscFunctionReturn(0); 2682ec7775f6SShri Abhyankar } 2683ec7775f6SShri Abhyankar 2684ec7775f6SShri Abhyankar #undef __FUNCT__ 2685ac90fabeSBarry Smith #define __FUNCT__ "MatAXPY_SeqAIJ" 2686f4df32b1SMatthew Knepley PetscErrorCode MatAXPY_SeqAIJ(Mat Y,PetscScalar a,Mat X,MatStructure str) 2687ac90fabeSBarry Smith { 2688dfbe8321SBarry Smith PetscErrorCode ierr; 268997f1f81fSBarry Smith PetscInt i; 2690ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data,*y = (Mat_SeqAIJ *)Y->data; 26910805154bSBarry Smith PetscBLASInt one=1,bnz = PetscBLASIntCast(x->nz); 2692ac90fabeSBarry Smith 2693ac90fabeSBarry Smith PetscFunctionBegin; 2694ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 2695f4df32b1SMatthew Knepley PetscScalar alpha = a; 2696f4df32b1SMatthew Knepley BLASaxpy_(&bnz,&alpha,x->a,&one,y->a,&one); 269786c113feSBarry Smith y->idiagvalid = PETSC_FALSE; 269886c113feSBarry Smith y->ibdiagvalid = PETSC_FALSE; 2699c537a176SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 2700a30b2313SHong Zhang if (y->xtoy && y->XtoY != X) { 2701a30b2313SHong Zhang ierr = PetscFree(y->xtoy);CHKERRQ(ierr); 27026bf464f9SBarry Smith ierr = MatDestroy(&y->XtoY);CHKERRQ(ierr); 2703a30b2313SHong Zhang } 2704a30b2313SHong Zhang if (!y->xtoy) { /* get xtoy */ 2705d0f46423SBarry Smith ierr = MatAXPYGetxtoy_Private(X->rmap->n,x->i,x->j,PETSC_NULL, y->i,y->j,PETSC_NULL, &y->xtoy);CHKERRQ(ierr); 2706a30b2313SHong Zhang y->XtoY = X; 2707407f6b05SHong Zhang ierr = PetscObjectReference((PetscObject)X);CHKERRQ(ierr); 2708c537a176SHong Zhang } 2709f4df32b1SMatthew Knepley for (i=0; i<x->nz; i++) y->a[y->xtoy[i]] += a*(x->a[i]); 27101e2582c4SBarry Smith ierr = PetscInfo3(Y,"ratio of nnz(X)/nnz(Y): %d/%d = %G\n",x->nz,y->nz,(PetscReal)(x->nz)/y->nz);CHKERRQ(ierr); 2711ac90fabeSBarry Smith } else { 27128229c054SShri Abhyankar Mat B; 27138229c054SShri Abhyankar PetscInt *nnz; 271416b2e9dcSShri Abhyankar ierr = PetscMalloc(Y->rmap->N*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 2715ec7775f6SShri Abhyankar ierr = MatCreate(((PetscObject)Y)->comm,&B);CHKERRQ(ierr); 2716bc5a2726SShri Abhyankar ierr = PetscObjectSetName((PetscObject)B,((PetscObject)Y)->name);CHKERRQ(ierr); 27174aa94f47SShri Abhyankar ierr = MatSetSizes(B,Y->rmap->n,Y->cmap->n,Y->rmap->N,Y->cmap->N);CHKERRQ(ierr); 2718176df525SBarry Smith ierr = MatSetType(B,(MatType) ((PetscObject)Y)->type_name);CHKERRQ(ierr); 27198229c054SShri Abhyankar ierr = MatAXPYGetPreallocation_SeqAIJ(Y,X,nnz);CHKERRQ(ierr); 2720ecd8bba6SJed Brown ierr = MatSeqAIJSetPreallocation(B,0,nnz);CHKERRQ(ierr); 2721ec7775f6SShri Abhyankar ierr = MatAXPY_BasicWithPreallocation(B,Y,a,X,str);CHKERRQ(ierr); 2722ec7775f6SShri Abhyankar ierr = MatHeaderReplace(Y,B);CHKERRQ(ierr); 27238229c054SShri Abhyankar ierr = PetscFree(nnz);CHKERRQ(ierr); 2724ac90fabeSBarry Smith } 2725ac90fabeSBarry Smith PetscFunctionReturn(0); 2726ac90fabeSBarry Smith } 2727ac90fabeSBarry Smith 2728521d7252SBarry Smith #undef __FUNCT__ 2729521d7252SBarry Smith #define __FUNCT__ "MatSetBlockSize_SeqAIJ" 2730521d7252SBarry Smith PetscErrorCode MatSetBlockSize_SeqAIJ(Mat A,PetscInt bs) 2731521d7252SBarry Smith { 273241c166b1SJed Brown PetscErrorCode ierr; 273341c166b1SJed Brown 2734521d7252SBarry Smith PetscFunctionBegin; 273541c166b1SJed Brown ierr = PetscLayoutSetBlockSize(A->rmap,bs);CHKERRQ(ierr); 273641c166b1SJed Brown ierr = PetscLayoutSetBlockSize(A->cmap,bs);CHKERRQ(ierr); 2737521d7252SBarry Smith PetscFunctionReturn(0); 2738521d7252SBarry Smith } 2739521d7252SBarry Smith 2740354c94deSBarry Smith #undef __FUNCT__ 2741354c94deSBarry Smith #define __FUNCT__ "MatConjugate_SeqAIJ" 27427087cfbeSBarry Smith PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 2743354c94deSBarry Smith { 2744354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 2745354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 2746354c94deSBarry Smith PetscInt i,nz; 2747354c94deSBarry Smith PetscScalar *a; 2748354c94deSBarry Smith 2749354c94deSBarry Smith PetscFunctionBegin; 2750354c94deSBarry Smith nz = aij->nz; 2751354c94deSBarry Smith a = aij->a; 2752354c94deSBarry Smith for (i=0; i<nz; i++) { 2753354c94deSBarry Smith a[i] = PetscConj(a[i]); 2754354c94deSBarry Smith } 2755354c94deSBarry Smith #else 2756354c94deSBarry Smith PetscFunctionBegin; 2757354c94deSBarry Smith #endif 2758354c94deSBarry Smith PetscFunctionReturn(0); 2759354c94deSBarry Smith } 2760354c94deSBarry Smith 2761e34fafa9SBarry Smith #undef __FUNCT__ 2762985db425SBarry Smith #define __FUNCT__ "MatGetRowMaxAbs_SeqAIJ" 2763985db425SBarry Smith PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 2764e34fafa9SBarry Smith { 2765e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2766e34fafa9SBarry Smith PetscErrorCode ierr; 2767d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 2768e34fafa9SBarry Smith PetscReal atmp; 2769985db425SBarry Smith PetscScalar *x; 2770e34fafa9SBarry Smith MatScalar *aa; 2771e34fafa9SBarry Smith 2772e34fafa9SBarry Smith PetscFunctionBegin; 2773e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2774e34fafa9SBarry Smith aa = a->a; 2775e34fafa9SBarry Smith ai = a->i; 2776e34fafa9SBarry Smith aj = a->j; 2777e34fafa9SBarry Smith 2778985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 2779e34fafa9SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2780e34fafa9SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 2781e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2782e34fafa9SBarry Smith for (i=0; i<m; i++) { 2783e34fafa9SBarry Smith ncols = ai[1] - ai[0]; ai++; 27849189402eSHong Zhang x[i] = 0.0; 2785e34fafa9SBarry Smith for (j=0; j<ncols; j++){ 2786985db425SBarry Smith atmp = PetscAbsScalar(*aa); 2787985db425SBarry Smith if (PetscAbsScalar(x[i]) < atmp) {x[i] = atmp; if (idx) idx[i] = *aj;} 2788985db425SBarry Smith aa++; aj++; 2789985db425SBarry Smith } 2790985db425SBarry Smith } 2791985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2792985db425SBarry Smith PetscFunctionReturn(0); 2793985db425SBarry Smith } 2794985db425SBarry Smith 2795985db425SBarry Smith #undef __FUNCT__ 2796985db425SBarry Smith #define __FUNCT__ "MatGetRowMax_SeqAIJ" 2797985db425SBarry Smith PetscErrorCode MatGetRowMax_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 2798985db425SBarry Smith { 2799985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2800985db425SBarry Smith PetscErrorCode ierr; 2801d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 2802985db425SBarry Smith PetscScalar *x; 2803985db425SBarry Smith MatScalar *aa; 2804985db425SBarry Smith 2805985db425SBarry Smith PetscFunctionBegin; 2806e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2807985db425SBarry Smith aa = a->a; 2808985db425SBarry Smith ai = a->i; 2809985db425SBarry Smith aj = a->j; 2810985db425SBarry Smith 2811985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 2812985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2813985db425SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 2814e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2815985db425SBarry Smith for (i=0; i<m; i++) { 2816985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 2817d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 2818985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 2819985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 2820985db425SBarry Smith x[i] = 0.0; 2821985db425SBarry Smith if (idx) { 2822985db425SBarry Smith idx[i] = 0; /* in case ncols is zero */ 2823985db425SBarry Smith for (j=0;j<ncols;j++) { /* find first implicit 0.0 in the row */ 2824985db425SBarry Smith if (aj[j] > j) { 2825985db425SBarry Smith idx[i] = j; 2826985db425SBarry Smith break; 2827985db425SBarry Smith } 2828985db425SBarry Smith } 2829985db425SBarry Smith } 2830985db425SBarry Smith } 2831985db425SBarry Smith for (j=0; j<ncols; j++){ 2832985db425SBarry Smith if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 2833985db425SBarry Smith aa++; aj++; 2834985db425SBarry Smith } 2835985db425SBarry Smith } 2836985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2837985db425SBarry Smith PetscFunctionReturn(0); 2838985db425SBarry Smith } 2839985db425SBarry Smith 2840985db425SBarry Smith #undef __FUNCT__ 2841c87e5d42SMatthew Knepley #define __FUNCT__ "MatGetRowMinAbs_SeqAIJ" 2842c87e5d42SMatthew Knepley PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 2843c87e5d42SMatthew Knepley { 2844c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2845c87e5d42SMatthew Knepley PetscErrorCode ierr; 2846c87e5d42SMatthew Knepley PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 2847c87e5d42SMatthew Knepley PetscReal atmp; 2848c87e5d42SMatthew Knepley PetscScalar *x; 2849c87e5d42SMatthew Knepley MatScalar *aa; 2850c87e5d42SMatthew Knepley 2851c87e5d42SMatthew Knepley PetscFunctionBegin; 2852e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2853c87e5d42SMatthew Knepley aa = a->a; 2854c87e5d42SMatthew Knepley ai = a->i; 2855c87e5d42SMatthew Knepley aj = a->j; 2856c87e5d42SMatthew Knepley 2857c87e5d42SMatthew Knepley ierr = VecSet(v,0.0);CHKERRQ(ierr); 2858c87e5d42SMatthew Knepley ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2859c87e5d42SMatthew Knepley ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 2860e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2861c87e5d42SMatthew Knepley for (i=0; i<m; i++) { 2862c87e5d42SMatthew Knepley ncols = ai[1] - ai[0]; ai++; 2863289a08f5SMatthew Knepley if (ncols) { 2864289a08f5SMatthew Knepley /* Get first nonzero */ 2865289a08f5SMatthew Knepley for(j = 0; j < ncols; j++) { 2866289a08f5SMatthew Knepley atmp = PetscAbsScalar(aa[j]); 2867289a08f5SMatthew Knepley if (atmp > 1.0e-12) {x[i] = atmp; if (idx) idx[i] = aj[j]; break;} 2868289a08f5SMatthew Knepley } 2869289a08f5SMatthew Knepley if (j == ncols) {x[i] = *aa; if (idx) idx[i] = *aj;} 2870289a08f5SMatthew Knepley } else { 2871289a08f5SMatthew Knepley x[i] = 0.0; if (idx) idx[i] = 0; 2872289a08f5SMatthew Knepley } 2873c87e5d42SMatthew Knepley for(j = 0; j < ncols; j++) { 2874c87e5d42SMatthew Knepley atmp = PetscAbsScalar(*aa); 2875289a08f5SMatthew Knepley if (atmp > 1.0e-12 && PetscAbsScalar(x[i]) > atmp) {x[i] = atmp; if (idx) idx[i] = *aj;} 2876c87e5d42SMatthew Knepley aa++; aj++; 2877c87e5d42SMatthew Knepley } 2878c87e5d42SMatthew Knepley } 2879c87e5d42SMatthew Knepley ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2880c87e5d42SMatthew Knepley PetscFunctionReturn(0); 2881c87e5d42SMatthew Knepley } 2882c87e5d42SMatthew Knepley 2883c87e5d42SMatthew Knepley #undef __FUNCT__ 2884985db425SBarry Smith #define __FUNCT__ "MatGetRowMin_SeqAIJ" 2885985db425SBarry Smith PetscErrorCode MatGetRowMin_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 2886985db425SBarry Smith { 2887985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2888985db425SBarry Smith PetscErrorCode ierr; 2889d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 2890985db425SBarry Smith PetscScalar *x; 2891985db425SBarry Smith MatScalar *aa; 2892985db425SBarry Smith 2893985db425SBarry Smith PetscFunctionBegin; 2894e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2895985db425SBarry Smith aa = a->a; 2896985db425SBarry Smith ai = a->i; 2897985db425SBarry Smith aj = a->j; 2898985db425SBarry Smith 2899985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 2900985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2901985db425SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 2902e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2903985db425SBarry Smith for (i=0; i<m; i++) { 2904985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 2905d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 2906985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 2907985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 2908985db425SBarry Smith x[i] = 0.0; 2909985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 2910985db425SBarry Smith idx[i] = 0; /* in case ncols is zero */ 2911985db425SBarry Smith for (j=0;j<ncols;j++) { 2912985db425SBarry Smith if (aj[j] > j) { 2913985db425SBarry Smith idx[i] = j; 2914985db425SBarry Smith break; 2915985db425SBarry Smith } 2916985db425SBarry Smith } 2917985db425SBarry Smith } 2918985db425SBarry Smith } 2919985db425SBarry Smith for (j=0; j<ncols; j++){ 2920985db425SBarry Smith if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 2921985db425SBarry Smith aa++; aj++; 2922e34fafa9SBarry Smith } 2923e34fafa9SBarry Smith } 2924e34fafa9SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2925e34fafa9SBarry Smith PetscFunctionReturn(0); 2926e34fafa9SBarry Smith } 2927bbead8a2SBarry Smith 2928bbead8a2SBarry Smith #include <petscblaslapack.h> 2929bbead8a2SBarry Smith #include <../src/mat/blockinvert.h> 2930bbead8a2SBarry Smith 2931bbead8a2SBarry Smith #undef __FUNCT__ 2932bbead8a2SBarry Smith #define __FUNCT__ "MatInvertBlockDiagonal_SeqAIJ" 2933bbead8a2SBarry Smith PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A,PetscScalar **values) 2934bbead8a2SBarry Smith { 2935bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 2936bbead8a2SBarry Smith PetscErrorCode ierr; 293734fc4b71SJed Brown PetscInt i,bs = A->rmap->bs,mbs = A->rmap->n/A->rmap->bs,ipvt[5],bs2 = bs*bs,*v_pivots,ij[7],*IJ,j; 2938bbead8a2SBarry Smith MatScalar *diag,work[25],*v_work; 2939bbead8a2SBarry Smith PetscReal shift = 0.0; 2940bbead8a2SBarry Smith 2941bbead8a2SBarry Smith PetscFunctionBegin; 29424a0d0026SBarry Smith if (a->ibdiagvalid) { 29434a0d0026SBarry Smith if (values) *values = a->ibdiag; 29444a0d0026SBarry Smith PetscFunctionReturn(0); 29454a0d0026SBarry Smith } 2946bbead8a2SBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 2947bbead8a2SBarry Smith if (!a->ibdiag) { 2948bbead8a2SBarry Smith ierr = PetscMalloc(bs2*mbs*sizeof(PetscScalar),&a->ibdiag);CHKERRQ(ierr); 2949bbead8a2SBarry Smith ierr = PetscLogObjectMemory(A,bs2*mbs*sizeof(PetscScalar));CHKERRQ(ierr); 2950bbead8a2SBarry Smith } 2951bbead8a2SBarry Smith diag = a->ibdiag; 2952bbead8a2SBarry Smith if (values) *values = a->ibdiag; 2953bbead8a2SBarry Smith /* factor and invert each block */ 2954bbead8a2SBarry Smith switch (bs){ 2955bbead8a2SBarry Smith case 1: 2956bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 2957bbead8a2SBarry Smith ierr = MatGetValues(A,1,&i,1,&i,diag+i);CHKERRQ(ierr); 2958bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 2959bbead8a2SBarry Smith } 2960bbead8a2SBarry Smith break; 2961bbead8a2SBarry Smith case 2: 2962bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 2963bbead8a2SBarry Smith ij[0] = 2*i; ij[1] = 2*i + 1; 2964bbead8a2SBarry Smith ierr = MatGetValues(A,2,ij,2,ij,diag);CHKERRQ(ierr); 2965bbead8a2SBarry Smith ierr = Kernel_A_gets_inverse_A_2(diag,shift);CHKERRQ(ierr); 2966d441b888SJed Brown ierr = Kernel_A_gets_transpose_A_2(diag);CHKERRQ(ierr); 2967bbead8a2SBarry Smith diag += 4; 2968bbead8a2SBarry Smith } 2969bbead8a2SBarry Smith break; 2970bbead8a2SBarry Smith case 3: 2971bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 2972bbead8a2SBarry Smith ij[0] = 3*i; ij[1] = 3*i + 1; ij[2] = 3*i + 2; 2973bbead8a2SBarry Smith ierr = MatGetValues(A,3,ij,3,ij,diag);CHKERRQ(ierr); 2974bbead8a2SBarry Smith ierr = Kernel_A_gets_inverse_A_3(diag,shift);CHKERRQ(ierr); 2975d441b888SJed Brown ierr = Kernel_A_gets_transpose_A_3(diag);CHKERRQ(ierr); 2976bbead8a2SBarry Smith diag += 9; 2977bbead8a2SBarry Smith } 2978bbead8a2SBarry Smith break; 2979bbead8a2SBarry Smith case 4: 2980bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 2981bbead8a2SBarry Smith ij[0] = 4*i; ij[1] = 4*i + 1; ij[2] = 4*i + 2; ij[3] = 4*i + 3; 2982bbead8a2SBarry Smith ierr = MatGetValues(A,4,ij,4,ij,diag);CHKERRQ(ierr); 2983bbead8a2SBarry Smith ierr = Kernel_A_gets_inverse_A_4(diag,shift);CHKERRQ(ierr); 2984d441b888SJed Brown ierr = Kernel_A_gets_transpose_A_4(diag);CHKERRQ(ierr); 2985bbead8a2SBarry Smith diag += 16; 2986bbead8a2SBarry Smith } 2987bbead8a2SBarry Smith break; 2988bbead8a2SBarry Smith case 5: 2989bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 2990bbead8a2SBarry Smith ij[0] = 5*i; ij[1] = 5*i + 1; ij[2] = 5*i + 2; ij[3] = 5*i + 3; ij[4] = 5*i + 4; 2991bbead8a2SBarry Smith ierr = MatGetValues(A,5,ij,5,ij,diag);CHKERRQ(ierr); 2992bbead8a2SBarry Smith ierr = Kernel_A_gets_inverse_A_5(diag,ipvt,work,shift);CHKERRQ(ierr); 2993d441b888SJed Brown ierr = Kernel_A_gets_transpose_A_5(diag);CHKERRQ(ierr); 2994bbead8a2SBarry Smith diag += 25; 2995bbead8a2SBarry Smith } 2996bbead8a2SBarry Smith break; 2997bbead8a2SBarry Smith case 6: 2998bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 2999bbead8a2SBarry Smith ij[0] = 6*i; ij[1] = 6*i + 1; ij[2] = 6*i + 2; ij[3] = 6*i + 3; ij[4] = 6*i + 4; ij[5] = 6*i + 5; 3000bbead8a2SBarry Smith ierr = MatGetValues(A,6,ij,6,ij,diag);CHKERRQ(ierr); 3001bbead8a2SBarry Smith ierr = Kernel_A_gets_inverse_A_6(diag,shift);CHKERRQ(ierr); 3002d441b888SJed Brown ierr = Kernel_A_gets_transpose_A_6(diag);CHKERRQ(ierr); 3003bbead8a2SBarry Smith diag += 36; 3004bbead8a2SBarry Smith } 3005bbead8a2SBarry Smith break; 3006bbead8a2SBarry Smith case 7: 3007bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3008bbead8a2SBarry Smith ij[0] = 7*i; ij[1] = 7*i + 1; ij[2] = 7*i + 2; ij[3] = 7*i + 3; ij[4] = 7*i + 4; ij[5] = 7*i + 5; ij[5] = 7*i + 6; 3009bbead8a2SBarry Smith ierr = MatGetValues(A,7,ij,7,ij,diag);CHKERRQ(ierr); 3010bbead8a2SBarry Smith ierr = Kernel_A_gets_inverse_A_7(diag,shift);CHKERRQ(ierr); 3011d441b888SJed Brown ierr = Kernel_A_gets_transpose_A_7(diag);CHKERRQ(ierr); 3012bbead8a2SBarry Smith diag += 49; 3013bbead8a2SBarry Smith } 3014bbead8a2SBarry Smith break; 3015bbead8a2SBarry Smith default: 3016bbead8a2SBarry Smith ierr = PetscMalloc3(bs,MatScalar,&v_work,bs,PetscInt,&v_pivots,bs,PetscInt,&IJ);CHKERRQ(ierr); 3017bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3018bbead8a2SBarry Smith for (j=0; j<bs; j++) { 3019bbead8a2SBarry Smith IJ[j] = bs*i + j; 3020bbead8a2SBarry Smith } 3021bbead8a2SBarry Smith ierr = MatGetValues(A,bs,IJ,bs,IJ,diag);CHKERRQ(ierr); 3022bbead8a2SBarry Smith ierr = Kernel_A_gets_inverse_A(bs,diag,v_pivots,v_work);CHKERRQ(ierr); 3023d441b888SJed Brown ierr = Kernel_A_gets_transpose_A_N(diag,bs);CHKERRQ(ierr); 3024bbead8a2SBarry Smith diag += bs2; 3025bbead8a2SBarry Smith } 3026bbead8a2SBarry Smith ierr = PetscFree3(v_work,v_pivots,IJ);CHKERRQ(ierr); 3027bbead8a2SBarry Smith } 3028bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 3029bbead8a2SBarry Smith PetscFunctionReturn(0); 3030bbead8a2SBarry Smith } 3031bbead8a2SBarry Smith 30327087cfbeSBarry Smith extern PetscErrorCode MatFDColoringApply_AIJ(Mat,MatFDColoring,Vec,MatStructure*,void*); 3033682d7d0cSBarry Smith /* -------------------------------------------------------------------*/ 30340a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3035cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3036cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3037cb5b572fSBarry Smith MatMult_SeqAIJ, 303897304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 30397c922b88SBarry Smith MatMultTranspose_SeqAIJ, 30407c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3041db4efbfdSBarry Smith 0, 3042db4efbfdSBarry Smith 0, 3043db4efbfdSBarry Smith 0, 3044db4efbfdSBarry Smith /*10*/ 0, 3045cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3046cb5b572fSBarry Smith 0, 304741f059aeSBarry Smith MatSOR_SeqAIJ, 304817ab2063SBarry Smith MatTranspose_SeqAIJ, 304997304618SKris Buschelman /*15*/ MatGetInfo_SeqAIJ, 3050cb5b572fSBarry Smith MatEqual_SeqAIJ, 3051cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3052cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3053cb5b572fSBarry Smith MatNorm_SeqAIJ, 305497304618SKris Buschelman /*20*/ 0, 3055cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3056cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3057cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3058d519adbfSMatthew Knepley /*24*/ MatZeroRows_SeqAIJ, 3059db4efbfdSBarry Smith 0, 3060db4efbfdSBarry Smith 0, 3061db4efbfdSBarry Smith 0, 3062db4efbfdSBarry Smith 0, 3063d519adbfSMatthew Knepley /*29*/ MatSetUpPreallocation_SeqAIJ, 3064db4efbfdSBarry Smith 0, 3065db4efbfdSBarry Smith 0, 30666c0721eeSBarry Smith MatGetArray_SeqAIJ, 30676c0721eeSBarry Smith MatRestoreArray_SeqAIJ, 3068d519adbfSMatthew Knepley /*34*/ MatDuplicate_SeqAIJ, 3069cb5b572fSBarry Smith 0, 3070cb5b572fSBarry Smith 0, 3071cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3072cb5b572fSBarry Smith 0, 3073d519adbfSMatthew Knepley /*39*/ MatAXPY_SeqAIJ, 3074cb5b572fSBarry Smith MatGetSubMatrices_SeqAIJ, 3075cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3076cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3077cb5b572fSBarry Smith MatCopy_SeqAIJ, 3078d519adbfSMatthew Knepley /*44*/ MatGetRowMax_SeqAIJ, 3079cb5b572fSBarry Smith MatScale_SeqAIJ, 3080cb5b572fSBarry Smith 0, 308179299369SBarry Smith MatDiagonalSet_SeqAIJ, 30826e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 3083d519adbfSMatthew Knepley /*49*/ MatSetBlockSize_SeqAIJ, 30843b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 30853b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 30863b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3087a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 3088d519adbfSMatthew Knepley /*54*/ MatFDColoringCreate_SeqAIJ, 3089b9617806SBarry Smith 0, 30900513a670SBarry Smith 0, 3091cda55fadSBarry Smith MatPermute_SeqAIJ, 3092cda55fadSBarry Smith 0, 3093d519adbfSMatthew Knepley /*59*/ 0, 3094b9b97703SBarry Smith MatDestroy_SeqAIJ, 3095b9b97703SBarry Smith MatView_SeqAIJ, 3096357abbc8SBarry Smith 0, 3097ee4f033dSBarry Smith 0, 3098d519adbfSMatthew Knepley /*64*/ 0, 3099ee4f033dSBarry Smith 0, 3100ee4f033dSBarry Smith 0, 3101ee4f033dSBarry Smith 0, 3102ee4f033dSBarry Smith 0, 3103d519adbfSMatthew Knepley /*69*/ MatGetRowMaxAbs_SeqAIJ, 3104c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3105ee4f033dSBarry Smith 0, 3106ee4f033dSBarry Smith MatSetColoring_SeqAIJ, 3107dcf5cc72SBarry Smith #if defined(PETSC_HAVE_ADIC) 3108ee4f033dSBarry Smith MatSetValuesAdic_SeqAIJ, 3109dcf5cc72SBarry Smith #else 3110dcf5cc72SBarry Smith 0, 3111dcf5cc72SBarry Smith #endif 3112d519adbfSMatthew Knepley /*74*/ MatSetValuesAdifor_SeqAIJ, 31133acb8795SBarry Smith MatFDColoringApply_AIJ, 311497304618SKris Buschelman 0, 311597304618SKris Buschelman 0, 311697304618SKris Buschelman 0, 31176ce1633cSBarry Smith /*79*/ MatFindZeroDiagonals_SeqAIJ, 311897304618SKris Buschelman 0, 311997304618SKris Buschelman 0, 312097304618SKris Buschelman 0, 3121bc011b1eSHong Zhang MatLoad_SeqAIJ, 3122d519adbfSMatthew Knepley /*84*/ MatIsSymmetric_SeqAIJ, 31231cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 31246284ec50SHong Zhang 0, 31256284ec50SHong Zhang 0, 3126bc011b1eSHong Zhang 0, 3127d519adbfSMatthew Knepley /*89*/ MatMatMult_SeqAIJ_SeqAIJ, 312826be0446SHong Zhang MatMatMultSymbolic_SeqAIJ_SeqAIJ, 312926be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3130d439da42SKris Buschelman MatPtAP_Basic, 31317ba1a0bfSKris Buschelman MatPtAPSymbolic_SeqAIJ, 3132d519adbfSMatthew Knepley /*94*/ MatPtAPNumeric_SeqAIJ, 31336fc122caSHong Zhang MatMatTransposeMult_SeqAIJ_SeqAIJ, 31346fc122caSHong Zhang MatMatTransposeMultSymbolic_SeqAIJ_SeqAIJ, 31356fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 31367ba1a0bfSKris Buschelman MatPtAPSymbolic_SeqAIJ_SeqAIJ, 3137d519adbfSMatthew Knepley /*99*/ MatPtAPNumeric_SeqAIJ_SeqAIJ, 3138609c6c4dSKris Buschelman 0, 3139609c6c4dSKris Buschelman 0, 314087d4246cSBarry Smith MatConjugate_SeqAIJ, 314187d4246cSBarry Smith 0, 3142d519adbfSMatthew Knepley /*104*/MatSetValuesRow_SeqAIJ, 314399cafbc1SBarry Smith MatRealPart_SeqAIJ, 3144f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3145f5edf698SHong Zhang 0, 31462bebee5dSHong Zhang 0, 3147cbd44569SHong Zhang /*109*/MatMatSolve_SeqAIJ, 3148985db425SBarry Smith 0, 31492af78befSBarry Smith MatGetRowMin_SeqAIJ, 31502af78befSBarry Smith 0, 3151599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3152d519adbfSMatthew Knepley /*114*/0, 3153599ef60dSHong Zhang 0, 31543c2a7987SHong Zhang 0, 3155fe97e370SBarry Smith 0, 3156fbdbba38SShri Abhyankar 0, 3157fbdbba38SShri Abhyankar /*119*/0, 3158fbdbba38SShri Abhyankar 0, 3159fbdbba38SShri Abhyankar 0, 316082d44351SHong Zhang 0, 3161b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 31620716a85fSBarry Smith /*124*/MatFindNonzeroRows_SeqAIJ, 3163bbead8a2SBarry Smith MatGetColumnNorms_SeqAIJ, 316437868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 316537868618SMatthew G Knepley 0, 316637868618SMatthew G Knepley 0, 31675df89d91SHong Zhang /*129*/0, 316875648e8dSHong Zhang MatTransposeMatMult_SeqAIJ_SeqAIJ, 316975648e8dSHong Zhang MatTransposeMatMultSymbolic_SeqAIJ_SeqAIJ, 317075648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3171b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3172b9af6bddSHong Zhang /*134*/MatTransColoringApplySpToDen_SeqAIJ, 31732b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 31742b8ad9a3SHong Zhang MatRARt_SeqAIJ_SeqAIJ, 31752b8ad9a3SHong Zhang MatRARtSymbolic_SeqAIJ_SeqAIJ, 31762b8ad9a3SHong Zhang MatRARtNumeric_SeqAIJ_SeqAIJ 31779e29f15eSvictorle }; 317817ab2063SBarry Smith 3179fb2e594dSBarry Smith EXTERN_C_BEGIN 31804a2ae208SSatish Balay #undef __FUNCT__ 31814a2ae208SSatish Balay #define __FUNCT__ "MatSeqAIJSetColumnIndices_SeqAIJ" 31827087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat,PetscInt *indices) 3183bef8e0ddSBarry Smith { 3184bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 318597f1f81fSBarry Smith PetscInt i,nz,n; 3186bef8e0ddSBarry Smith 3187bef8e0ddSBarry Smith PetscFunctionBegin; 3188bef8e0ddSBarry Smith 3189bef8e0ddSBarry Smith nz = aij->maxnz; 3190d0f46423SBarry Smith n = mat->rmap->n; 3191bef8e0ddSBarry Smith for (i=0; i<nz; i++) { 3192bef8e0ddSBarry Smith aij->j[i] = indices[i]; 3193bef8e0ddSBarry Smith } 3194bef8e0ddSBarry Smith aij->nz = nz; 3195bef8e0ddSBarry Smith for (i=0; i<n; i++) { 3196bef8e0ddSBarry Smith aij->ilen[i] = aij->imax[i]; 3197bef8e0ddSBarry Smith } 3198bef8e0ddSBarry Smith 3199bef8e0ddSBarry Smith PetscFunctionReturn(0); 3200bef8e0ddSBarry Smith } 3201fb2e594dSBarry Smith EXTERN_C_END 3202bef8e0ddSBarry Smith 32034a2ae208SSatish Balay #undef __FUNCT__ 32044a2ae208SSatish Balay #define __FUNCT__ "MatSeqAIJSetColumnIndices" 3205bef8e0ddSBarry Smith /*@ 3206bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3207bef8e0ddSBarry Smith in the matrix. 3208bef8e0ddSBarry Smith 3209bef8e0ddSBarry Smith Input Parameters: 3210bef8e0ddSBarry Smith + mat - the SeqAIJ matrix 3211bef8e0ddSBarry Smith - indices - the column indices 3212bef8e0ddSBarry Smith 321315091d37SBarry Smith Level: advanced 321415091d37SBarry Smith 3215bef8e0ddSBarry Smith Notes: 3216bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3217bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 3218bef8e0ddSBarry Smith of the MatSetValues() operation. 3219bef8e0ddSBarry Smith 3220bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 3221d1be2dadSMatthew Knepley MatCreateSeqAIJ(), and the columns indices MUST be sorted. 3222bef8e0ddSBarry Smith 3223bef8e0ddSBarry Smith MUST be called before any calls to MatSetValues(); 3224bef8e0ddSBarry Smith 3225b9617806SBarry Smith The indices should start with zero, not one. 3226b9617806SBarry Smith 3227bef8e0ddSBarry Smith @*/ 32287087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat,PetscInt *indices) 3229bef8e0ddSBarry Smith { 32304ac538c5SBarry Smith PetscErrorCode ierr; 3231bef8e0ddSBarry Smith 3232bef8e0ddSBarry Smith PetscFunctionBegin; 32330700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 32344482741eSBarry Smith PetscValidPointer(indices,2); 32354ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatSeqAIJSetColumnIndices_C",(Mat,PetscInt *),(mat,indices));CHKERRQ(ierr); 3236bef8e0ddSBarry Smith PetscFunctionReturn(0); 3237bef8e0ddSBarry Smith } 3238bef8e0ddSBarry Smith 3239be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/ 3240be6bf707SBarry Smith 3241fb2e594dSBarry Smith EXTERN_C_BEGIN 32424a2ae208SSatish Balay #undef __FUNCT__ 32434a2ae208SSatish Balay #define __FUNCT__ "MatStoreValues_SeqAIJ" 32447087cfbeSBarry Smith PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3245be6bf707SBarry Smith { 3246be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 32476849ba73SBarry Smith PetscErrorCode ierr; 3248d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3249be6bf707SBarry Smith 3250be6bf707SBarry Smith PetscFunctionBegin; 3251be6bf707SBarry Smith if (aij->nonew != 1) { 3252e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3253be6bf707SBarry Smith } 3254be6bf707SBarry Smith 3255be6bf707SBarry Smith /* allocate space for values if not already there */ 3256be6bf707SBarry Smith if (!aij->saved_values) { 325787828ca2SBarry Smith ierr = PetscMalloc((nz+1)*sizeof(PetscScalar),&aij->saved_values);CHKERRQ(ierr); 32589518dbb4SMatthew Knepley ierr = PetscLogObjectMemory(mat,(nz+1)*sizeof(PetscScalar));CHKERRQ(ierr); 3259be6bf707SBarry Smith } 3260be6bf707SBarry Smith 3261be6bf707SBarry Smith /* copy values over */ 326287828ca2SBarry Smith ierr = PetscMemcpy(aij->saved_values,aij->a,nz*sizeof(PetscScalar));CHKERRQ(ierr); 3263be6bf707SBarry Smith PetscFunctionReturn(0); 3264be6bf707SBarry Smith } 3265fb2e594dSBarry Smith EXTERN_C_END 3266be6bf707SBarry Smith 32674a2ae208SSatish Balay #undef __FUNCT__ 3268b9617806SBarry Smith #define __FUNCT__ "MatStoreValues" 3269be6bf707SBarry Smith /*@ 3270be6bf707SBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows, for 3271be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3272be6bf707SBarry Smith nonlinear portion. 3273be6bf707SBarry Smith 3274be6bf707SBarry Smith Collect on Mat 3275be6bf707SBarry Smith 3276be6bf707SBarry Smith Input Parameters: 32770e609b76SBarry Smith . mat - the matrix (currently only AIJ matrices support this option) 3278be6bf707SBarry Smith 327915091d37SBarry Smith Level: advanced 328015091d37SBarry Smith 3281be6bf707SBarry Smith Common Usage, with SNESSolve(): 3282be6bf707SBarry Smith $ Create Jacobian matrix 3283be6bf707SBarry Smith $ Set linear terms into matrix 3284be6bf707SBarry Smith $ Apply boundary conditions to matrix, at this time matrix must have 3285be6bf707SBarry Smith $ final nonzero structure (i.e. setting the nonlinear terms and applying 3286be6bf707SBarry Smith $ boundary conditions again will not change the nonzero structure 3287512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3288be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3289be6bf707SBarry Smith $ Call SNESSetJacobian() with matrix 3290be6bf707SBarry Smith $ In your Jacobian routine 3291be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3292be6bf707SBarry Smith $ Set nonlinear terms in matrix 3293be6bf707SBarry Smith 3294be6bf707SBarry Smith Common Usage without SNESSolve(), i.e. when you handle nonlinear solve yourself: 3295be6bf707SBarry Smith $ // build linear portion of Jacobian 3296512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3297be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3298be6bf707SBarry Smith $ loop over nonlinear iterations 3299be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3300be6bf707SBarry Smith $ // call MatSetValues(mat,...) to set nonliner portion of Jacobian 3301be6bf707SBarry Smith $ // call MatAssemblyBegin/End() on matrix 3302be6bf707SBarry Smith $ Solve linear system with Jacobian 3303be6bf707SBarry Smith $ endloop 3304be6bf707SBarry Smith 3305be6bf707SBarry Smith Notes: 3306be6bf707SBarry Smith Matrix must already be assemblied before calling this routine 3307512a5fc5SBarry Smith Must set the matrix option MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); before 3308be6bf707SBarry Smith calling this routine. 3309be6bf707SBarry Smith 33100c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 33110c468ba9SBarry Smith and does not allocated additional space. 33120c468ba9SBarry Smith 3313be6bf707SBarry Smith .seealso: MatRetrieveValues() 3314be6bf707SBarry Smith 3315be6bf707SBarry Smith @*/ 33167087cfbeSBarry Smith PetscErrorCode MatStoreValues(Mat mat) 3317be6bf707SBarry Smith { 33184ac538c5SBarry Smith PetscErrorCode ierr; 3319be6bf707SBarry Smith 3320be6bf707SBarry Smith PetscFunctionBegin; 33210700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3322e32f2f54SBarry Smith if (!mat->assembled) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 3323e32f2f54SBarry Smith if (mat->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 33244ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatStoreValues_C",(Mat),(mat));CHKERRQ(ierr); 3325be6bf707SBarry Smith PetscFunctionReturn(0); 3326be6bf707SBarry Smith } 3327be6bf707SBarry Smith 3328fb2e594dSBarry Smith EXTERN_C_BEGIN 33294a2ae208SSatish Balay #undef __FUNCT__ 33304a2ae208SSatish Balay #define __FUNCT__ "MatRetrieveValues_SeqAIJ" 33317087cfbeSBarry Smith PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3332be6bf707SBarry Smith { 3333be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 33346849ba73SBarry Smith PetscErrorCode ierr; 3335d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3336be6bf707SBarry Smith 3337be6bf707SBarry Smith PetscFunctionBegin; 3338be6bf707SBarry Smith if (aij->nonew != 1) { 3339e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3340be6bf707SBarry Smith } 3341be6bf707SBarry Smith if (!aij->saved_values) { 3342e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatStoreValues(A);first"); 3343be6bf707SBarry Smith } 3344be6bf707SBarry Smith /* copy values over */ 334587828ca2SBarry Smith ierr = PetscMemcpy(aij->a,aij->saved_values,nz*sizeof(PetscScalar));CHKERRQ(ierr); 3346be6bf707SBarry Smith PetscFunctionReturn(0); 3347be6bf707SBarry Smith } 3348fb2e594dSBarry Smith EXTERN_C_END 3349be6bf707SBarry Smith 33504a2ae208SSatish Balay #undef __FUNCT__ 33514a2ae208SSatish Balay #define __FUNCT__ "MatRetrieveValues" 3352be6bf707SBarry Smith /*@ 3353be6bf707SBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for 3354be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3355be6bf707SBarry Smith nonlinear portion. 3356be6bf707SBarry Smith 3357be6bf707SBarry Smith Collect on Mat 3358be6bf707SBarry Smith 3359be6bf707SBarry Smith Input Parameters: 3360be6bf707SBarry Smith . mat - the matrix (currently on AIJ matrices support this option) 3361be6bf707SBarry Smith 336215091d37SBarry Smith Level: advanced 336315091d37SBarry Smith 3364be6bf707SBarry Smith .seealso: MatStoreValues() 3365be6bf707SBarry Smith 3366be6bf707SBarry Smith @*/ 33677087cfbeSBarry Smith PetscErrorCode MatRetrieveValues(Mat mat) 3368be6bf707SBarry Smith { 33694ac538c5SBarry Smith PetscErrorCode ierr; 3370be6bf707SBarry Smith 3371be6bf707SBarry Smith PetscFunctionBegin; 33720700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3373e32f2f54SBarry Smith if (!mat->assembled) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 3374e32f2f54SBarry Smith if (mat->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 33754ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatRetrieveValues_C",(Mat),(mat));CHKERRQ(ierr); 3376be6bf707SBarry Smith PetscFunctionReturn(0); 3377be6bf707SBarry Smith } 3378be6bf707SBarry Smith 3379f83d6046SBarry Smith 3380be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/ 33814a2ae208SSatish Balay #undef __FUNCT__ 33824a2ae208SSatish Balay #define __FUNCT__ "MatCreateSeqAIJ" 338317ab2063SBarry Smith /*@C 3384682d7d0cSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in AIJ (compressed row) format 33850d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 33866e62573dSLois Curfman McInnes the user should preallocate the matrix storage by setting the parameter nz 338751c19458SBarry Smith (or the array nnz). By setting these parameters accurately, performance 33882bd5e0b2SLois Curfman McInnes during matrix assembly can be increased by more than a factor of 50. 338917ab2063SBarry Smith 3390db81eaa0SLois Curfman McInnes Collective on MPI_Comm 3391db81eaa0SLois Curfman McInnes 339217ab2063SBarry Smith Input Parameters: 3393db81eaa0SLois Curfman McInnes + comm - MPI communicator, set to PETSC_COMM_SELF 339417ab2063SBarry Smith . m - number of rows 339517ab2063SBarry Smith . n - number of columns 339617ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 339751c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 33982bd5e0b2SLois Curfman McInnes (possibly different for each row) or PETSC_NULL 339917ab2063SBarry Smith 340017ab2063SBarry Smith Output Parameter: 3401416022c9SBarry Smith . A - the matrix 340217ab2063SBarry Smith 3403175b88e8SBarry Smith It is recommended that one use the MatCreate(), MatSetType() and/or MatSetFromOptions(), 3404ae1d86c5SBarry Smith MatXXXXSetPreallocation() paradgm instead of this routine directly. 3405175b88e8SBarry Smith [MatXXXXSetPreallocation() is, for example, MatSeqAIJSetPreallocation] 3406175b88e8SBarry Smith 3407b259b22eSLois Curfman McInnes Notes: 340849a6f317SBarry Smith If nnz is given then nz is ignored 340949a6f317SBarry Smith 341017ab2063SBarry Smith The AIJ format (also called the Yale sparse matrix format or 341117ab2063SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 34120002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 341344cd7ae7SLois Curfman McInnes either one (as in Fortran) or zero. See the users' manual for details. 341417ab2063SBarry Smith 341517ab2063SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 3416a40aa06bSLois Curfman McInnes Set nz=PETSC_DEFAULT and nnz=PETSC_NULL for PETSc to control dynamic memory 34173d323bbdSBarry Smith allocation. For large problems you MUST preallocate memory or you 34186da5968aSLois Curfman McInnes will get TERRIBLE performance, see the users' manual chapter on matrices. 341917ab2063SBarry Smith 3420682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 34214fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3422682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 34236c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 34246c7ebb05SLois Curfman McInnes 34256c7ebb05SLois Curfman McInnes Options Database Keys: 3426698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 34279db58ca8SBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 342817ab2063SBarry Smith 3429027ccd11SLois Curfman McInnes Level: intermediate 3430027ccd11SLois Curfman McInnes 343136db0b34SBarry Smith .seealso: MatCreate(), MatCreateMPIAIJ(), MatSetValues(), MatSeqAIJSetColumnIndices(), MatCreateSeqAIJWithArrays() 343236db0b34SBarry Smith 343317ab2063SBarry Smith @*/ 34347087cfbeSBarry Smith PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt nz,const PetscInt nnz[],Mat *A) 343517ab2063SBarry Smith { 3436dfbe8321SBarry Smith PetscErrorCode ierr; 34376945ee14SBarry Smith 34383a40ed3dSBarry Smith PetscFunctionBegin; 3439f69a0ea3SMatthew Knepley ierr = MatCreate(comm,A);CHKERRQ(ierr); 3440117016b1SBarry Smith ierr = MatSetSizes(*A,m,n,m,n);CHKERRQ(ierr); 3441c4752a88SBarry Smith ierr = MatSetType(*A,MATSEQAIJ);CHKERRQ(ierr); 3442d28bb7d2SJed Brown ierr = MatSeqAIJSetPreallocation_SeqAIJ(*A,nz,nnz);CHKERRQ(ierr); 3443273d9f13SBarry Smith PetscFunctionReturn(0); 3444273d9f13SBarry Smith } 3445273d9f13SBarry Smith 34464a2ae208SSatish Balay #undef __FUNCT__ 34474a2ae208SSatish Balay #define __FUNCT__ "MatSeqAIJSetPreallocation" 3448273d9f13SBarry Smith /*@C 3449273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3450273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3451273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3452273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3453273d9f13SBarry Smith 3454273d9f13SBarry Smith Collective on MPI_Comm 3455273d9f13SBarry Smith 3456273d9f13SBarry Smith Input Parameters: 3457117016b1SBarry Smith + B - The matrix-free 3458273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3459273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 3460273d9f13SBarry Smith (possibly different for each row) or PETSC_NULL 3461273d9f13SBarry Smith 3462273d9f13SBarry Smith Notes: 346349a6f317SBarry Smith If nnz is given then nz is ignored 346449a6f317SBarry Smith 3465273d9f13SBarry Smith The AIJ format (also called the Yale sparse matrix format or 3466273d9f13SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 3467273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3468273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3469273d9f13SBarry Smith 3470273d9f13SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 3471273d9f13SBarry Smith Set nz=PETSC_DEFAULT and nnz=PETSC_NULL for PETSc to control dynamic memory 3472273d9f13SBarry Smith allocation. For large problems you MUST preallocate memory or you 3473273d9f13SBarry Smith will get TERRIBLE performance, see the users' manual chapter on matrices. 3474273d9f13SBarry Smith 3475aa95bbe8SBarry Smith You can call MatGetInfo() to get information on how effective the preallocation was; 3476aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3477aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3478aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3479aa95bbe8SBarry Smith 3480a96a251dSBarry Smith Developers: Use nz of MAT_SKIP_ALLOCATION to not allocate any space for the matrix 3481a96a251dSBarry Smith entries or columns indices 3482a96a251dSBarry Smith 3483273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3484273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3485273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3486273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3487273d9f13SBarry Smith 3488273d9f13SBarry Smith Options Database Keys: 3489698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 3490698d4c6aSKris Buschelman . -mat_inode_limit <limit> - Sets inode limit (max limit=5) 3491273d9f13SBarry Smith - -mat_aij_oneindex - Internally use indexing starting at 1 3492273d9f13SBarry Smith rather than 0. Note that when calling MatSetValues(), 3493273d9f13SBarry Smith the user still MUST index entries starting at 0! 3494273d9f13SBarry Smith 3495273d9f13SBarry Smith Level: intermediate 3496273d9f13SBarry Smith 3497aa95bbe8SBarry Smith .seealso: MatCreate(), MatCreateMPIAIJ(), MatSetValues(), MatSeqAIJSetColumnIndices(), MatCreateSeqAIJWithArrays(), MatGetInfo() 3498273d9f13SBarry Smith 3499273d9f13SBarry Smith @*/ 35007087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation(Mat B,PetscInt nz,const PetscInt nnz[]) 3501273d9f13SBarry Smith { 35024ac538c5SBarry Smith PetscErrorCode ierr; 3503a23d5eceSKris Buschelman 3504a23d5eceSKris Buschelman PetscFunctionBegin; 3505*6ba663aaSJed Brown PetscValidHeaderSpecific(B,MAT_CLASSID,1); 3506*6ba663aaSJed Brown PetscValidType(B,1); 35074ac538c5SBarry Smith ierr = PetscTryMethod(B,"MatSeqAIJSetPreallocation_C",(Mat,PetscInt,const PetscInt[]),(B,nz,nnz));CHKERRQ(ierr); 3508a23d5eceSKris Buschelman PetscFunctionReturn(0); 3509a23d5eceSKris Buschelman } 3510a23d5eceSKris Buschelman 3511a23d5eceSKris Buschelman EXTERN_C_BEGIN 3512a23d5eceSKris Buschelman #undef __FUNCT__ 3513a23d5eceSKris Buschelman #define __FUNCT__ "MatSeqAIJSetPreallocation_SeqAIJ" 35147087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B,PetscInt nz,const PetscInt *nnz) 3515a23d5eceSKris Buschelman { 3516273d9f13SBarry Smith Mat_SeqAIJ *b; 3517ace3abfcSBarry Smith PetscBool skipallocation = PETSC_FALSE; 35186849ba73SBarry Smith PetscErrorCode ierr; 351997f1f81fSBarry Smith PetscInt i; 3520273d9f13SBarry Smith 3521273d9f13SBarry Smith PetscFunctionBegin; 3522d5d45c9bSBarry Smith 3523a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3524c461c341SBarry Smith skipallocation = PETSC_TRUE; 3525c461c341SBarry Smith nz = 0; 3526c461c341SBarry Smith } 3527c461c341SBarry Smith 352826283091SBarry Smith ierr = PetscLayoutSetBlockSize(B->rmap,1);CHKERRQ(ierr); 352926283091SBarry Smith ierr = PetscLayoutSetBlockSize(B->cmap,1);CHKERRQ(ierr); 353026283091SBarry Smith ierr = PetscLayoutSetUp(B->rmap);CHKERRQ(ierr); 353126283091SBarry Smith ierr = PetscLayoutSetUp(B->cmap);CHKERRQ(ierr); 3532899cda47SBarry Smith 3533435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 3534e32f2f54SBarry Smith if (nz < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nz cannot be less than 0: value %d",nz); 3535b73539f3SBarry Smith if (nnz) { 3536d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) { 3537e32f2f54SBarry Smith if (nnz[i] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be less than 0: local row %d value %d",i,nnz[i]); 3538e32f2f54SBarry Smith if (nnz[i] > B->cmap->n) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be greater than row length: local row %d value %d rowlength %d",i,nnz[i],B->cmap->n); 3539b73539f3SBarry Smith } 3540b73539f3SBarry Smith } 3541b73539f3SBarry Smith 3542273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 3543273d9f13SBarry Smith b = (Mat_SeqAIJ*)B->data; 3544273d9f13SBarry Smith 3545ab93d7beSBarry Smith if (!skipallocation) { 35462ee49352SLisandro Dalcin if (!b->imax) { 3547d0f46423SBarry Smith ierr = PetscMalloc2(B->rmap->n,PetscInt,&b->imax,B->rmap->n,PetscInt,&b->ilen);CHKERRQ(ierr); 3548d0f46423SBarry Smith ierr = PetscLogObjectMemory(B,2*B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 35492ee49352SLisandro Dalcin } 3550273d9f13SBarry Smith if (!nnz) { 3551435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 3552c62bd62aSJed Brown else if (nz < 0) nz = 1; 3553d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) b->imax[i] = nz; 3554d0f46423SBarry Smith nz = nz*B->rmap->n; 3555273d9f13SBarry Smith } else { 3556273d9f13SBarry Smith nz = 0; 3557d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) {b->imax[i] = nnz[i]; nz += nnz[i];} 3558273d9f13SBarry Smith } 3559ab93d7beSBarry Smith /* b->ilen will count nonzeros in each row so far. */ 3560d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) { b->ilen[i] = 0; } 3561ab93d7beSBarry Smith 3562273d9f13SBarry Smith /* allocate the matrix space */ 35632ee49352SLisandro Dalcin ierr = MatSeqXAIJFreeAIJ(B,&b->a,&b->j,&b->i);CHKERRQ(ierr); 3564d0f46423SBarry Smith ierr = PetscMalloc3(nz,PetscScalar,&b->a,nz,PetscInt,&b->j,B->rmap->n+1,PetscInt,&b->i);CHKERRQ(ierr); 3565d0f46423SBarry Smith ierr = PetscLogObjectMemory(B,(B->rmap->n+1)*sizeof(PetscInt)+nz*(sizeof(PetscScalar)+sizeof(PetscInt)));CHKERRQ(ierr); 3566bfeeae90SHong Zhang b->i[0] = 0; 3567d0f46423SBarry Smith for (i=1; i<B->rmap->n+1; i++) { 35685da197adSKris Buschelman b->i[i] = b->i[i-1] + b->imax[i-1]; 35695da197adSKris Buschelman } 3570273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 3571e6b907acSBarry Smith b->free_a = PETSC_TRUE; 3572e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 3573c461c341SBarry Smith } else { 3574e6b907acSBarry Smith b->free_a = PETSC_FALSE; 3575e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 3576c461c341SBarry Smith } 3577273d9f13SBarry Smith 3578273d9f13SBarry Smith b->nz = 0; 3579273d9f13SBarry Smith b->maxnz = nz; 3580273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 3581273d9f13SBarry Smith PetscFunctionReturn(0); 3582273d9f13SBarry Smith } 3583a23d5eceSKris Buschelman EXTERN_C_END 3584273d9f13SBarry Smith 3585a1661176SMatthew Knepley #undef __FUNCT__ 3586a1661176SMatthew Knepley #define __FUNCT__ "MatSeqAIJSetPreallocationCSR" 358758d36128SBarry Smith /*@ 3588a1661176SMatthew Knepley MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in AIJ format. 3589a1661176SMatthew Knepley 3590a1661176SMatthew Knepley Input Parameters: 3591a1661176SMatthew Knepley + B - the matrix 3592a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 3593a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 3594a1661176SMatthew Knepley - v - optional values in the matrix 3595a1661176SMatthew Knepley 3596a1661176SMatthew Knepley Level: developer 3597a1661176SMatthew Knepley 359858d36128SBarry Smith The i,j,v values are COPIED with this routine; to avoid the copy use MatCreateSeqAIJWithArrays() 359958d36128SBarry Smith 3600a1661176SMatthew Knepley .keywords: matrix, aij, compressed row, sparse, sequential 3601a1661176SMatthew Knepley 3602a1661176SMatthew Knepley .seealso: MatCreate(), MatCreateSeqAIJ(), MatSetValues(), MatSeqAIJSetPreallocation(), MatCreateSeqAIJ(), SeqAIJ 3603a1661176SMatthew Knepley @*/ 3604a1661176SMatthew Knepley PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B,const PetscInt i[],const PetscInt j[],const PetscScalar v[]) 3605a1661176SMatthew Knepley { 3606a1661176SMatthew Knepley PetscErrorCode ierr; 3607a1661176SMatthew Knepley 3608a1661176SMatthew Knepley PetscFunctionBegin; 36090700a824SBarry Smith PetscValidHeaderSpecific(B,MAT_CLASSID,1); 3610*6ba663aaSJed Brown PetscValidType(B,1); 36114ac538c5SBarry Smith ierr = PetscTryMethod(B,"MatSeqAIJSetPreallocationCSR_C",(Mat,const PetscInt[],const PetscInt[],const PetscScalar[]),(B,i,j,v));CHKERRQ(ierr); 3612a1661176SMatthew Knepley PetscFunctionReturn(0); 3613a1661176SMatthew Knepley } 3614a1661176SMatthew Knepley 3615a1661176SMatthew Knepley EXTERN_C_BEGIN 3616a1661176SMatthew Knepley #undef __FUNCT__ 3617a1661176SMatthew Knepley #define __FUNCT__ "MatSeqAIJSetPreallocationCSR_SeqAIJ" 36187087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B,const PetscInt Ii[],const PetscInt J[],const PetscScalar v[]) 3619a1661176SMatthew Knepley { 3620a1661176SMatthew Knepley PetscInt i; 3621a1661176SMatthew Knepley PetscInt m,n; 3622a1661176SMatthew Knepley PetscInt nz; 3623a1661176SMatthew Knepley PetscInt *nnz, nz_max = 0; 3624a1661176SMatthew Knepley PetscScalar *values; 3625a1661176SMatthew Knepley PetscErrorCode ierr; 3626a1661176SMatthew Knepley 3627a1661176SMatthew Knepley PetscFunctionBegin; 3628a1661176SMatthew Knepley ierr = MatGetSize(B, &m, &n);CHKERRQ(ierr); 3629a1661176SMatthew Knepley 363065e19b50SBarry Smith if (Ii[0]) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %D", Ii[0]); 3631a1661176SMatthew Knepley ierr = PetscMalloc((m+1) * sizeof(PetscInt), &nnz);CHKERRQ(ierr); 3632a1661176SMatthew Knepley for(i = 0; i < m; i++) { 3633b7940d39SSatish Balay nz = Ii[i+1]- Ii[i]; 3634a1661176SMatthew Knepley nz_max = PetscMax(nz_max, nz); 363565e19b50SBarry Smith if (nz < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Local row %D has a negative number of columns %D", i, nnz); 3636a1661176SMatthew Knepley nnz[i] = nz; 3637a1661176SMatthew Knepley } 3638a1661176SMatthew Knepley ierr = MatSeqAIJSetPreallocation(B, 0, nnz);CHKERRQ(ierr); 3639a1661176SMatthew Knepley ierr = PetscFree(nnz);CHKERRQ(ierr); 3640a1661176SMatthew Knepley 3641a1661176SMatthew Knepley if (v) { 3642a1661176SMatthew Knepley values = (PetscScalar*) v; 3643a1661176SMatthew Knepley } else { 36440e83c824SBarry Smith ierr = PetscMalloc(nz_max*sizeof(PetscScalar), &values);CHKERRQ(ierr); 3645a1661176SMatthew Knepley ierr = PetscMemzero(values, nz_max*sizeof(PetscScalar));CHKERRQ(ierr); 3646a1661176SMatthew Knepley } 3647a1661176SMatthew Knepley 3648a1661176SMatthew Knepley for(i = 0; i < m; i++) { 3649b7940d39SSatish Balay nz = Ii[i+1] - Ii[i]; 3650b7940d39SSatish Balay ierr = MatSetValues_SeqAIJ(B, 1, &i, nz, J+Ii[i], values + (v ? Ii[i] : 0), INSERT_VALUES);CHKERRQ(ierr); 3651a1661176SMatthew Knepley } 3652a1661176SMatthew Knepley 3653a1661176SMatthew Knepley ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3654a1661176SMatthew Knepley ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3655a1661176SMatthew Knepley 3656a1661176SMatthew Knepley if (!v) { 3657a1661176SMatthew Knepley ierr = PetscFree(values);CHKERRQ(ierr); 3658a1661176SMatthew Knepley } 3659a1661176SMatthew Knepley PetscFunctionReturn(0); 3660a1661176SMatthew Knepley } 3661a1661176SMatthew Knepley EXTERN_C_END 3662a1661176SMatthew Knepley 3663c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 3664c6db04a5SJed Brown #include <private/petscaxpy.h> 3665170fe5c8SBarry Smith 3666170fe5c8SBarry Smith #undef __FUNCT__ 3667170fe5c8SBarry Smith #define __FUNCT__ "MatMatMultNumeric_SeqDense_SeqAIJ" 3668170fe5c8SBarry Smith /* 3669170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 3670170fe5c8SBarry Smith 3671170fe5c8SBarry Smith n p p 3672170fe5c8SBarry Smith ( ) ( ) ( ) 3673170fe5c8SBarry Smith m ( A ) * n ( B ) = m ( C ) 3674170fe5c8SBarry Smith ( ) ( ) ( ) 3675170fe5c8SBarry Smith 3676170fe5c8SBarry Smith */ 3677170fe5c8SBarry Smith PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A,Mat B,Mat C) 3678170fe5c8SBarry Smith { 3679170fe5c8SBarry Smith PetscErrorCode ierr; 3680170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense*)A->data; 3681170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ*)B->data; 3682170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense*)C->data; 36831de00fd4SBarry Smith PetscInt i,n,m,q,p; 3684170fe5c8SBarry Smith const PetscInt *ii,*idx; 3685170fe5c8SBarry Smith const PetscScalar *b,*a,*a_q; 3686170fe5c8SBarry Smith PetscScalar *c,*c_q; 3687170fe5c8SBarry Smith 3688170fe5c8SBarry Smith PetscFunctionBegin; 3689d0f46423SBarry Smith m = A->rmap->n; 3690d0f46423SBarry Smith n = A->cmap->n; 3691d0f46423SBarry Smith p = B->cmap->n; 3692170fe5c8SBarry Smith a = sub_a->v; 3693170fe5c8SBarry Smith b = sub_b->a; 3694170fe5c8SBarry Smith c = sub_c->v; 3695170fe5c8SBarry Smith ierr = PetscMemzero(c,m*p*sizeof(PetscScalar));CHKERRQ(ierr); 3696170fe5c8SBarry Smith 3697170fe5c8SBarry Smith ii = sub_b->i; 3698170fe5c8SBarry Smith idx = sub_b->j; 3699170fe5c8SBarry Smith for (i=0; i<n; i++) { 3700170fe5c8SBarry Smith q = ii[i+1] - ii[i]; 3701170fe5c8SBarry Smith while (q-->0) { 3702170fe5c8SBarry Smith c_q = c + m*(*idx); 3703170fe5c8SBarry Smith a_q = a + m*i; 3704be7314b0SBarry Smith PetscAXPY(c_q,*b,a_q,m); 3705170fe5c8SBarry Smith idx++; 3706170fe5c8SBarry Smith b++; 3707170fe5c8SBarry Smith } 3708170fe5c8SBarry Smith } 3709170fe5c8SBarry Smith PetscFunctionReturn(0); 3710170fe5c8SBarry Smith } 3711170fe5c8SBarry Smith 3712170fe5c8SBarry Smith #undef __FUNCT__ 3713170fe5c8SBarry Smith #define __FUNCT__ "MatMatMultSymbolic_SeqDense_SeqAIJ" 3714170fe5c8SBarry Smith PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A,Mat B,PetscReal fill,Mat *C) 3715170fe5c8SBarry Smith { 3716170fe5c8SBarry Smith PetscErrorCode ierr; 3717d0f46423SBarry Smith PetscInt m=A->rmap->n,n=B->cmap->n; 3718170fe5c8SBarry Smith Mat Cmat; 3719170fe5c8SBarry Smith 3720170fe5c8SBarry Smith PetscFunctionBegin; 3721e32f2f54SBarry Smith if (A->cmap->n != B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"A->cmap->n %d != B->rmap->n %d\n",A->cmap->n,B->rmap->n); 372239804f7cSBarry Smith ierr = MatCreate(((PetscObject)A)->comm,&Cmat);CHKERRQ(ierr); 3723170fe5c8SBarry Smith ierr = MatSetSizes(Cmat,m,n,m,n);CHKERRQ(ierr); 3724170fe5c8SBarry Smith ierr = MatSetType(Cmat,MATSEQDENSE);CHKERRQ(ierr); 3725170fe5c8SBarry Smith ierr = MatSeqDenseSetPreallocation(Cmat,PETSC_NULL);CHKERRQ(ierr); 3726170fe5c8SBarry Smith Cmat->assembled = PETSC_TRUE; 37278cdbd757SHong Zhang Cmat->ops->matmult = MatMatMult_SeqDense_SeqAIJ; 3728170fe5c8SBarry Smith *C = Cmat; 3729170fe5c8SBarry Smith PetscFunctionReturn(0); 3730170fe5c8SBarry Smith } 3731170fe5c8SBarry Smith 3732170fe5c8SBarry Smith /* ----------------------------------------------------------------*/ 3733170fe5c8SBarry Smith #undef __FUNCT__ 3734170fe5c8SBarry Smith #define __FUNCT__ "MatMatMult_SeqDense_SeqAIJ" 3735170fe5c8SBarry Smith PetscErrorCode MatMatMult_SeqDense_SeqAIJ(Mat A,Mat B,MatReuse scall,PetscReal fill,Mat *C) 3736170fe5c8SBarry Smith { 3737170fe5c8SBarry Smith PetscErrorCode ierr; 3738170fe5c8SBarry Smith 3739170fe5c8SBarry Smith PetscFunctionBegin; 3740170fe5c8SBarry Smith if (scall == MAT_INITIAL_MATRIX){ 3741170fe5c8SBarry Smith ierr = MatMatMultSymbolic_SeqDense_SeqAIJ(A,B,fill,C);CHKERRQ(ierr); 3742170fe5c8SBarry Smith } 3743170fe5c8SBarry Smith ierr = MatMatMultNumeric_SeqDense_SeqAIJ(A,B,*C);CHKERRQ(ierr); 3744170fe5c8SBarry Smith PetscFunctionReturn(0); 3745170fe5c8SBarry Smith } 3746170fe5c8SBarry Smith 3747170fe5c8SBarry Smith 37480bad9183SKris Buschelman /*MC 3749fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 37500bad9183SKris Buschelman based on compressed sparse row format. 37510bad9183SKris Buschelman 37520bad9183SKris Buschelman Options Database Keys: 37530bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 37540bad9183SKris Buschelman 37550bad9183SKris Buschelman Level: beginner 37560bad9183SKris Buschelman 3757f587520bSBarry Smith .seealso: MatCreateSeqAIJ(), MatSetFromOptions(), MatSetType(), MatCreate(), MatType 37580bad9183SKris Buschelman M*/ 37590bad9183SKris Buschelman 3760a6175056SHong Zhang EXTERN_C_BEGIN 3761b5e56a35SBarry Smith #if defined(PETSC_HAVE_PASTIX) 3762b5e56a35SBarry Smith extern PetscErrorCode MatGetFactor_seqaij_pastix(Mat,MatFactorType,Mat*); 3763b5e56a35SBarry Smith #endif 3764ce63c4c1SBarry Smith #if defined(PETSC_HAVE_ESSL) && !defined(PETSC_USE_COMPLEX) && !defined(PETSC_USE_REAL_SINGLE) && !defined(PETSC_USE_REAL___FLOAT128) 3765af1023dbSSatish Balay extern PetscErrorCode MatGetFactor_seqaij_essl(Mat,MatFactorType,Mat *); 3766af1023dbSSatish Balay #endif 37677087cfbeSBarry Smith extern PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat,MatType,MatReuse,Mat*); 37687087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_petsc(Mat,MatFactorType,Mat*); 37697087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_bas(Mat,MatFactorType,Mat*); 37707087cfbeSBarry Smith extern PetscErrorCode MatGetFactorAvailable_seqaij_petsc(Mat,MatFactorType,PetscBool *); 3771611f576cSBarry Smith #if defined(PETSC_HAVE_MUMPS) 37727087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_aij_mumps(Mat,MatFactorType,Mat*); 3773611f576cSBarry Smith #endif 3774611f576cSBarry Smith #if defined(PETSC_HAVE_SUPERLU) 37757087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_superlu(Mat,MatFactorType,Mat*); 3776611f576cSBarry Smith #endif 3777f3c0ef26SHong Zhang #if defined(PETSC_HAVE_SUPERLU_DIST) 3778f3c0ef26SHong Zhang extern PetscErrorCode MatGetFactor_seqaij_superlu_dist(Mat,MatFactorType,Mat*); 3779f3c0ef26SHong Zhang #endif 3780611f576cSBarry Smith #if defined(PETSC_HAVE_SPOOLES) 37817087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_spooles(Mat,MatFactorType,Mat*); 3782611f576cSBarry Smith #endif 3783eb3b5408SSatish Balay #if defined(PETSC_HAVE_UMFPACK) 37847087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_umfpack(Mat,MatFactorType,Mat*); 3785eb3b5408SSatish Balay #endif 3786586621ddSJed Brown #if defined(PETSC_HAVE_CHOLMOD) 37877087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_cholmod(Mat,MatFactorType,Mat*); 3788586621ddSJed Brown #endif 3789719d5645SBarry Smith #if defined(PETSC_HAVE_LUSOL) 37907087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_lusol(Mat,MatFactorType,Mat*); 3791719d5645SBarry Smith #endif 3792b3866ffcSBarry Smith #if defined(PETSC_HAVE_MATLAB_ENGINE) 37937087cfbeSBarry Smith extern PetscErrorCode MatGetFactor_seqaij_matlab(Mat,MatFactorType,Mat*); 37947087cfbeSBarry Smith extern PetscErrorCode MatlabEnginePut_SeqAIJ(PetscObject,void*); 37957087cfbeSBarry Smith extern PetscErrorCode MatlabEngineGet_SeqAIJ(PetscObject,void*); 3796b3866ffcSBarry Smith #endif 379717667f90SBarry Smith EXTERN_C_END 379817667f90SBarry Smith 3799c0c8ee5eSDmitry Karpeev 380017667f90SBarry Smith EXTERN_C_BEGIN 38014a2ae208SSatish Balay #undef __FUNCT__ 38024a2ae208SSatish Balay #define __FUNCT__ "MatCreate_SeqAIJ" 38037087cfbeSBarry Smith PetscErrorCode MatCreate_SeqAIJ(Mat B) 3804273d9f13SBarry Smith { 3805273d9f13SBarry Smith Mat_SeqAIJ *b; 3806dfbe8321SBarry Smith PetscErrorCode ierr; 380738baddfdSBarry Smith PetscMPIInt size; 3808273d9f13SBarry Smith 3809273d9f13SBarry Smith PetscFunctionBegin; 38107adad957SLisandro Dalcin ierr = MPI_Comm_size(((PetscObject)B)->comm,&size);CHKERRQ(ierr); 3811e32f2f54SBarry Smith if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Comm must be of size 1"); 3812273d9f13SBarry Smith 381338f2d2fdSLisandro Dalcin ierr = PetscNewLog(B,Mat_SeqAIJ,&b);CHKERRQ(ierr); 3814b0a32e0cSBarry Smith B->data = (void*)b; 3815549d3d68SSatish Balay ierr = PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps));CHKERRQ(ierr); 3816416022c9SBarry Smith b->row = 0; 3817416022c9SBarry Smith b->col = 0; 381882bf6240SBarry Smith b->icol = 0; 3819b810aeb4SBarry Smith b->reallocs = 0; 382036db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 3821f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 3822416022c9SBarry Smith b->nonew = 0; 3823416022c9SBarry Smith b->diag = 0; 3824416022c9SBarry Smith b->solve_work = 0; 38252a1b7f2aSHong Zhang B->spptr = 0; 3826be6bf707SBarry Smith b->saved_values = 0; 3827d7f994e1SBarry Smith b->idiag = 0; 382871f1c65dSBarry Smith b->mdiag = 0; 382971f1c65dSBarry Smith b->ssor_work = 0; 383071f1c65dSBarry Smith b->omega = 1.0; 383171f1c65dSBarry Smith b->fshift = 0.0; 383271f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 3833bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 3834a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 3835a30b2313SHong Zhang b->xtoy = 0; 3836a30b2313SHong Zhang b->XtoY = 0; 383788e51ccdSHong Zhang B->same_nonzero = PETSC_FALSE; 383817ab2063SBarry Smith 383935d8aa7fSBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ);CHKERRQ(ierr); 3840b3866ffcSBarry Smith #if defined(PETSC_HAVE_MATLAB_ENGINE) 3841700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_matlab_C","MatGetFactor_seqaij_matlab",MatGetFactor_seqaij_matlab);CHKERRQ(ierr); 3842b3866ffcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"PetscMatlabEnginePut_C","MatlabEnginePut_SeqAIJ",MatlabEnginePut_SeqAIJ);CHKERRQ(ierr); 3843b3866ffcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"PetscMatlabEngineGet_C","MatlabEngineGet_SeqAIJ",MatlabEngineGet_SeqAIJ);CHKERRQ(ierr); 3844b3866ffcSBarry Smith #endif 3845b5e56a35SBarry Smith #if defined(PETSC_HAVE_PASTIX) 3846700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_pastix_C","MatGetFactor_seqaij_pastix",MatGetFactor_seqaij_pastix);CHKERRQ(ierr); 3847b5e56a35SBarry Smith #endif 3848ce63c4c1SBarry Smith #if defined(PETSC_HAVE_ESSL) && !defined(PETSC_USE_COMPLEX) && !defined(PETSC_USE_REAL_SINGLE) && !defined(PETSC_USE_REAL___FLOAT128) 3849700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_essl_C","MatGetFactor_seqaij_essl",MatGetFactor_seqaij_essl);CHKERRQ(ierr); 3850719d5645SBarry Smith #endif 3851611f576cSBarry Smith #if defined(PETSC_HAVE_SUPERLU) 3852700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_superlu_C","MatGetFactor_seqaij_superlu",MatGetFactor_seqaij_superlu);CHKERRQ(ierr); 3853611f576cSBarry Smith #endif 3854f3c0ef26SHong Zhang #if defined(PETSC_HAVE_SUPERLU_DIST) 3855700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_superlu_dist_C","MatGetFactor_seqaij_superlu_dist",MatGetFactor_seqaij_superlu_dist);CHKERRQ(ierr); 3856f3c0ef26SHong Zhang #endif 3857611f576cSBarry Smith #if defined(PETSC_HAVE_SPOOLES) 3858700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_spooles_C","MatGetFactor_seqaij_spooles",MatGetFactor_seqaij_spooles);CHKERRQ(ierr); 3859611f576cSBarry Smith #endif 3860611f576cSBarry Smith #if defined(PETSC_HAVE_MUMPS) 3861700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_mumps_C","MatGetFactor_aij_mumps",MatGetFactor_aij_mumps);CHKERRQ(ierr); 3862611f576cSBarry Smith #endif 3863eb3b5408SSatish Balay #if defined(PETSC_HAVE_UMFPACK) 3864700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_umfpack_C","MatGetFactor_seqaij_umfpack",MatGetFactor_seqaij_umfpack);CHKERRQ(ierr); 3865eb3b5408SSatish Balay #endif 3866586621ddSJed Brown #if defined(PETSC_HAVE_CHOLMOD) 3867700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_cholmod_C","MatGetFactor_seqaij_cholmod",MatGetFactor_seqaij_cholmod);CHKERRQ(ierr); 3868586621ddSJed Brown #endif 3869719d5645SBarry Smith #if defined(PETSC_HAVE_LUSOL) 3870700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_lusol_C","MatGetFactor_seqaij_lusol",MatGetFactor_seqaij_lusol);CHKERRQ(ierr); 3871719d5645SBarry Smith #endif 3872700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_petsc_C","MatGetFactor_seqaij_petsc",MatGetFactor_seqaij_petsc);CHKERRQ(ierr); 3873700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactorAvailable_petsc_C","MatGetFactorAvailable_seqaij_petsc",MatGetFactorAvailable_seqaij_petsc);CHKERRQ(ierr); 3874700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_bas_C","MatGetFactor_seqaij_bas",MatGetFactor_seqaij_bas);CHKERRQ(ierr); 3875700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatSeqAIJSetColumnIndices_C","MatSeqAIJSetColumnIndices_SeqAIJ",MatSeqAIJSetColumnIndices_SeqAIJ);CHKERRQ(ierr); 3876700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatStoreValues_C","MatStoreValues_SeqAIJ",MatStoreValues_SeqAIJ);CHKERRQ(ierr); 3877700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatRetrieveValues_C","MatRetrieveValues_SeqAIJ",MatRetrieveValues_SeqAIJ);CHKERRQ(ierr); 3878700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatConvert_seqaij_seqsbaij_C","MatConvert_SeqAIJ_SeqSBAIJ",MatConvert_SeqAIJ_SeqSBAIJ);CHKERRQ(ierr); 3879700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatConvert_seqaij_seqbaij_C","MatConvert_SeqAIJ_SeqBAIJ",MatConvert_SeqAIJ_SeqBAIJ);CHKERRQ(ierr); 3880700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatConvert_seqaij_seqaijperm_C","MatConvert_SeqAIJ_SeqAIJPERM",MatConvert_SeqAIJ_SeqAIJPERM);CHKERRQ(ierr); 3881700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatConvert_seqaij_seqaijcrl_C","MatConvert_SeqAIJ_SeqAIJCRL",MatConvert_SeqAIJ_SeqAIJCRL);CHKERRQ(ierr); 3882700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatIsTranspose_C","MatIsTranspose_SeqAIJ",MatIsTranspose_SeqAIJ);CHKERRQ(ierr); 3883700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatIsHermitianTranspose_C","MatIsHermitianTranspose_SeqAIJ",MatIsTranspose_SeqAIJ);CHKERRQ(ierr); 3884700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatSeqAIJSetPreallocation_C","MatSeqAIJSetPreallocation_SeqAIJ",MatSeqAIJSetPreallocation_SeqAIJ);CHKERRQ(ierr); 3885700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatSeqAIJSetPreallocationCSR_C","MatSeqAIJSetPreallocationCSR_SeqAIJ",MatSeqAIJSetPreallocationCSR_SeqAIJ);CHKERRQ(ierr); 3886700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatReorderForNonzeroDiagonal_C","MatReorderForNonzeroDiagonal_SeqAIJ",MatReorderForNonzeroDiagonal_SeqAIJ);CHKERRQ(ierr); 3887700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatMatMult_seqdense_seqaij_C","MatMatMult_SeqDense_SeqAIJ",MatMatMult_SeqDense_SeqAIJ);CHKERRQ(ierr); 3888700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatMatMultSymbolic_seqdense_seqaij_C","MatMatMultSymbolic_SeqDense_SeqAIJ",MatMatMultSymbolic_SeqDense_SeqAIJ);CHKERRQ(ierr); 3889700c5bfcSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatMatMultNumeric_seqdense_seqaij_C","MatMatMultNumeric_SeqDense_SeqAIJ",MatMatMultNumeric_SeqDense_SeqAIJ);CHKERRQ(ierr); 38904108e4d5SBarry Smith ierr = MatCreate_SeqAIJ_Inode(B);CHKERRQ(ierr); 389117667f90SBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ);CHKERRQ(ierr); 38923a40ed3dSBarry Smith PetscFunctionReturn(0); 389317ab2063SBarry Smith } 3894273d9f13SBarry Smith EXTERN_C_END 389517ab2063SBarry Smith 3896ff34cdc8SBarry Smith #if defined(PETSC_HAVE_PTHREADCLASSES) 389751d315f7SKerry Stevens EXTERN_C_BEGIN 389851d315f7SKerry Stevens #undef __FUNCT__ 38997d6a0e61SBarry Smith #define __FUNCT__ "MatCreate_SeqAIJPThread" 39007d6a0e61SBarry Smith PetscErrorCode MatCreate_SeqAIJPThread(Mat B) 390151d315f7SKerry Stevens { 390251d315f7SKerry Stevens PetscErrorCode ierr; 390351d315f7SKerry Stevens 390451d315f7SKerry Stevens PetscFunctionBegin; 390551d315f7SKerry Stevens ierr = MatCreate_SeqAIJ(B); 390651d315f7SKerry Stevens ierr = PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps));CHKERRQ(ierr); 39077d6a0e61SBarry Smith B->ops->mult = MatMult_SeqAIJPThread; 39087d6a0e61SBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJPTHREAD);CHKERRQ(ierr); 390951d315f7SKerry Stevens PetscFunctionReturn(0); 391051d315f7SKerry Stevens } 391151d315f7SKerry Stevens EXTERN_C_END 3912ba61063dSBarry Smith #endif 391351d315f7SKerry Stevens 39144a2ae208SSatish Balay #undef __FUNCT__ 3915b24902e0SBarry Smith #define __FUNCT__ "MatDuplicateNoCreate_SeqAIJ" 3916b24902e0SBarry Smith /* 3917b24902e0SBarry Smith Given a matrix generated with MatGetFactor() duplicates all the information in A into B 3918b24902e0SBarry Smith */ 3919ace3abfcSBarry Smith PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C,Mat A,MatDuplicateOption cpvalues,PetscBool mallocmatspace) 392017ab2063SBarry Smith { 3921416022c9SBarry Smith Mat_SeqAIJ *c,*a = (Mat_SeqAIJ*)A->data; 39226849ba73SBarry Smith PetscErrorCode ierr; 3923d0f46423SBarry Smith PetscInt i,m = A->rmap->n; 392417ab2063SBarry Smith 39253a40ed3dSBarry Smith PetscFunctionBegin; 3926273d9f13SBarry Smith c = (Mat_SeqAIJ*)C->data; 3927273d9f13SBarry Smith 3928d5f3da31SBarry Smith C->factortype = A->factortype; 3929416022c9SBarry Smith c->row = 0; 3930416022c9SBarry Smith c->col = 0; 393182bf6240SBarry Smith c->icol = 0; 39326ad4291fSHong Zhang c->reallocs = 0; 393317ab2063SBarry Smith 39346ad4291fSHong Zhang C->assembled = PETSC_TRUE; 393517ab2063SBarry Smith 3936aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->rmap,&C->rmap);CHKERRQ(ierr); 3937aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->cmap,&C->cmap);CHKERRQ(ierr); 3938eec197d1SBarry Smith 393933b91e9fSSatish Balay ierr = PetscMalloc2(m,PetscInt,&c->imax,m,PetscInt,&c->ilen);CHKERRQ(ierr); 39409518dbb4SMatthew Knepley ierr = PetscLogObjectMemory(C, 2*m*sizeof(PetscInt));CHKERRQ(ierr); 394117ab2063SBarry Smith for (i=0; i<m; i++) { 3942416022c9SBarry Smith c->imax[i] = a->imax[i]; 3943416022c9SBarry Smith c->ilen[i] = a->ilen[i]; 394417ab2063SBarry Smith } 394517ab2063SBarry Smith 394617ab2063SBarry Smith /* allocate the matrix space */ 3947f77e22a1SHong Zhang if (mallocmatspace){ 3948a96a251dSBarry Smith ierr = PetscMalloc3(a->i[m],PetscScalar,&c->a,a->i[m],PetscInt,&c->j,m+1,PetscInt,&c->i);CHKERRQ(ierr); 39499518dbb4SMatthew Knepley ierr = PetscLogObjectMemory(C, a->i[m]*(sizeof(PetscScalar)+sizeof(PetscInt))+(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 3950f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 395197f1f81fSBarry Smith ierr = PetscMemcpy(c->i,a->i,(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 395217ab2063SBarry Smith if (m > 0) { 395397f1f81fSBarry Smith ierr = PetscMemcpy(c->j,a->j,(a->i[m])*sizeof(PetscInt));CHKERRQ(ierr); 3954be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 3955bfeeae90SHong Zhang ierr = PetscMemcpy(c->a,a->a,(a->i[m])*sizeof(PetscScalar));CHKERRQ(ierr); 3956be6bf707SBarry Smith } else { 3957bfeeae90SHong Zhang ierr = PetscMemzero(c->a,(a->i[m])*sizeof(PetscScalar));CHKERRQ(ierr); 395817ab2063SBarry Smith } 395908480c60SBarry Smith } 3960f77e22a1SHong Zhang } 396117ab2063SBarry Smith 39626ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 3963416022c9SBarry Smith c->roworiented = a->roworiented; 3964416022c9SBarry Smith c->nonew = a->nonew; 3965416022c9SBarry Smith if (a->diag) { 396697f1f81fSBarry Smith ierr = PetscMalloc((m+1)*sizeof(PetscInt),&c->diag);CHKERRQ(ierr); 396752e6d16bSBarry Smith ierr = PetscLogObjectMemory(C,(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 396817ab2063SBarry Smith for (i=0; i<m; i++) { 3969416022c9SBarry Smith c->diag[i] = a->diag[i]; 397017ab2063SBarry Smith } 39713a40ed3dSBarry Smith } else c->diag = 0; 39726ad4291fSHong Zhang c->solve_work = 0; 39736ad4291fSHong Zhang c->saved_values = 0; 39746ad4291fSHong Zhang c->idiag = 0; 397571f1c65dSBarry Smith c->ssor_work = 0; 3976a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 3977e6b907acSBarry Smith c->free_a = PETSC_TRUE; 3978e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 39796ad4291fSHong Zhang c->xtoy = 0; 39806ad4291fSHong Zhang c->XtoY = 0; 39816ad4291fSHong Zhang 3982416022c9SBarry Smith c->nz = a->nz; 39838ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 3984273d9f13SBarry Smith C->preallocated = PETSC_TRUE; 3985754ec7b1SSatish Balay 39866ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 39876ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 3988cd6b891eSBarry Smith c->compressedrow.check = a->compressedrow.check; 3989cd6b891eSBarry Smith if (a->compressedrow.use){ 39906ad4291fSHong Zhang i = a->compressedrow.nrows; 39910e83c824SBarry Smith ierr = PetscMalloc2(i+1,PetscInt,&c->compressedrow.i,i,PetscInt,&c->compressedrow.rindex);CHKERRQ(ierr); 39926ad4291fSHong Zhang ierr = PetscMemcpy(c->compressedrow.i,a->compressedrow.i,(i+1)*sizeof(PetscInt));CHKERRQ(ierr); 39936ad4291fSHong Zhang ierr = PetscMemcpy(c->compressedrow.rindex,a->compressedrow.rindex,i*sizeof(PetscInt));CHKERRQ(ierr); 399427ea64f8SHong Zhang } else { 399527ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 399627ea64f8SHong Zhang c->compressedrow.i = PETSC_NULL; 399727ea64f8SHong Zhang c->compressedrow.rindex = PETSC_NULL; 39986ad4291fSHong Zhang } 399988e51ccdSHong Zhang C->same_nonzero = A->same_nonzero; 40004108e4d5SBarry Smith ierr = MatDuplicate_SeqAIJ_Inode(A,cpvalues,&C);CHKERRQ(ierr); 40014846f1f5SKris Buschelman 40027adad957SLisandro Dalcin ierr = PetscFListDuplicate(((PetscObject)A)->qlist,&((PetscObject)C)->qlist);CHKERRQ(ierr); 40033a40ed3dSBarry Smith PetscFunctionReturn(0); 400417ab2063SBarry Smith } 400517ab2063SBarry Smith 40064a2ae208SSatish Balay #undef __FUNCT__ 4007b24902e0SBarry Smith #define __FUNCT__ "MatDuplicate_SeqAIJ" 4008b24902e0SBarry Smith PetscErrorCode MatDuplicate_SeqAIJ(Mat A,MatDuplicateOption cpvalues,Mat *B) 4009b24902e0SBarry Smith { 4010b24902e0SBarry Smith PetscErrorCode ierr; 4011b24902e0SBarry Smith 4012b24902e0SBarry Smith PetscFunctionBegin; 4013b24902e0SBarry Smith ierr = MatCreate(((PetscObject)A)->comm,B);CHKERRQ(ierr); 40144b6263acSBarry Smith ierr = MatSetSizes(*B,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 4015a54f2f98SBarry Smith ierr = MatSetType(*B,((PetscObject)A)->type_name);CHKERRQ(ierr); 4016f77e22a1SHong Zhang ierr = MatDuplicateNoCreate_SeqAIJ(*B,A,cpvalues,PETSC_TRUE);CHKERRQ(ierr); 4017b24902e0SBarry Smith PetscFunctionReturn(0); 4018b24902e0SBarry Smith } 4019b24902e0SBarry Smith 4020b24902e0SBarry Smith #undef __FUNCT__ 40214a2ae208SSatish Balay #define __FUNCT__ "MatLoad_SeqAIJ" 4022112444f4SShri Abhyankar PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 4023fbdbba38SShri Abhyankar { 4024fbdbba38SShri Abhyankar Mat_SeqAIJ *a; 4025fbdbba38SShri Abhyankar PetscErrorCode ierr; 4026fbdbba38SShri Abhyankar PetscInt i,sum,nz,header[4],*rowlengths = 0,M,N,rows,cols; 4027fbdbba38SShri Abhyankar int fd; 4028fbdbba38SShri Abhyankar PetscMPIInt size; 4029fbdbba38SShri Abhyankar MPI_Comm comm; 4030bbead8a2SBarry Smith PetscInt bs = 1; 4031fbdbba38SShri Abhyankar 4032fbdbba38SShri Abhyankar PetscFunctionBegin; 4033fbdbba38SShri Abhyankar ierr = PetscObjectGetComm((PetscObject)viewer,&comm);CHKERRQ(ierr); 4034fbdbba38SShri Abhyankar ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 4035fbdbba38SShri Abhyankar if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"view must have one processor"); 4036bbead8a2SBarry Smith 4037bbead8a2SBarry Smith ierr = PetscOptionsBegin(comm,PETSC_NULL,"Options for loading SEQAIJ matrix","Mat");CHKERRQ(ierr); 4038bbead8a2SBarry Smith ierr = PetscOptionsInt("-matload_block_size","Set the blocksize used to store the matrix","MatLoad",bs,&bs,PETSC_NULL);CHKERRQ(ierr); 4039bbead8a2SBarry Smith ierr = PetscOptionsEnd();CHKERRQ(ierr); 4040bbead8a2SBarry Smith 4041fbdbba38SShri Abhyankar ierr = PetscViewerBinaryGetDescriptor(viewer,&fd);CHKERRQ(ierr); 4042fbdbba38SShri Abhyankar ierr = PetscBinaryRead(fd,header,4,PETSC_INT);CHKERRQ(ierr); 4043fbdbba38SShri Abhyankar if (header[0] != MAT_FILE_CLASSID) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"not matrix object in file"); 4044fbdbba38SShri Abhyankar M = header[1]; N = header[2]; nz = header[3]; 4045fbdbba38SShri Abhyankar 4046bbead8a2SBarry Smith if (nz < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Matrix stored in special format on disk,cannot load as SeqAIJ"); 4047fbdbba38SShri Abhyankar 4048fbdbba38SShri Abhyankar /* read in row lengths */ 4049fbdbba38SShri Abhyankar ierr = PetscMalloc(M*sizeof(PetscInt),&rowlengths);CHKERRQ(ierr); 4050fbdbba38SShri Abhyankar ierr = PetscBinaryRead(fd,rowlengths,M,PETSC_INT);CHKERRQ(ierr); 4051fbdbba38SShri Abhyankar 4052fbdbba38SShri Abhyankar /* check if sum of rowlengths is same as nz */ 4053fbdbba38SShri Abhyankar for (i=0,sum=0; i< M; i++) sum +=rowlengths[i]; 4054fbdbba38SShri Abhyankar if (sum != nz) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_FILE_READ,"Inconsistant matrix data in file. no-nonzeros = %d, sum-row-lengths = %d\n",nz,sum); 4055fbdbba38SShri Abhyankar 4056fbdbba38SShri Abhyankar /* set global size if not set already*/ 4057f501eaabSShri Abhyankar if (newMat->rmap->n < 0 && newMat->rmap->N < 0 && newMat->cmap->n < 0 && newMat->cmap->N < 0) { 4058fbdbba38SShri Abhyankar ierr = MatSetSizes(newMat,PETSC_DECIDE,PETSC_DECIDE,M,N);CHKERRQ(ierr); 4059aabbc4fbSShri Abhyankar } else { 4060fbdbba38SShri Abhyankar /* if sizes and type are already set, check if the vector global sizes are correct */ 4061fbdbba38SShri Abhyankar ierr = MatGetSize(newMat,&rows,&cols);CHKERRQ(ierr); 40624c5b953cSHong Zhang if (rows < 0 && cols < 0){ /* user might provide local size instead of global size */ 40634c5b953cSHong Zhang ierr = MatGetLocalSize(newMat,&rows,&cols);CHKERRQ(ierr); 40644c5b953cSHong Zhang } 4065f501eaabSShri Abhyankar if (M != rows || N != cols) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%d, %d) than the input matrix (%d, %d)",M,N,rows,cols); 4066aabbc4fbSShri Abhyankar } 4067fbdbba38SShri Abhyankar ierr = MatSeqAIJSetPreallocation_SeqAIJ(newMat,0,rowlengths);CHKERRQ(ierr); 4068fbdbba38SShri Abhyankar a = (Mat_SeqAIJ*)newMat->data; 4069fbdbba38SShri Abhyankar 4070fbdbba38SShri Abhyankar ierr = PetscBinaryRead(fd,a->j,nz,PETSC_INT);CHKERRQ(ierr); 4071fbdbba38SShri Abhyankar 4072fbdbba38SShri Abhyankar /* read in nonzero values */ 4073fbdbba38SShri Abhyankar ierr = PetscBinaryRead(fd,a->a,nz,PETSC_SCALAR);CHKERRQ(ierr); 4074fbdbba38SShri Abhyankar 4075fbdbba38SShri Abhyankar /* set matrix "i" values */ 4076fbdbba38SShri Abhyankar a->i[0] = 0; 4077fbdbba38SShri Abhyankar for (i=1; i<= M; i++) { 4078fbdbba38SShri Abhyankar a->i[i] = a->i[i-1] + rowlengths[i-1]; 4079fbdbba38SShri Abhyankar a->ilen[i-1] = rowlengths[i-1]; 4080fbdbba38SShri Abhyankar } 4081fbdbba38SShri Abhyankar ierr = PetscFree(rowlengths);CHKERRQ(ierr); 4082fbdbba38SShri Abhyankar 4083fbdbba38SShri Abhyankar ierr = MatAssemblyBegin(newMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4084fbdbba38SShri Abhyankar ierr = MatAssemblyEnd(newMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4085bbead8a2SBarry Smith if (bs > 1) {ierr = MatSetBlockSize(newMat,bs);CHKERRQ(ierr);} 4086fbdbba38SShri Abhyankar PetscFunctionReturn(0); 4087fbdbba38SShri Abhyankar } 4088fbdbba38SShri Abhyankar 4089fbdbba38SShri Abhyankar #undef __FUNCT__ 4090b9617806SBarry Smith #define __FUNCT__ "MatEqual_SeqAIJ" 4091ace3abfcSBarry Smith PetscErrorCode MatEqual_SeqAIJ(Mat A,Mat B,PetscBool * flg) 40927264ac53SSatish Balay { 40937264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data,*b = (Mat_SeqAIJ *)B->data; 4094dfbe8321SBarry Smith PetscErrorCode ierr; 4095eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 4096eeffb40dSHong Zhang PetscInt k; 4097eeffb40dSHong Zhang #endif 40987264ac53SSatish Balay 40993a40ed3dSBarry Smith PetscFunctionBegin; 4100bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 4101d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) ||(a->nz != b->nz)) { 4102ca44d042SBarry Smith *flg = PETSC_FALSE; 4103ca44d042SBarry Smith PetscFunctionReturn(0); 4104bcd2baecSBarry Smith } 41057264ac53SSatish Balay 41067264ac53SSatish Balay /* if the a->i are the same */ 4107d0f46423SBarry Smith ierr = PetscMemcmp(a->i,b->i,(A->rmap->n+1)*sizeof(PetscInt),flg);CHKERRQ(ierr); 4108abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 41097264ac53SSatish Balay 41107264ac53SSatish Balay /* if a->j are the same */ 411197f1f81fSBarry Smith ierr = PetscMemcmp(a->j,b->j,(a->nz)*sizeof(PetscInt),flg);CHKERRQ(ierr); 4112abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 4113bcd2baecSBarry Smith 4114bcd2baecSBarry Smith /* if a->a are the same */ 4115eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 4116eeffb40dSHong Zhang for (k=0; k<a->nz; k++){ 4117eeffb40dSHong Zhang if (PetscRealPart(a->a[k]) != PetscRealPart(b->a[k]) || PetscImaginaryPart(a->a[k]) != PetscImaginaryPart(b->a[k])){ 4118eeffb40dSHong Zhang *flg = PETSC_FALSE; 41193a40ed3dSBarry Smith PetscFunctionReturn(0); 4120eeffb40dSHong Zhang } 4121eeffb40dSHong Zhang } 4122eeffb40dSHong Zhang #else 4123eeffb40dSHong Zhang ierr = PetscMemcmp(a->a,b->a,(a->nz)*sizeof(PetscScalar),flg);CHKERRQ(ierr); 4124eeffb40dSHong Zhang #endif 4125eeffb40dSHong Zhang PetscFunctionReturn(0); 41267264ac53SSatish Balay } 412736db0b34SBarry Smith 41284a2ae208SSatish Balay #undef __FUNCT__ 41294a2ae208SSatish Balay #define __FUNCT__ "MatCreateSeqAIJWithArrays" 413005869f15SSatish Balay /*@ 413136db0b34SBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential AIJ matrix using matrix elements (in CSR format) 413236db0b34SBarry Smith provided by the user. 413336db0b34SBarry Smith 4134c75a6043SHong Zhang Collective on MPI_Comm 413536db0b34SBarry Smith 413636db0b34SBarry Smith Input Parameters: 413736db0b34SBarry Smith + comm - must be an MPI communicator of size 1 413836db0b34SBarry Smith . m - number of rows 413936db0b34SBarry Smith . n - number of columns 414036db0b34SBarry Smith . i - row indices 414136db0b34SBarry Smith . j - column indices 414236db0b34SBarry Smith - a - matrix values 414336db0b34SBarry Smith 414436db0b34SBarry Smith Output Parameter: 414536db0b34SBarry Smith . mat - the matrix 414636db0b34SBarry Smith 414736db0b34SBarry Smith Level: intermediate 414836db0b34SBarry Smith 414936db0b34SBarry Smith Notes: 41500551d7c0SBarry Smith The i, j, and a arrays are not copied by this routine, the user must free these arrays 4151292fb18eSBarry Smith once the matrix is destroyed and not before 415236db0b34SBarry Smith 415336db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 415436db0b34SBarry Smith 4155bfeeae90SHong Zhang The i and j indices are 0 based 415636db0b34SBarry Smith 4157a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 4158a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 4159a4552177SSatish Balay as shown: 4160a4552177SSatish Balay 4161a4552177SSatish Balay 1 0 0 4162a4552177SSatish Balay 2 0 3 4163a4552177SSatish Balay 4 5 6 4164a4552177SSatish Balay 4165a4552177SSatish Balay i = {0,1,3,6} [size = nrow+1 = 3+1] 41669985e31cSBarry Smith j = {0,0,2,0,1,2} [size = nz = 6]; values must be sorted for each row 4167a4552177SSatish Balay v = {1,2,3,4,5,6} [size = nz = 6] 4168a4552177SSatish Balay 41699985e31cSBarry Smith 41702fb0ec9aSBarry Smith .seealso: MatCreate(), MatCreateMPIAIJ(), MatCreateSeqAIJ(), MatCreateMPIAIJWithArrays(), MatMPIAIJSetPreallocationCSR() 417136db0b34SBarry Smith 417236db0b34SBarry Smith @*/ 41737087cfbeSBarry Smith PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt* i,PetscInt*j,PetscScalar *a,Mat *mat) 417436db0b34SBarry Smith { 4175dfbe8321SBarry Smith PetscErrorCode ierr; 4176cbcfb4deSHong Zhang PetscInt ii; 417736db0b34SBarry Smith Mat_SeqAIJ *aij; 4178cbcfb4deSHong Zhang #if defined(PETSC_USE_DEBUG) 4179cbcfb4deSHong Zhang PetscInt jj; 4180cbcfb4deSHong Zhang #endif 418136db0b34SBarry Smith 418236db0b34SBarry Smith PetscFunctionBegin; 4183a96a251dSBarry Smith if (i[0]) { 4184e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"i (row indices) must start with 0"); 418536db0b34SBarry Smith } 4186f69a0ea3SMatthew Knepley ierr = MatCreate(comm,mat);CHKERRQ(ierr); 4187f69a0ea3SMatthew Knepley ierr = MatSetSizes(*mat,m,n,m,n);CHKERRQ(ierr); 4188ab93d7beSBarry Smith ierr = MatSetType(*mat,MATSEQAIJ);CHKERRQ(ierr); 4189ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(*mat,MAT_SKIP_ALLOCATION,0);CHKERRQ(ierr); 4190ab93d7beSBarry Smith aij = (Mat_SeqAIJ*)(*mat)->data; 4191ab93d7beSBarry Smith ierr = PetscMalloc2(m,PetscInt,&aij->imax,m,PetscInt,&aij->ilen);CHKERRQ(ierr); 4192ab93d7beSBarry Smith 419336db0b34SBarry Smith aij->i = i; 419436db0b34SBarry Smith aij->j = j; 419536db0b34SBarry Smith aij->a = a; 419636db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 419736db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 4198e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 4199e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 420036db0b34SBarry Smith 420136db0b34SBarry Smith for (ii=0; ii<m; ii++) { 420236db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii+1] - i[ii]; 42032515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 4204e32f2f54SBarry Smith if (i[ii+1] - i[ii] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row length in i (row indices) row = %d length = %d",ii,i[ii+1] - i[ii]); 42059985e31cSBarry Smith for (jj=i[ii]+1; jj<i[ii+1]; jj++) { 4206e32f2f54SBarry Smith if (j[jj] < j[jj-1]) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %D (actual colum %D) in row %D is not sorted",jj-i[ii],j[jj],ii); 4207e32f2f54SBarry Smith if (j[jj] == j[jj]-1) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %D (actual colum %D) in row %D is identical to previous entry",jj-i[ii],j[jj],ii); 42089985e31cSBarry Smith } 420936db0b34SBarry Smith #endif 421036db0b34SBarry Smith } 42112515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 421236db0b34SBarry Smith for (ii=0; ii<aij->i[m]; ii++) { 4213e32f2f54SBarry Smith if (j[ii] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column index at location = %d index = %d",ii,j[ii]); 4214e32f2f54SBarry Smith if (j[ii] > n - 1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column index to large at location = %d index = %d",ii,j[ii]); 421536db0b34SBarry Smith } 421636db0b34SBarry Smith #endif 421736db0b34SBarry Smith 4218b65db4caSBarry Smith ierr = MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4219b65db4caSBarry Smith ierr = MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 422036db0b34SBarry Smith PetscFunctionReturn(0); 422136db0b34SBarry Smith } 42228a0b0e6bSVictor Minden #undef __FUNCT__ 42238a0b0e6bSVictor Minden #define __FUNCT__ "MatCreateSeqAIJFromTriple" 422480ef6e79SMatthew G Knepley /*@C 4225d021a1c5SVictor Minden MatCreateSeqAIJFromTriple - Creates an sequential AIJ matrix using matrix elements (in COO format) 42268a0b0e6bSVictor Minden provided by the user. 42278a0b0e6bSVictor Minden 42288a0b0e6bSVictor Minden Collective on MPI_Comm 42298a0b0e6bSVictor Minden 42308a0b0e6bSVictor Minden Input Parameters: 42318a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 42328a0b0e6bSVictor Minden . m - number of rows 42338a0b0e6bSVictor Minden . n - number of columns 42348a0b0e6bSVictor Minden . i - row indices 42358a0b0e6bSVictor Minden . j - column indices 42361230e6d1SVictor Minden . a - matrix values 42371230e6d1SVictor Minden . nz - number of nonzeros 42381230e6d1SVictor Minden - idx - 0 or 1 based 42398a0b0e6bSVictor Minden 42408a0b0e6bSVictor Minden Output Parameter: 42418a0b0e6bSVictor Minden . mat - the matrix 42428a0b0e6bSVictor Minden 42438a0b0e6bSVictor Minden Level: intermediate 42448a0b0e6bSVictor Minden 42458a0b0e6bSVictor Minden Notes: 42468a0b0e6bSVictor Minden The i and j indices are 0 based 42478a0b0e6bSVictor Minden 42488a0b0e6bSVictor Minden The format which is used for the sparse matrix input, is equivalent to a 42498a0b0e6bSVictor Minden row-major ordering.. i.e for the following matrix, the input data expected is 42508a0b0e6bSVictor Minden as shown: 42518a0b0e6bSVictor Minden 42528a0b0e6bSVictor Minden 1 0 0 42538a0b0e6bSVictor Minden 2 0 3 42548a0b0e6bSVictor Minden 4 5 6 42558a0b0e6bSVictor Minden 42568a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 42578a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 42588a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 42598a0b0e6bSVictor Minden 42608a0b0e6bSVictor Minden 42618a0b0e6bSVictor Minden .seealso: MatCreate(), MatCreateMPIAIJ(), MatCreateSeqAIJ(), MatCreateSeqAIJWithArrays(), MatMPIAIJSetPreallocationCSR() 42628a0b0e6bSVictor Minden 42638a0b0e6bSVictor Minden @*/ 42641230e6d1SVictor Minden PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt* i,PetscInt*j,PetscScalar *a,Mat *mat,PetscInt nz,PetscBool idx) 42658a0b0e6bSVictor Minden { 42668a0b0e6bSVictor Minden PetscErrorCode ierr; 4267d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1,row,col; 42688a0b0e6bSVictor Minden 42698a0b0e6bSVictor Minden 42708a0b0e6bSVictor Minden PetscFunctionBegin; 4271d021a1c5SVictor Minden ierr = PetscMalloc(m*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 42721230e6d1SVictor Minden ierr = PetscMemzero(nnz,m*sizeof(PetscInt));CHKERRQ(ierr); 42731230e6d1SVictor Minden for (ii = 0; ii < nz; ii++){ 42741230e6d1SVictor Minden nnz[i[ii]] += 1; 42751230e6d1SVictor Minden } 42768a0b0e6bSVictor Minden ierr = MatCreate(comm,mat);CHKERRQ(ierr); 42778a0b0e6bSVictor Minden ierr = MatSetSizes(*mat,m,n,m,n);CHKERRQ(ierr); 42788a0b0e6bSVictor Minden ierr = MatSetType(*mat,MATSEQAIJ);CHKERRQ(ierr); 42791230e6d1SVictor Minden ierr = MatSeqAIJSetPreallocation_SeqAIJ(*mat,0,nnz);CHKERRQ(ierr); 42801230e6d1SVictor Minden for (ii = 0; ii < nz; ii++){ 42811230e6d1SVictor Minden if (idx){ 42821230e6d1SVictor Minden row = i[ii] - 1; 42831230e6d1SVictor Minden col = j[ii] - 1; 42841230e6d1SVictor Minden } else { 42851230e6d1SVictor Minden row = i[ii]; 42861230e6d1SVictor Minden col = j[ii]; 42878a0b0e6bSVictor Minden } 42881230e6d1SVictor Minden ierr = MatSetValues(*mat,one,&row,one,&col,&a[ii],ADD_VALUES);CHKERRQ(ierr); 42898a0b0e6bSVictor Minden } 42908a0b0e6bSVictor Minden ierr = MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 42918a0b0e6bSVictor Minden ierr = MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4292d021a1c5SVictor Minden ierr = PetscFree(nnz);CHKERRQ(ierr); 42938a0b0e6bSVictor Minden PetscFunctionReturn(0); 42948a0b0e6bSVictor Minden } 429536db0b34SBarry Smith 4296cc8ba8e1SBarry Smith #undef __FUNCT__ 4297ee4f033dSBarry Smith #define __FUNCT__ "MatSetColoring_SeqAIJ" 4298dfbe8321SBarry Smith PetscErrorCode MatSetColoring_SeqAIJ(Mat A,ISColoring coloring) 4299cc8ba8e1SBarry Smith { 4300dfbe8321SBarry Smith PetscErrorCode ierr; 4301cc8ba8e1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 430236db0b34SBarry Smith 4303cc8ba8e1SBarry Smith PetscFunctionBegin; 43048ee2e534SBarry Smith if (coloring->ctype == IS_COLORING_GLOBAL) { 4305cc8ba8e1SBarry Smith ierr = ISColoringReference(coloring);CHKERRQ(ierr); 4306cc8ba8e1SBarry Smith a->coloring = coloring; 430712c595b3SBarry Smith } else if (coloring->ctype == IS_COLORING_GHOSTED) { 430897f1f81fSBarry Smith PetscInt i,*larray; 430912c595b3SBarry Smith ISColoring ocoloring; 431008b6dcc0SBarry Smith ISColoringValue *colors; 431112c595b3SBarry Smith 431212c595b3SBarry Smith /* set coloring for diagonal portion */ 43130e83c824SBarry Smith ierr = PetscMalloc(A->cmap->n*sizeof(PetscInt),&larray);CHKERRQ(ierr); 4314d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) { 431512c595b3SBarry Smith larray[i] = i; 431612c595b3SBarry Smith } 4317992144d0SBarry Smith ierr = ISGlobalToLocalMappingApply(A->cmap->mapping,IS_GTOLM_MASK,A->cmap->n,larray,PETSC_NULL,larray);CHKERRQ(ierr); 43180e83c824SBarry Smith ierr = PetscMalloc(A->cmap->n*sizeof(ISColoringValue),&colors);CHKERRQ(ierr); 4319d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) { 432012c595b3SBarry Smith colors[i] = coloring->colors[larray[i]]; 432112c595b3SBarry Smith } 432212c595b3SBarry Smith ierr = PetscFree(larray);CHKERRQ(ierr); 4323d0f46423SBarry Smith ierr = ISColoringCreate(PETSC_COMM_SELF,coloring->n,A->cmap->n,colors,&ocoloring);CHKERRQ(ierr); 432412c595b3SBarry Smith a->coloring = ocoloring; 432512c595b3SBarry Smith } 4326cc8ba8e1SBarry Smith PetscFunctionReturn(0); 4327cc8ba8e1SBarry Smith } 4328cc8ba8e1SBarry Smith 4329dcf5cc72SBarry Smith #if defined(PETSC_HAVE_ADIC) 4330ee4f033dSBarry Smith EXTERN_C_BEGIN 4331c6db04a5SJed Brown #include <adic/ad_utils.h> 4332ee4f033dSBarry Smith EXTERN_C_END 4333cc8ba8e1SBarry Smith 4334cc8ba8e1SBarry Smith #undef __FUNCT__ 4335ee4f033dSBarry Smith #define __FUNCT__ "MatSetValuesAdic_SeqAIJ" 4336dfbe8321SBarry Smith PetscErrorCode MatSetValuesAdic_SeqAIJ(Mat A,void *advalues) 4337cc8ba8e1SBarry Smith { 4338cc8ba8e1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 4339d0f46423SBarry Smith PetscInt m = A->rmap->n,*ii = a->i,*jj = a->j,nz,i,j,nlen; 43404440f671SBarry Smith PetscScalar *v = a->a,*values = ((PetscScalar*)advalues)+1; 434108b6dcc0SBarry Smith ISColoringValue *color; 4342cc8ba8e1SBarry Smith 4343cc8ba8e1SBarry Smith PetscFunctionBegin; 4344e32f2f54SBarry Smith if (!a->coloring) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Coloring not set for matrix"); 43454440f671SBarry Smith nlen = PetscADGetDerivTypeSize()/sizeof(PetscScalar); 4346cc8ba8e1SBarry Smith color = a->coloring->colors; 4347cc8ba8e1SBarry Smith /* loop over rows */ 4348cc8ba8e1SBarry Smith for (i=0; i<m; i++) { 4349cc8ba8e1SBarry Smith nz = ii[i+1] - ii[i]; 4350cc8ba8e1SBarry Smith /* loop over columns putting computed value into matrix */ 4351cc8ba8e1SBarry Smith for (j=0; j<nz; j++) { 4352cc8ba8e1SBarry Smith *v++ = values[color[*jj++]]; 4353cc8ba8e1SBarry Smith } 43544440f671SBarry Smith values += nlen; /* jump to next row of derivatives */ 4355ee4f033dSBarry Smith } 4356ee4f033dSBarry Smith PetscFunctionReturn(0); 4357ee4f033dSBarry Smith } 4358ee4f033dSBarry Smith #endif 4359ee4f033dSBarry Smith 4360ee4f033dSBarry Smith #undef __FUNCT__ 4361ee4f033dSBarry Smith #define __FUNCT__ "MatSetValuesAdifor_SeqAIJ" 436297f1f81fSBarry Smith PetscErrorCode MatSetValuesAdifor_SeqAIJ(Mat A,PetscInt nl,void *advalues) 4363ee4f033dSBarry Smith { 4364ee4f033dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 4365d0f46423SBarry Smith PetscInt m = A->rmap->n,*ii = a->i,*jj = a->j,nz,i,j; 436654f21887SBarry Smith MatScalar *v = a->a; 436754f21887SBarry Smith PetscScalar *values = (PetscScalar *)advalues; 436808b6dcc0SBarry Smith ISColoringValue *color; 4369ee4f033dSBarry Smith 4370ee4f033dSBarry Smith PetscFunctionBegin; 4371e32f2f54SBarry Smith if (!a->coloring) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Coloring not set for matrix"); 4372ee4f033dSBarry Smith color = a->coloring->colors; 4373ee4f033dSBarry Smith /* loop over rows */ 4374ee4f033dSBarry Smith for (i=0; i<m; i++) { 4375ee4f033dSBarry Smith nz = ii[i+1] - ii[i]; 4376ee4f033dSBarry Smith /* loop over columns putting computed value into matrix */ 4377ee4f033dSBarry Smith for (j=0; j<nz; j++) { 4378ee4f033dSBarry Smith *v++ = values[color[*jj++]]; 4379ee4f033dSBarry Smith } 4380ee4f033dSBarry Smith values += nl; /* jump to next row of derivatives */ 4381cc8ba8e1SBarry Smith } 4382cc8ba8e1SBarry Smith PetscFunctionReturn(0); 4383cc8ba8e1SBarry Smith } 438436db0b34SBarry Smith 438581824310SBarry Smith /* 438681824310SBarry Smith Special version for direct calls from Fortran 438781824310SBarry Smith */ 4388c6db04a5SJed Brown #include <private/fortranimpl.h> 438981824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 439081824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 439181824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 439281824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 439381824310SBarry Smith #endif 439481824310SBarry Smith 439581824310SBarry Smith /* Change these macros so can be used in void function */ 439681824310SBarry Smith #undef CHKERRQ 43977adad957SLisandro Dalcin #define CHKERRQ(ierr) CHKERRABORT(((PetscObject)A)->comm,ierr) 439881824310SBarry Smith #undef SETERRQ2 4399e32f2f54SBarry Smith #define SETERRQ2(comm,ierr,b,c,d) CHKERRABORT(comm,ierr) 440081824310SBarry Smith 440181824310SBarry Smith EXTERN_C_BEGIN 440281824310SBarry Smith #undef __FUNCT__ 440381824310SBarry Smith #define __FUNCT__ "matsetvaluesseqaij_" 44041f6cc5b2SSatish Balay void PETSC_STDCALL matsetvaluesseqaij_(Mat *AA,PetscInt *mm,const PetscInt im[],PetscInt *nn,const PetscInt in[],const PetscScalar v[],InsertMode *isis, PetscErrorCode *_ierr) 440581824310SBarry Smith { 440681824310SBarry Smith Mat A = *AA; 440781824310SBarry Smith PetscInt m = *mm, n = *nn; 440881824310SBarry Smith InsertMode is = *isis; 440981824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 441081824310SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 441181824310SBarry Smith PetscInt *imax,*ai,*ailen; 441281824310SBarry Smith PetscErrorCode ierr; 441381824310SBarry Smith PetscInt *aj,nonew = a->nonew,lastcol = -1; 441454f21887SBarry Smith MatScalar *ap,value,*aa; 4415ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 4416ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 441781824310SBarry Smith 441881824310SBarry Smith PetscFunctionBegin; 4419d9e2c085SLisandro Dalcin ierr = MatPreallocated(A);CHKERRQ(ierr); 442081824310SBarry Smith imax = a->imax; 442181824310SBarry Smith ai = a->i; 442281824310SBarry Smith ailen = a->ilen; 442381824310SBarry Smith aj = a->j; 442481824310SBarry Smith aa = a->a; 442581824310SBarry Smith 442681824310SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 442781824310SBarry Smith row = im[k]; 442881824310SBarry Smith if (row < 0) continue; 442981824310SBarry Smith #if defined(PETSC_USE_DEBUG) 4430d0f46423SBarry Smith if (row >= A->rmap->n) SETERRABORT(((PetscObject)A)->comm,PETSC_ERR_ARG_OUTOFRANGE,"Row too large"); 443181824310SBarry Smith #endif 443281824310SBarry Smith rp = aj + ai[row]; ap = aa + ai[row]; 443381824310SBarry Smith rmax = imax[row]; nrow = ailen[row]; 443481824310SBarry Smith low = 0; 443581824310SBarry Smith high = nrow; 443681824310SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 443781824310SBarry Smith if (in[l] < 0) continue; 443881824310SBarry Smith #if defined(PETSC_USE_DEBUG) 4439d0f46423SBarry Smith if (in[l] >= A->cmap->n) SETERRABORT(((PetscObject)A)->comm,PETSC_ERR_ARG_OUTOFRANGE,"Column too large"); 444081824310SBarry Smith #endif 444181824310SBarry Smith col = in[l]; 444281824310SBarry Smith if (roworiented) { 444381824310SBarry Smith value = v[l + k*n]; 444481824310SBarry Smith } else { 444581824310SBarry Smith value = v[k + l*m]; 444681824310SBarry Smith } 444781824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 444881824310SBarry Smith 444981824310SBarry Smith if (col <= lastcol) low = 0; else high = nrow; 445081824310SBarry Smith lastcol = col; 445181824310SBarry Smith while (high-low > 5) { 445281824310SBarry Smith t = (low+high)/2; 445381824310SBarry Smith if (rp[t] > col) high = t; 445481824310SBarry Smith else low = t; 445581824310SBarry Smith } 445681824310SBarry Smith for (i=low; i<high; i++) { 445781824310SBarry Smith if (rp[i] > col) break; 445881824310SBarry Smith if (rp[i] == col) { 445981824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 446081824310SBarry Smith else ap[i] = value; 446181824310SBarry Smith goto noinsert; 446281824310SBarry Smith } 446381824310SBarry Smith } 446481824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 446581824310SBarry Smith if (nonew == 1) goto noinsert; 44667adad957SLisandro Dalcin if (nonew == -1) SETERRABORT(((PetscObject)A)->comm,PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero in the matrix"); 4467fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 446881824310SBarry Smith N = nrow++ - 1; a->nz++; high++; 446981824310SBarry Smith /* shift up all the later entries in this row */ 447081824310SBarry Smith for (ii=N; ii>=i; ii--) { 447181824310SBarry Smith rp[ii+1] = rp[ii]; 447281824310SBarry Smith ap[ii+1] = ap[ii]; 447381824310SBarry Smith } 447481824310SBarry Smith rp[i] = col; 447581824310SBarry Smith ap[i] = value; 447681824310SBarry Smith noinsert:; 447781824310SBarry Smith low = i + 1; 447881824310SBarry Smith } 447981824310SBarry Smith ailen[row] = nrow; 448081824310SBarry Smith } 448181824310SBarry Smith A->same_nonzero = PETSC_FALSE; 448281824310SBarry Smith PetscFunctionReturnVoid(); 448381824310SBarry Smith } 448481824310SBarry Smith EXTERN_C_END 448562298a1eSBarry Smith 4486