1b377110cSBarry Smith 2d5d45c9bSBarry Smith /* 33369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 4d5d45c9bSBarry Smith matrix storage format. 5d5d45c9bSBarry Smith */ 63369ce9aSBarry Smith 77c4f633dSBarry Smith 8c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 9c6db04a5SJed Brown #include <petscblaslapack.h> 10c6db04a5SJed Brown #include <petscbt.h> 11af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 120716a85fSBarry Smith 134099cc6bSBarry Smith PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 144099cc6bSBarry Smith { 154099cc6bSBarry Smith PetscErrorCode ierr; 164099cc6bSBarry Smith PetscBool flg; 174099cc6bSBarry Smith char type[256]; 184099cc6bSBarry Smith 194099cc6bSBarry Smith PetscFunctionBegin; 204099cc6bSBarry Smith ierr = PetscObjectOptionsBegin((PetscObject)A); 214099cc6bSBarry Smith ierr = PetscOptionsFList("-mat_seqaij_type","Matrix SeqAIJ type","MatSeqAIJSetType",MatSeqAIJList,"seqaij",type,256,&flg);CHKERRQ(ierr); 224099cc6bSBarry Smith if (flg) { 234099cc6bSBarry Smith ierr = MatSeqAIJSetType(A,type);CHKERRQ(ierr); 244099cc6bSBarry Smith } 254099cc6bSBarry Smith ierr = PetscOptionsEnd();CHKERRQ(ierr); 264099cc6bSBarry Smith PetscFunctionReturn(0); 274099cc6bSBarry Smith } 284099cc6bSBarry Smith 290716a85fSBarry Smith PetscErrorCode MatGetColumnNorms_SeqAIJ(Mat A,NormType type,PetscReal *norms) 300716a85fSBarry Smith { 310716a85fSBarry Smith PetscErrorCode ierr; 320716a85fSBarry Smith PetscInt i,m,n; 330716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 340716a85fSBarry Smith 350716a85fSBarry Smith PetscFunctionBegin; 360716a85fSBarry Smith ierr = MatGetSize(A,&m,&n);CHKERRQ(ierr); 370716a85fSBarry Smith ierr = PetscMemzero(norms,n*sizeof(PetscReal));CHKERRQ(ierr); 380716a85fSBarry Smith if (type == NORM_2) { 390716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 400716a85fSBarry Smith norms[aij->j[i]] += PetscAbsScalar(aij->a[i]*aij->a[i]); 410716a85fSBarry Smith } 420716a85fSBarry Smith } else if (type == NORM_1) { 430716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 440716a85fSBarry Smith norms[aij->j[i]] += PetscAbsScalar(aij->a[i]); 450716a85fSBarry Smith } 460716a85fSBarry Smith } else if (type == NORM_INFINITY) { 470716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 480716a85fSBarry Smith norms[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]),norms[aij->j[i]]); 490716a85fSBarry Smith } 500716a85fSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Unknown NormType"); 510716a85fSBarry Smith 520716a85fSBarry Smith if (type == NORM_2) { 538f1a2a5eSBarry Smith for (i=0; i<n; i++) norms[i] = PetscSqrtReal(norms[i]); 540716a85fSBarry Smith } 550716a85fSBarry Smith PetscFunctionReturn(0); 560716a85fSBarry Smith } 570716a85fSBarry Smith 583a062f41SBarry Smith PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A,IS *is) 593a062f41SBarry Smith { 603a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 613a062f41SBarry Smith PetscInt i,m=A->rmap->n,cnt = 0, bs = A->rmap->bs; 623a062f41SBarry Smith const PetscInt *jj = a->j,*ii = a->i; 633a062f41SBarry Smith PetscInt *rows; 643a062f41SBarry Smith PetscErrorCode ierr; 653a062f41SBarry Smith 663a062f41SBarry Smith PetscFunctionBegin; 673a062f41SBarry Smith for (i=0; i<m; i++) { 683a062f41SBarry Smith if ((ii[i] != ii[i+1]) && ((jj[ii[i]] < bs*(i/bs)) || (jj[ii[i+1]-1] > bs*((i+bs)/bs)-1))) { 693a062f41SBarry Smith cnt++; 703a062f41SBarry Smith } 713a062f41SBarry Smith } 723a062f41SBarry Smith ierr = PetscMalloc1(cnt,&rows);CHKERRQ(ierr); 733a062f41SBarry Smith cnt = 0; 743a062f41SBarry Smith for (i=0; i<m; i++) { 753a062f41SBarry Smith if ((ii[i] != ii[i+1]) && ((jj[ii[i]] < bs*(i/bs)) || (jj[ii[i+1]-1] > bs*((i+bs)/bs)-1))) { 763a062f41SBarry Smith rows[cnt] = i; 773a062f41SBarry Smith cnt++; 783a062f41SBarry Smith } 793a062f41SBarry Smith } 803a062f41SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,cnt,rows,PETSC_OWN_POINTER,is);CHKERRQ(ierr); 813a062f41SBarry Smith PetscFunctionReturn(0); 823a062f41SBarry Smith } 833a062f41SBarry Smith 84f1f41ecbSJed Brown PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A,PetscInt *nrows,PetscInt **zrows) 856ce1633cSBarry Smith { 866ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 876ce1633cSBarry Smith const MatScalar *aa = a->a; 886ce1633cSBarry Smith PetscInt i,m=A->rmap->n,cnt = 0; 89b2db7409Sstefano_zampini const PetscInt *ii = a->i,*jj = a->j,*diag; 906ce1633cSBarry Smith PetscInt *rows; 916ce1633cSBarry Smith PetscErrorCode ierr; 926ce1633cSBarry Smith 936ce1633cSBarry Smith PetscFunctionBegin; 946ce1633cSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 956ce1633cSBarry Smith diag = a->diag; 966ce1633cSBarry Smith for (i=0; i<m; i++) { 97b2db7409Sstefano_zampini if ((diag[i] >= ii[i+1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 986ce1633cSBarry Smith cnt++; 996ce1633cSBarry Smith } 1006ce1633cSBarry Smith } 101785e854fSJed Brown ierr = PetscMalloc1(cnt,&rows);CHKERRQ(ierr); 1026ce1633cSBarry Smith cnt = 0; 1036ce1633cSBarry Smith for (i=0; i<m; i++) { 104b2db7409Sstefano_zampini if ((diag[i] >= ii[i+1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 1056ce1633cSBarry Smith rows[cnt++] = i; 1066ce1633cSBarry Smith } 1076ce1633cSBarry Smith } 108f1f41ecbSJed Brown *nrows = cnt; 109f1f41ecbSJed Brown *zrows = rows; 110f1f41ecbSJed Brown PetscFunctionReturn(0); 111f1f41ecbSJed Brown } 112f1f41ecbSJed Brown 113f1f41ecbSJed Brown PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A,IS *zrows) 114f1f41ecbSJed Brown { 115f1f41ecbSJed Brown PetscInt nrows,*rows; 116f1f41ecbSJed Brown PetscErrorCode ierr; 117f1f41ecbSJed Brown 118f1f41ecbSJed Brown PetscFunctionBegin; 1190298fd71SBarry Smith *zrows = NULL; 120f1f41ecbSJed Brown ierr = MatFindZeroDiagonals_SeqAIJ_Private(A,&nrows,&rows);CHKERRQ(ierr); 121ce94432eSBarry Smith ierr = ISCreateGeneral(PetscObjectComm((PetscObject)A),nrows,rows,PETSC_OWN_POINTER,zrows);CHKERRQ(ierr); 1226ce1633cSBarry Smith PetscFunctionReturn(0); 1236ce1633cSBarry Smith } 1246ce1633cSBarry Smith 125b3a44c85SBarry Smith PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A,IS *keptrows) 126b3a44c85SBarry Smith { 127b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 128b3a44c85SBarry Smith const MatScalar *aa; 129b3a44c85SBarry Smith PetscInt m=A->rmap->n,cnt = 0; 130b3a44c85SBarry Smith const PetscInt *ii; 131b3a44c85SBarry Smith PetscInt n,i,j,*rows; 132b3a44c85SBarry Smith PetscErrorCode ierr; 133b3a44c85SBarry Smith 134b3a44c85SBarry Smith PetscFunctionBegin; 135b3a44c85SBarry Smith *keptrows = 0; 136b3a44c85SBarry Smith ii = a->i; 137b3a44c85SBarry Smith for (i=0; i<m; i++) { 138b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 139b3a44c85SBarry Smith if (!n) { 140b3a44c85SBarry Smith cnt++; 141b3a44c85SBarry Smith goto ok1; 142b3a44c85SBarry Smith } 143b3a44c85SBarry Smith aa = a->a + ii[i]; 144b3a44c85SBarry Smith for (j=0; j<n; j++) { 145b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 146b3a44c85SBarry Smith } 147b3a44c85SBarry Smith cnt++; 148b3a44c85SBarry Smith ok1:; 149b3a44c85SBarry Smith } 150b3a44c85SBarry Smith if (!cnt) PetscFunctionReturn(0); 151854ce69bSBarry Smith ierr = PetscMalloc1(A->rmap->n-cnt,&rows);CHKERRQ(ierr); 152b3a44c85SBarry Smith cnt = 0; 153b3a44c85SBarry Smith for (i=0; i<m; i++) { 154b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 155b3a44c85SBarry Smith if (!n) continue; 156b3a44c85SBarry Smith aa = a->a + ii[i]; 157b3a44c85SBarry Smith for (j=0; j<n; j++) { 158b3a44c85SBarry Smith if (aa[j] != 0.0) { 159b3a44c85SBarry Smith rows[cnt++] = i; 160b3a44c85SBarry Smith break; 161b3a44c85SBarry Smith } 162b3a44c85SBarry Smith } 163b3a44c85SBarry Smith } 164b3a44c85SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,cnt,rows,PETSC_OWN_POINTER,keptrows);CHKERRQ(ierr); 165b3a44c85SBarry Smith PetscFunctionReturn(0); 166b3a44c85SBarry Smith } 167b3a44c85SBarry Smith 1687087cfbeSBarry Smith PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y,Vec D,InsertMode is) 16979299369SBarry Smith { 17079299369SBarry Smith PetscErrorCode ierr; 17179299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) Y->data; 17299e65526SBarry Smith PetscInt i,m = Y->rmap->n; 17399e65526SBarry Smith const PetscInt *diag; 17454f21887SBarry Smith MatScalar *aa = aij->a; 17599e65526SBarry Smith const PetscScalar *v; 176ace3abfcSBarry Smith PetscBool missing; 17779299369SBarry Smith 17879299369SBarry Smith PetscFunctionBegin; 17909f38230SBarry Smith if (Y->assembled) { 1800298fd71SBarry Smith ierr = MatMissingDiagonal_SeqAIJ(Y,&missing,NULL);CHKERRQ(ierr); 18109f38230SBarry Smith if (!missing) { 18279299369SBarry Smith diag = aij->diag; 18399e65526SBarry Smith ierr = VecGetArrayRead(D,&v);CHKERRQ(ierr); 18479299369SBarry Smith if (is == INSERT_VALUES) { 18579299369SBarry Smith for (i=0; i<m; i++) { 18679299369SBarry Smith aa[diag[i]] = v[i]; 18779299369SBarry Smith } 18879299369SBarry Smith } else { 18979299369SBarry Smith for (i=0; i<m; i++) { 19079299369SBarry Smith aa[diag[i]] += v[i]; 19179299369SBarry Smith } 19279299369SBarry Smith } 19399e65526SBarry Smith ierr = VecRestoreArrayRead(D,&v);CHKERRQ(ierr); 19479299369SBarry Smith PetscFunctionReturn(0); 19579299369SBarry Smith } 196acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(Y);CHKERRQ(ierr); 19709f38230SBarry Smith } 19809f38230SBarry Smith ierr = MatDiagonalSet_Default(Y,D,is);CHKERRQ(ierr); 19909f38230SBarry Smith PetscFunctionReturn(0); 20009f38230SBarry Smith } 20179299369SBarry Smith 2021a83f524SJed Brown PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *m,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 20317ab2063SBarry Smith { 204416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 205dfbe8321SBarry Smith PetscErrorCode ierr; 20697f1f81fSBarry Smith PetscInt i,ishift; 20717ab2063SBarry Smith 2083a40ed3dSBarry Smith PetscFunctionBegin; 209d0f46423SBarry Smith *m = A->rmap->n; 2103a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 211bfeeae90SHong Zhang ishift = 0; 21253e63a63SBarry Smith if (symmetric && !A->structurally_symmetric) { 2132462f5fdSStefano Zampini ierr = MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,PETSC_TRUE,ishift,oshift,(PetscInt**)ia,(PetscInt**)ja);CHKERRQ(ierr); 214bfeeae90SHong Zhang } else if (oshift == 1) { 2151a83f524SJed Brown PetscInt *tia; 216d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2173b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 218854ce69bSBarry Smith ierr = PetscMalloc1(A->rmap->n+1,&tia);CHKERRQ(ierr); 2191a83f524SJed Brown for (i=0; i<A->rmap->n+1; i++) tia[i] = a->i[i] + 1; 2201a83f524SJed Brown *ia = tia; 221ecc77c7aSBarry Smith if (ja) { 2221a83f524SJed Brown PetscInt *tja; 223854ce69bSBarry Smith ierr = PetscMalloc1(nz+1,&tja);CHKERRQ(ierr); 2241a83f524SJed Brown for (i=0; i<nz; i++) tja[i] = a->j[i] + 1; 2251a83f524SJed Brown *ja = tja; 226ecc77c7aSBarry Smith } 2276945ee14SBarry Smith } else { 228ecc77c7aSBarry Smith *ia = a->i; 229ecc77c7aSBarry Smith if (ja) *ja = a->j; 230a2ce50c7SBarry Smith } 2313a40ed3dSBarry Smith PetscFunctionReturn(0); 232a2744918SBarry Smith } 233a2744918SBarry Smith 2341a83f524SJed Brown PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2356945ee14SBarry Smith { 236dfbe8321SBarry Smith PetscErrorCode ierr; 2376945ee14SBarry Smith 2383a40ed3dSBarry Smith PetscFunctionBegin; 2393a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 240bfeeae90SHong Zhang if ((symmetric && !A->structurally_symmetric) || oshift == 1) { 241606d414cSSatish Balay ierr = PetscFree(*ia);CHKERRQ(ierr); 242ecc77c7aSBarry Smith if (ja) {ierr = PetscFree(*ja);CHKERRQ(ierr);} 243bcd2baecSBarry Smith } 2443a40ed3dSBarry Smith PetscFunctionReturn(0); 24517ab2063SBarry Smith } 24617ab2063SBarry Smith 2471a83f524SJed Brown PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *nn,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2483b2fbd54SBarry Smith { 2493b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 250dfbe8321SBarry Smith PetscErrorCode ierr; 251d0f46423SBarry Smith PetscInt i,*collengths,*cia,*cja,n = A->cmap->n,m = A->rmap->n; 25297f1f81fSBarry Smith PetscInt nz = a->i[m],row,*jj,mr,col; 2533b2fbd54SBarry Smith 2543a40ed3dSBarry Smith PetscFunctionBegin; 255899cda47SBarry Smith *nn = n; 2563a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2573b2fbd54SBarry Smith if (symmetric) { 2582462f5fdSStefano Zampini ierr = MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,PETSC_TRUE,0,oshift,(PetscInt**)ia,(PetscInt**)ja);CHKERRQ(ierr); 2593b2fbd54SBarry Smith } else { 2601795a4d1SJed Brown ierr = PetscCalloc1(n+1,&collengths);CHKERRQ(ierr); 261854ce69bSBarry Smith ierr = PetscMalloc1(n+1,&cia);CHKERRQ(ierr); 262854ce69bSBarry Smith ierr = PetscMalloc1(nz+1,&cja);CHKERRQ(ierr); 2633b2fbd54SBarry Smith jj = a->j; 2643b2fbd54SBarry Smith for (i=0; i<nz; i++) { 265bfeeae90SHong Zhang collengths[jj[i]]++; 2663b2fbd54SBarry Smith } 2673b2fbd54SBarry Smith cia[0] = oshift; 2683b2fbd54SBarry Smith for (i=0; i<n; i++) { 2693b2fbd54SBarry Smith cia[i+1] = cia[i] + collengths[i]; 2703b2fbd54SBarry Smith } 27197f1f81fSBarry Smith ierr = PetscMemzero(collengths,n*sizeof(PetscInt));CHKERRQ(ierr); 2723b2fbd54SBarry Smith jj = a->j; 273a93ec695SBarry Smith for (row=0; row<m; row++) { 274a93ec695SBarry Smith mr = a->i[row+1] - a->i[row]; 275a93ec695SBarry Smith for (i=0; i<mr; i++) { 276bfeeae90SHong Zhang col = *jj++; 2772205254eSKarl Rupp 2783b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2793b2fbd54SBarry Smith } 2803b2fbd54SBarry Smith } 281606d414cSSatish Balay ierr = PetscFree(collengths);CHKERRQ(ierr); 2823b2fbd54SBarry Smith *ia = cia; *ja = cja; 2833b2fbd54SBarry Smith } 2843a40ed3dSBarry Smith PetscFunctionReturn(0); 2853b2fbd54SBarry Smith } 2863b2fbd54SBarry Smith 2871a83f524SJed Brown PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2883b2fbd54SBarry Smith { 289dfbe8321SBarry Smith PetscErrorCode ierr; 290606d414cSSatish Balay 2913a40ed3dSBarry Smith PetscFunctionBegin; 2923a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2933b2fbd54SBarry Smith 294606d414cSSatish Balay ierr = PetscFree(*ia);CHKERRQ(ierr); 295606d414cSSatish Balay ierr = PetscFree(*ja);CHKERRQ(ierr); 2963a40ed3dSBarry Smith PetscFunctionReturn(0); 2973b2fbd54SBarry Smith } 2983b2fbd54SBarry Smith 2997cee066cSHong Zhang /* 3007cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 3017cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 302040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 3037cee066cSHong Zhang */ 3047cee066cSHong Zhang PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *nn,const PetscInt *ia[],const PetscInt *ja[],PetscInt *spidx[],PetscBool *done) 3057cee066cSHong Zhang { 3067cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3077cee066cSHong Zhang PetscErrorCode ierr; 3087cee066cSHong Zhang PetscInt i,*collengths,*cia,*cja,n = A->cmap->n,m = A->rmap->n; 3097cee066cSHong Zhang PetscInt nz = a->i[m],row,*jj,mr,col; 3107cee066cSHong Zhang PetscInt *cspidx; 3117cee066cSHong Zhang 3127cee066cSHong Zhang PetscFunctionBegin; 3137cee066cSHong Zhang *nn = n; 3147cee066cSHong Zhang if (!ia) PetscFunctionReturn(0); 315625f6d37SHong Zhang 3161795a4d1SJed Brown ierr = PetscCalloc1(n+1,&collengths);CHKERRQ(ierr); 317854ce69bSBarry Smith ierr = PetscMalloc1(n+1,&cia);CHKERRQ(ierr); 318854ce69bSBarry Smith ierr = PetscMalloc1(nz+1,&cja);CHKERRQ(ierr); 319854ce69bSBarry Smith ierr = PetscMalloc1(nz+1,&cspidx);CHKERRQ(ierr); 3207cee066cSHong Zhang jj = a->j; 3217cee066cSHong Zhang for (i=0; i<nz; i++) { 3227cee066cSHong Zhang collengths[jj[i]]++; 3237cee066cSHong Zhang } 3247cee066cSHong Zhang cia[0] = oshift; 3257cee066cSHong Zhang for (i=0; i<n; i++) { 3267cee066cSHong Zhang cia[i+1] = cia[i] + collengths[i]; 3277cee066cSHong Zhang } 3287cee066cSHong Zhang ierr = PetscMemzero(collengths,n*sizeof(PetscInt));CHKERRQ(ierr); 3297cee066cSHong Zhang jj = a->j; 3307cee066cSHong Zhang for (row=0; row<m; row++) { 3317cee066cSHong Zhang mr = a->i[row+1] - a->i[row]; 3327cee066cSHong Zhang for (i=0; i<mr; i++) { 3337cee066cSHong Zhang col = *jj++; 3347cee066cSHong Zhang cspidx[cia[col] + collengths[col] - oshift] = a->i[row] + i; /* index of a->j */ 3357cee066cSHong Zhang cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 3367cee066cSHong Zhang } 3377cee066cSHong Zhang } 3387cee066cSHong Zhang ierr = PetscFree(collengths);CHKERRQ(ierr); 3397cee066cSHong Zhang *ia = cia; *ja = cja; 3407cee066cSHong Zhang *spidx = cspidx; 3417cee066cSHong Zhang PetscFunctionReturn(0); 3427cee066cSHong Zhang } 3437cee066cSHong Zhang 3447cee066cSHong Zhang PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscInt *spidx[],PetscBool *done) 3457cee066cSHong Zhang { 3467cee066cSHong Zhang PetscErrorCode ierr; 3477cee066cSHong Zhang 3487cee066cSHong Zhang PetscFunctionBegin; 3495243ef75SHong Zhang ierr = MatRestoreColumnIJ_SeqAIJ(A,oshift,symmetric,inodecompressed,n,ia,ja,done);CHKERRQ(ierr); 3507cee066cSHong Zhang ierr = PetscFree(*spidx);CHKERRQ(ierr); 3517cee066cSHong Zhang PetscFunctionReturn(0); 3527cee066cSHong Zhang } 3537cee066cSHong Zhang 35487d4246cSBarry Smith PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A,PetscInt row,const PetscScalar v[]) 35587d4246cSBarry Smith { 35687d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 35787d4246cSBarry Smith PetscInt *ai = a->i; 35887d4246cSBarry Smith PetscErrorCode ierr; 35987d4246cSBarry Smith 36087d4246cSBarry Smith PetscFunctionBegin; 36187d4246cSBarry Smith ierr = PetscMemcpy(a->a+ai[row],v,(ai[row+1]-ai[row])*sizeof(PetscScalar));CHKERRQ(ierr); 36287d4246cSBarry Smith PetscFunctionReturn(0); 36387d4246cSBarry Smith } 36487d4246cSBarry Smith 365bd04181cSBarry Smith /* 366bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 367bd04181cSBarry Smith 368bd04181cSBarry Smith - a single row of values is set with each call 369bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 370bd04181cSBarry Smith - the values are always added to the matrix, not set 371bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 372bd04181cSBarry Smith 3731f763a69SBarry Smith This does NOT assume the global column indices are sorted 374bd04181cSBarry Smith 3751f763a69SBarry Smith */ 376bd04181cSBarry Smith 377af0996ceSBarry Smith #include <petsc/private/isimpl.h> 378189e4007SBarry Smith PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 379189e4007SBarry Smith { 380189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3811f763a69SBarry Smith PetscInt low,high,t,row,nrow,i,col,l; 3821f763a69SBarry Smith const PetscInt *rp,*ai = a->i,*ailen = a->ilen,*aj = a->j; 3831f763a69SBarry Smith PetscInt lastcol = -1; 384189e4007SBarry Smith MatScalar *ap,value,*aa = a->a; 385189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices,*cidx = A->cmap->mapping->indices; 386189e4007SBarry Smith 387f38dd0b8SBarry Smith row = ridx[im[0]]; 3881f763a69SBarry Smith rp = aj + ai[row]; 3891f763a69SBarry Smith ap = aa + ai[row]; 3901f763a69SBarry Smith nrow = ailen[row]; 391189e4007SBarry Smith low = 0; 392189e4007SBarry Smith high = nrow; 393189e4007SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 394189e4007SBarry Smith col = cidx[in[l]]; 395f38dd0b8SBarry Smith value = v[l]; 396189e4007SBarry Smith 397189e4007SBarry Smith if (col <= lastcol) low = 0; 398189e4007SBarry Smith else high = nrow; 399189e4007SBarry Smith lastcol = col; 400189e4007SBarry Smith while (high-low > 5) { 401189e4007SBarry Smith t = (low+high)/2; 402189e4007SBarry Smith if (rp[t] > col) high = t; 403189e4007SBarry Smith else low = t; 404189e4007SBarry Smith } 405189e4007SBarry Smith for (i=low; i<high; i++) { 406189e4007SBarry Smith if (rp[i] == col) { 4071f763a69SBarry Smith ap[i] += value; 408189e4007SBarry Smith low = i + 1; 4091f763a69SBarry Smith break; 410189e4007SBarry Smith } 411189e4007SBarry Smith } 412189e4007SBarry Smith } 413f38dd0b8SBarry Smith return 0; 414189e4007SBarry Smith } 415189e4007SBarry Smith 41697f1f81fSBarry Smith PetscErrorCode MatSetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 41717ab2063SBarry Smith { 418416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 419e2ee6c50SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 42097f1f81fSBarry Smith PetscInt *imax = a->imax,*ai = a->i,*ailen = a->ilen; 4216849ba73SBarry Smith PetscErrorCode ierr; 422e2ee6c50SBarry Smith PetscInt *aj = a->j,nonew = a->nonew,lastcol = -1; 423d8cdefa3SHong Zhang MatScalar *ap=NULL,value=0.0,*aa = a->a; 424ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 425ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 42617ab2063SBarry Smith 4273a40ed3dSBarry Smith PetscFunctionBegin; 42817ab2063SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 429416022c9SBarry Smith row = im[k]; 4305ef9f2a5SBarry Smith if (row < 0) continue; 4312515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 432e32f2f54SBarry Smith if (row >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",row,A->rmap->n-1); 4333b2fbd54SBarry Smith #endif 434720833daSHong Zhang rp = aj + ai[row]; 435876c6284SHong Zhang if (!A->structure_only) ap = aa + ai[row]; 43617ab2063SBarry Smith rmax = imax[row]; nrow = ailen[row]; 437416022c9SBarry Smith low = 0; 438c71e6ed7SBarry Smith high = nrow; 43917ab2063SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 4405ef9f2a5SBarry Smith if (in[l] < 0) continue; 4412515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 442e32f2f54SBarry Smith if (in[l] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",in[l],A->cmap->n-1); 4433b2fbd54SBarry Smith #endif 444bfeeae90SHong Zhang col = in[l]; 445720833daSHong Zhang if (!A->structure_only) { 4464b0e389bSBarry Smith if (roworiented) { 4475ef9f2a5SBarry Smith value = v[l + k*n]; 448bef8e0ddSBarry Smith } else { 4494b0e389bSBarry Smith value = v[k + l*m]; 4504b0e389bSBarry Smith } 451720833daSHong Zhang } else { /* A->structure_only */ 452720833daSHong Zhang value = 1; /* avoid 'continue' below? */ 453720833daSHong Zhang } 454dcd36c23SBarry Smith if ((value == 0.0 && ignorezeroentries) && (is == ADD_VALUES) && row != col) continue; 45536db0b34SBarry Smith 4562205254eSKarl Rupp if (col <= lastcol) low = 0; 4572205254eSKarl Rupp else high = nrow; 458e2ee6c50SBarry Smith lastcol = col; 459416022c9SBarry Smith while (high-low > 5) { 460416022c9SBarry Smith t = (low+high)/2; 461416022c9SBarry Smith if (rp[t] > col) high = t; 462416022c9SBarry Smith else low = t; 46317ab2063SBarry Smith } 464416022c9SBarry Smith for (i=low; i<high; i++) { 46517ab2063SBarry Smith if (rp[i] > col) break; 46617ab2063SBarry Smith if (rp[i] == col) { 467876c6284SHong Zhang if (!A->structure_only) { 468*0c0d7e18SFande Kong if (is == ADD_VALUES) { 469*0c0d7e18SFande Kong ap[i] += value; 470*0c0d7e18SFande Kong (void)PetscLogFlops(1.0); 471*0c0d7e18SFande Kong } 47217ab2063SBarry Smith else ap[i] = value; 473720833daSHong Zhang } 474e44c0bd4SBarry Smith low = i + 1; 47517ab2063SBarry Smith goto noinsert; 47617ab2063SBarry Smith } 47717ab2063SBarry Smith } 478dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 479c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 480e32f2f54SBarry Smith if (nonew == -1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero at (%D,%D) in the matrix",row,col); 481720833daSHong Zhang if (A->structure_only) { 482876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A,A->rmap->n,1,nrow,row,col,rmax,ai,aj,rp,imax,nonew,MatScalar); 483720833daSHong Zhang } else { 484fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 485720833daSHong Zhang } 486c03d1d03SSatish Balay N = nrow++ - 1; a->nz++; high++; 487416022c9SBarry Smith /* shift up all the later entries in this row */ 488416022c9SBarry Smith for (ii=N; ii>=i; ii--) { 48917ab2063SBarry Smith rp[ii+1] = rp[ii]; 490876c6284SHong Zhang if (!A->structure_only) ap[ii+1] = ap[ii]; 491720833daSHong Zhang } 49217ab2063SBarry Smith rp[i] = col; 493876c6284SHong Zhang if (!A->structure_only) ap[i] = value; 494416022c9SBarry Smith low = i + 1; 495e56f5c9eSBarry Smith A->nonzerostate++; 496e44c0bd4SBarry Smith noinsert:; 49717ab2063SBarry Smith } 49817ab2063SBarry Smith ailen[row] = nrow; 49917ab2063SBarry Smith } 5003a40ed3dSBarry Smith PetscFunctionReturn(0); 50117ab2063SBarry Smith } 50217ab2063SBarry Smith 50381824310SBarry Smith 504a77337e4SBarry Smith PetscErrorCode MatGetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],PetscScalar v[]) 5057eb43aa7SLois Curfman McInnes { 5067eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 50797f1f81fSBarry Smith PetscInt *rp,k,low,high,t,row,nrow,i,col,l,*aj = a->j; 50897f1f81fSBarry Smith PetscInt *ai = a->i,*ailen = a->ilen; 50954f21887SBarry Smith MatScalar *ap,*aa = a->a; 5107eb43aa7SLois Curfman McInnes 5113a40ed3dSBarry Smith PetscFunctionBegin; 5127eb43aa7SLois Curfman McInnes for (k=0; k<m; k++) { /* loop over rows */ 5137eb43aa7SLois Curfman McInnes row = im[k]; 514e32f2f54SBarry Smith if (row < 0) {v += n; continue;} /* SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row: %D",row); */ 515e32f2f54SBarry Smith if (row >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",row,A->rmap->n-1); 516bfeeae90SHong Zhang rp = aj + ai[row]; ap = aa + ai[row]; 5177eb43aa7SLois Curfman McInnes nrow = ailen[row]; 5187eb43aa7SLois Curfman McInnes for (l=0; l<n; l++) { /* loop over columns */ 519e32f2f54SBarry Smith if (in[l] < 0) {v++; continue;} /* SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column: %D",in[l]); */ 520e32f2f54SBarry Smith if (in[l] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",in[l],A->cmap->n-1); 521bfeeae90SHong Zhang col = in[l]; 5227eb43aa7SLois Curfman McInnes high = nrow; low = 0; /* assume unsorted */ 5237eb43aa7SLois Curfman McInnes while (high-low > 5) { 5247eb43aa7SLois Curfman McInnes t = (low+high)/2; 5257eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 5267eb43aa7SLois Curfman McInnes else low = t; 5277eb43aa7SLois Curfman McInnes } 5287eb43aa7SLois Curfman McInnes for (i=low; i<high; i++) { 5297eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 5307eb43aa7SLois Curfman McInnes if (rp[i] == col) { 531b49de8d1SLois Curfman McInnes *v++ = ap[i]; 5327eb43aa7SLois Curfman McInnes goto finished; 5337eb43aa7SLois Curfman McInnes } 5347eb43aa7SLois Curfman McInnes } 53597e567efSBarry Smith *v++ = 0.0; 5367eb43aa7SLois Curfman McInnes finished:; 5377eb43aa7SLois Curfman McInnes } 5387eb43aa7SLois Curfman McInnes } 5393a40ed3dSBarry Smith PetscFunctionReturn(0); 5407eb43aa7SLois Curfman McInnes } 5417eb43aa7SLois Curfman McInnes 54217ab2063SBarry Smith 543dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Binary(Mat A,PetscViewer viewer) 54417ab2063SBarry Smith { 545416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 5466849ba73SBarry Smith PetscErrorCode ierr; 5476f69ff64SBarry Smith PetscInt i,*col_lens; 5486f69ff64SBarry Smith int fd; 549b37d52dbSMark F. Adams FILE *file; 55017ab2063SBarry Smith 5513a40ed3dSBarry Smith PetscFunctionBegin; 552b0a32e0cSBarry Smith ierr = PetscViewerBinaryGetDescriptor(viewer,&fd);CHKERRQ(ierr); 553854ce69bSBarry Smith ierr = PetscMalloc1(4+A->rmap->n,&col_lens);CHKERRQ(ierr); 5542205254eSKarl Rupp 5550700a824SBarry Smith col_lens[0] = MAT_FILE_CLASSID; 556d0f46423SBarry Smith col_lens[1] = A->rmap->n; 557d0f46423SBarry Smith col_lens[2] = A->cmap->n; 558416022c9SBarry Smith col_lens[3] = a->nz; 559416022c9SBarry Smith 560416022c9SBarry Smith /* store lengths of each row and write (including header) to file */ 561d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 562416022c9SBarry Smith col_lens[4+i] = a->i[i+1] - a->i[i]; 56317ab2063SBarry Smith } 564d0f46423SBarry Smith ierr = PetscBinaryWrite(fd,col_lens,4+A->rmap->n,PETSC_INT,PETSC_TRUE);CHKERRQ(ierr); 565606d414cSSatish Balay ierr = PetscFree(col_lens);CHKERRQ(ierr); 566416022c9SBarry Smith 567416022c9SBarry Smith /* store column indices (zero start index) */ 5686f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,a->j,a->nz,PETSC_INT,PETSC_FALSE);CHKERRQ(ierr); 569416022c9SBarry Smith 570416022c9SBarry Smith /* store nonzero values */ 5716f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,a->a,a->nz,PETSC_SCALAR,PETSC_FALSE);CHKERRQ(ierr); 572b37d52dbSMark F. Adams 573b37d52dbSMark F. Adams ierr = PetscViewerBinaryGetInfoPointer(viewer,&file);CHKERRQ(ierr); 574b37d52dbSMark F. Adams if (file) { 57533d57670SJed Brown fprintf(file,"-matload_block_size %d\n",(int)PetscAbs(A->rmap->bs)); 576b37d52dbSMark F. Adams } 5773a40ed3dSBarry Smith PetscFunctionReturn(0); 57817ab2063SBarry Smith } 579416022c9SBarry Smith 5807dc0baabSHong Zhang static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A,PetscViewer viewer) 5817dc0baabSHong Zhang { 5827dc0baabSHong Zhang PetscErrorCode ierr; 5837dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 5847dc0baabSHong Zhang PetscInt i,k,m=A->rmap->N; 5857dc0baabSHong Zhang 5867dc0baabSHong Zhang PetscFunctionBegin; 5877dc0baabSHong Zhang ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 5887dc0baabSHong Zhang for (i=0; i<m; i++) { 5897dc0baabSHong Zhang ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 5907dc0baabSHong Zhang for (k=a->i[i]; k<a->i[i+1]; k++) { 5917dc0baabSHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (%D) ",a->j[k]);CHKERRQ(ierr); 5927dc0baabSHong Zhang } 5937dc0baabSHong Zhang ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 5947dc0baabSHong Zhang } 5957dc0baabSHong Zhang ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 5967dc0baabSHong Zhang PetscFunctionReturn(0); 5977dc0baabSHong Zhang } 5987dc0baabSHong Zhang 59909573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat,PetscViewer); 600cd155464SBarry Smith 601dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_ASCII(Mat A,PetscViewer viewer) 602416022c9SBarry Smith { 603416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 604dfbe8321SBarry Smith PetscErrorCode ierr; 60560e0710aSBarry Smith PetscInt i,j,m = A->rmap->n; 606e060cb09SBarry Smith const char *name; 607f3ef73ceSBarry Smith PetscViewerFormat format; 60817ab2063SBarry Smith 6093a40ed3dSBarry Smith PetscFunctionBegin; 6107dc0baabSHong Zhang if (A->structure_only) { 6117dc0baabSHong Zhang ierr = MatView_SeqAIJ_ASCII_structonly(A,viewer);CHKERRQ(ierr); 6127dc0baabSHong Zhang PetscFunctionReturn(0); 6137dc0baabSHong Zhang } 61443e49210SHong Zhang 615b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 61671c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 61797f1f81fSBarry Smith PetscInt nofinalvalue = 0; 61860e0710aSBarry Smith if (m && ((a->i[m] == a->i[m-1]) || (a->j[a->nz-1] != A->cmap->n-1))) { 619c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 620d00d2cf4SBarry Smith nofinalvalue = 1; 621d00d2cf4SBarry Smith } 622d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 623d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Size = %D %D \n",m,A->cmap->n);CHKERRQ(ierr); 62477431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Nonzeros = %D \n",a->nz);CHKERRQ(ierr); 625fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 626fbfe6fa7SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"zzz = zeros(%D,4);\n",a->nz+nofinalvalue);CHKERRQ(ierr); 627fbfe6fa7SJed Brown #else 62877431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"zzz = zeros(%D,3);\n",a->nz+nofinalvalue);CHKERRQ(ierr); 629fbfe6fa7SJed Brown #endif 630b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"zzz = [\n");CHKERRQ(ierr); 63117ab2063SBarry Smith 63217ab2063SBarry Smith for (i=0; i<m; i++) { 63360e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 634aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 635a9bf72d8SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e %18.16e\n",i+1,a->j[j]+1,(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 63617ab2063SBarry Smith #else 63760e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e\n",i+1,a->j[j]+1,(double)a->a[j]);CHKERRQ(ierr); 63817ab2063SBarry Smith #endif 63917ab2063SBarry Smith } 64017ab2063SBarry Smith } 641d00d2cf4SBarry Smith if (nofinalvalue) { 642c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 643c337ccceSJed Brown ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e %18.16e\n",m,A->cmap->n,0.,0.);CHKERRQ(ierr); 644c337ccceSJed Brown #else 645d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e\n",m,A->cmap->n,0.0);CHKERRQ(ierr); 646c337ccceSJed Brown #endif 647d00d2cf4SBarry Smith } 648317d6ea6SBarry Smith ierr = PetscObjectGetName((PetscObject)A,&name);CHKERRQ(ierr); 649fb9695e5SSatish Balay ierr = PetscViewerASCIIPrintf(viewer,"];\n %s = spconvert(zzz);\n",name);CHKERRQ(ierr); 650d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 65168369a75SKris Buschelman } else if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO) { 652cd155464SBarry Smith PetscFunctionReturn(0); 653fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 654d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 65544cd7ae7SLois Curfman McInnes for (i=0; i<m; i++) { 65677431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 65760e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 658aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 65936db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 66060e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 66136db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 66260e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 66336db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 66460e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(a->a[j]));CHKERRQ(ierr); 6656831982aSBarry Smith } 66644cd7ae7SLois Curfman McInnes #else 66760e0710aSBarry Smith if (a->a[j] != 0.0) {ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)a->a[j]);CHKERRQ(ierr);} 66844cd7ae7SLois Curfman McInnes #endif 66944cd7ae7SLois Curfman McInnes } 670b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 67144cd7ae7SLois Curfman McInnes } 672d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 673fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 67497f1f81fSBarry Smith PetscInt nzd=0,fshift=1,*sptr; 675d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 676854ce69bSBarry Smith ierr = PetscMalloc1(m+1,&sptr);CHKERRQ(ierr); 677496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 678496be53dSLois Curfman McInnes sptr[i] = nzd+1; 67960e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 680496be53dSLois Curfman McInnes if (a->j[j] >= i) { 681aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 68236db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 683496be53dSLois Curfman McInnes #else 684496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 685496be53dSLois Curfman McInnes #endif 686496be53dSLois Curfman McInnes } 687496be53dSLois Curfman McInnes } 688496be53dSLois Curfman McInnes } 6892e44a96cSLois Curfman McInnes sptr[m] = nzd+1; 69077431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %D %D\n\n",m,nzd);CHKERRQ(ierr); 6912e44a96cSLois Curfman McInnes for (i=0; i<m+1; i+=6) { 6922205254eSKarl Rupp if (i+4<m) { 6932205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4],sptr[i+5]);CHKERRQ(ierr); 6942205254eSKarl Rupp } else if (i+3<m) { 6952205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4]);CHKERRQ(ierr); 6962205254eSKarl Rupp } else if (i+2<m) { 6972205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3]);CHKERRQ(ierr); 6982205254eSKarl Rupp } else if (i+1<m) { 6992205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2]);CHKERRQ(ierr); 7002205254eSKarl Rupp } else if (i<m) { 7012205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D %D\n",sptr[i],sptr[i+1]);CHKERRQ(ierr); 7022205254eSKarl Rupp } else { 7032205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D\n",sptr[i]);CHKERRQ(ierr); 7042205254eSKarl Rupp } 705496be53dSLois Curfman McInnes } 706b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 707606d414cSSatish Balay ierr = PetscFree(sptr);CHKERRQ(ierr); 708496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 70960e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 71077431f27SBarry Smith if (a->j[j] >= i) {ierr = PetscViewerASCIIPrintf(viewer," %D ",a->j[j]+fshift);CHKERRQ(ierr);} 711496be53dSLois Curfman McInnes } 712b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 713496be53dSLois Curfman McInnes } 714b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 715496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 71660e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 717496be53dSLois Curfman McInnes if (a->j[j] >= i) { 718aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 71936db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) { 72060e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %18.16e %18.16e ",(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 7216831982aSBarry Smith } 722496be53dSLois Curfman McInnes #else 72360e0710aSBarry Smith if (a->a[j] != 0.0) {ierr = PetscViewerASCIIPrintf(viewer," %18.16e ",(double)a->a[j]);CHKERRQ(ierr);} 724496be53dSLois Curfman McInnes #endif 725496be53dSLois Curfman McInnes } 726496be53dSLois Curfman McInnes } 727b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 728496be53dSLois Curfman McInnes } 729d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 730fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 73197f1f81fSBarry Smith PetscInt cnt = 0,jcnt; 73287828ca2SBarry Smith PetscScalar value; 73368f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 73468f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 73568f1ed48SBarry Smith 73668f1ed48SBarry Smith for (i=0; i<a->i[m]; i++) { 73768f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 73868f1ed48SBarry Smith realonly = PETSC_FALSE; 73968f1ed48SBarry Smith break; 74068f1ed48SBarry Smith } 74168f1ed48SBarry Smith } 74268f1ed48SBarry Smith #endif 74302594712SBarry Smith 744d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 74502594712SBarry Smith for (i=0; i<m; i++) { 74602594712SBarry Smith jcnt = 0; 747d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 748e24b481bSBarry Smith if (jcnt < a->i[i+1]-a->i[i] && j == a->j[cnt]) { 74902594712SBarry Smith value = a->a[cnt++]; 750e24b481bSBarry Smith jcnt++; 75102594712SBarry Smith } else { 75202594712SBarry Smith value = 0.0; 75302594712SBarry Smith } 754aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 75568f1ed48SBarry Smith if (realonly) { 75660e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %7.5e ",(double)PetscRealPart(value));CHKERRQ(ierr); 75768f1ed48SBarry Smith } else { 75860e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %7.5e+%7.5e i ",(double)PetscRealPart(value),(double)PetscImaginaryPart(value));CHKERRQ(ierr); 75968f1ed48SBarry Smith } 76002594712SBarry Smith #else 76160e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %7.5e ",(double)value);CHKERRQ(ierr); 76202594712SBarry Smith #endif 76302594712SBarry Smith } 764b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 76502594712SBarry Smith } 766d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 7673c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 768150b93efSMatthew G. Knepley PetscInt fshift=1; 769d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 7703c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 77119303e72SJonathan Guyer ierr = PetscViewerASCIIPrintf(viewer,"%%%%MatrixMarket matrix coordinate complex general\n");CHKERRQ(ierr); 7723c215bfdSMatthew Knepley #else 77319303e72SJonathan Guyer ierr = PetscViewerASCIIPrintf(viewer,"%%%%MatrixMarket matrix coordinate real general\n");CHKERRQ(ierr); 7743c215bfdSMatthew Knepley #endif 775d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %D\n", m, A->cmap->n, a->nz);CHKERRQ(ierr); 7763c215bfdSMatthew Knepley for (i=0; i<m; i++) { 77760e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 7783c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 779a9a0e077SKarl Rupp ierr = PetscViewerASCIIPrintf(viewer,"%D %D %g %g\n", i+fshift,a->j[j]+fshift,(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 7803c215bfdSMatthew Knepley #else 781150b93efSMatthew G. Knepley ierr = PetscViewerASCIIPrintf(viewer,"%D %D %g\n", i+fshift, a->j[j]+fshift, (double)a->a[j]);CHKERRQ(ierr); 7823c215bfdSMatthew Knepley #endif 7833c215bfdSMatthew Knepley } 7843c215bfdSMatthew Knepley } 785d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 7863a40ed3dSBarry Smith } else { 787d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 788d5f3da31SBarry Smith if (A->factortype) { 78916cd7e1dSShri Abhyankar for (i=0; i<m; i++) { 79016cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 79116cd7e1dSShri Abhyankar /* L part */ 79260e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 79316cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 79416cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 79560e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 79616cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 7976712e2f1SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)(-PetscImaginaryPart(a->a[j])));CHKERRQ(ierr); 79816cd7e1dSShri Abhyankar } else { 79960e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(a->a[j]));CHKERRQ(ierr); 80016cd7e1dSShri Abhyankar } 80116cd7e1dSShri Abhyankar #else 80260e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)a->a[j]);CHKERRQ(ierr); 80316cd7e1dSShri Abhyankar #endif 80416cd7e1dSShri Abhyankar } 80516cd7e1dSShri Abhyankar /* diagonal */ 80616cd7e1dSShri Abhyankar j = a->diag[i]; 80716cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 80816cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 80960e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(1.0/a->a[j]),(double)PetscImaginaryPart(1.0/a->a[j]));CHKERRQ(ierr); 81016cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 8116712e2f1SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(1.0/a->a[j]),(double)(-PetscImaginaryPart(1.0/a->a[j])));CHKERRQ(ierr); 81216cd7e1dSShri Abhyankar } else { 81360e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(1.0/a->a[j]));CHKERRQ(ierr); 81416cd7e1dSShri Abhyankar } 81516cd7e1dSShri Abhyankar #else 81660e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)(1.0/a->a[j]));CHKERRQ(ierr); 81716cd7e1dSShri Abhyankar #endif 81816cd7e1dSShri Abhyankar 81916cd7e1dSShri Abhyankar /* U part */ 82060e0710aSBarry Smith for (j=a->diag[i+1]+1; j<a->diag[i]; j++) { 82116cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 82216cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 82360e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 82416cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 82522ab088eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)(-PetscImaginaryPart(a->a[j])));CHKERRQ(ierr); 82616cd7e1dSShri Abhyankar } else { 82760e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(a->a[j]));CHKERRQ(ierr); 82816cd7e1dSShri Abhyankar } 82916cd7e1dSShri Abhyankar #else 83060e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)a->a[j]);CHKERRQ(ierr); 83116cd7e1dSShri Abhyankar #endif 83216cd7e1dSShri Abhyankar } 83316cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 83416cd7e1dSShri Abhyankar } 83516cd7e1dSShri Abhyankar } else { 83617ab2063SBarry Smith for (i=0; i<m; i++) { 83777431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 83860e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 839aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 84036db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 84160e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 84236db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 84360e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 8443a40ed3dSBarry Smith } else { 84560e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(a->a[j]));CHKERRQ(ierr); 84617ab2063SBarry Smith } 84717ab2063SBarry Smith #else 84860e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)a->a[j]);CHKERRQ(ierr); 84917ab2063SBarry Smith #endif 85017ab2063SBarry Smith } 851b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 85217ab2063SBarry Smith } 85316cd7e1dSShri Abhyankar } 854d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 85517ab2063SBarry Smith } 856b0a32e0cSBarry Smith ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 8573a40ed3dSBarry Smith PetscFunctionReturn(0); 858416022c9SBarry Smith } 859416022c9SBarry Smith 8609804daf3SBarry Smith #include <petscdraw.h> 861dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw,void *Aa) 862416022c9SBarry Smith { 863480ef9eaSBarry Smith Mat A = (Mat) Aa; 864416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 865dfbe8321SBarry Smith PetscErrorCode ierr; 866383922c3SLisandro Dalcin PetscInt i,j,m = A->rmap->n; 867383922c3SLisandro Dalcin int color; 868b05fc000SLisandro Dalcin PetscReal xl,yl,xr,yr,x_l,x_r,y_l,y_r; 869b0a32e0cSBarry Smith PetscViewer viewer; 870f3ef73ceSBarry Smith PetscViewerFormat format; 871cddf8d76SBarry Smith 8723a40ed3dSBarry Smith PetscFunctionBegin; 873480ef9eaSBarry Smith ierr = PetscObjectQuery((PetscObject)A,"Zoomviewer",(PetscObject*)&viewer);CHKERRQ(ierr); 874b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 875b0a32e0cSBarry Smith ierr = PetscDrawGetCoordinates(draw,&xl,&yl,&xr,&yr);CHKERRQ(ierr); 876383922c3SLisandro Dalcin 877416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 8780513a670SBarry Smith 879fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 880383922c3SLisandro Dalcin ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr); 8810513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 882b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 883416022c9SBarry Smith for (i=0; i<m; i++) { 884cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 885bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 886bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 88736db0b34SBarry Smith if (PetscRealPart(a->a[j]) >= 0.) continue; 888b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 889cddf8d76SBarry Smith } 890cddf8d76SBarry Smith } 891b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 892cddf8d76SBarry Smith for (i=0; i<m; i++) { 893cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 894bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 895bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 896cddf8d76SBarry Smith if (a->a[j] != 0.) continue; 897b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 898cddf8d76SBarry Smith } 899cddf8d76SBarry Smith } 900b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 901cddf8d76SBarry Smith for (i=0; i<m; i++) { 902cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 903bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 904bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 90536db0b34SBarry Smith if (PetscRealPart(a->a[j]) <= 0.) continue; 906b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 907416022c9SBarry Smith } 908416022c9SBarry Smith } 909383922c3SLisandro Dalcin ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr); 9100513a670SBarry Smith } else { 9110513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 9120513a670SBarry Smith /* first determine max of all nonzero values */ 913b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 914383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 915b0a32e0cSBarry Smith PetscDraw popup; 9160513a670SBarry Smith 9170513a670SBarry Smith for (i=0; i<nz; i++) { 9180513a670SBarry Smith if (PetscAbsScalar(a->a[i]) > maxv) maxv = PetscAbsScalar(a->a[i]); 9190513a670SBarry Smith } 920383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 921b0a32e0cSBarry Smith ierr = PetscDrawGetPopup(draw,&popup);CHKERRQ(ierr); 92245f3bb6eSLisandro Dalcin ierr = PetscDrawScalePopup(popup,minv,maxv);CHKERRQ(ierr); 923383922c3SLisandro Dalcin 924383922c3SLisandro Dalcin ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr); 9250513a670SBarry Smith for (i=0; i<m; i++) { 926383922c3SLisandro Dalcin y_l = m - i - 1.0; 927383922c3SLisandro Dalcin y_r = y_l + 1.0; 928bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 929383922c3SLisandro Dalcin x_l = a->j[j]; 930383922c3SLisandro Dalcin x_r = x_l + 1.0; 931b05fc000SLisandro Dalcin color = PetscDrawRealToColor(PetscAbsScalar(a->a[count]),minv,maxv); 932b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 9330513a670SBarry Smith count++; 9340513a670SBarry Smith } 9350513a670SBarry Smith } 936383922c3SLisandro Dalcin ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr); 9370513a670SBarry Smith } 938480ef9eaSBarry Smith PetscFunctionReturn(0); 939480ef9eaSBarry Smith } 940cddf8d76SBarry Smith 9419804daf3SBarry Smith #include <petscdraw.h> 942dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw(Mat A,PetscViewer viewer) 943480ef9eaSBarry Smith { 944dfbe8321SBarry Smith PetscErrorCode ierr; 945b0a32e0cSBarry Smith PetscDraw draw; 94636db0b34SBarry Smith PetscReal xr,yr,xl,yl,h,w; 947ace3abfcSBarry Smith PetscBool isnull; 948480ef9eaSBarry Smith 949480ef9eaSBarry Smith PetscFunctionBegin; 950b0a32e0cSBarry Smith ierr = PetscViewerDrawGetDraw(viewer,0,&draw);CHKERRQ(ierr); 951b0a32e0cSBarry Smith ierr = PetscDrawIsNull(draw,&isnull);CHKERRQ(ierr); 952480ef9eaSBarry Smith if (isnull) PetscFunctionReturn(0); 953480ef9eaSBarry Smith 954d0f46423SBarry Smith xr = A->cmap->n; yr = A->rmap->n; h = yr/10.0; w = xr/10.0; 955480ef9eaSBarry Smith xr += w; yr += h; xl = -w; yl = -h; 956b0a32e0cSBarry Smith ierr = PetscDrawSetCoordinates(draw,xl,yl,xr,yr);CHKERRQ(ierr); 957832b7cebSLisandro Dalcin ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",(PetscObject)viewer);CHKERRQ(ierr); 958b0a32e0cSBarry Smith ierr = PetscDrawZoom(draw,MatView_SeqAIJ_Draw_Zoom,A);CHKERRQ(ierr); 9590298fd71SBarry Smith ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",NULL);CHKERRQ(ierr); 960832b7cebSLisandro Dalcin ierr = PetscDrawSave(draw);CHKERRQ(ierr); 9613a40ed3dSBarry Smith PetscFunctionReturn(0); 962416022c9SBarry Smith } 963416022c9SBarry Smith 964dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ(Mat A,PetscViewer viewer) 965416022c9SBarry Smith { 966dfbe8321SBarry Smith PetscErrorCode ierr; 967ace3abfcSBarry Smith PetscBool iascii,isbinary,isdraw; 968416022c9SBarry Smith 9693a40ed3dSBarry Smith PetscFunctionBegin; 970251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 971251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 972251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERDRAW,&isdraw);CHKERRQ(ierr); 973c45a1595SBarry Smith if (iascii) { 9743a40ed3dSBarry Smith ierr = MatView_SeqAIJ_ASCII(A,viewer);CHKERRQ(ierr); 9750f5bd95cSBarry Smith } else if (isbinary) { 9763a40ed3dSBarry Smith ierr = MatView_SeqAIJ_Binary(A,viewer);CHKERRQ(ierr); 9770f5bd95cSBarry Smith } else if (isdraw) { 9783a40ed3dSBarry Smith ierr = MatView_SeqAIJ_Draw(A,viewer);CHKERRQ(ierr); 97911aeaf0aSBarry Smith } 9804108e4d5SBarry Smith ierr = MatView_SeqAIJ_Inode(A,viewer);CHKERRQ(ierr); 9813a40ed3dSBarry Smith PetscFunctionReturn(0); 98217ab2063SBarry Smith } 98319bcc07fSBarry Smith 984dfbe8321SBarry Smith PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A,MatAssemblyType mode) 98517ab2063SBarry Smith { 986416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 9876849ba73SBarry Smith PetscErrorCode ierr; 98897f1f81fSBarry Smith PetscInt fshift = 0,i,j,*ai = a->i,*aj = a->j,*imax = a->imax; 989d0f46423SBarry Smith PetscInt m = A->rmap->n,*ip,N,*ailen = a->ilen,rmax = 0; 99054f21887SBarry Smith MatScalar *aa = a->a,*ap; 9913447b6efSHong Zhang PetscReal ratio = 0.6; 99217ab2063SBarry Smith 9933a40ed3dSBarry Smith PetscFunctionBegin; 9943a40ed3dSBarry Smith if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0); 99517ab2063SBarry Smith 99643ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 99717ab2063SBarry Smith for (i=1; i<m; i++) { 998416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 99917ab2063SBarry Smith fshift += imax[i-1] - ailen[i-1]; 100094a9d846SBarry Smith rmax = PetscMax(rmax,ailen[i]); 100117ab2063SBarry Smith if (fshift) { 1002bfeeae90SHong Zhang ip = aj + ai[i]; 1003bfeeae90SHong Zhang ap = aa + ai[i]; 100417ab2063SBarry Smith N = ailen[i]; 100517ab2063SBarry Smith for (j=0; j<N; j++) { 100617ab2063SBarry Smith ip[j-fshift] = ip[j]; 1007876c6284SHong Zhang if (!A->structure_only) ap[j-fshift] = ap[j]; 100817ab2063SBarry Smith } 100917ab2063SBarry Smith } 101017ab2063SBarry Smith ai[i] = ai[i-1] + ailen[i-1]; 101117ab2063SBarry Smith } 101217ab2063SBarry Smith if (m) { 101317ab2063SBarry Smith fshift += imax[m-1] - ailen[m-1]; 101417ab2063SBarry Smith ai[m] = ai[m-1] + ailen[m-1]; 101517ab2063SBarry Smith } 10167b083b7cSBarry Smith 101717ab2063SBarry Smith /* reset ilen and imax for each row */ 10187b083b7cSBarry Smith a->nonzerorowcnt = 0; 1019396832f4SHong Zhang if (A->structure_only) { 1020396832f4SHong Zhang ierr = PetscFree2(a->imax,a->ilen);CHKERRQ(ierr); 1021396832f4SHong Zhang } else { /* !A->structure_only */ 102217ab2063SBarry Smith for (i=0; i<m; i++) { 102317ab2063SBarry Smith ailen[i] = imax[i] = ai[i+1] - ai[i]; 10247b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i+1] - ai[i]) > 0); 102517ab2063SBarry Smith } 1026396832f4SHong Zhang } 1027bfeeae90SHong Zhang a->nz = ai[m]; 102865e19b50SBarry Smith if (fshift && a->nounused == -1) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_PLIB, "Unused space detected in matrix: %D X %D, %D unneeded", m, A->cmap->n, fshift); 102917ab2063SBarry Smith 103009f38230SBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 1031d0f46423SBarry Smith ierr = PetscInfo4(A,"Matrix size: %D X %D; storage space: %D unneeded,%D used\n",m,A->cmap->n,fshift,a->nz);CHKERRQ(ierr); 1032ae15b995SBarry Smith ierr = PetscInfo1(A,"Number of mallocs during MatSetValues() is %D\n",a->reallocs);CHKERRQ(ierr); 1033ae15b995SBarry Smith ierr = PetscInfo1(A,"Maximum nonzeros in any row is %D\n",rmax);CHKERRQ(ierr); 10342205254eSKarl Rupp 10358e58a170SBarry Smith A->info.mallocs += a->reallocs; 1036dd5f02e7SSatish Balay a->reallocs = 0; 10376712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 103836db0b34SBarry Smith a->rmax = rmax; 10394e220ebcSLois Curfman McInnes 1040396832f4SHong Zhang if (!A->structure_only) { 104111e456e1SBarry Smith ierr = MatCheckCompressedRow(A,a->nonzerorowcnt,&a->compressedrow,a->i,m,ratio);CHKERRQ(ierr); 1042396832f4SHong Zhang } 10434108e4d5SBarry Smith ierr = MatAssemblyEnd_SeqAIJ_Inode(A,mode);CHKERRQ(ierr); 1044acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr); 10453a40ed3dSBarry Smith PetscFunctionReturn(0); 104617ab2063SBarry Smith } 104717ab2063SBarry Smith 104899cafbc1SBarry Smith PetscErrorCode MatRealPart_SeqAIJ(Mat A) 104999cafbc1SBarry Smith { 105099cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 105199cafbc1SBarry Smith PetscInt i,nz = a->nz; 105254f21887SBarry Smith MatScalar *aa = a->a; 1053acf2f550SJed Brown PetscErrorCode ierr; 105499cafbc1SBarry Smith 105599cafbc1SBarry Smith PetscFunctionBegin; 105699cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscRealPart(aa[i]); 1057acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr); 105899cafbc1SBarry Smith PetscFunctionReturn(0); 105999cafbc1SBarry Smith } 106099cafbc1SBarry Smith 106199cafbc1SBarry Smith PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 106299cafbc1SBarry Smith { 106399cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 106499cafbc1SBarry Smith PetscInt i,nz = a->nz; 106554f21887SBarry Smith MatScalar *aa = a->a; 1066acf2f550SJed Brown PetscErrorCode ierr; 106799cafbc1SBarry Smith 106899cafbc1SBarry Smith PetscFunctionBegin; 106999cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 1070acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr); 107199cafbc1SBarry Smith PetscFunctionReturn(0); 107299cafbc1SBarry Smith } 107399cafbc1SBarry Smith 1074dfbe8321SBarry Smith PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 107517ab2063SBarry Smith { 1076416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1077dfbe8321SBarry Smith PetscErrorCode ierr; 10783a40ed3dSBarry Smith 10793a40ed3dSBarry Smith PetscFunctionBegin; 1080d0f46423SBarry Smith ierr = PetscMemzero(a->a,(a->i[A->rmap->n])*sizeof(PetscScalar));CHKERRQ(ierr); 1081acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr); 10823a40ed3dSBarry Smith PetscFunctionReturn(0); 108317ab2063SBarry Smith } 1084416022c9SBarry Smith 1085dfbe8321SBarry Smith PetscErrorCode MatDestroy_SeqAIJ(Mat A) 108617ab2063SBarry Smith { 1087416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1088dfbe8321SBarry Smith PetscErrorCode ierr; 1089d5d45c9bSBarry Smith 10903a40ed3dSBarry Smith PetscFunctionBegin; 1091aa482453SBarry Smith #if defined(PETSC_USE_LOG) 1092d0f46423SBarry Smith PetscLogObjectState((PetscObject)A,"Rows=%D, Cols=%D, NZ=%D",A->rmap->n,A->cmap->n,a->nz); 109317ab2063SBarry Smith #endif 1094e6b907acSBarry Smith ierr = MatSeqXAIJFreeAIJ(A,&a->a,&a->j,&a->i);CHKERRQ(ierr); 10956bf464f9SBarry Smith ierr = ISDestroy(&a->row);CHKERRQ(ierr); 10966bf464f9SBarry Smith ierr = ISDestroy(&a->col);CHKERRQ(ierr); 109705b42c5fSBarry Smith ierr = PetscFree(a->diag);CHKERRQ(ierr); 1098d48dcb14SBarry Smith ierr = PetscFree(a->ibdiag);CHKERRQ(ierr); 109905b42c5fSBarry Smith ierr = PetscFree2(a->imax,a->ilen);CHKERRQ(ierr); 1100846b4da1SFande Kong ierr = PetscFree(a->ipre);CHKERRQ(ierr); 110171f1c65dSBarry Smith ierr = PetscFree3(a->idiag,a->mdiag,a->ssor_work);CHKERRQ(ierr); 110205b42c5fSBarry Smith ierr = PetscFree(a->solve_work);CHKERRQ(ierr); 11036bf464f9SBarry Smith ierr = ISDestroy(&a->icol);CHKERRQ(ierr); 110405b42c5fSBarry Smith ierr = PetscFree(a->saved_values);CHKERRQ(ierr); 11056bf464f9SBarry Smith ierr = ISColoringDestroy(&a->coloring);CHKERRQ(ierr); 1106cd6b891eSBarry Smith ierr = PetscFree2(a->compressedrow.i,a->compressedrow.rindex);CHKERRQ(ierr); 11070b7e3e3dSHong Zhang ierr = PetscFree(a->matmult_abdense);CHKERRQ(ierr); 1108a30b2313SHong Zhang 11094108e4d5SBarry Smith ierr = MatDestroy_SeqAIJ_Inode(A);CHKERRQ(ierr); 1110bf0cc555SLisandro Dalcin ierr = PetscFree(A->data);CHKERRQ(ierr); 1111901853e0SKris Buschelman 1112dbd8c25aSHong Zhang ierr = PetscObjectChangeTypeName((PetscObject)A,0);CHKERRQ(ierr); 1113bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetColumnIndices_C",NULL);CHKERRQ(ierr); 1114bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatStoreValues_C",NULL);CHKERRQ(ierr); 1115bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatRetrieveValues_C",NULL);CHKERRQ(ierr); 1116bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqsbaij_C",NULL);CHKERRQ(ierr); 1117bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqbaij_C",NULL);CHKERRQ(ierr); 1118bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijperm_C",NULL);CHKERRQ(ierr); 1119af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 1120af8000cdSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_elemental_C",NULL);CHKERRQ(ierr); 1121af8000cdSHong Zhang #endif 112263c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 112363c07aadSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_hypre_C",NULL);CHKERRQ(ierr); 11243dad0653Sstefano_zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMatMatMult_transpose_seqaij_seqaij_C",NULL);CHKERRQ(ierr); 112563c07aadSStefano Zampini #endif 1126b49cda9fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 1127c9225affSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqsell_C",NULL);CHKERRQ(ierr); 1128c9225affSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_is_C",NULL);CHKERRQ(ierr); 1129bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatIsTranspose_C",NULL);CHKERRQ(ierr); 1130bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetPreallocation_C",NULL);CHKERRQ(ierr); 1131846b4da1SFande Kong ierr = PetscObjectComposeFunction((PetscObject)A,"MatResetPreallocation_C",NULL);CHKERRQ(ierr); 1132bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetPreallocationCSR_C",NULL);CHKERRQ(ierr); 1133bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatReorderForNonzeroDiagonal_C",NULL);CHKERRQ(ierr); 113475d48cdbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatPtAP_is_seqaij_C",NULL);CHKERRQ(ierr); 11353a40ed3dSBarry Smith PetscFunctionReturn(0); 113617ab2063SBarry Smith } 113717ab2063SBarry Smith 1138ace3abfcSBarry Smith PetscErrorCode MatSetOption_SeqAIJ(Mat A,MatOption op,PetscBool flg) 113917ab2063SBarry Smith { 1140416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 11414846f1f5SKris Buschelman PetscErrorCode ierr; 11423a40ed3dSBarry Smith 11433a40ed3dSBarry Smith PetscFunctionBegin; 1144a65d3064SKris Buschelman switch (op) { 1145a65d3064SKris Buschelman case MAT_ROW_ORIENTED: 11464e0d8c25SBarry Smith a->roworiented = flg; 1147a65d3064SKris Buschelman break; 1148a9817697SBarry Smith case MAT_KEEP_NONZERO_PATTERN: 1149a9817697SBarry Smith a->keepnonzeropattern = flg; 1150a65d3064SKris Buschelman break; 1151512a5fc5SBarry Smith case MAT_NEW_NONZERO_LOCATIONS: 1152512a5fc5SBarry Smith a->nonew = (flg ? 0 : 1); 1153a65d3064SKris Buschelman break; 1154a65d3064SKris Buschelman case MAT_NEW_NONZERO_LOCATION_ERR: 11554e0d8c25SBarry Smith a->nonew = (flg ? -1 : 0); 1156a65d3064SKris Buschelman break; 1157a65d3064SKris Buschelman case MAT_NEW_NONZERO_ALLOCATION_ERR: 11584e0d8c25SBarry Smith a->nonew = (flg ? -2 : 0); 1159a65d3064SKris Buschelman break; 116028b2fa4aSMatthew Knepley case MAT_UNUSED_NONZERO_LOCATION_ERR: 116128b2fa4aSMatthew Knepley a->nounused = (flg ? -1 : 0); 116228b2fa4aSMatthew Knepley break; 1163a65d3064SKris Buschelman case MAT_IGNORE_ZERO_ENTRIES: 11644e0d8c25SBarry Smith a->ignorezeroentries = flg; 11650df259c2SBarry Smith break; 11663d472b54SHong Zhang case MAT_SPD: 1167b1646e73SJed Brown case MAT_SYMMETRIC: 1168b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1169b1646e73SJed Brown case MAT_HERMITIAN: 1170b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1171957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 11725021d80fSJed Brown /* These options are handled directly by MatSetOption() */ 11735021d80fSJed Brown break; 11744e0d8c25SBarry Smith case MAT_NEW_DIAGONALS: 1175a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1176a65d3064SKris Buschelman case MAT_USE_HASH_TABLE: 1177290bbb0aSBarry Smith ierr = PetscInfo1(A,"Option %s ignored\n",MatOptions[op]);CHKERRQ(ierr); 1178a65d3064SKris Buschelman break; 1179b87ac2d8SJed Brown case MAT_USE_INODES: 1180b87ac2d8SJed Brown /* Not an error because MatSetOption_SeqAIJ_Inode handles this one */ 1181b87ac2d8SJed Brown break; 1182c10200c1SHong Zhang case MAT_SUBMAT_SINGLEIS: 1183c10200c1SHong Zhang A->submat_singleis = flg; 1184c10200c1SHong Zhang break; 1185a65d3064SKris Buschelman default: 1186e32f2f54SBarry Smith SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"unknown option %d",op); 1187a65d3064SKris Buschelman } 11884108e4d5SBarry Smith ierr = MatSetOption_SeqAIJ_Inode(A,op,flg);CHKERRQ(ierr); 11893a40ed3dSBarry Smith PetscFunctionReturn(0); 119017ab2063SBarry Smith } 119117ab2063SBarry Smith 1192dfbe8321SBarry Smith PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A,Vec v) 119317ab2063SBarry Smith { 1194416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 11956849ba73SBarry Smith PetscErrorCode ierr; 1196d3e70bfaSHong Zhang PetscInt i,j,n,*ai=a->i,*aj=a->j,nz; 119735e7444dSHong Zhang PetscScalar *aa=a->a,*x,zero=0.0; 119817ab2063SBarry Smith 11993a40ed3dSBarry Smith PetscFunctionBegin; 1200d3e70bfaSHong Zhang ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 1201e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 120235e7444dSHong Zhang 1203d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1204d3e70bfaSHong Zhang PetscInt *diag=a->diag; 120535e7444dSHong Zhang ierr = VecGetArray(v,&x);CHKERRQ(ierr); 12062c990fa1SHong Zhang for (i=0; i<n; i++) x[i] = 1.0/aa[diag[i]]; 120735e7444dSHong Zhang ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 120835e7444dSHong Zhang PetscFunctionReturn(0); 120935e7444dSHong Zhang } 121035e7444dSHong Zhang 12112dcb1b2aSMatthew Knepley ierr = VecSet(v,zero);CHKERRQ(ierr); 12121ebc52fbSHong Zhang ierr = VecGetArray(v,&x);CHKERRQ(ierr); 121335e7444dSHong Zhang for (i=0; i<n; i++) { 121435e7444dSHong Zhang nz = ai[i+1] - ai[i]; 12152f5a7c2eSBarry Smith if (!nz) x[i] = 0.0; 121635e7444dSHong Zhang for (j=ai[i]; j<ai[i+1]; j++) { 121735e7444dSHong Zhang if (aj[j] == i) { 121835e7444dSHong Zhang x[i] = aa[j]; 121917ab2063SBarry Smith break; 122017ab2063SBarry Smith } 122117ab2063SBarry Smith } 122217ab2063SBarry Smith } 12231ebc52fbSHong Zhang ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 12243a40ed3dSBarry Smith PetscFunctionReturn(0); 122517ab2063SBarry Smith } 122617ab2063SBarry Smith 1227c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1228dfbe8321SBarry Smith PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A,Vec xx,Vec zz,Vec yy) 122917ab2063SBarry Smith { 1230416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1231d9ca1df4SBarry Smith PetscScalar *y; 1232d9ca1df4SBarry Smith const PetscScalar *x; 1233dfbe8321SBarry Smith PetscErrorCode ierr; 1234d0f46423SBarry Smith PetscInt m = A->rmap->n; 12355c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1236d9ca1df4SBarry Smith const MatScalar *v; 1237a77337e4SBarry Smith PetscScalar alpha; 1238d9ca1df4SBarry Smith PetscInt n,i,j; 1239d9ca1df4SBarry Smith const PetscInt *idx,*ii,*ridx=NULL; 12403447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1241ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 12425c897100SBarry Smith #endif 124317ab2063SBarry Smith 12443a40ed3dSBarry Smith PetscFunctionBegin; 12452e8a6d31SBarry Smith if (zz != yy) {ierr = VecCopy(zz,yy);CHKERRQ(ierr);} 1246d9ca1df4SBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 12471ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 12485c897100SBarry Smith 12495c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1250bfeeae90SHong Zhang fortranmulttransposeaddaij_(&m,x,a->i,a->j,a->a,y); 12515c897100SBarry Smith #else 12523447b6efSHong Zhang if (usecprow) { 12533447b6efSHong Zhang m = cprow.nrows; 12543447b6efSHong Zhang ii = cprow.i; 12557b2bb3b9SHong Zhang ridx = cprow.rindex; 12563447b6efSHong Zhang } else { 12573447b6efSHong Zhang ii = a->i; 12583447b6efSHong Zhang } 125917ab2063SBarry Smith for (i=0; i<m; i++) { 12603447b6efSHong Zhang idx = a->j + ii[i]; 12613447b6efSHong Zhang v = a->a + ii[i]; 12623447b6efSHong Zhang n = ii[i+1] - ii[i]; 12633447b6efSHong Zhang if (usecprow) { 12647b2bb3b9SHong Zhang alpha = x[ridx[i]]; 12653447b6efSHong Zhang } else { 126617ab2063SBarry Smith alpha = x[i]; 12673447b6efSHong Zhang } 126804fbf559SBarry Smith for (j=0; j<n; j++) y[idx[j]] += alpha*v[j]; 126917ab2063SBarry Smith } 12705c897100SBarry Smith #endif 1271dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1272d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 12731ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 12743a40ed3dSBarry Smith PetscFunctionReturn(0); 127517ab2063SBarry Smith } 127617ab2063SBarry Smith 1277dfbe8321SBarry Smith PetscErrorCode MatMultTranspose_SeqAIJ(Mat A,Vec xx,Vec yy) 12785c897100SBarry Smith { 1279dfbe8321SBarry Smith PetscErrorCode ierr; 12805c897100SBarry Smith 12815c897100SBarry Smith PetscFunctionBegin; 1282170fe5c8SBarry Smith ierr = VecSet(yy,0.0);CHKERRQ(ierr); 12835c897100SBarry Smith ierr = MatMultTransposeAdd_SeqAIJ(A,xx,yy,yy);CHKERRQ(ierr); 12845c897100SBarry Smith PetscFunctionReturn(0); 12855c897100SBarry Smith } 12865c897100SBarry Smith 1287c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 128878b84d54SShri Abhyankar 1289dfbe8321SBarry Smith PetscErrorCode MatMult_SeqAIJ(Mat A,Vec xx,Vec yy) 129017ab2063SBarry Smith { 1291416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1292d9fead3dSBarry Smith PetscScalar *y; 129354f21887SBarry Smith const PetscScalar *x; 129454f21887SBarry Smith const MatScalar *aa; 1295dfbe8321SBarry Smith PetscErrorCode ierr; 1296003131ecSBarry Smith PetscInt m=A->rmap->n; 12970298fd71SBarry Smith const PetscInt *aj,*ii,*ridx=NULL; 12987b083b7cSBarry Smith PetscInt n,i; 1299362ced78SSatish Balay PetscScalar sum; 1300ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 130117ab2063SBarry Smith 1302b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 130397952fefSHong Zhang #pragma disjoint(*x,*y,*aa) 1304fee21e36SBarry Smith #endif 1305fee21e36SBarry Smith 13063a40ed3dSBarry Smith PetscFunctionBegin; 13073649974fSBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 13081ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 1309416022c9SBarry Smith ii = a->i; 13104eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 13114f390cb1SBarry Smith ierr = PetscMemzero(y,m*sizeof(PetscScalar));CHKERRQ(ierr); 131297952fefSHong Zhang m = a->compressedrow.nrows; 131397952fefSHong Zhang ii = a->compressedrow.i; 131497952fefSHong Zhang ridx = a->compressedrow.rindex; 131597952fefSHong Zhang for (i=0; i<m; i++) { 131697952fefSHong Zhang n = ii[i+1] - ii[i]; 131797952fefSHong Zhang aj = a->j + ii[i]; 131897952fefSHong Zhang aa = a->a + ii[i]; 131997952fefSHong Zhang sum = 0.0; 1320003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 1321003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 132297952fefSHong Zhang y[*ridx++] = sum; 132397952fefSHong Zhang } 132497952fefSHong Zhang } else { /* do not use compressed row format */ 1325b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 13263d3eaba7SBarry Smith aj = a->j; 13273d3eaba7SBarry Smith aa = a->a; 1328b05257ddSBarry Smith fortranmultaij_(&m,x,ii,aj,aa,y); 1329b05257ddSBarry Smith #else 133017ab2063SBarry Smith for (i=0; i<m; i++) { 1331003131ecSBarry Smith n = ii[i+1] - ii[i]; 1332003131ecSBarry Smith aj = a->j + ii[i]; 1333003131ecSBarry Smith aa = a->a + ii[i]; 133417ab2063SBarry Smith sum = 0.0; 1335003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 133617ab2063SBarry Smith y[i] = sum; 133717ab2063SBarry Smith } 13388d195f9aSBarry Smith #endif 1339b05257ddSBarry Smith } 13407b083b7cSBarry Smith ierr = PetscLogFlops(2.0*a->nz - a->nonzerorowcnt);CHKERRQ(ierr); 13413649974fSBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 13421ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 13433a40ed3dSBarry Smith PetscFunctionReturn(0); 134417ab2063SBarry Smith } 134517ab2063SBarry Smith 1346b434eb95SMatthew G. Knepley PetscErrorCode MatMultMax_SeqAIJ(Mat A,Vec xx,Vec yy) 1347b434eb95SMatthew G. Knepley { 1348b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1349b434eb95SMatthew G. Knepley PetscScalar *y; 1350b434eb95SMatthew G. Knepley const PetscScalar *x; 1351b434eb95SMatthew G. Knepley const MatScalar *aa; 1352b434eb95SMatthew G. Knepley PetscErrorCode ierr; 1353b434eb95SMatthew G. Knepley PetscInt m=A->rmap->n; 1354b434eb95SMatthew G. Knepley const PetscInt *aj,*ii,*ridx=NULL; 1355b434eb95SMatthew G. Knepley PetscInt n,i,nonzerorow=0; 1356b434eb95SMatthew G. Knepley PetscScalar sum; 1357b434eb95SMatthew G. Knepley PetscBool usecprow=a->compressedrow.use; 1358b434eb95SMatthew G. Knepley 1359b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1360b434eb95SMatthew G. Knepley #pragma disjoint(*x,*y,*aa) 1361b434eb95SMatthew G. Knepley #endif 1362b434eb95SMatthew G. Knepley 1363b434eb95SMatthew G. Knepley PetscFunctionBegin; 1364b434eb95SMatthew G. Knepley ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 1365b434eb95SMatthew G. Knepley ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 1366b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1367b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1368b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1369b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1370b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1371b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1372b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1373b434eb95SMatthew G. Knepley aa = a->a + ii[i]; 1374b434eb95SMatthew G. Knepley sum = 0.0; 1375b434eb95SMatthew G. Knepley nonzerorow += (n>0); 1376b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1377b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1378b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1379b434eb95SMatthew G. Knepley } 1380b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 13813d3eaba7SBarry Smith ii = a->i; 1382b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1383b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1384b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1385b434eb95SMatthew G. Knepley aa = a->a + ii[i]; 1386b434eb95SMatthew G. Knepley sum = 0.0; 1387b434eb95SMatthew G. Knepley nonzerorow += (n>0); 1388b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1389b434eb95SMatthew G. Knepley y[i] = sum; 1390b434eb95SMatthew G. Knepley } 1391b434eb95SMatthew G. Knepley } 1392b434eb95SMatthew G. Knepley ierr = PetscLogFlops(2.0*a->nz - nonzerorow);CHKERRQ(ierr); 1393b434eb95SMatthew G. Knepley ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 1394b434eb95SMatthew G. Knepley ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 1395b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1396b434eb95SMatthew G. Knepley } 1397b434eb95SMatthew G. Knepley 1398b434eb95SMatthew G. Knepley PetscErrorCode MatMultAddMax_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz) 1399b434eb95SMatthew G. Knepley { 1400b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1401b434eb95SMatthew G. Knepley PetscScalar *y,*z; 1402b434eb95SMatthew G. Knepley const PetscScalar *x; 1403b434eb95SMatthew G. Knepley const MatScalar *aa; 1404b434eb95SMatthew G. Knepley PetscErrorCode ierr; 1405b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n,*aj,*ii; 1406b434eb95SMatthew G. Knepley PetscInt n,i,*ridx=NULL; 1407b434eb95SMatthew G. Knepley PetscScalar sum; 1408b434eb95SMatthew G. Knepley PetscBool usecprow=a->compressedrow.use; 1409b434eb95SMatthew G. Knepley 1410b434eb95SMatthew G. Knepley PetscFunctionBegin; 1411b434eb95SMatthew G. Knepley ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 1412d9ca1df4SBarry Smith ierr = VecGetArrayPair(yy,zz,&y,&z);CHKERRQ(ierr); 1413b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1414b434eb95SMatthew G. Knepley if (zz != yy) { 1415b434eb95SMatthew G. Knepley ierr = PetscMemcpy(z,y,m*sizeof(PetscScalar));CHKERRQ(ierr); 1416b434eb95SMatthew G. Knepley } 1417b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1418b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1419b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1420b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1421b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1422b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1423b434eb95SMatthew G. Knepley aa = a->a + ii[i]; 1424b434eb95SMatthew G. Knepley sum = y[*ridx]; 1425b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1426b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1427b434eb95SMatthew G. Knepley } 1428b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 14293d3eaba7SBarry Smith ii = a->i; 1430b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1431b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1432b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1433b434eb95SMatthew G. Knepley aa = a->a + ii[i]; 1434b434eb95SMatthew G. Knepley sum = y[i]; 1435b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1436b434eb95SMatthew G. Knepley z[i] = sum; 1437b434eb95SMatthew G. Knepley } 1438b434eb95SMatthew G. Knepley } 1439b434eb95SMatthew G. Knepley ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1440b434eb95SMatthew G. Knepley ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 1441d9ca1df4SBarry Smith ierr = VecRestoreArrayPair(yy,zz,&y,&z);CHKERRQ(ierr); 1442b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1443b434eb95SMatthew G. Knepley } 1444b434eb95SMatthew G. Knepley 1445c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1446dfbe8321SBarry Smith PetscErrorCode MatMultAdd_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz) 144717ab2063SBarry Smith { 1448416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1449f15663dcSBarry Smith PetscScalar *y,*z; 1450f15663dcSBarry Smith const PetscScalar *x; 145154f21887SBarry Smith const MatScalar *aa; 1452dfbe8321SBarry Smith PetscErrorCode ierr; 1453d9ca1df4SBarry Smith const PetscInt *aj,*ii,*ridx=NULL; 1454d9ca1df4SBarry Smith PetscInt m = A->rmap->n,n,i; 1455362ced78SSatish Balay PetscScalar sum; 1456ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 14579ea0dfa2SSatish Balay 14583a40ed3dSBarry Smith PetscFunctionBegin; 1459f15663dcSBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 1460d9ca1df4SBarry Smith ierr = VecGetArrayPair(yy,zz,&y,&z);CHKERRQ(ierr); 14614eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14624eb6d288SHong Zhang if (zz != yy) { 14634eb6d288SHong Zhang ierr = PetscMemcpy(z,y,m*sizeof(PetscScalar));CHKERRQ(ierr); 14644eb6d288SHong Zhang } 146597952fefSHong Zhang m = a->compressedrow.nrows; 146697952fefSHong Zhang ii = a->compressedrow.i; 146797952fefSHong Zhang ridx = a->compressedrow.rindex; 146897952fefSHong Zhang for (i=0; i<m; i++) { 146997952fefSHong Zhang n = ii[i+1] - ii[i]; 147097952fefSHong Zhang aj = a->j + ii[i]; 147197952fefSHong Zhang aa = a->a + ii[i]; 147297952fefSHong Zhang sum = y[*ridx]; 1473f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 147497952fefSHong Zhang z[*ridx++] = sum; 147597952fefSHong Zhang } 147697952fefSHong Zhang } else { /* do not use compressed row format */ 14773d3eaba7SBarry Smith ii = a->i; 1478f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 14793d3eaba7SBarry Smith aj = a->j; 14803d3eaba7SBarry Smith aa = a->a; 1481f15663dcSBarry Smith fortranmultaddaij_(&m,x,ii,aj,aa,y,z); 1482f15663dcSBarry Smith #else 148317ab2063SBarry Smith for (i=0; i<m; i++) { 1484f15663dcSBarry Smith n = ii[i+1] - ii[i]; 1485f15663dcSBarry Smith aj = a->j + ii[i]; 1486f15663dcSBarry Smith aa = a->a + ii[i]; 148717ab2063SBarry Smith sum = y[i]; 1488f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 148917ab2063SBarry Smith z[i] = sum; 149017ab2063SBarry Smith } 149102ab625aSSatish Balay #endif 1492f15663dcSBarry Smith } 1493dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1494f15663dcSBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 1495d9ca1df4SBarry Smith ierr = VecRestoreArrayPair(yy,zz,&y,&z);CHKERRQ(ierr); 14963a40ed3dSBarry Smith PetscFunctionReturn(0); 149717ab2063SBarry Smith } 149817ab2063SBarry Smith 149917ab2063SBarry Smith /* 150017ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 150117ab2063SBarry Smith */ 1502dfbe8321SBarry Smith PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 150317ab2063SBarry Smith { 1504416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 15056849ba73SBarry Smith PetscErrorCode ierr; 1506d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n; 150717ab2063SBarry Smith 15083a40ed3dSBarry Smith PetscFunctionBegin; 150909f38230SBarry Smith if (!a->diag) { 1510785e854fSJed Brown ierr = PetscMalloc1(m,&a->diag);CHKERRQ(ierr); 15113bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)A, m*sizeof(PetscInt));CHKERRQ(ierr); 151209f38230SBarry Smith } 1513d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 151409f38230SBarry Smith a->diag[i] = a->i[i+1]; 1515bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1516bfeeae90SHong Zhang if (a->j[j] == i) { 151709f38230SBarry Smith a->diag[i] = j; 151817ab2063SBarry Smith break; 151917ab2063SBarry Smith } 152017ab2063SBarry Smith } 152117ab2063SBarry Smith } 15223a40ed3dSBarry Smith PetscFunctionReturn(0); 152317ab2063SBarry Smith } 152417ab2063SBarry Smith 152561ecd0c6SBarry Smith PetscErrorCode MatShift_SeqAIJ(Mat A,PetscScalar v) 152661ecd0c6SBarry Smith { 152761ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 152861ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt*)a->diag; 152961ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt*) a->i; 153061ecd0c6SBarry Smith PetscInt i,*mdiag = NULL; 153161ecd0c6SBarry Smith PetscErrorCode ierr; 153261ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 153361ecd0c6SBarry Smith 153461ecd0c6SBarry Smith PetscFunctionBegin; 153561ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 153661ecd0c6SBarry Smith ierr = MatSeqAIJSetPreallocation(A,1,NULL);CHKERRQ(ierr); 153761ecd0c6SBarry Smith ierr = MatShift_Basic(A,v);CHKERRQ(ierr); 153861ecd0c6SBarry Smith PetscFunctionReturn(0); 153961ecd0c6SBarry Smith } 154061ecd0c6SBarry Smith 154161ecd0c6SBarry Smith if (a->diagonaldense) { 154261ecd0c6SBarry Smith cnt = 0; 154361ecd0c6SBarry Smith } else { 154461ecd0c6SBarry Smith ierr = PetscCalloc1(A->rmap->n,&mdiag);CHKERRQ(ierr); 154561ecd0c6SBarry Smith for (i=0; i<A->rmap->n; i++) { 154661ecd0c6SBarry Smith if (diag[i] >= ii[i+1]) { 154761ecd0c6SBarry Smith cnt++; 154861ecd0c6SBarry Smith mdiag[i] = 1; 154961ecd0c6SBarry Smith } 155061ecd0c6SBarry Smith } 155161ecd0c6SBarry Smith } 155261ecd0c6SBarry Smith if (!cnt) { 155361ecd0c6SBarry Smith ierr = MatShift_Basic(A,v);CHKERRQ(ierr); 155461ecd0c6SBarry Smith } else { 1555b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1556b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 155761ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc,free_a = a->free_a,free_ij = a->free_ij; 155861ecd0c6SBarry Smith 155961ecd0c6SBarry Smith a->a = NULL; 156061ecd0c6SBarry Smith a->j = NULL; 156161ecd0c6SBarry Smith a->i = NULL; 156261ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 156361ecd0c6SBarry Smith for (i=0; i<A->rmap->n; i++) { 156461ecd0c6SBarry Smith a->imax[i] += mdiag[i]; 1565447d62f5SStefano Zampini a->imax[i] = PetscMin(a->imax[i],A->cmap->n); 156661ecd0c6SBarry Smith } 156761ecd0c6SBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(A,0,a->imax);CHKERRQ(ierr); 156861ecd0c6SBarry Smith 156961ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 157061ecd0c6SBarry Smith for (i=0; i<A->rmap->n; i++) { 157161ecd0c6SBarry Smith ierr = MatSetValues(A,1,&i,a->imax[i] - mdiag[i],&oldj[oldi[i]],&olda[oldi[i]],ADD_VALUES);CHKERRQ(ierr); 1572447d62f5SStefano Zampini if (i < A->cmap->n) { 157361ecd0c6SBarry Smith ierr = MatSetValue(A,i,i,v,ADD_VALUES);CHKERRQ(ierr); 157461ecd0c6SBarry Smith } 1575447d62f5SStefano Zampini } 157661ecd0c6SBarry Smith ierr = MatAssemblyBegin(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 157761ecd0c6SBarry Smith ierr = MatAssemblyEnd(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 157861ecd0c6SBarry Smith if (singlemalloc) { 157961ecd0c6SBarry Smith ierr = PetscFree3(olda,oldj,oldi);CHKERRQ(ierr); 158061ecd0c6SBarry Smith } else { 158161ecd0c6SBarry Smith if (free_a) {ierr = PetscFree(olda);CHKERRQ(ierr);} 158261ecd0c6SBarry Smith if (free_ij) {ierr = PetscFree(oldj);CHKERRQ(ierr);} 158361ecd0c6SBarry Smith if (free_ij) {ierr = PetscFree(oldi);CHKERRQ(ierr);} 158461ecd0c6SBarry Smith } 158561ecd0c6SBarry Smith } 158661ecd0c6SBarry Smith ierr = PetscFree(mdiag);CHKERRQ(ierr); 158761ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 158861ecd0c6SBarry Smith PetscFunctionReturn(0); 158961ecd0c6SBarry Smith } 159061ecd0c6SBarry Smith 1591be5855fcSBarry Smith /* 1592be5855fcSBarry Smith Checks for missing diagonals 1593be5855fcSBarry Smith */ 1594ace3abfcSBarry Smith PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A,PetscBool *missing,PetscInt *d) 1595be5855fcSBarry Smith { 1596be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 15977734d3b5SMatthew G. Knepley PetscInt *diag,*ii = a->i,i; 1598994fe344SLisandro Dalcin PetscErrorCode ierr; 1599be5855fcSBarry Smith 1600be5855fcSBarry Smith PetscFunctionBegin; 160109f38230SBarry Smith *missing = PETSC_FALSE; 16027734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 160309f38230SBarry Smith *missing = PETSC_TRUE; 160409f38230SBarry Smith if (d) *d = 0; 1605994fe344SLisandro Dalcin ierr = PetscInfo(A,"Matrix has no entries therefore is missing diagonal\n");CHKERRQ(ierr); 160609f38230SBarry Smith } else { 1607f1e2ffcdSBarry Smith diag = a->diag; 1608d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 16097734d3b5SMatthew G. Knepley if (diag[i] >= ii[i+1]) { 161009f38230SBarry Smith *missing = PETSC_TRUE; 161109f38230SBarry Smith if (d) *d = i; 1612994fe344SLisandro Dalcin ierr = PetscInfo1(A,"Matrix is missing diagonal number %D\n",i);CHKERRQ(ierr); 1613358d2f5dSShri Abhyankar break; 161409f38230SBarry Smith } 1615be5855fcSBarry Smith } 1616be5855fcSBarry Smith } 1617be5855fcSBarry Smith PetscFunctionReturn(0); 1618be5855fcSBarry Smith } 1619be5855fcSBarry Smith 16200da83c2eSBarry Smith #include <petscblaslapack.h> 16210da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 16220da83c2eSBarry Smith 16230da83c2eSBarry Smith /* 16240da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 16250da83c2eSBarry Smith */ 16260da83c2eSBarry Smith PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A,PetscInt nblocks,const PetscInt *bsizes,PetscScalar *diag) 16270da83c2eSBarry Smith { 16280da83c2eSBarry Smith PetscErrorCode ierr; 16290da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx,j,bsizemax = 0,*v_pivots; 16300da83c2eSBarry Smith PetscBool allowzeropivot,zeropivotdetected=PETSC_FALSE; 16310da83c2eSBarry Smith const PetscReal shift = 0.0; 16320da83c2eSBarry Smith PetscInt ipvt[5]; 16330da83c2eSBarry Smith PetscScalar work[25],*v_work; 16340da83c2eSBarry Smith 16350da83c2eSBarry Smith PetscFunctionBegin; 16360da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 16370da83c2eSBarry Smith for (i=0; i<nblocks; i++) ncnt += bsizes[i]; 16380da83c2eSBarry Smith if (ncnt != n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Total blocksizes %D doesn't match number matrix rows %D",ncnt,n); 16390da83c2eSBarry Smith for (i=0; i<nblocks; i++) { 16400da83c2eSBarry Smith bsizemax = PetscMax(bsizemax,bsizes[i]); 16410da83c2eSBarry Smith } 16420da83c2eSBarry Smith ierr = PetscMalloc1(bsizemax,&indx);CHKERRQ(ierr); 16430da83c2eSBarry Smith if (bsizemax > 7) { 16440da83c2eSBarry Smith ierr = PetscMalloc2(bsizemax,&v_work,bsizemax,&v_pivots);CHKERRQ(ierr); 16450da83c2eSBarry Smith } 16460da83c2eSBarry Smith ncnt = 0; 16470da83c2eSBarry Smith for (i=0; i<nblocks; i++) { 16480da83c2eSBarry Smith for (j=0; j<bsizes[i]; j++) indx[j] = ncnt+j; 16490da83c2eSBarry Smith ierr = MatGetValues(A,bsizes[i],indx,bsizes[i],indx,diag);CHKERRQ(ierr); 16500da83c2eSBarry Smith switch (bsizes[i]) { 16510da83c2eSBarry Smith case 1: 16520da83c2eSBarry Smith *diag = 1.0/(*diag); 16530da83c2eSBarry Smith break; 16540da83c2eSBarry Smith case 2: 16550da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_2(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 16560da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 16570da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_2(diag);CHKERRQ(ierr); 16580da83c2eSBarry Smith break; 16590da83c2eSBarry Smith case 3: 16600da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_3(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 16610da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 16620da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_3(diag);CHKERRQ(ierr); 16630da83c2eSBarry Smith break; 16640da83c2eSBarry Smith case 4: 16650da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_4(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 16660da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 16670da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_4(diag);CHKERRQ(ierr); 16680da83c2eSBarry Smith break; 16690da83c2eSBarry Smith case 5: 16700da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_5(diag,ipvt,work,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 16710da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 16720da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_5(diag);CHKERRQ(ierr); 16730da83c2eSBarry Smith break; 16740da83c2eSBarry Smith case 6: 16750da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_6(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 16760da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 16770da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_6(diag);CHKERRQ(ierr); 16780da83c2eSBarry Smith break; 16790da83c2eSBarry Smith case 7: 16800da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_7(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 16810da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 16820da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_7(diag);CHKERRQ(ierr); 16830da83c2eSBarry Smith break; 16840da83c2eSBarry Smith default: 16850da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A(bsizes[i],diag,v_pivots,v_work,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 16860da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 16870da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_N(diag,bsizes[i]);CHKERRQ(ierr); 16880da83c2eSBarry Smith } 16890da83c2eSBarry Smith ncnt += bsizes[i]; 16900da83c2eSBarry Smith diag += bsizes[i]*bsizes[i]; 16910da83c2eSBarry Smith } 16920da83c2eSBarry Smith if (bsizemax > 7) { 16930da83c2eSBarry Smith ierr = PetscFree2(v_work,v_pivots);CHKERRQ(ierr); 16940da83c2eSBarry Smith } 16950da83c2eSBarry Smith ierr = PetscFree(indx);CHKERRQ(ierr); 16960da83c2eSBarry Smith PetscFunctionReturn(0); 16970da83c2eSBarry Smith } 16980da83c2eSBarry Smith 1699422a814eSBarry Smith /* 1700422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1701422a814eSBarry Smith */ 17027087cfbeSBarry Smith PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A,PetscScalar omega,PetscScalar fshift) 170371f1c65dSBarry Smith { 170471f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 170571f1c65dSBarry Smith PetscErrorCode ierr; 1706d0f46423SBarry Smith PetscInt i,*diag,m = A->rmap->n; 170754f21887SBarry Smith MatScalar *v = a->a; 170854f21887SBarry Smith PetscScalar *idiag,*mdiag; 170971f1c65dSBarry Smith 171071f1c65dSBarry Smith PetscFunctionBegin; 171171f1c65dSBarry Smith if (a->idiagvalid) PetscFunctionReturn(0); 171271f1c65dSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 171371f1c65dSBarry Smith diag = a->diag; 171471f1c65dSBarry Smith if (!a->idiag) { 1715dcca6d9dSJed Brown ierr = PetscMalloc3(m,&a->idiag,m,&a->mdiag,m,&a->ssor_work);CHKERRQ(ierr); 17163bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)A, 3*m*sizeof(PetscScalar));CHKERRQ(ierr); 171771f1c65dSBarry Smith v = a->a; 171871f1c65dSBarry Smith } 171971f1c65dSBarry Smith mdiag = a->mdiag; 172071f1c65dSBarry Smith idiag = a->idiag; 172171f1c65dSBarry Smith 1722422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 172371f1c65dSBarry Smith for (i=0; i<m; i++) { 172471f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1725899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1726899639b0SHong Zhang if (PetscRealPart(fshift)) { 1727899639b0SHong Zhang ierr = PetscInfo1(A,"Zero diagonal on row %D\n",i);CHKERRQ(ierr); 17287b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17297b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 17307b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 1731a6fa060aSHong Zhang } else SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Zero diagonal on row %D",i); 1732899639b0SHong Zhang } 173371f1c65dSBarry Smith idiag[i] = 1.0/v[diag[i]]; 173471f1c65dSBarry Smith } 173571f1c65dSBarry Smith ierr = PetscLogFlops(m);CHKERRQ(ierr); 173671f1c65dSBarry Smith } else { 173771f1c65dSBarry Smith for (i=0; i<m; i++) { 173871f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 173971f1c65dSBarry Smith idiag[i] = omega/(fshift + v[diag[i]]); 174071f1c65dSBarry Smith } 1741dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*m);CHKERRQ(ierr); 174271f1c65dSBarry Smith } 174371f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 174471f1c65dSBarry Smith PetscFunctionReturn(0); 174571f1c65dSBarry Smith } 174671f1c65dSBarry Smith 1747c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 174841f059aeSBarry Smith PetscErrorCode MatSOR_SeqAIJ(Mat A,Vec bb,PetscReal omega,MatSORType flag,PetscReal fshift,PetscInt its,PetscInt lits,Vec xx) 174917ab2063SBarry Smith { 1750416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1751e6d1f457SBarry Smith PetscScalar *x,d,sum,*t,scale; 17523d3eaba7SBarry Smith const MatScalar *v,*idiag=0,*mdiag; 175354f21887SBarry Smith const PetscScalar *b, *bs,*xb, *ts; 1754dfbe8321SBarry Smith PetscErrorCode ierr; 17553d3eaba7SBarry Smith PetscInt n,m = A->rmap->n,i; 175697f1f81fSBarry Smith const PetscInt *idx,*diag; 175717ab2063SBarry Smith 17583a40ed3dSBarry Smith PetscFunctionBegin; 1759b965ef7fSBarry Smith its = its*lits; 176091723122SBarry Smith 176171f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 176271f1c65dSBarry Smith if (!a->idiagvalid) {ierr = MatInvertDiagonal_SeqAIJ(A,omega,fshift);CHKERRQ(ierr);} 176371f1c65dSBarry Smith a->fshift = fshift; 176471f1c65dSBarry Smith a->omega = omega; 1765ed480e8bSBarry Smith 176671f1c65dSBarry Smith diag = a->diag; 176771f1c65dSBarry Smith t = a->ssor_work; 1768ed480e8bSBarry Smith idiag = a->idiag; 176971f1c65dSBarry Smith mdiag = a->mdiag; 1770ed480e8bSBarry Smith 17711ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 17723649974fSBarry Smith ierr = VecGetArrayRead(bb,&b);CHKERRQ(ierr); 1773ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 177417ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 177517ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1776ed480e8bSBarry Smith bs = b; 177717ab2063SBarry Smith for (i=0; i<m; i++) { 177871f1c65dSBarry Smith d = fshift + mdiag[i]; 1779416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1780ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1781ed480e8bSBarry Smith v = a->a + diag[i] + 1; 178217ab2063SBarry Smith sum = b[i]*d/omega; 1783003131ecSBarry Smith PetscSparseDensePlusDot(sum,bs,v,idx,n); 178417ab2063SBarry Smith x[i] = sum; 178517ab2063SBarry Smith } 17861ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 17873649974fSBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 1788efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 17893a40ed3dSBarry Smith PetscFunctionReturn(0); 179017ab2063SBarry Smith } 1791c783ea89SBarry Smith 17922205254eSKarl Rupp if (flag == SOR_APPLY_LOWER) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"SOR_APPLY_LOWER is not implemented"); 17932205254eSKarl Rupp else if (flag & SOR_EISENSTAT) { 179417ab2063SBarry Smith /* Let A = L + U + D; where L is lower trianglar, 1795887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 179617ab2063SBarry Smith 179717ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 179817ab2063SBarry Smith 1799887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 180017ab2063SBarry Smith */ 180117ab2063SBarry Smith scale = (2.0/omega) - 1.0; 180217ab2063SBarry Smith 180317ab2063SBarry Smith /* x = (E + U)^{-1} b */ 180417ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1805416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1806ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1807ed480e8bSBarry Smith v = a->a + diag[i] + 1; 180817ab2063SBarry Smith sum = b[i]; 1809e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 1810ed480e8bSBarry Smith x[i] = sum*idiag[i]; 181117ab2063SBarry Smith } 181217ab2063SBarry Smith 181317ab2063SBarry Smith /* t = b - (2*E - D)x */ 1814416022c9SBarry Smith v = a->a; 18152205254eSKarl Rupp for (i=0; i<m; i++) t[i] = b[i] - scale*(v[*diag++])*x[i]; 181617ab2063SBarry Smith 181717ab2063SBarry Smith /* t = (E + L)^{-1}t */ 1818ed480e8bSBarry Smith ts = t; 1819416022c9SBarry Smith diag = a->diag; 182017ab2063SBarry Smith for (i=0; i<m; i++) { 1821416022c9SBarry Smith n = diag[i] - a->i[i]; 1822ed480e8bSBarry Smith idx = a->j + a->i[i]; 1823ed480e8bSBarry Smith v = a->a + a->i[i]; 182417ab2063SBarry Smith sum = t[i]; 1825003131ecSBarry Smith PetscSparseDenseMinusDot(sum,ts,v,idx,n); 1826ed480e8bSBarry Smith t[i] = sum*idiag[i]; 1827733d66baSBarry Smith /* x = x + t */ 1828733d66baSBarry Smith x[i] += t[i]; 182917ab2063SBarry Smith } 183017ab2063SBarry Smith 1831dc0b31edSSatish Balay ierr = PetscLogFlops(6.0*m-1 + 2.0*a->nz);CHKERRQ(ierr); 18321ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 18333649974fSBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 18343a40ed3dSBarry Smith PetscFunctionReturn(0); 183517ab2063SBarry Smith } 183617ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 183717ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 183817ab2063SBarry Smith for (i=0; i<m; i++) { 1839416022c9SBarry Smith n = diag[i] - a->i[i]; 1840ed480e8bSBarry Smith idx = a->j + a->i[i]; 1841ed480e8bSBarry Smith v = a->a + a->i[i]; 184217ab2063SBarry Smith sum = b[i]; 1843e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 18445c99c7daSBarry Smith t[i] = sum; 1845ed480e8bSBarry Smith x[i] = sum*idiag[i]; 184617ab2063SBarry Smith } 18475c99c7daSBarry Smith xb = t; 1848efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 18493a40ed3dSBarry Smith } else xb = b; 185017ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 185117ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1852416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1853ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1854ed480e8bSBarry Smith v = a->a + diag[i] + 1; 185517ab2063SBarry Smith sum = xb[i]; 1856e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 18575c99c7daSBarry Smith if (xb == b) { 1858ed480e8bSBarry Smith x[i] = sum*idiag[i]; 18595c99c7daSBarry Smith } else { 1860b19a5dc2SMark Adams x[i] = (1-omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 186117ab2063SBarry Smith } 18625c99c7daSBarry Smith } 1863b19a5dc2SMark Adams ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); /* assumes 1/2 in upper */ 186417ab2063SBarry Smith } 186517ab2063SBarry Smith its--; 186617ab2063SBarry Smith } 186717ab2063SBarry Smith while (its--) { 186817ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 186917ab2063SBarry Smith for (i=0; i<m; i++) { 1870b19a5dc2SMark Adams /* lower */ 1871b19a5dc2SMark Adams n = diag[i] - a->i[i]; 1872ed480e8bSBarry Smith idx = a->j + a->i[i]; 1873ed480e8bSBarry Smith v = a->a + a->i[i]; 187417ab2063SBarry Smith sum = b[i]; 1875e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 1876b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 1877b19a5dc2SMark Adams /* upper */ 1878b19a5dc2SMark Adams n = a->i[i+1] - diag[i] - 1; 1879b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 1880b19a5dc2SMark Adams v = a->a + diag[i] + 1; 1881b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum,x,v,idx,n); 1882b19a5dc2SMark Adams x[i] = (1. - omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 188317ab2063SBarry Smith } 1884b19a5dc2SMark Adams xb = t; 18859f863219SBarry Smith ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1886b19a5dc2SMark Adams } else xb = b; 188717ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 188817ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1889b19a5dc2SMark Adams sum = xb[i]; 1890b19a5dc2SMark Adams if (xb == b) { 1891b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 1892416022c9SBarry Smith n = a->i[i+1] - a->i[i]; 1893ed480e8bSBarry Smith idx = a->j + a->i[i]; 1894ed480e8bSBarry Smith v = a->a + a->i[i]; 1895e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 1896ed480e8bSBarry Smith x[i] = (1. - omega)*x[i] + (sum + mdiag[i]*x[i])*idiag[i]; 1897b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 1898b19a5dc2SMark Adams n = a->i[i+1] - diag[i] - 1; 1899b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 1900b19a5dc2SMark Adams v = a->a + diag[i] + 1; 1901b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum,x,v,idx,n); 1902b19a5dc2SMark Adams x[i] = (1. - omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 190317ab2063SBarry Smith } 1904b19a5dc2SMark Adams } 1905b19a5dc2SMark Adams if (xb == b) { 19069f863219SBarry Smith ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1907b19a5dc2SMark Adams } else { 1908b19a5dc2SMark Adams ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); /* assumes 1/2 in upper */ 1909b19a5dc2SMark Adams } 191017ab2063SBarry Smith } 191117ab2063SBarry Smith } 19121ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 19133649974fSBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 1914365a8a9eSBarry Smith PetscFunctionReturn(0); 191517ab2063SBarry Smith } 191617ab2063SBarry Smith 19172af78befSBarry Smith 1918dfbe8321SBarry Smith PetscErrorCode MatGetInfo_SeqAIJ(Mat A,MatInfoType flag,MatInfo *info) 191917ab2063SBarry Smith { 1920416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 19214e220ebcSLois Curfman McInnes 19223a40ed3dSBarry Smith PetscFunctionBegin; 19234e220ebcSLois Curfman McInnes info->block_size = 1.0; 19244e220ebcSLois Curfman McInnes info->nz_allocated = (double)a->maxnz; 19254e220ebcSLois Curfman McInnes info->nz_used = (double)a->nz; 19264e220ebcSLois Curfman McInnes info->nz_unneeded = (double)(a->maxnz - a->nz); 19274e220ebcSLois Curfman McInnes info->assemblies = (double)A->num_ass; 19288e58a170SBarry Smith info->mallocs = (double)A->info.mallocs; 19297adad957SLisandro Dalcin info->memory = ((PetscObject)A)->mem; 1930d5f3da31SBarry Smith if (A->factortype) { 19314e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 19324e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 19334e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 19344e220ebcSLois Curfman McInnes } else { 19354e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 19364e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 19374e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 19384e220ebcSLois Curfman McInnes } 19393a40ed3dSBarry Smith PetscFunctionReturn(0); 194017ab2063SBarry Smith } 194117ab2063SBarry Smith 19422b40b63fSBarry Smith PetscErrorCode MatZeroRows_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 194317ab2063SBarry Smith { 1944416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1945c7da8527SEric Chamberland PetscInt i,m = A->rmap->n - 1; 19466849ba73SBarry Smith PetscErrorCode ierr; 194797b48c8fSBarry Smith const PetscScalar *xx; 194897b48c8fSBarry Smith PetscScalar *bb; 1949c7da8527SEric Chamberland PetscInt d = 0; 195017ab2063SBarry Smith 19513a40ed3dSBarry Smith PetscFunctionBegin; 195297b48c8fSBarry Smith if (x && b) { 195397b48c8fSBarry Smith ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 195497b48c8fSBarry Smith ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 195597b48c8fSBarry Smith for (i=0; i<N; i++) { 195697b48c8fSBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 1957447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 195897b48c8fSBarry Smith bb[rows[i]] = diag*xx[rows[i]]; 195997b48c8fSBarry Smith } 196097b48c8fSBarry Smith ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 196197b48c8fSBarry Smith ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 196297b48c8fSBarry Smith } 196397b48c8fSBarry Smith 1964a9817697SBarry Smith if (a->keepnonzeropattern) { 1965f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 1966e32f2f54SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 1967bfeeae90SHong Zhang ierr = PetscMemzero(&a->a[a->i[rows[i]]],a->ilen[rows[i]]*sizeof(PetscScalar));CHKERRQ(ierr); 1968f1e2ffcdSBarry Smith } 1969f4df32b1SMatthew Knepley if (diag != 0.0) { 1970c7da8527SEric Chamberland for (i=0; i<N; i++) { 1971c7da8527SEric Chamberland d = rows[i]; 1972447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 1973c7da8527SEric Chamberland if (a->diag[d] >= a->i[d+1]) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in the zeroed row %D",d); 1974c7da8527SEric Chamberland } 1975f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 1976447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 1977f4df32b1SMatthew Knepley a->a[a->diag[rows[i]]] = diag; 1978f1e2ffcdSBarry Smith } 1979f1e2ffcdSBarry Smith } 1980f1e2ffcdSBarry Smith } else { 1981f4df32b1SMatthew Knepley if (diag != 0.0) { 198217ab2063SBarry Smith for (i=0; i<N; i++) { 1983e32f2f54SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 19847ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 1985447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 1986447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 1987447d62f5SStefano Zampini } else { 1988416022c9SBarry Smith a->ilen[rows[i]] = 1; 1989f4df32b1SMatthew Knepley a->a[a->i[rows[i]]] = diag; 1990bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 1991447d62f5SStefano Zampini } 1992447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 1993f4df32b1SMatthew Knepley ierr = MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],&diag,INSERT_VALUES);CHKERRQ(ierr); 199417ab2063SBarry Smith } 199517ab2063SBarry Smith } 19963a40ed3dSBarry Smith } else { 199717ab2063SBarry Smith for (i=0; i<N; i++) { 1998e32f2f54SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 1999416022c9SBarry Smith a->ilen[rows[i]] = 0; 200017ab2063SBarry Smith } 200117ab2063SBarry Smith } 2002e56f5c9eSBarry Smith A->nonzerostate++; 2003f1e2ffcdSBarry Smith } 20044099cc6bSBarry Smith ierr = (*A->ops->assemblyend)(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 20053a40ed3dSBarry Smith PetscFunctionReturn(0); 200617ab2063SBarry Smith } 200717ab2063SBarry Smith 20086e169961SBarry Smith PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 20096e169961SBarry Smith { 20106e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 20116e169961SBarry Smith PetscInt i,j,m = A->rmap->n - 1,d = 0; 20126e169961SBarry Smith PetscErrorCode ierr; 20132b40b63fSBarry Smith PetscBool missing,*zeroed,vecs = PETSC_FALSE; 20146e169961SBarry Smith const PetscScalar *xx; 20156e169961SBarry Smith PetscScalar *bb; 20166e169961SBarry Smith 20176e169961SBarry Smith PetscFunctionBegin; 20186e169961SBarry Smith if (x && b) { 20196e169961SBarry Smith ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 20206e169961SBarry Smith ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 20212b40b63fSBarry Smith vecs = PETSC_TRUE; 20226e169961SBarry Smith } 20231795a4d1SJed Brown ierr = PetscCalloc1(A->rmap->n,&zeroed);CHKERRQ(ierr); 20246e169961SBarry Smith for (i=0; i<N; i++) { 20256e169961SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 20266e169961SBarry Smith ierr = PetscMemzero(&a->a[a->i[rows[i]]],a->ilen[rows[i]]*sizeof(PetscScalar));CHKERRQ(ierr); 20272205254eSKarl Rupp 20286e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 20296e169961SBarry Smith } 20306e169961SBarry Smith for (i=0; i<A->rmap->n; i++) { 20316e169961SBarry Smith if (!zeroed[i]) { 20326e169961SBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 20334cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 20342b40b63fSBarry Smith if (vecs) bb[i] -= a->a[j]*xx[a->j[j]]; 20356e169961SBarry Smith a->a[j] = 0.0; 20366e169961SBarry Smith } 20376e169961SBarry Smith } 20384cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag*xx[i]; 20396e169961SBarry Smith } 20406e169961SBarry Smith if (x && b) { 20416e169961SBarry Smith ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 20426e169961SBarry Smith ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 20436e169961SBarry Smith } 20446e169961SBarry Smith ierr = PetscFree(zeroed);CHKERRQ(ierr); 20456e169961SBarry Smith if (diag != 0.0) { 20466e169961SBarry Smith ierr = MatMissingDiagonal_SeqAIJ(A,&missing,&d);CHKERRQ(ierr); 20471d5a398dSstefano_zampini if (missing) { 20481d5a398dSstefano_zampini for (i=0; i<N; i++) { 20494cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 20504cf107fdSStefano Zampini if (a->nonew && rows[i] >= d) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in row %D (%D)",d,rows[i]); 20511d5a398dSstefano_zampini ierr = MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],&diag,INSERT_VALUES);CHKERRQ(ierr); 20521d5a398dSstefano_zampini } 20531d5a398dSstefano_zampini } else { 20546e169961SBarry Smith for (i=0; i<N; i++) { 20556e169961SBarry Smith a->a[a->diag[rows[i]]] = diag; 20566e169961SBarry Smith } 20576e169961SBarry Smith } 20581d5a398dSstefano_zampini } 20594099cc6bSBarry Smith ierr = (*A->ops->assemblyend)(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 20606e169961SBarry Smith PetscFunctionReturn(0); 20616e169961SBarry Smith } 20626e169961SBarry Smith 2063a77337e4SBarry Smith PetscErrorCode MatGetRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 206417ab2063SBarry Smith { 2065416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 206697f1f81fSBarry Smith PetscInt *itmp; 206717ab2063SBarry Smith 20683a40ed3dSBarry Smith PetscFunctionBegin; 2069e32f2f54SBarry Smith if (row < 0 || row >= A->rmap->n) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D out of range",row); 207017ab2063SBarry Smith 2071416022c9SBarry Smith *nz = a->i[row+1] - a->i[row]; 2072bfeeae90SHong Zhang if (v) *v = a->a + a->i[row]; 207317ab2063SBarry Smith if (idx) { 2074bfeeae90SHong Zhang itmp = a->j + a->i[row]; 207526fbe8dcSKarl Rupp if (*nz) *idx = itmp; 207617ab2063SBarry Smith else *idx = 0; 207717ab2063SBarry Smith } 20783a40ed3dSBarry Smith PetscFunctionReturn(0); 207917ab2063SBarry Smith } 208017ab2063SBarry Smith 2081bfeeae90SHong Zhang /* remove this function? */ 2082a77337e4SBarry Smith PetscErrorCode MatRestoreRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 208317ab2063SBarry Smith { 20843a40ed3dSBarry Smith PetscFunctionBegin; 20853a40ed3dSBarry Smith PetscFunctionReturn(0); 208617ab2063SBarry Smith } 208717ab2063SBarry Smith 2088dfbe8321SBarry Smith PetscErrorCode MatNorm_SeqAIJ(Mat A,NormType type,PetscReal *nrm) 208917ab2063SBarry Smith { 2090416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 209154f21887SBarry Smith MatScalar *v = a->a; 209236db0b34SBarry Smith PetscReal sum = 0.0; 20936849ba73SBarry Smith PetscErrorCode ierr; 209497f1f81fSBarry Smith PetscInt i,j; 209517ab2063SBarry Smith 20963a40ed3dSBarry Smith PetscFunctionBegin; 209717ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2098570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2099570b7f6dSBarry Smith PetscBLASInt one = 1,nz = a->nz; 2100570b7f6dSBarry Smith *nrm = BLASnrm2_(&nz,v,&one); 2101570b7f6dSBarry Smith #else 2102416022c9SBarry Smith for (i=0; i<a->nz; i++) { 210336db0b34SBarry Smith sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 210417ab2063SBarry Smith } 21058f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2106570b7f6dSBarry Smith #endif 210751f70360SJed Brown ierr = PetscLogFlops(2*a->nz);CHKERRQ(ierr); 21083a40ed3dSBarry Smith } else if (type == NORM_1) { 210936db0b34SBarry Smith PetscReal *tmp; 211097f1f81fSBarry Smith PetscInt *jj = a->j; 21111795a4d1SJed Brown ierr = PetscCalloc1(A->cmap->n+1,&tmp);CHKERRQ(ierr); 2112064f8208SBarry Smith *nrm = 0.0; 2113416022c9SBarry Smith for (j=0; j<a->nz; j++) { 2114bfeeae90SHong Zhang tmp[*jj++] += PetscAbsScalar(*v); v++; 211517ab2063SBarry Smith } 2116d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 2117064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 211817ab2063SBarry Smith } 2119606d414cSSatish Balay ierr = PetscFree(tmp);CHKERRQ(ierr); 212051f70360SJed Brown ierr = PetscLogFlops(PetscMax(a->nz-1,0));CHKERRQ(ierr); 21213a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2122064f8208SBarry Smith *nrm = 0.0; 2123d0f46423SBarry Smith for (j=0; j<A->rmap->n; j++) { 2124bfeeae90SHong Zhang v = a->a + a->i[j]; 212517ab2063SBarry Smith sum = 0.0; 2126416022c9SBarry Smith for (i=0; i<a->i[j+1]-a->i[j]; i++) { 2127cddf8d76SBarry Smith sum += PetscAbsScalar(*v); v++; 212817ab2063SBarry Smith } 2129064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 213017ab2063SBarry Smith } 213151f70360SJed Brown ierr = PetscLogFlops(PetscMax(a->nz-1,0));CHKERRQ(ierr); 2132f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"No support for two norm"); 21333a40ed3dSBarry Smith PetscFunctionReturn(0); 213417ab2063SBarry Smith } 213517ab2063SBarry Smith 21364e938277SHong Zhang /* Merged from MatGetSymbolicTranspose_SeqAIJ() - replace MatGetSymbolicTranspose_SeqAIJ()? */ 21374e938277SHong Zhang PetscErrorCode MatTransposeSymbolic_SeqAIJ(Mat A,Mat *B) 21384e938277SHong Zhang { 21394e938277SHong Zhang PetscErrorCode ierr; 21404e938277SHong Zhang PetscInt i,j,anzj; 21414e938277SHong Zhang Mat_SeqAIJ *a=(Mat_SeqAIJ*)A->data,*b; 21424e938277SHong Zhang PetscInt an=A->cmap->N,am=A->rmap->N; 21434e938277SHong Zhang PetscInt *ati,*atj,*atfill,*ai=a->i,*aj=a->j; 21444e938277SHong Zhang 21454e938277SHong Zhang PetscFunctionBegin; 21464e938277SHong Zhang /* Allocate space for symbolic transpose info and work array */ 2147854ce69bSBarry Smith ierr = PetscCalloc1(an+1,&ati);CHKERRQ(ierr); 2148785e854fSJed Brown ierr = PetscMalloc1(ai[am],&atj);CHKERRQ(ierr); 2149785e854fSJed Brown ierr = PetscMalloc1(an,&atfill);CHKERRQ(ierr); 21504e938277SHong Zhang 21514e938277SHong Zhang /* Walk through aj and count ## of non-zeros in each row of A^T. */ 21524e938277SHong Zhang /* Note: offset by 1 for fast conversion into csr format. */ 215326fbe8dcSKarl Rupp for (i=0;i<ai[am];i++) ati[aj[i]+1] += 1; 21544e938277SHong Zhang /* Form ati for csr format of A^T. */ 215526fbe8dcSKarl Rupp for (i=0;i<an;i++) ati[i+1] += ati[i]; 21564e938277SHong Zhang 21574e938277SHong Zhang /* Copy ati into atfill so we have locations of the next free space in atj */ 21584e938277SHong Zhang ierr = PetscMemcpy(atfill,ati,an*sizeof(PetscInt));CHKERRQ(ierr); 21594e938277SHong Zhang 21604e938277SHong Zhang /* Walk through A row-wise and mark nonzero entries of A^T. */ 21614e938277SHong Zhang for (i=0;i<am;i++) { 21624e938277SHong Zhang anzj = ai[i+1] - ai[i]; 21634e938277SHong Zhang for (j=0;j<anzj;j++) { 21644e938277SHong Zhang atj[atfill[*aj]] = i; 21654e938277SHong Zhang atfill[*aj++] += 1; 21664e938277SHong Zhang } 21674e938277SHong Zhang } 21684e938277SHong Zhang 21694e938277SHong Zhang /* Clean up temporary space and complete requests. */ 21704e938277SHong Zhang ierr = PetscFree(atfill);CHKERRQ(ierr); 2171ce94432eSBarry Smith ierr = MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),an,am,ati,atj,NULL,B);CHKERRQ(ierr); 217233d57670SJed Brown ierr = MatSetBlockSizes(*B,PetscAbs(A->cmap->bs),PetscAbs(A->rmap->bs));CHKERRQ(ierr); 2173a2f3521dSMark F. Adams 21744e938277SHong Zhang b = (Mat_SeqAIJ*)((*B)->data); 21754e938277SHong Zhang b->free_a = PETSC_FALSE; 21764e938277SHong Zhang b->free_ij = PETSC_TRUE; 21774e938277SHong Zhang b->nonew = 0; 21784e938277SHong Zhang PetscFunctionReturn(0); 21794e938277SHong Zhang } 21804e938277SHong Zhang 21817087cfbeSBarry Smith PetscErrorCode MatIsTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 2182cd0d46ebSvictorle { 21833d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) A->data,*bij = (Mat_SeqAIJ*) B->data; 218454f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 218554f21887SBarry Smith MatScalar *va,*vb; 21866849ba73SBarry Smith PetscErrorCode ierr; 218797f1f81fSBarry Smith PetscInt ma,na,mb,nb, i; 2188cd0d46ebSvictorle 2189cd0d46ebSvictorle PetscFunctionBegin; 2190cd0d46ebSvictorle ierr = MatGetSize(A,&ma,&na);CHKERRQ(ierr); 2191cd0d46ebSvictorle ierr = MatGetSize(B,&mb,&nb);CHKERRQ(ierr); 21925485867bSBarry Smith if (ma!=nb || na!=mb) { 21935485867bSBarry Smith *f = PETSC_FALSE; 21945485867bSBarry Smith PetscFunctionReturn(0); 21955485867bSBarry Smith } 2196cd0d46ebSvictorle aii = aij->i; bii = bij->i; 2197cd0d46ebSvictorle adx = aij->j; bdx = bij->j; 2198cd0d46ebSvictorle va = aij->a; vb = bij->a; 2199785e854fSJed Brown ierr = PetscMalloc1(ma,&aptr);CHKERRQ(ierr); 2200785e854fSJed Brown ierr = PetscMalloc1(mb,&bptr);CHKERRQ(ierr); 2201cd0d46ebSvictorle for (i=0; i<ma; i++) aptr[i] = aii[i]; 2202cd0d46ebSvictorle for (i=0; i<mb; i++) bptr[i] = bii[i]; 2203cd0d46ebSvictorle 2204cd0d46ebSvictorle *f = PETSC_TRUE; 2205cd0d46ebSvictorle for (i=0; i<ma; i++) { 2206cd0d46ebSvictorle while (aptr[i]<aii[i+1]) { 220797f1f81fSBarry Smith PetscInt idc,idr; 22085485867bSBarry Smith PetscScalar vc,vr; 2209cd0d46ebSvictorle /* column/row index/value */ 22105485867bSBarry Smith idc = adx[aptr[i]]; 22115485867bSBarry Smith idr = bdx[bptr[idc]]; 22125485867bSBarry Smith vc = va[aptr[i]]; 22135485867bSBarry Smith vr = vb[bptr[idc]]; 22145485867bSBarry Smith if (i!=idr || PetscAbsScalar(vc-vr) > tol) { 22155485867bSBarry Smith *f = PETSC_FALSE; 22165485867bSBarry Smith goto done; 2217cd0d46ebSvictorle } else { 22185485867bSBarry Smith aptr[i]++; 22195485867bSBarry Smith if (B || i!=idc) bptr[idc]++; 2220cd0d46ebSvictorle } 2221cd0d46ebSvictorle } 2222cd0d46ebSvictorle } 2223cd0d46ebSvictorle done: 2224cd0d46ebSvictorle ierr = PetscFree(aptr);CHKERRQ(ierr); 22253aeef889SHong Zhang ierr = PetscFree(bptr);CHKERRQ(ierr); 2226cd0d46ebSvictorle PetscFunctionReturn(0); 2227cd0d46ebSvictorle } 2228cd0d46ebSvictorle 22297087cfbeSBarry Smith PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 22301cbb95d3SBarry Smith { 22313d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) A->data,*bij = (Mat_SeqAIJ*) B->data; 223254f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 223354f21887SBarry Smith MatScalar *va,*vb; 22341cbb95d3SBarry Smith PetscErrorCode ierr; 22351cbb95d3SBarry Smith PetscInt ma,na,mb,nb, i; 22361cbb95d3SBarry Smith 22371cbb95d3SBarry Smith PetscFunctionBegin; 22381cbb95d3SBarry Smith ierr = MatGetSize(A,&ma,&na);CHKERRQ(ierr); 22391cbb95d3SBarry Smith ierr = MatGetSize(B,&mb,&nb);CHKERRQ(ierr); 22401cbb95d3SBarry Smith if (ma!=nb || na!=mb) { 22411cbb95d3SBarry Smith *f = PETSC_FALSE; 22421cbb95d3SBarry Smith PetscFunctionReturn(0); 22431cbb95d3SBarry Smith } 22441cbb95d3SBarry Smith aii = aij->i; bii = bij->i; 22451cbb95d3SBarry Smith adx = aij->j; bdx = bij->j; 22461cbb95d3SBarry Smith va = aij->a; vb = bij->a; 2247785e854fSJed Brown ierr = PetscMalloc1(ma,&aptr);CHKERRQ(ierr); 2248785e854fSJed Brown ierr = PetscMalloc1(mb,&bptr);CHKERRQ(ierr); 22491cbb95d3SBarry Smith for (i=0; i<ma; i++) aptr[i] = aii[i]; 22501cbb95d3SBarry Smith for (i=0; i<mb; i++) bptr[i] = bii[i]; 22511cbb95d3SBarry Smith 22521cbb95d3SBarry Smith *f = PETSC_TRUE; 22531cbb95d3SBarry Smith for (i=0; i<ma; i++) { 22541cbb95d3SBarry Smith while (aptr[i]<aii[i+1]) { 22551cbb95d3SBarry Smith PetscInt idc,idr; 22561cbb95d3SBarry Smith PetscScalar vc,vr; 22571cbb95d3SBarry Smith /* column/row index/value */ 22581cbb95d3SBarry Smith idc = adx[aptr[i]]; 22591cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 22601cbb95d3SBarry Smith vc = va[aptr[i]]; 22611cbb95d3SBarry Smith vr = vb[bptr[idc]]; 22621cbb95d3SBarry Smith if (i!=idr || PetscAbsScalar(vc-PetscConj(vr)) > tol) { 22631cbb95d3SBarry Smith *f = PETSC_FALSE; 22641cbb95d3SBarry Smith goto done; 22651cbb95d3SBarry Smith } else { 22661cbb95d3SBarry Smith aptr[i]++; 22671cbb95d3SBarry Smith if (B || i!=idc) bptr[idc]++; 22681cbb95d3SBarry Smith } 22691cbb95d3SBarry Smith } 22701cbb95d3SBarry Smith } 22711cbb95d3SBarry Smith done: 22721cbb95d3SBarry Smith ierr = PetscFree(aptr);CHKERRQ(ierr); 22731cbb95d3SBarry Smith ierr = PetscFree(bptr);CHKERRQ(ierr); 22741cbb95d3SBarry Smith PetscFunctionReturn(0); 22751cbb95d3SBarry Smith } 22761cbb95d3SBarry Smith 2277ace3abfcSBarry Smith PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 22789e29f15eSvictorle { 2279dfbe8321SBarry Smith PetscErrorCode ierr; 22806e111a19SKarl Rupp 22819e29f15eSvictorle PetscFunctionBegin; 22825485867bSBarry Smith ierr = MatIsTranspose_SeqAIJ(A,A,tol,f);CHKERRQ(ierr); 22839e29f15eSvictorle PetscFunctionReturn(0); 22849e29f15eSvictorle } 22859e29f15eSvictorle 2286ace3abfcSBarry Smith PetscErrorCode MatIsHermitian_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 22871cbb95d3SBarry Smith { 22881cbb95d3SBarry Smith PetscErrorCode ierr; 22896e111a19SKarl Rupp 22901cbb95d3SBarry Smith PetscFunctionBegin; 22911cbb95d3SBarry Smith ierr = MatIsHermitianTranspose_SeqAIJ(A,A,tol,f);CHKERRQ(ierr); 22921cbb95d3SBarry Smith PetscFunctionReturn(0); 22931cbb95d3SBarry Smith } 22941cbb95d3SBarry Smith 2295dfbe8321SBarry Smith PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A,Vec ll,Vec rr) 229617ab2063SBarry Smith { 2297416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2298fff8e43fSBarry Smith const PetscScalar *l,*r; 2299fff8e43fSBarry Smith PetscScalar x; 230054f21887SBarry Smith MatScalar *v; 2301dfbe8321SBarry Smith PetscErrorCode ierr; 2302fff8e43fSBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,M,nz = a->nz; 2303fff8e43fSBarry Smith const PetscInt *jj; 230417ab2063SBarry Smith 23053a40ed3dSBarry Smith PetscFunctionBegin; 230617ab2063SBarry Smith if (ll) { 23073ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 23083ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 2309e1311b90SBarry Smith ierr = VecGetLocalSize(ll,&m);CHKERRQ(ierr); 2310e32f2f54SBarry Smith if (m != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Left scaling vector wrong length"); 2311fff8e43fSBarry Smith ierr = VecGetArrayRead(ll,&l);CHKERRQ(ierr); 2312416022c9SBarry Smith v = a->a; 231317ab2063SBarry Smith for (i=0; i<m; i++) { 231417ab2063SBarry Smith x = l[i]; 2315416022c9SBarry Smith M = a->i[i+1] - a->i[i]; 23162205254eSKarl Rupp for (j=0; j<M; j++) (*v++) *= x; 231717ab2063SBarry Smith } 2318fff8e43fSBarry Smith ierr = VecRestoreArrayRead(ll,&l);CHKERRQ(ierr); 2319efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 232017ab2063SBarry Smith } 232117ab2063SBarry Smith if (rr) { 2322e1311b90SBarry Smith ierr = VecGetLocalSize(rr,&n);CHKERRQ(ierr); 2323e32f2f54SBarry Smith if (n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Right scaling vector wrong length"); 2324fff8e43fSBarry Smith ierr = VecGetArrayRead(rr,&r);CHKERRQ(ierr); 2325416022c9SBarry Smith v = a->a; jj = a->j; 23262205254eSKarl Rupp for (i=0; i<nz; i++) (*v++) *= r[*jj++]; 2327fff8e43fSBarry Smith ierr = VecRestoreArrayRead(rr,&r);CHKERRQ(ierr); 2328efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 232917ab2063SBarry Smith } 2330acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr); 23313a40ed3dSBarry Smith PetscFunctionReturn(0); 233217ab2063SBarry Smith } 233317ab2063SBarry Smith 23347dae84e0SHong Zhang PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A,IS isrow,IS iscol,PetscInt csize,MatReuse scall,Mat *B) 233517ab2063SBarry Smith { 2336db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*c; 23376849ba73SBarry Smith PetscErrorCode ierr; 2338d0f46423SBarry Smith PetscInt *smap,i,k,kstart,kend,oldcols = A->cmap->n,*lens; 233997f1f81fSBarry Smith PetscInt row,mat_i,*mat_j,tcol,first,step,*mat_ilen,sum,lensi; 23405d0c19d7SBarry Smith const PetscInt *irow,*icol; 23415d0c19d7SBarry Smith PetscInt nrows,ncols; 234297f1f81fSBarry Smith PetscInt *starts,*j_new,*i_new,*aj = a->j,*ai = a->i,ii,*ailen = a->ilen; 234354f21887SBarry Smith MatScalar *a_new,*mat_a; 2344416022c9SBarry Smith Mat C; 2345cdc6f3adSToby Isaac PetscBool stride; 234617ab2063SBarry Smith 23473a40ed3dSBarry Smith PetscFunctionBegin; 234899141d43SSatish Balay 234917ab2063SBarry Smith ierr = ISGetIndices(isrow,&irow);CHKERRQ(ierr); 2350b9b97703SBarry Smith ierr = ISGetLocalSize(isrow,&nrows);CHKERRQ(ierr); 2351b9b97703SBarry Smith ierr = ISGetLocalSize(iscol,&ncols);CHKERRQ(ierr); 235217ab2063SBarry Smith 2353251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)iscol,ISSTRIDE,&stride);CHKERRQ(ierr); 2354ff718158SBarry Smith if (stride) { 2355ff718158SBarry Smith ierr = ISStrideGetInfo(iscol,&first,&step);CHKERRQ(ierr); 2356ff718158SBarry Smith } else { 2357ff718158SBarry Smith first = 0; 2358ff718158SBarry Smith step = 0; 2359ff718158SBarry Smith } 2360fee21e36SBarry Smith if (stride && step == 1) { 236102834360SBarry Smith /* special case of contiguous rows */ 2362dcca6d9dSJed Brown ierr = PetscMalloc2(nrows,&lens,nrows,&starts);CHKERRQ(ierr); 236302834360SBarry Smith /* loop over new rows determining lens and starting points */ 236402834360SBarry Smith for (i=0; i<nrows; i++) { 2365bfeeae90SHong Zhang kstart = ai[irow[i]]; 2366a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2367a91a9bebSLisandro Dalcin starts[i] = kstart; 236802834360SBarry Smith for (k=kstart; k<kend; k++) { 2369bfeeae90SHong Zhang if (aj[k] >= first) { 237002834360SBarry Smith starts[i] = k; 237102834360SBarry Smith break; 237202834360SBarry Smith } 237302834360SBarry Smith } 2374a2744918SBarry Smith sum = 0; 237502834360SBarry Smith while (k < kend) { 2376bfeeae90SHong Zhang if (aj[k++] >= first+ncols) break; 2377a2744918SBarry Smith sum++; 237802834360SBarry Smith } 2379a2744918SBarry Smith lens[i] = sum; 238002834360SBarry Smith } 238102834360SBarry Smith /* create submatrix */ 2382cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 238397f1f81fSBarry Smith PetscInt n_cols,n_rows; 238408480c60SBarry Smith ierr = MatGetSize(*B,&n_rows,&n_cols);CHKERRQ(ierr); 2385e32f2f54SBarry Smith if (n_rows != nrows || n_cols != ncols) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Reused submatrix wrong size"); 2386d8ced48eSBarry Smith ierr = MatZeroEntries(*B);CHKERRQ(ierr); 238708480c60SBarry Smith C = *B; 23883a40ed3dSBarry Smith } else { 23893bef6203SJed Brown PetscInt rbs,cbs; 2390ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&C);CHKERRQ(ierr); 2391f69a0ea3SMatthew Knepley ierr = MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr); 23923bef6203SJed Brown ierr = ISGetBlockSize(isrow,&rbs);CHKERRQ(ierr); 23933bef6203SJed Brown ierr = ISGetBlockSize(iscol,&cbs);CHKERRQ(ierr); 23943bef6203SJed Brown ierr = MatSetBlockSizes(C,rbs,cbs);CHKERRQ(ierr); 23957adad957SLisandro Dalcin ierr = MatSetType(C,((PetscObject)A)->type_name);CHKERRQ(ierr); 2396ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens);CHKERRQ(ierr); 239708480c60SBarry Smith } 2398db02288aSLois Curfman McInnes c = (Mat_SeqAIJ*)C->data; 2399db02288aSLois Curfman McInnes 240002834360SBarry Smith /* loop over rows inserting into submatrix */ 2401db02288aSLois Curfman McInnes a_new = c->a; 2402db02288aSLois Curfman McInnes j_new = c->j; 2403db02288aSLois Curfman McInnes i_new = c->i; 2404bfeeae90SHong Zhang 240502834360SBarry Smith for (i=0; i<nrows; i++) { 2406a2744918SBarry Smith ii = starts[i]; 2407a2744918SBarry Smith lensi = lens[i]; 2408a2744918SBarry Smith for (k=0; k<lensi; k++) { 2409a2744918SBarry Smith *j_new++ = aj[ii+k] - first; 241002834360SBarry Smith } 241187828ca2SBarry Smith ierr = PetscMemcpy(a_new,a->a + starts[i],lensi*sizeof(PetscScalar));CHKERRQ(ierr); 2412a2744918SBarry Smith a_new += lensi; 2413a2744918SBarry Smith i_new[i+1] = i_new[i] + lensi; 2414a2744918SBarry Smith c->ilen[i] = lensi; 241502834360SBarry Smith } 24160e83c824SBarry Smith ierr = PetscFree2(lens,starts);CHKERRQ(ierr); 24173a40ed3dSBarry Smith } else { 241802834360SBarry Smith ierr = ISGetIndices(iscol,&icol);CHKERRQ(ierr); 24191795a4d1SJed Brown ierr = PetscCalloc1(oldcols,&smap);CHKERRQ(ierr); 2420854ce69bSBarry Smith ierr = PetscMalloc1(1+nrows,&lens);CHKERRQ(ierr); 24214dcab191SBarry Smith for (i=0; i<ncols; i++) { 24224dcab191SBarry Smith #if defined(PETSC_USE_DEBUG) 24234dcab191SBarry Smith if (icol[i] >= oldcols) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Requesting column beyond largest column icol[%D] %D <= A->cmap->n %D",i,icol[i],oldcols); 24244dcab191SBarry Smith #endif 24254dcab191SBarry Smith smap[icol[i]] = i+1; 24264dcab191SBarry Smith } 24274dcab191SBarry Smith 242802834360SBarry Smith /* determine lens of each row */ 242902834360SBarry Smith for (i=0; i<nrows; i++) { 2430bfeeae90SHong Zhang kstart = ai[irow[i]]; 243102834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 243202834360SBarry Smith lens[i] = 0; 243302834360SBarry Smith for (k=kstart; k<kend; k++) { 2434bfeeae90SHong Zhang if (smap[aj[k]]) { 243502834360SBarry Smith lens[i]++; 243602834360SBarry Smith } 243702834360SBarry Smith } 243802834360SBarry Smith } 243917ab2063SBarry Smith /* Create and fill new matrix */ 2440a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2441ace3abfcSBarry Smith PetscBool equal; 24420f5bd95cSBarry Smith 244399141d43SSatish Balay c = (Mat_SeqAIJ*)((*B)->data); 2444e32f2f54SBarry Smith if ((*B)->rmap->n != nrows || (*B)->cmap->n != ncols) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong size"); 2445d0f46423SBarry Smith ierr = PetscMemcmp(c->ilen,lens,(*B)->rmap->n*sizeof(PetscInt),&equal);CHKERRQ(ierr); 2446f23aa3ddSBarry Smith if (!equal) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong no of nonzeros"); 2447d0f46423SBarry Smith ierr = PetscMemzero(c->ilen,(*B)->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 244808480c60SBarry Smith C = *B; 24493a40ed3dSBarry Smith } else { 24503bef6203SJed Brown PetscInt rbs,cbs; 2451ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&C);CHKERRQ(ierr); 2452f69a0ea3SMatthew Knepley ierr = MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr); 24533bef6203SJed Brown ierr = ISGetBlockSize(isrow,&rbs);CHKERRQ(ierr); 24543bef6203SJed Brown ierr = ISGetBlockSize(iscol,&cbs);CHKERRQ(ierr); 24553bef6203SJed Brown ierr = MatSetBlockSizes(C,rbs,cbs);CHKERRQ(ierr); 24567adad957SLisandro Dalcin ierr = MatSetType(C,((PetscObject)A)->type_name);CHKERRQ(ierr); 2457ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens);CHKERRQ(ierr); 245808480c60SBarry Smith } 245999141d43SSatish Balay c = (Mat_SeqAIJ*)(C->data); 246017ab2063SBarry Smith for (i=0; i<nrows; i++) { 246199141d43SSatish Balay row = irow[i]; 2462bfeeae90SHong Zhang kstart = ai[row]; 246399141d43SSatish Balay kend = kstart + a->ilen[row]; 2464bfeeae90SHong Zhang mat_i = c->i[i]; 246599141d43SSatish Balay mat_j = c->j + mat_i; 246699141d43SSatish Balay mat_a = c->a + mat_i; 246799141d43SSatish Balay mat_ilen = c->ilen + i; 246817ab2063SBarry Smith for (k=kstart; k<kend; k++) { 2469bfeeae90SHong Zhang if ((tcol=smap[a->j[k]])) { 2470ed480e8bSBarry Smith *mat_j++ = tcol - 1; 247199141d43SSatish Balay *mat_a++ = a->a[k]; 247299141d43SSatish Balay (*mat_ilen)++; 247399141d43SSatish Balay 247417ab2063SBarry Smith } 247517ab2063SBarry Smith } 247617ab2063SBarry Smith } 247702834360SBarry Smith /* Free work space */ 247802834360SBarry Smith ierr = ISRestoreIndices(iscol,&icol);CHKERRQ(ierr); 2479606d414cSSatish Balay ierr = PetscFree(smap);CHKERRQ(ierr); 2480606d414cSSatish Balay ierr = PetscFree(lens);CHKERRQ(ierr); 2481cdc6f3adSToby Isaac /* sort */ 2482cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2483cdc6f3adSToby Isaac PetscInt ilen; 2484cdc6f3adSToby Isaac 2485cdc6f3adSToby Isaac mat_i = c->i[i]; 2486cdc6f3adSToby Isaac mat_j = c->j + mat_i; 2487cdc6f3adSToby Isaac mat_a = c->a + mat_i; 2488cdc6f3adSToby Isaac ilen = c->ilen[i]; 2489390e1bf2SBarry Smith ierr = PetscSortIntWithScalarArray(ilen,mat_j,mat_a);CHKERRQ(ierr); 2490cdc6f3adSToby Isaac } 249102834360SBarry Smith } 24926d4a8577SBarry Smith ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 24936d4a8577SBarry Smith ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 249417ab2063SBarry Smith 249517ab2063SBarry Smith ierr = ISRestoreIndices(isrow,&irow);CHKERRQ(ierr); 2496416022c9SBarry Smith *B = C; 24973a40ed3dSBarry Smith PetscFunctionReturn(0); 249817ab2063SBarry Smith } 249917ab2063SBarry Smith 2500fc08c53fSHong Zhang PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat,MPI_Comm subComm,MatReuse scall,Mat *subMat) 250182d44351SHong Zhang { 250282d44351SHong Zhang PetscErrorCode ierr; 250382d44351SHong Zhang Mat B; 250482d44351SHong Zhang 250582d44351SHong Zhang PetscFunctionBegin; 2506c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 250782d44351SHong Zhang ierr = MatCreate(subComm,&B);CHKERRQ(ierr); 250882d44351SHong Zhang ierr = MatSetSizes(B,mat->rmap->n,mat->cmap->n,mat->rmap->n,mat->cmap->n);CHKERRQ(ierr); 250933d57670SJed Brown ierr = MatSetBlockSizesFromMats(B,mat,mat);CHKERRQ(ierr); 251082d44351SHong Zhang ierr = MatSetType(B,MATSEQAIJ);CHKERRQ(ierr); 251182d44351SHong Zhang ierr = MatDuplicateNoCreate_SeqAIJ(B,mat,MAT_COPY_VALUES,PETSC_TRUE);CHKERRQ(ierr); 251282d44351SHong Zhang *subMat = B; 2513c2d650bdSHong Zhang } else { 2514c2d650bdSHong Zhang ierr = MatCopy_SeqAIJ(mat,*subMat,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 2515c2d650bdSHong Zhang } 251682d44351SHong Zhang PetscFunctionReturn(0); 251782d44351SHong Zhang } 251882d44351SHong Zhang 25199a625307SHong Zhang PetscErrorCode MatILUFactor_SeqAIJ(Mat inA,IS row,IS col,const MatFactorInfo *info) 2520a871dcd8SBarry Smith { 252163b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 2522dfbe8321SBarry Smith PetscErrorCode ierr; 252363b91edcSBarry Smith Mat outA; 2524ace3abfcSBarry Smith PetscBool row_identity,col_identity; 252563b91edcSBarry Smith 25263a40ed3dSBarry Smith PetscFunctionBegin; 2527e32f2f54SBarry Smith if (info->levels != 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Only levels=0 supported for in-place ilu"); 25281df811f5SHong Zhang 2529b8a78c4aSBarry Smith ierr = ISIdentity(row,&row_identity);CHKERRQ(ierr); 2530b8a78c4aSBarry Smith ierr = ISIdentity(col,&col_identity);CHKERRQ(ierr); 2531a871dcd8SBarry Smith 253263b91edcSBarry Smith outA = inA; 2533d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 2534f6224b95SHong Zhang ierr = PetscFree(inA->solvertype);CHKERRQ(ierr); 2535f6224b95SHong Zhang ierr = PetscStrallocpy(MATSOLVERPETSC,&inA->solvertype);CHKERRQ(ierr); 25362205254eSKarl Rupp 2537c38d4ed2SBarry Smith ierr = PetscObjectReference((PetscObject)row);CHKERRQ(ierr); 25386bf464f9SBarry Smith ierr = ISDestroy(&a->row);CHKERRQ(ierr); 25392205254eSKarl Rupp 2540c3122656SLisandro Dalcin a->row = row; 25412205254eSKarl Rupp 2542c38d4ed2SBarry Smith ierr = PetscObjectReference((PetscObject)col);CHKERRQ(ierr); 25436bf464f9SBarry Smith ierr = ISDestroy(&a->col);CHKERRQ(ierr); 25442205254eSKarl Rupp 2545c3122656SLisandro Dalcin a->col = col; 254663b91edcSBarry Smith 254736db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 25486bf464f9SBarry Smith ierr = ISDestroy(&a->icol);CHKERRQ(ierr); 25494c49b128SBarry Smith ierr = ISInvertPermutation(col,PETSC_DECIDE,&a->icol);CHKERRQ(ierr); 25503bb1ff40SBarry Smith ierr = PetscLogObjectParent((PetscObject)inA,(PetscObject)a->icol);CHKERRQ(ierr); 2551f0ec6fceSSatish Balay 255294a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 2553854ce69bSBarry Smith ierr = PetscMalloc1(inA->rmap->n+1,&a->solve_work);CHKERRQ(ierr); 25543bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)inA, (inA->rmap->n+1)*sizeof(PetscScalar));CHKERRQ(ierr); 255594a9d846SBarry Smith } 255663b91edcSBarry Smith 2557f1e2ffcdSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(inA);CHKERRQ(ierr); 2558137fb511SHong Zhang if (row_identity && col_identity) { 2559ad04f41aSHong Zhang ierr = MatLUFactorNumeric_SeqAIJ_inplace(outA,inA,info);CHKERRQ(ierr); 2560137fb511SHong Zhang } else { 2561719d5645SBarry Smith ierr = MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA,inA,info);CHKERRQ(ierr); 2562137fb511SHong Zhang } 25633a40ed3dSBarry Smith PetscFunctionReturn(0); 2564a871dcd8SBarry Smith } 2565a871dcd8SBarry Smith 2566f4df32b1SMatthew Knepley PetscErrorCode MatScale_SeqAIJ(Mat inA,PetscScalar alpha) 2567f0b747eeSBarry Smith { 2568f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 2569f4df32b1SMatthew Knepley PetscScalar oalpha = alpha; 2570efee365bSSatish Balay PetscErrorCode ierr; 2571c5df96a5SBarry Smith PetscBLASInt one = 1,bnz; 25723a40ed3dSBarry Smith 25733a40ed3dSBarry Smith PetscFunctionBegin; 2574c5df96a5SBarry Smith ierr = PetscBLASIntCast(a->nz,&bnz);CHKERRQ(ierr); 25758b83055fSJed Brown PetscStackCallBLAS("BLASscal",BLASscal_(&bnz,&oalpha,a->a,&one)); 2576efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 2577acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(inA);CHKERRQ(ierr); 25783a40ed3dSBarry Smith PetscFunctionReturn(0); 2579f0b747eeSBarry Smith } 2580f0b747eeSBarry Smith 2581f68bb481SHong Zhang PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 258216b64355SHong Zhang { 258316b64355SHong Zhang PetscErrorCode ierr; 258416b64355SHong Zhang PetscInt i; 258516b64355SHong Zhang 258616b64355SHong Zhang PetscFunctionBegin; 258716b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 258816b64355SHong Zhang ierr = PetscFree4(submatj->sbuf1,submatj->ptr,submatj->tmp,submatj->ctr);CHKERRQ(ierr); 258916b64355SHong Zhang 259016b64355SHong Zhang for (i=0; i<submatj->nrqr; ++i) { 259116b64355SHong Zhang ierr = PetscFree(submatj->sbuf2[i]);CHKERRQ(ierr); 259216b64355SHong Zhang } 259316b64355SHong Zhang ierr = PetscFree3(submatj->sbuf2,submatj->req_size,submatj->req_source1);CHKERRQ(ierr); 259416b64355SHong Zhang 259516b64355SHong Zhang if (submatj->rbuf1) { 259616b64355SHong Zhang ierr = PetscFree(submatj->rbuf1[0]);CHKERRQ(ierr); 259716b64355SHong Zhang ierr = PetscFree(submatj->rbuf1);CHKERRQ(ierr); 259816b64355SHong Zhang } 259916b64355SHong Zhang 260016b64355SHong Zhang for (i=0; i<submatj->nrqs; ++i) { 260116b64355SHong Zhang ierr = PetscFree(submatj->rbuf3[i]);CHKERRQ(ierr); 260216b64355SHong Zhang } 260316b64355SHong Zhang ierr = PetscFree3(submatj->req_source2,submatj->rbuf2,submatj->rbuf3);CHKERRQ(ierr); 260416b64355SHong Zhang ierr = PetscFree(submatj->pa);CHKERRQ(ierr); 260516b64355SHong Zhang } 260616b64355SHong Zhang 260716b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 260816b64355SHong Zhang ierr = PetscTableDestroy((PetscTable*)&submatj->rmap);CHKERRQ(ierr); 260916b64355SHong Zhang if (submatj->cmap_loc) {ierr = PetscFree(submatj->cmap_loc);CHKERRQ(ierr);} 261016b64355SHong Zhang ierr = PetscFree(submatj->rmap_loc);CHKERRQ(ierr); 261116b64355SHong Zhang #else 261216b64355SHong Zhang ierr = PetscFree(submatj->rmap);CHKERRQ(ierr); 261316b64355SHong Zhang #endif 261416b64355SHong Zhang 261516b64355SHong Zhang if (!submatj->allcolumns) { 261616b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 261716b64355SHong Zhang ierr = PetscTableDestroy((PetscTable*)&submatj->cmap);CHKERRQ(ierr); 261816b64355SHong Zhang #else 261916b64355SHong Zhang ierr = PetscFree(submatj->cmap);CHKERRQ(ierr); 262016b64355SHong Zhang #endif 262116b64355SHong Zhang } 262216b64355SHong Zhang ierr = PetscFree(submatj->row2proc);CHKERRQ(ierr); 262316b64355SHong Zhang 262416b64355SHong Zhang ierr = PetscFree(submatj);CHKERRQ(ierr); 262516b64355SHong Zhang PetscFunctionReturn(0); 262616b64355SHong Zhang } 262716b64355SHong Zhang 26280fb991dcSHong Zhang PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 262916b64355SHong Zhang { 263016b64355SHong Zhang PetscErrorCode ierr; 263116b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ*)C->data; 26325c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 263316b64355SHong Zhang 263416b64355SHong Zhang PetscFunctionBegin; 263534136279SStefano Zampini ierr = (*submatj->destroy)(C);CHKERRQ(ierr); 2636f68bb481SHong Zhang ierr = MatDestroySubMatrix_Private(submatj);CHKERRQ(ierr); 263716b64355SHong Zhang PetscFunctionReturn(0); 263816b64355SHong Zhang } 263916b64355SHong Zhang 26402d033e1fSHong Zhang PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n,Mat *mat[]) 26412d033e1fSHong Zhang { 26422d033e1fSHong Zhang PetscErrorCode ierr; 26432d033e1fSHong Zhang PetscInt i; 26440fb991dcSHong Zhang Mat C; 26450fb991dcSHong Zhang Mat_SeqAIJ *c; 26460fb991dcSHong Zhang Mat_SubSppt *submatj; 26472d033e1fSHong Zhang 26482d033e1fSHong Zhang PetscFunctionBegin; 26492d033e1fSHong Zhang for (i=0; i<n; i++) { 26500fb991dcSHong Zhang C = (*mat)[i]; 26510fb991dcSHong Zhang c = (Mat_SeqAIJ*)C->data; 26520fb991dcSHong Zhang submatj = c->submatis1; 26532d033e1fSHong Zhang if (submatj) { 2654682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 265534136279SStefano Zampini ierr = (*submatj->destroy)(C);CHKERRQ(ierr); 2656f68bb481SHong Zhang ierr = MatDestroySubMatrix_Private(submatj);CHKERRQ(ierr); 265734136279SStefano Zampini ierr = PetscFree(C->defaultvectype);CHKERRQ(ierr); 26582d033e1fSHong Zhang ierr = PetscLayoutDestroy(&C->rmap);CHKERRQ(ierr); 26592d033e1fSHong Zhang ierr = PetscLayoutDestroy(&C->cmap);CHKERRQ(ierr); 26602d033e1fSHong Zhang ierr = PetscHeaderDestroy(&C);CHKERRQ(ierr); 2661682e4c99SStefano Zampini } 26622d033e1fSHong Zhang } else { 26632d033e1fSHong Zhang ierr = MatDestroy(&C);CHKERRQ(ierr); 26642d033e1fSHong Zhang } 26652d033e1fSHong Zhang } 266686e85357SHong Zhang 266763a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 266863a75b2aSHong Zhang ierr = MatDestroySubMatrices_Dummy(n,mat);CHKERRQ(ierr); 266963a75b2aSHong Zhang 26702d033e1fSHong Zhang ierr = PetscFree(*mat);CHKERRQ(ierr); 26712d033e1fSHong Zhang PetscFunctionReturn(0); 26722d033e1fSHong Zhang } 26732d033e1fSHong Zhang 26747dae84e0SHong Zhang PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A,PetscInt n,const IS irow[],const IS icol[],MatReuse scall,Mat *B[]) 2675cddf8d76SBarry Smith { 2676dfbe8321SBarry Smith PetscErrorCode ierr; 267797f1f81fSBarry Smith PetscInt i; 2678cddf8d76SBarry Smith 26793a40ed3dSBarry Smith PetscFunctionBegin; 2680cddf8d76SBarry Smith if (scall == MAT_INITIAL_MATRIX) { 2681df750dc8SHong Zhang ierr = PetscCalloc1(n+1,B);CHKERRQ(ierr); 2682cddf8d76SBarry Smith } 2683cddf8d76SBarry Smith 2684cddf8d76SBarry Smith for (i=0; i<n; i++) { 26857dae84e0SHong Zhang ierr = MatCreateSubMatrix_SeqAIJ(A,irow[i],icol[i],PETSC_DECIDE,scall,&(*B)[i]);CHKERRQ(ierr); 2686cddf8d76SBarry Smith } 26873a40ed3dSBarry Smith PetscFunctionReturn(0); 2688cddf8d76SBarry Smith } 2689cddf8d76SBarry Smith 269097f1f81fSBarry Smith PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A,PetscInt is_max,IS is[],PetscInt ov) 26914dcbc457SBarry Smith { 2692e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 26936849ba73SBarry Smith PetscErrorCode ierr; 26945d0c19d7SBarry Smith PetscInt row,i,j,k,l,m,n,*nidx,isz,val; 26955d0c19d7SBarry Smith const PetscInt *idx; 269697f1f81fSBarry Smith PetscInt start,end,*ai,*aj; 2697f1af5d2fSBarry Smith PetscBT table; 2698bbd702dbSSatish Balay 26993a40ed3dSBarry Smith PetscFunctionBegin; 2700d0f46423SBarry Smith m = A->rmap->n; 2701e4d965acSSatish Balay ai = a->i; 2702bfeeae90SHong Zhang aj = a->j; 27038a047759SSatish Balay 2704e32f2f54SBarry Smith if (ov < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"illegal negative overlap value used"); 270506763907SSatish Balay 2706854ce69bSBarry Smith ierr = PetscMalloc1(m+1,&nidx);CHKERRQ(ierr); 270753b8de81SBarry Smith ierr = PetscBTCreate(m,&table);CHKERRQ(ierr); 270806763907SSatish Balay 2709e4d965acSSatish Balay for (i=0; i<is_max; i++) { 2710b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2711e4d965acSSatish Balay isz = 0; 27126831982aSBarry Smith ierr = PetscBTMemzero(m,table);CHKERRQ(ierr); 2713e4d965acSSatish Balay 2714e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 27154dcbc457SBarry Smith ierr = ISGetIndices(is[i],&idx);CHKERRQ(ierr); 2716b9b97703SBarry Smith ierr = ISGetLocalSize(is[i],&n);CHKERRQ(ierr); 2717e4d965acSSatish Balay 2718dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2719e4d965acSSatish Balay for (j=0; j<n; ++j) { 27202205254eSKarl Rupp if (!PetscBTLookupSet(table,idx[j])) nidx[isz++] = idx[j]; 27214dcbc457SBarry Smith } 272206763907SSatish Balay ierr = ISRestoreIndices(is[i],&idx);CHKERRQ(ierr); 27236bf464f9SBarry Smith ierr = ISDestroy(&is[i]);CHKERRQ(ierr); 2724e4d965acSSatish Balay 272504a348a9SBarry Smith k = 0; 272604a348a9SBarry Smith for (j=0; j<ov; j++) { /* for each overlap */ 272704a348a9SBarry Smith n = isz; 272806763907SSatish Balay for (; k<n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2729e4d965acSSatish Balay row = nidx[k]; 2730e4d965acSSatish Balay start = ai[row]; 2731e4d965acSSatish Balay end = ai[row+1]; 273204a348a9SBarry Smith for (l = start; l<end; l++) { 2733efb16452SHong Zhang val = aj[l]; 27342205254eSKarl Rupp if (!PetscBTLookupSet(table,val)) nidx[isz++] = val; 2735e4d965acSSatish Balay } 2736e4d965acSSatish Balay } 2737e4d965acSSatish Balay } 273870b3c8c7SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,isz,nidx,PETSC_COPY_VALUES,(is+i));CHKERRQ(ierr); 2739e4d965acSSatish Balay } 274094bacf5dSBarry Smith ierr = PetscBTDestroy(&table);CHKERRQ(ierr); 2741606d414cSSatish Balay ierr = PetscFree(nidx);CHKERRQ(ierr); 27423a40ed3dSBarry Smith PetscFunctionReturn(0); 27434dcbc457SBarry Smith } 274417ab2063SBarry Smith 27450513a670SBarry Smith /* -------------------------------------------------------------- */ 2746dfbe8321SBarry Smith PetscErrorCode MatPermute_SeqAIJ(Mat A,IS rowp,IS colp,Mat *B) 27470513a670SBarry Smith { 27480513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 27496849ba73SBarry Smith PetscErrorCode ierr; 27503b98c0a2SBarry Smith PetscInt i,nz = 0,m = A->rmap->n,n = A->cmap->n; 27515d0c19d7SBarry Smith const PetscInt *row,*col; 27525d0c19d7SBarry Smith PetscInt *cnew,j,*lens; 275356cd22aeSBarry Smith IS icolp,irowp; 27540298fd71SBarry Smith PetscInt *cwork = NULL; 27550298fd71SBarry Smith PetscScalar *vwork = NULL; 27560513a670SBarry Smith 27573a40ed3dSBarry Smith PetscFunctionBegin; 27584c49b128SBarry Smith ierr = ISInvertPermutation(rowp,PETSC_DECIDE,&irowp);CHKERRQ(ierr); 275956cd22aeSBarry Smith ierr = ISGetIndices(irowp,&row);CHKERRQ(ierr); 27604c49b128SBarry Smith ierr = ISInvertPermutation(colp,PETSC_DECIDE,&icolp);CHKERRQ(ierr); 276156cd22aeSBarry Smith ierr = ISGetIndices(icolp,&col);CHKERRQ(ierr); 27620513a670SBarry Smith 27630513a670SBarry Smith /* determine lengths of permuted rows */ 2764854ce69bSBarry Smith ierr = PetscMalloc1(m+1,&lens);CHKERRQ(ierr); 27652205254eSKarl Rupp for (i=0; i<m; i++) lens[row[i]] = a->i[i+1] - a->i[i]; 2766ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),B);CHKERRQ(ierr); 2767f69a0ea3SMatthew Knepley ierr = MatSetSizes(*B,m,n,m,n);CHKERRQ(ierr); 276833d57670SJed Brown ierr = MatSetBlockSizesFromMats(*B,A,A);CHKERRQ(ierr); 27697adad957SLisandro Dalcin ierr = MatSetType(*B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2770ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(*B,0,lens);CHKERRQ(ierr); 2771606d414cSSatish Balay ierr = PetscFree(lens);CHKERRQ(ierr); 27720513a670SBarry Smith 2773785e854fSJed Brown ierr = PetscMalloc1(n,&cnew);CHKERRQ(ierr); 27740513a670SBarry Smith for (i=0; i<m; i++) { 277532ec9ce4SBarry Smith ierr = MatGetRow_SeqAIJ(A,i,&nz,&cwork,&vwork);CHKERRQ(ierr); 27762205254eSKarl Rupp for (j=0; j<nz; j++) cnew[j] = col[cwork[j]]; 2777cdc0ba36SBarry Smith ierr = MatSetValues_SeqAIJ(*B,1,&row[i],nz,cnew,vwork,INSERT_VALUES);CHKERRQ(ierr); 277832ec9ce4SBarry Smith ierr = MatRestoreRow_SeqAIJ(A,i,&nz,&cwork,&vwork);CHKERRQ(ierr); 27790513a670SBarry Smith } 2780606d414cSSatish Balay ierr = PetscFree(cnew);CHKERRQ(ierr); 27812205254eSKarl Rupp 27823c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 27832205254eSKarl Rupp 27840513a670SBarry Smith ierr = MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 27850513a670SBarry Smith ierr = MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 278656cd22aeSBarry Smith ierr = ISRestoreIndices(irowp,&row);CHKERRQ(ierr); 278756cd22aeSBarry Smith ierr = ISRestoreIndices(icolp,&col);CHKERRQ(ierr); 27886bf464f9SBarry Smith ierr = ISDestroy(&irowp);CHKERRQ(ierr); 27896bf464f9SBarry Smith ierr = ISDestroy(&icolp);CHKERRQ(ierr); 27903a40ed3dSBarry Smith PetscFunctionReturn(0); 27910513a670SBarry Smith } 27920513a670SBarry Smith 2793dfbe8321SBarry Smith PetscErrorCode MatCopy_SeqAIJ(Mat A,Mat B,MatStructure str) 2794cb5b572fSBarry Smith { 2795dfbe8321SBarry Smith PetscErrorCode ierr; 2796cb5b572fSBarry Smith 2797cb5b572fSBarry Smith PetscFunctionBegin; 279833f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 279933f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2800be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2801be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ*)B->data; 2802be6bf707SBarry Smith 2803700c5bfcSBarry Smith if (a->i[A->rmap->n] != b->i[B->rmap->n]) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Number of nonzeros in two matrices are different"); 2804d0f46423SBarry Smith ierr = PetscMemcpy(b->a,a->a,(a->i[A->rmap->n])*sizeof(PetscScalar));CHKERRQ(ierr); 2805cdc753b6SBarry Smith ierr = PetscObjectStateIncrease((PetscObject)B);CHKERRQ(ierr); 2806cb5b572fSBarry Smith } else { 2807cb5b572fSBarry Smith ierr = MatCopy_Basic(A,B,str);CHKERRQ(ierr); 2808cb5b572fSBarry Smith } 2809cb5b572fSBarry Smith PetscFunctionReturn(0); 2810cb5b572fSBarry Smith } 2811cb5b572fSBarry Smith 28124994cf47SJed Brown PetscErrorCode MatSetUp_SeqAIJ(Mat A) 2813273d9f13SBarry Smith { 2814dfbe8321SBarry Smith PetscErrorCode ierr; 2815273d9f13SBarry Smith 2816273d9f13SBarry Smith PetscFunctionBegin; 2817ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(A,PETSC_DEFAULT,0);CHKERRQ(ierr); 2818273d9f13SBarry Smith PetscFunctionReturn(0); 2819273d9f13SBarry Smith } 2820273d9f13SBarry Smith 28218c778c55SBarry Smith PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A,PetscScalar *array[]) 28226c0721eeSBarry Smith { 28236c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 28246e111a19SKarl Rupp 28256c0721eeSBarry Smith PetscFunctionBegin; 28266c0721eeSBarry Smith *array = a->a; 28276c0721eeSBarry Smith PetscFunctionReturn(0); 28286c0721eeSBarry Smith } 28296c0721eeSBarry Smith 28308c778c55SBarry Smith PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A,PetscScalar *array[]) 28316c0721eeSBarry Smith { 28326c0721eeSBarry Smith PetscFunctionBegin; 28336c0721eeSBarry Smith PetscFunctionReturn(0); 28346c0721eeSBarry Smith } 2835273d9f13SBarry Smith 28368229c054SShri Abhyankar /* 28378229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 28388229c054SShri Abhyankar have different nonzero structure. 28398229c054SShri Abhyankar */ 2840b264fe52SHong Zhang PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m,const PetscInt *xi,const PetscInt *xj,const PetscInt *yi,const PetscInt *yj,PetscInt *nnz) 2841ec7775f6SShri Abhyankar { 2842b264fe52SHong Zhang PetscInt i,j,k,nzx,nzy; 2843ec7775f6SShri Abhyankar 2844ec7775f6SShri Abhyankar PetscFunctionBegin; 2845ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 2846ec7775f6SShri Abhyankar for (i=0; i<m; i++) { 2847b264fe52SHong Zhang const PetscInt *xjj = xj+xi[i],*yjj = yj+yi[i]; 2848b264fe52SHong Zhang nzx = xi[i+1] - xi[i]; 2849b264fe52SHong Zhang nzy = yi[i+1] - yi[i]; 28508af7cee1SJed Brown nnz[i] = 0; 28518af7cee1SJed Brown for (j=0,k=0; j<nzx; j++) { /* Point in X */ 2852b264fe52SHong Zhang for (; k<nzy && yjj[k]<xjj[j]; k++) nnz[i]++; /* Catch up to X */ 2853b264fe52SHong Zhang if (k<nzy && yjj[k]==xjj[j]) k++; /* Skip duplicate */ 28548af7cee1SJed Brown nnz[i]++; 28558af7cee1SJed Brown } 28568af7cee1SJed Brown for (; k<nzy; k++) nnz[i]++; 2857ec7775f6SShri Abhyankar } 2858ec7775f6SShri Abhyankar PetscFunctionReturn(0); 2859ec7775f6SShri Abhyankar } 2860ec7775f6SShri Abhyankar 2861b264fe52SHong Zhang PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y,Mat X,PetscInt *nnz) 2862b264fe52SHong Zhang { 2863b264fe52SHong Zhang PetscInt m = Y->rmap->N; 2864b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ*)X->data; 2865b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ*)Y->data; 2866b264fe52SHong Zhang PetscErrorCode ierr; 2867b264fe52SHong Zhang 2868b264fe52SHong Zhang PetscFunctionBegin; 2869b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 2870b264fe52SHong Zhang ierr = MatAXPYGetPreallocation_SeqX_private(m,x->i,x->j,y->i,y->j,nnz);CHKERRQ(ierr); 2871b264fe52SHong Zhang PetscFunctionReturn(0); 2872b264fe52SHong Zhang } 2873b264fe52SHong Zhang 2874f4df32b1SMatthew Knepley PetscErrorCode MatAXPY_SeqAIJ(Mat Y,PetscScalar a,Mat X,MatStructure str) 2875ac90fabeSBarry Smith { 2876dfbe8321SBarry Smith PetscErrorCode ierr; 2877ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ*)X->data,*y = (Mat_SeqAIJ*)Y->data; 2878c5df96a5SBarry Smith PetscBLASInt one=1,bnz; 2879ac90fabeSBarry Smith 2880ac90fabeSBarry Smith PetscFunctionBegin; 2881c5df96a5SBarry Smith ierr = PetscBLASIntCast(x->nz,&bnz);CHKERRQ(ierr); 2882ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 2883f4df32b1SMatthew Knepley PetscScalar alpha = a; 28848b83055fSJed Brown PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&bnz,&alpha,x->a,&one,y->a,&one)); 2885acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(Y);CHKERRQ(ierr); 2886a3fa217bSJose E. Roman ierr = PetscObjectStateIncrease((PetscObject)Y);CHKERRQ(ierr); 2887ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 2888ab784542SHong Zhang ierr = MatAXPY_Basic(Y,a,X,str);CHKERRQ(ierr); 2889ac90fabeSBarry Smith } else { 28908229c054SShri Abhyankar Mat B; 28918229c054SShri Abhyankar PetscInt *nnz; 2892785e854fSJed Brown ierr = PetscMalloc1(Y->rmap->N,&nnz);CHKERRQ(ierr); 2893ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)Y),&B);CHKERRQ(ierr); 2894bc5a2726SShri Abhyankar ierr = PetscObjectSetName((PetscObject)B,((PetscObject)Y)->name);CHKERRQ(ierr); 28954aa94f47SShri Abhyankar ierr = MatSetSizes(B,Y->rmap->n,Y->cmap->n,Y->rmap->N,Y->cmap->N);CHKERRQ(ierr); 289633d57670SJed Brown ierr = MatSetBlockSizesFromMats(B,Y,Y);CHKERRQ(ierr); 2897176df525SBarry Smith ierr = MatSetType(B,(MatType) ((PetscObject)Y)->type_name);CHKERRQ(ierr); 28988229c054SShri Abhyankar ierr = MatAXPYGetPreallocation_SeqAIJ(Y,X,nnz);CHKERRQ(ierr); 2899ecd8bba6SJed Brown ierr = MatSeqAIJSetPreallocation(B,0,nnz);CHKERRQ(ierr); 2900ec7775f6SShri Abhyankar ierr = MatAXPY_BasicWithPreallocation(B,Y,a,X,str);CHKERRQ(ierr); 290128be2f97SBarry Smith ierr = MatHeaderReplace(Y,&B);CHKERRQ(ierr); 29028229c054SShri Abhyankar ierr = PetscFree(nnz);CHKERRQ(ierr); 2903ac90fabeSBarry Smith } 2904ac90fabeSBarry Smith PetscFunctionReturn(0); 2905ac90fabeSBarry Smith } 2906ac90fabeSBarry Smith 29077087cfbeSBarry Smith PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 2908354c94deSBarry Smith { 2909354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 2910354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 2911354c94deSBarry Smith PetscInt i,nz; 2912354c94deSBarry Smith PetscScalar *a; 2913354c94deSBarry Smith 2914354c94deSBarry Smith PetscFunctionBegin; 2915354c94deSBarry Smith nz = aij->nz; 2916354c94deSBarry Smith a = aij->a; 29172205254eSKarl Rupp for (i=0; i<nz; i++) a[i] = PetscConj(a[i]); 2918354c94deSBarry Smith #else 2919354c94deSBarry Smith PetscFunctionBegin; 2920354c94deSBarry Smith #endif 2921354c94deSBarry Smith PetscFunctionReturn(0); 2922354c94deSBarry Smith } 2923354c94deSBarry Smith 2924985db425SBarry Smith PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 2925e34fafa9SBarry Smith { 2926e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2927e34fafa9SBarry Smith PetscErrorCode ierr; 2928d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 2929e34fafa9SBarry Smith PetscReal atmp; 2930985db425SBarry Smith PetscScalar *x; 2931e34fafa9SBarry Smith MatScalar *aa; 2932e34fafa9SBarry Smith 2933e34fafa9SBarry Smith PetscFunctionBegin; 2934e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2935e34fafa9SBarry Smith aa = a->a; 2936e34fafa9SBarry Smith ai = a->i; 2937e34fafa9SBarry Smith aj = a->j; 2938e34fafa9SBarry Smith 2939985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 2940e34fafa9SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2941e34fafa9SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 2942e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2943e34fafa9SBarry Smith for (i=0; i<m; i++) { 2944e34fafa9SBarry Smith ncols = ai[1] - ai[0]; ai++; 29459189402eSHong Zhang x[i] = 0.0; 2946e34fafa9SBarry Smith for (j=0; j<ncols; j++) { 2947985db425SBarry Smith atmp = PetscAbsScalar(*aa); 2948985db425SBarry Smith if (PetscAbsScalar(x[i]) < atmp) {x[i] = atmp; if (idx) idx[i] = *aj;} 2949985db425SBarry Smith aa++; aj++; 2950985db425SBarry Smith } 2951985db425SBarry Smith } 2952985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2953985db425SBarry Smith PetscFunctionReturn(0); 2954985db425SBarry Smith } 2955985db425SBarry Smith 2956985db425SBarry Smith PetscErrorCode MatGetRowMax_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 2957985db425SBarry Smith { 2958985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2959985db425SBarry Smith PetscErrorCode ierr; 2960d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 2961985db425SBarry Smith PetscScalar *x; 2962985db425SBarry Smith MatScalar *aa; 2963985db425SBarry Smith 2964985db425SBarry Smith PetscFunctionBegin; 2965e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2966985db425SBarry Smith aa = a->a; 2967985db425SBarry Smith ai = a->i; 2968985db425SBarry Smith aj = a->j; 2969985db425SBarry Smith 2970985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 2971985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2972985db425SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 2973e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2974985db425SBarry Smith for (i=0; i<m; i++) { 2975985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 2976d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 2977985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 2978985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 2979985db425SBarry Smith x[i] = 0.0; 2980985db425SBarry Smith if (idx) { 2981985db425SBarry Smith idx[i] = 0; /* in case ncols is zero */ 2982985db425SBarry Smith for (j=0;j<ncols;j++) { /* find first implicit 0.0 in the row */ 2983985db425SBarry Smith if (aj[j] > j) { 2984985db425SBarry Smith idx[i] = j; 2985985db425SBarry Smith break; 2986985db425SBarry Smith } 2987985db425SBarry Smith } 2988985db425SBarry Smith } 2989985db425SBarry Smith } 2990985db425SBarry Smith for (j=0; j<ncols; j++) { 2991985db425SBarry Smith if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 2992985db425SBarry Smith aa++; aj++; 2993985db425SBarry Smith } 2994985db425SBarry Smith } 2995985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2996985db425SBarry Smith PetscFunctionReturn(0); 2997985db425SBarry Smith } 2998985db425SBarry Smith 2999c87e5d42SMatthew Knepley PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3000c87e5d42SMatthew Knepley { 3001c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3002c87e5d42SMatthew Knepley PetscErrorCode ierr; 3003c87e5d42SMatthew Knepley PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3004c87e5d42SMatthew Knepley PetscReal atmp; 3005c87e5d42SMatthew Knepley PetscScalar *x; 3006c87e5d42SMatthew Knepley MatScalar *aa; 3007c87e5d42SMatthew Knepley 3008c87e5d42SMatthew Knepley PetscFunctionBegin; 3009e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3010c87e5d42SMatthew Knepley aa = a->a; 3011c87e5d42SMatthew Knepley ai = a->i; 3012c87e5d42SMatthew Knepley aj = a->j; 3013c87e5d42SMatthew Knepley 3014c87e5d42SMatthew Knepley ierr = VecSet(v,0.0);CHKERRQ(ierr); 3015c87e5d42SMatthew Knepley ierr = VecGetArray(v,&x);CHKERRQ(ierr); 3016c87e5d42SMatthew Knepley ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 301760e0710aSBarry Smith if (n != A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector, %D vs. %D rows", A->rmap->n, n); 3018c87e5d42SMatthew Knepley for (i=0; i<m; i++) { 3019c87e5d42SMatthew Knepley ncols = ai[1] - ai[0]; ai++; 3020289a08f5SMatthew Knepley if (ncols) { 3021289a08f5SMatthew Knepley /* Get first nonzero */ 3022289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3023289a08f5SMatthew Knepley atmp = PetscAbsScalar(aa[j]); 30242205254eSKarl Rupp if (atmp > 1.0e-12) { 30252205254eSKarl Rupp x[i] = atmp; 30262205254eSKarl Rupp if (idx) idx[i] = aj[j]; 30272205254eSKarl Rupp break; 30282205254eSKarl Rupp } 3029289a08f5SMatthew Knepley } 303012431cb0SMatthew G Knepley if (j == ncols) {x[i] = PetscAbsScalar(*aa); if (idx) idx[i] = *aj;} 3031289a08f5SMatthew Knepley } else { 3032289a08f5SMatthew Knepley x[i] = 0.0; if (idx) idx[i] = 0; 3033289a08f5SMatthew Knepley } 3034c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 3035c87e5d42SMatthew Knepley atmp = PetscAbsScalar(*aa); 3036289a08f5SMatthew Knepley if (atmp > 1.0e-12 && PetscAbsScalar(x[i]) > atmp) {x[i] = atmp; if (idx) idx[i] = *aj;} 3037c87e5d42SMatthew Knepley aa++; aj++; 3038c87e5d42SMatthew Knepley } 3039c87e5d42SMatthew Knepley } 3040c87e5d42SMatthew Knepley ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 3041c87e5d42SMatthew Knepley PetscFunctionReturn(0); 3042c87e5d42SMatthew Knepley } 3043c87e5d42SMatthew Knepley 3044985db425SBarry Smith PetscErrorCode MatGetRowMin_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3045985db425SBarry Smith { 3046985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3047985db425SBarry Smith PetscErrorCode ierr; 3048d9ca1df4SBarry Smith PetscInt i,j,m = A->rmap->n,ncols,n; 3049d9ca1df4SBarry Smith const PetscInt *ai,*aj; 3050985db425SBarry Smith PetscScalar *x; 3051d9ca1df4SBarry Smith const MatScalar *aa; 3052985db425SBarry Smith 3053985db425SBarry Smith PetscFunctionBegin; 3054e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3055985db425SBarry Smith aa = a->a; 3056985db425SBarry Smith ai = a->i; 3057985db425SBarry Smith aj = a->j; 3058985db425SBarry Smith 3059985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 3060985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 3061985db425SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 3062e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3063985db425SBarry Smith for (i=0; i<m; i++) { 3064985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 3065d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 3066985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 3067985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3068985db425SBarry Smith x[i] = 0.0; 3069985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3070985db425SBarry Smith idx[i] = 0; /* in case ncols is zero */ 3071985db425SBarry Smith for (j=0; j<ncols; j++) { 3072985db425SBarry Smith if (aj[j] > j) { 3073985db425SBarry Smith idx[i] = j; 3074985db425SBarry Smith break; 3075985db425SBarry Smith } 3076985db425SBarry Smith } 3077985db425SBarry Smith } 3078985db425SBarry Smith } 3079985db425SBarry Smith for (j=0; j<ncols; j++) { 3080985db425SBarry Smith if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 3081985db425SBarry Smith aa++; aj++; 3082e34fafa9SBarry Smith } 3083e34fafa9SBarry Smith } 3084e34fafa9SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 3085e34fafa9SBarry Smith PetscFunctionReturn(0); 3086e34fafa9SBarry Smith } 3087bbead8a2SBarry Smith 3088713ccfa9SJed Brown PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A,const PetscScalar **values) 3089bbead8a2SBarry Smith { 3090bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 3091bbead8a2SBarry Smith PetscErrorCode ierr; 309233d57670SJed Brown PetscInt i,bs = PetscAbs(A->rmap->bs),mbs = A->rmap->n/bs,ipvt[5],bs2 = bs*bs,*v_pivots,ij[7],*IJ,j; 3093bbead8a2SBarry Smith MatScalar *diag,work[25],*v_work; 30940da83c2eSBarry Smith const PetscReal shift = 0.0; 30951a9391e3SHong Zhang PetscBool allowzeropivot,zeropivotdetected=PETSC_FALSE; 3096bbead8a2SBarry Smith 3097bbead8a2SBarry Smith PetscFunctionBegin; 3098a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 30994a0d0026SBarry Smith if (a->ibdiagvalid) { 31004a0d0026SBarry Smith if (values) *values = a->ibdiag; 31014a0d0026SBarry Smith PetscFunctionReturn(0); 31024a0d0026SBarry Smith } 3103bbead8a2SBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 3104bbead8a2SBarry Smith if (!a->ibdiag) { 3105785e854fSJed Brown ierr = PetscMalloc1(bs2*mbs,&a->ibdiag);CHKERRQ(ierr); 31063bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)A,bs2*mbs*sizeof(PetscScalar));CHKERRQ(ierr); 3107bbead8a2SBarry Smith } 3108bbead8a2SBarry Smith diag = a->ibdiag; 3109bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3110bbead8a2SBarry Smith /* factor and invert each block */ 3111bbead8a2SBarry Smith switch (bs) { 3112bbead8a2SBarry Smith case 1: 3113bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3114bbead8a2SBarry Smith ierr = MatGetValues(A,1,&i,1,&i,diag+i);CHKERRQ(ierr); 3115ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3116ec1892c8SHong Zhang if (allowzeropivot) { 31177b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 31187b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 31197b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 31207b6c816cSBarry Smith ierr = PetscInfo3(A,"Zero pivot, row %D pivot %g tolerance %g\n",i,(double)PetscAbsScalar(diag[i]),(double)PETSC_MACHINE_EPSILON);CHKERRQ(ierr); 31217b6c816cSBarry Smith } else SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_MAT_LU_ZRPVT,"Zero pivot, row %D pivot %g tolerance %g",i,(double)PetscAbsScalar(diag[i]),(double)PETSC_MACHINE_EPSILON); 3122ec1892c8SHong Zhang } 3123bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3124bbead8a2SBarry Smith } 3125bbead8a2SBarry Smith break; 3126bbead8a2SBarry Smith case 2: 3127bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3128bbead8a2SBarry Smith ij[0] = 2*i; ij[1] = 2*i + 1; 3129bbead8a2SBarry Smith ierr = MatGetValues(A,2,ij,2,ij,diag);CHKERRQ(ierr); 3130a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_2(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 31317b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 313296b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_2(diag);CHKERRQ(ierr); 3133bbead8a2SBarry Smith diag += 4; 3134bbead8a2SBarry Smith } 3135bbead8a2SBarry Smith break; 3136bbead8a2SBarry Smith case 3: 3137bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3138bbead8a2SBarry Smith ij[0] = 3*i; ij[1] = 3*i + 1; ij[2] = 3*i + 2; 3139bbead8a2SBarry Smith ierr = MatGetValues(A,3,ij,3,ij,diag);CHKERRQ(ierr); 3140a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_3(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 31417b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 314296b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_3(diag);CHKERRQ(ierr); 3143bbead8a2SBarry Smith diag += 9; 3144bbead8a2SBarry Smith } 3145bbead8a2SBarry Smith break; 3146bbead8a2SBarry Smith case 4: 3147bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3148bbead8a2SBarry Smith ij[0] = 4*i; ij[1] = 4*i + 1; ij[2] = 4*i + 2; ij[3] = 4*i + 3; 3149bbead8a2SBarry Smith ierr = MatGetValues(A,4,ij,4,ij,diag);CHKERRQ(ierr); 3150a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_4(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 31517b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 315296b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_4(diag);CHKERRQ(ierr); 3153bbead8a2SBarry Smith diag += 16; 3154bbead8a2SBarry Smith } 3155bbead8a2SBarry Smith break; 3156bbead8a2SBarry Smith case 5: 3157bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3158bbead8a2SBarry Smith ij[0] = 5*i; ij[1] = 5*i + 1; ij[2] = 5*i + 2; ij[3] = 5*i + 3; ij[4] = 5*i + 4; 3159bbead8a2SBarry Smith ierr = MatGetValues(A,5,ij,5,ij,diag);CHKERRQ(ierr); 3160a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_5(diag,ipvt,work,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 31617b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 316296b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_5(diag);CHKERRQ(ierr); 3163bbead8a2SBarry Smith diag += 25; 3164bbead8a2SBarry Smith } 3165bbead8a2SBarry Smith break; 3166bbead8a2SBarry Smith case 6: 3167bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3168bbead8a2SBarry Smith ij[0] = 6*i; ij[1] = 6*i + 1; ij[2] = 6*i + 2; ij[3] = 6*i + 3; ij[4] = 6*i + 4; ij[5] = 6*i + 5; 3169bbead8a2SBarry Smith ierr = MatGetValues(A,6,ij,6,ij,diag);CHKERRQ(ierr); 3170a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_6(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 31717b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 317296b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_6(diag);CHKERRQ(ierr); 3173bbead8a2SBarry Smith diag += 36; 3174bbead8a2SBarry Smith } 3175bbead8a2SBarry Smith break; 3176bbead8a2SBarry Smith case 7: 3177bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3178bbead8a2SBarry Smith ij[0] = 7*i; ij[1] = 7*i + 1; ij[2] = 7*i + 2; ij[3] = 7*i + 3; ij[4] = 7*i + 4; ij[5] = 7*i + 5; ij[5] = 7*i + 6; 3179bbead8a2SBarry Smith ierr = MatGetValues(A,7,ij,7,ij,diag);CHKERRQ(ierr); 3180a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_7(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 31817b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 318296b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_7(diag);CHKERRQ(ierr); 3183bbead8a2SBarry Smith diag += 49; 3184bbead8a2SBarry Smith } 3185bbead8a2SBarry Smith break; 3186bbead8a2SBarry Smith default: 3187dcca6d9dSJed Brown ierr = PetscMalloc3(bs,&v_work,bs,&v_pivots,bs,&IJ);CHKERRQ(ierr); 3188bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3189bbead8a2SBarry Smith for (j=0; j<bs; j++) { 3190bbead8a2SBarry Smith IJ[j] = bs*i + j; 3191bbead8a2SBarry Smith } 3192bbead8a2SBarry Smith ierr = MatGetValues(A,bs,IJ,bs,IJ,diag);CHKERRQ(ierr); 31935f8bbccaSHong Zhang ierr = PetscKernel_A_gets_inverse_A(bs,diag,v_pivots,v_work,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 31947b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 319596b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_N(diag,bs);CHKERRQ(ierr); 3196bbead8a2SBarry Smith diag += bs2; 3197bbead8a2SBarry Smith } 3198bbead8a2SBarry Smith ierr = PetscFree3(v_work,v_pivots,IJ);CHKERRQ(ierr); 3199bbead8a2SBarry Smith } 3200bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 3201bbead8a2SBarry Smith PetscFunctionReturn(0); 3202bbead8a2SBarry Smith } 3203bbead8a2SBarry Smith 320473a71a0fSBarry Smith static PetscErrorCode MatSetRandom_SeqAIJ(Mat x,PetscRandom rctx) 320573a71a0fSBarry Smith { 320673a71a0fSBarry Smith PetscErrorCode ierr; 320773a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)x->data; 320873a71a0fSBarry Smith PetscScalar a; 320973a71a0fSBarry Smith PetscInt m,n,i,j,col; 321073a71a0fSBarry Smith 321173a71a0fSBarry Smith PetscFunctionBegin; 321273a71a0fSBarry Smith if (!x->assembled) { 321373a71a0fSBarry Smith ierr = MatGetSize(x,&m,&n);CHKERRQ(ierr); 321473a71a0fSBarry Smith for (i=0; i<m; i++) { 321573a71a0fSBarry Smith for (j=0; j<aij->imax[i]; j++) { 321673a71a0fSBarry Smith ierr = PetscRandomGetValue(rctx,&a);CHKERRQ(ierr); 321773a71a0fSBarry Smith col = (PetscInt)(n*PetscRealPart(a)); 321873a71a0fSBarry Smith ierr = MatSetValues(x,1,&i,1,&col,&a,ADD_VALUES);CHKERRQ(ierr); 321973a71a0fSBarry Smith } 322073a71a0fSBarry Smith } 3221e2ce353bSJunchao Zhang } else { 3222e2ce353bSJunchao Zhang for (i=0; i<aij->nz; i++) {ierr = PetscRandomGetValue(rctx,aij->a+i);CHKERRQ(ierr);} 3223e2ce353bSJunchao Zhang } 322473a71a0fSBarry Smith ierr = MatAssemblyBegin(x,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 322573a71a0fSBarry Smith ierr = MatAssemblyEnd(x,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 322673a71a0fSBarry Smith PetscFunctionReturn(0); 322773a71a0fSBarry Smith } 322873a71a0fSBarry Smith 3229679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3230679944adSJunchao Zhang PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x,PetscInt low,PetscInt high,PetscRandom rctx) 3231679944adSJunchao Zhang { 3232679944adSJunchao Zhang PetscErrorCode ierr; 3233679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)x->data; 3234679944adSJunchao Zhang PetscScalar a; 3235679944adSJunchao Zhang PetscInt m,n,i,j,col,nskip; 3236679944adSJunchao Zhang 3237679944adSJunchao Zhang PetscFunctionBegin; 3238679944adSJunchao Zhang nskip = high - low; 3239679944adSJunchao Zhang ierr = MatGetSize(x,&m,&n);CHKERRQ(ierr); 3240679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3241679944adSJunchao Zhang for (i=0; i<m; i++) { 3242679944adSJunchao Zhang for (j=0; j<aij->imax[i]; j++) { 3243679944adSJunchao Zhang ierr = PetscRandomGetValue(rctx,&a);CHKERRQ(ierr); 3244679944adSJunchao Zhang col = (PetscInt)(n*PetscRealPart(a)); 3245679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 3246679944adSJunchao Zhang ierr = MatSetValues(x,1,&i,1,&col,&a,ADD_VALUES);CHKERRQ(ierr); 3247679944adSJunchao Zhang } 3248e2ce353bSJunchao Zhang } 3249679944adSJunchao Zhang ierr = MatAssemblyBegin(x,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3250679944adSJunchao Zhang ierr = MatAssemblyEnd(x,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3251679944adSJunchao Zhang PetscFunctionReturn(0); 3252679944adSJunchao Zhang } 3253679944adSJunchao Zhang 3254679944adSJunchao Zhang 3255682d7d0cSBarry Smith /* -------------------------------------------------------------------*/ 32560a6ffc59SBarry Smith static struct _MatOps MatOps_Values = { MatSetValues_SeqAIJ, 3257cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3258cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3259cb5b572fSBarry Smith MatMult_SeqAIJ, 326097304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 32617c922b88SBarry Smith MatMultTranspose_SeqAIJ, 32627c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3263db4efbfdSBarry Smith 0, 3264db4efbfdSBarry Smith 0, 3265db4efbfdSBarry Smith 0, 3266db4efbfdSBarry Smith /* 10*/ 0, 3267cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3268cb5b572fSBarry Smith 0, 326941f059aeSBarry Smith MatSOR_SeqAIJ, 327091e9d3e2SHong Zhang MatTranspose_SeqAIJ, 327197304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3272cb5b572fSBarry Smith MatEqual_SeqAIJ, 3273cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3274cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3275cb5b572fSBarry Smith MatNorm_SeqAIJ, 327697304618SKris Buschelman /* 20*/ 0, 3277cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3278cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3279cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3280d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3281db4efbfdSBarry Smith 0, 3282db4efbfdSBarry Smith 0, 3283db4efbfdSBarry Smith 0, 3284db4efbfdSBarry Smith 0, 32854994cf47SJed Brown /* 29*/ MatSetUp_SeqAIJ, 3286db4efbfdSBarry Smith 0, 3287db4efbfdSBarry Smith 0, 32888c778c55SBarry Smith 0, 32898c778c55SBarry Smith 0, 3290d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3291cb5b572fSBarry Smith 0, 3292cb5b572fSBarry Smith 0, 3293cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3294cb5b572fSBarry Smith 0, 3295d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 32967dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3297cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3298cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3299cb5b572fSBarry Smith MatCopy_SeqAIJ, 3300d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3301cb5b572fSBarry Smith MatScale_SeqAIJ, 33027d68702bSBarry Smith MatShift_SeqAIJ, 330379299369SBarry Smith MatDiagonalSet_SeqAIJ, 33046e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 330573a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 33063b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 33073b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 33083b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3309a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 331093dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3311b9617806SBarry Smith 0, 33120513a670SBarry Smith 0, 3313cda55fadSBarry Smith MatPermute_SeqAIJ, 3314cda55fadSBarry Smith 0, 3315d519adbfSMatthew Knepley /* 59*/ 0, 3316b9b97703SBarry Smith MatDestroy_SeqAIJ, 3317b9b97703SBarry Smith MatView_SeqAIJ, 3318357abbc8SBarry Smith 0, 3319321b30b9SSatish Balay MatMatMatMult_SeqAIJ_SeqAIJ_SeqAIJ, 3320321b30b9SSatish Balay /* 64*/ MatMatMatMultSymbolic_SeqAIJ_SeqAIJ_SeqAIJ, 3321321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3322ee4f033dSBarry Smith 0, 3323ee4f033dSBarry Smith 0, 3324ee4f033dSBarry Smith 0, 3325d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3326c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3327ee4f033dSBarry Smith 0, 3328dcf5cc72SBarry Smith 0, 33292c93a97aSBarry Smith 0, 33302c93a97aSBarry Smith /* 74*/ 0, 33313acb8795SBarry Smith MatFDColoringApply_AIJ, 333297304618SKris Buschelman 0, 333397304618SKris Buschelman 0, 333497304618SKris Buschelman 0, 33356ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 333697304618SKris Buschelman 0, 333797304618SKris Buschelman 0, 333897304618SKris Buschelman 0, 3339bc011b1eSHong Zhang MatLoad_SeqAIJ, 3340d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqAIJ, 33411cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 33426284ec50SHong Zhang 0, 33436284ec50SHong Zhang 0, 3344bc011b1eSHong Zhang 0, 3345d519adbfSMatthew Knepley /* 89*/ MatMatMult_SeqAIJ_SeqAIJ, 334626be0446SHong Zhang MatMatMultSymbolic_SeqAIJ_SeqAIJ, 334726be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 334865e8a0caSHong Zhang MatPtAP_SeqAIJ_SeqAIJ, 33498fa4b5a6SHong Zhang MatPtAPSymbolic_SeqAIJ_SeqAIJ_SparseAxpy, 33508fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 33516fc122caSHong Zhang MatMatTransposeMult_SeqAIJ_SeqAIJ, 33526fc122caSHong Zhang MatMatTransposeMultSymbolic_SeqAIJ_SeqAIJ, 33536fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 33542121bac1SHong Zhang 0, 33552121bac1SHong Zhang /* 99*/ 0, 3356609c6c4dSKris Buschelman 0, 3357609c6c4dSKris Buschelman 0, 335887d4246cSBarry Smith MatConjugate_SeqAIJ, 335987d4246cSBarry Smith 0, 3360d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 336199cafbc1SBarry Smith MatRealPart_SeqAIJ, 3362f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3363f5edf698SHong Zhang 0, 33642bebee5dSHong Zhang 0, 3365cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3366985db425SBarry Smith 0, 33672af78befSBarry Smith MatGetRowMin_SeqAIJ, 33682af78befSBarry Smith 0, 3369599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3370d519adbfSMatthew Knepley /*114*/ 0, 3371599ef60dSHong Zhang 0, 33723c2a7987SHong Zhang 0, 3373fe97e370SBarry Smith 0, 3374fbdbba38SShri Abhyankar 0, 3375fbdbba38SShri Abhyankar /*119*/ 0, 3376fbdbba38SShri Abhyankar 0, 3377fbdbba38SShri Abhyankar 0, 337882d44351SHong Zhang 0, 3379b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 33800716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3381bbead8a2SBarry Smith MatGetColumnNorms_SeqAIJ, 338237868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 33830da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 338437868618SMatthew G Knepley 0, 33855df89d91SHong Zhang /*129*/ 0, 338675648e8dSHong Zhang MatTransposeMatMult_SeqAIJ_SeqAIJ, 338775648e8dSHong Zhang MatTransposeMatMultSymbolic_SeqAIJ_SeqAIJ, 338875648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3389b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3390b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 33912b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 33922b8ad9a3SHong Zhang MatRARt_SeqAIJ_SeqAIJ, 33932b8ad9a3SHong Zhang MatRARtSymbolic_SeqAIJ_SeqAIJ, 33943964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 33953964eb88SJed Brown /*139*/0, 3396f9426fe0SMark Adams 0, 33971919a2e2SJed Brown 0, 33983a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 33999c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 34002d033e1fSHong Zhang /*144*/MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 34012d033e1fSHong Zhang MatDestroySubMatrices_SeqAIJ 34029e29f15eSvictorle }; 340317ab2063SBarry Smith 34047087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat,PetscInt *indices) 3405bef8e0ddSBarry Smith { 3406bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 340797f1f81fSBarry Smith PetscInt i,nz,n; 3408bef8e0ddSBarry Smith 3409bef8e0ddSBarry Smith PetscFunctionBegin; 3410bef8e0ddSBarry Smith nz = aij->maxnz; 3411d0f46423SBarry Smith n = mat->rmap->n; 3412bef8e0ddSBarry Smith for (i=0; i<nz; i++) { 3413bef8e0ddSBarry Smith aij->j[i] = indices[i]; 3414bef8e0ddSBarry Smith } 3415bef8e0ddSBarry Smith aij->nz = nz; 3416bef8e0ddSBarry Smith for (i=0; i<n; i++) { 3417bef8e0ddSBarry Smith aij->ilen[i] = aij->imax[i]; 3418bef8e0ddSBarry Smith } 3419bef8e0ddSBarry Smith PetscFunctionReturn(0); 3420bef8e0ddSBarry Smith } 3421bef8e0ddSBarry Smith 3422a3bb6f32SFande Kong /* 3423e8b528d9SFande Kong * When a sparse matrix has many zero columns, we should compact them out to save the space 3424a3bb6f32SFande Kong * This happens in MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3425a3bb6f32SFande Kong * */ 3426a3bb6f32SFande Kong PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3427a3bb6f32SFande Kong { 3428a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3429a3bb6f32SFande Kong PetscTable gid1_lid1; 3430a3bb6f32SFande Kong PetscTablePosition tpos; 3431a3bb6f32SFande Kong PetscInt gid,lid,i,j,ncols,ec; 3432a3bb6f32SFande Kong PetscInt *garray; 3433a3bb6f32SFande Kong PetscErrorCode ierr; 3434a3bb6f32SFande Kong 3435a3bb6f32SFande Kong PetscFunctionBegin; 3436a3bb6f32SFande Kong PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3437a3bb6f32SFande Kong PetscValidPointer(mapping,2); 3438a3bb6f32SFande Kong /* use a table */ 3439a3bb6f32SFande Kong ierr = PetscTableCreate(mat->rmap->n,mat->cmap->N+1,&gid1_lid1);CHKERRQ(ierr); 3440a3bb6f32SFande Kong ec = 0; 3441a3bb6f32SFande Kong for (i=0; i<mat->rmap->n; i++) { 3442a3bb6f32SFande Kong ncols = aij->i[i+1] - aij->i[i]; 3443a3bb6f32SFande Kong for (j=0; j<ncols; j++) { 3444a3bb6f32SFande Kong PetscInt data,gid1 = aij->j[aij->i[i] + j] + 1; 3445a3bb6f32SFande Kong ierr = PetscTableFind(gid1_lid1,gid1,&data);CHKERRQ(ierr); 3446a3bb6f32SFande Kong if (!data) { 3447a3bb6f32SFande Kong /* one based table */ 3448a3bb6f32SFande Kong ierr = PetscTableAdd(gid1_lid1,gid1,++ec,INSERT_VALUES);CHKERRQ(ierr); 3449a3bb6f32SFande Kong } 3450a3bb6f32SFande Kong } 3451a3bb6f32SFande Kong } 3452a3bb6f32SFande Kong /* form array of columns we need */ 3453a3bb6f32SFande Kong ierr = PetscMalloc1(ec+1,&garray);CHKERRQ(ierr); 3454a3bb6f32SFande Kong ierr = PetscTableGetHeadPosition(gid1_lid1,&tpos);CHKERRQ(ierr); 3455a3bb6f32SFande Kong while (tpos) { 3456a3bb6f32SFande Kong ierr = PetscTableGetNext(gid1_lid1,&tpos,&gid,&lid);CHKERRQ(ierr); 3457a3bb6f32SFande Kong gid--; 3458a3bb6f32SFande Kong lid--; 3459a3bb6f32SFande Kong garray[lid] = gid; 3460a3bb6f32SFande Kong } 3461a3bb6f32SFande Kong ierr = PetscSortInt(ec,garray);CHKERRQ(ierr); /* sort, and rebuild */ 3462a3bb6f32SFande Kong ierr = PetscTableRemoveAll(gid1_lid1);CHKERRQ(ierr); 3463a3bb6f32SFande Kong for (i=0; i<ec; i++) { 3464a3bb6f32SFande Kong ierr = PetscTableAdd(gid1_lid1,garray[i]+1,i+1,INSERT_VALUES);CHKERRQ(ierr); 3465a3bb6f32SFande Kong } 3466a3bb6f32SFande Kong /* compact out the extra columns in B */ 3467a3bb6f32SFande Kong for (i=0; i<mat->rmap->n; i++) { 3468a3bb6f32SFande Kong ncols = aij->i[i+1] - aij->i[i]; 3469a3bb6f32SFande Kong for (j=0; j<ncols; j++) { 3470a3bb6f32SFande Kong PetscInt gid1 = aij->j[aij->i[i] + j] + 1; 3471a3bb6f32SFande Kong ierr = PetscTableFind(gid1_lid1,gid1,&lid);CHKERRQ(ierr); 3472a3bb6f32SFande Kong lid--; 3473a3bb6f32SFande Kong aij->j[aij->i[i] + j] = lid; 3474a3bb6f32SFande Kong } 3475a3bb6f32SFande Kong } 3476a3bb6f32SFande Kong mat->cmap->n = mat->cmap->N = ec; 3477a3bb6f32SFande Kong mat->cmap->bs = 1; 3478a3bb6f32SFande Kong 3479a3bb6f32SFande Kong ierr = PetscTableDestroy(&gid1_lid1);CHKERRQ(ierr); 3480a3bb6f32SFande Kong ierr = PetscLayoutSetUp((mat->cmap));CHKERRQ(ierr); 3481a3bb6f32SFande Kong ierr = ISLocalToGlobalMappingCreate(PETSC_COMM_SELF,mat->cmap->bs,mat->cmap->n,garray,PETSC_OWN_POINTER,mapping);CHKERRQ(ierr); 3482a3bb6f32SFande Kong ierr = ISLocalToGlobalMappingSetType(*mapping,ISLOCALTOGLOBALMAPPINGHASH);CHKERRQ(ierr); 3483a3bb6f32SFande Kong PetscFunctionReturn(0); 3484a3bb6f32SFande Kong } 3485a3bb6f32SFande Kong 3486bef8e0ddSBarry Smith /*@ 3487bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3488bef8e0ddSBarry Smith in the matrix. 3489bef8e0ddSBarry Smith 3490bef8e0ddSBarry Smith Input Parameters: 3491bef8e0ddSBarry Smith + mat - the SeqAIJ matrix 3492bef8e0ddSBarry Smith - indices - the column indices 3493bef8e0ddSBarry Smith 349415091d37SBarry Smith Level: advanced 349515091d37SBarry Smith 3496bef8e0ddSBarry Smith Notes: 3497bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3498bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 3499bef8e0ddSBarry Smith of the MatSetValues() operation. 3500bef8e0ddSBarry Smith 3501bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 3502d1be2dadSMatthew Knepley MatCreateSeqAIJ(), and the columns indices MUST be sorted. 3503bef8e0ddSBarry Smith 3504bef8e0ddSBarry Smith MUST be called before any calls to MatSetValues(); 3505bef8e0ddSBarry Smith 3506b9617806SBarry Smith The indices should start with zero, not one. 3507b9617806SBarry Smith 3508bef8e0ddSBarry Smith @*/ 35097087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat,PetscInt *indices) 3510bef8e0ddSBarry Smith { 35114ac538c5SBarry Smith PetscErrorCode ierr; 3512bef8e0ddSBarry Smith 3513bef8e0ddSBarry Smith PetscFunctionBegin; 35140700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 35154482741eSBarry Smith PetscValidPointer(indices,2); 35164ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatSeqAIJSetColumnIndices_C",(Mat,PetscInt*),(mat,indices));CHKERRQ(ierr); 3517bef8e0ddSBarry Smith PetscFunctionReturn(0); 3518bef8e0ddSBarry Smith } 3519bef8e0ddSBarry Smith 3520be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/ 3521be6bf707SBarry Smith 35227087cfbeSBarry Smith PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3523be6bf707SBarry Smith { 3524be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 35256849ba73SBarry Smith PetscErrorCode ierr; 3526d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3527be6bf707SBarry Smith 3528be6bf707SBarry Smith PetscFunctionBegin; 3529169f6850SBarry Smith if (!aij->nonew) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3530be6bf707SBarry Smith 3531be6bf707SBarry Smith /* allocate space for values if not already there */ 3532be6bf707SBarry Smith if (!aij->saved_values) { 3533854ce69bSBarry Smith ierr = PetscMalloc1(nz+1,&aij->saved_values);CHKERRQ(ierr); 35343bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)mat,(nz+1)*sizeof(PetscScalar));CHKERRQ(ierr); 3535be6bf707SBarry Smith } 3536be6bf707SBarry Smith 3537be6bf707SBarry Smith /* copy values over */ 353887828ca2SBarry Smith ierr = PetscMemcpy(aij->saved_values,aij->a,nz*sizeof(PetscScalar));CHKERRQ(ierr); 3539be6bf707SBarry Smith PetscFunctionReturn(0); 3540be6bf707SBarry Smith } 3541be6bf707SBarry Smith 3542be6bf707SBarry Smith /*@ 3543be6bf707SBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows, for 3544be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3545be6bf707SBarry Smith nonlinear portion. 3546be6bf707SBarry Smith 3547be6bf707SBarry Smith Collect on Mat 3548be6bf707SBarry Smith 3549be6bf707SBarry Smith Input Parameters: 35500e609b76SBarry Smith . mat - the matrix (currently only AIJ matrices support this option) 3551be6bf707SBarry Smith 355215091d37SBarry Smith Level: advanced 355315091d37SBarry Smith 3554be6bf707SBarry Smith Common Usage, with SNESSolve(): 3555be6bf707SBarry Smith $ Create Jacobian matrix 3556be6bf707SBarry Smith $ Set linear terms into matrix 3557be6bf707SBarry Smith $ Apply boundary conditions to matrix, at this time matrix must have 3558be6bf707SBarry Smith $ final nonzero structure (i.e. setting the nonlinear terms and applying 3559be6bf707SBarry Smith $ boundary conditions again will not change the nonzero structure 3560512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3561be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3562be6bf707SBarry Smith $ Call SNESSetJacobian() with matrix 3563be6bf707SBarry Smith $ In your Jacobian routine 3564be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3565be6bf707SBarry Smith $ Set nonlinear terms in matrix 3566be6bf707SBarry Smith 3567be6bf707SBarry Smith Common Usage without SNESSolve(), i.e. when you handle nonlinear solve yourself: 3568be6bf707SBarry Smith $ // build linear portion of Jacobian 3569512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3570be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3571be6bf707SBarry Smith $ loop over nonlinear iterations 3572be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3573be6bf707SBarry Smith $ // call MatSetValues(mat,...) to set nonliner portion of Jacobian 3574be6bf707SBarry Smith $ // call MatAssemblyBegin/End() on matrix 3575be6bf707SBarry Smith $ Solve linear system with Jacobian 3576be6bf707SBarry Smith $ endloop 3577be6bf707SBarry Smith 3578be6bf707SBarry Smith Notes: 3579be6bf707SBarry Smith Matrix must already be assemblied before calling this routine 3580512a5fc5SBarry Smith Must set the matrix option MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); before 3581be6bf707SBarry Smith calling this routine. 3582be6bf707SBarry Smith 35830c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 35840c468ba9SBarry Smith and does not allocated additional space. 35850c468ba9SBarry Smith 3586be6bf707SBarry Smith .seealso: MatRetrieveValues() 3587be6bf707SBarry Smith 3588be6bf707SBarry Smith @*/ 35897087cfbeSBarry Smith PetscErrorCode MatStoreValues(Mat mat) 3590be6bf707SBarry Smith { 35914ac538c5SBarry Smith PetscErrorCode ierr; 3592be6bf707SBarry Smith 3593be6bf707SBarry Smith PetscFunctionBegin; 35940700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3595e32f2f54SBarry Smith if (!mat->assembled) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 3596e32f2f54SBarry Smith if (mat->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 35974ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatStoreValues_C",(Mat),(mat));CHKERRQ(ierr); 3598be6bf707SBarry Smith PetscFunctionReturn(0); 3599be6bf707SBarry Smith } 3600be6bf707SBarry Smith 36017087cfbeSBarry Smith PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3602be6bf707SBarry Smith { 3603be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 36046849ba73SBarry Smith PetscErrorCode ierr; 3605d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3606be6bf707SBarry Smith 3607be6bf707SBarry Smith PetscFunctionBegin; 3608169f6850SBarry Smith if (!aij->nonew) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3609f23aa3ddSBarry Smith if (!aij->saved_values) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatStoreValues(A);first"); 3610be6bf707SBarry Smith /* copy values over */ 361187828ca2SBarry Smith ierr = PetscMemcpy(aij->a,aij->saved_values,nz*sizeof(PetscScalar));CHKERRQ(ierr); 3612be6bf707SBarry Smith PetscFunctionReturn(0); 3613be6bf707SBarry Smith } 3614be6bf707SBarry Smith 3615be6bf707SBarry Smith /*@ 3616be6bf707SBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for 3617be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3618be6bf707SBarry Smith nonlinear portion. 3619be6bf707SBarry Smith 3620be6bf707SBarry Smith Collect on Mat 3621be6bf707SBarry Smith 3622be6bf707SBarry Smith Input Parameters: 3623386f7cf9SBarry Smith . mat - the matrix (currently only AIJ matrices support this option) 3624be6bf707SBarry Smith 362515091d37SBarry Smith Level: advanced 362615091d37SBarry Smith 3627be6bf707SBarry Smith .seealso: MatStoreValues() 3628be6bf707SBarry Smith 3629be6bf707SBarry Smith @*/ 36307087cfbeSBarry Smith PetscErrorCode MatRetrieveValues(Mat mat) 3631be6bf707SBarry Smith { 36324ac538c5SBarry Smith PetscErrorCode ierr; 3633be6bf707SBarry Smith 3634be6bf707SBarry Smith PetscFunctionBegin; 36350700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3636e32f2f54SBarry Smith if (!mat->assembled) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 3637e32f2f54SBarry Smith if (mat->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 36384ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatRetrieveValues_C",(Mat),(mat));CHKERRQ(ierr); 3639be6bf707SBarry Smith PetscFunctionReturn(0); 3640be6bf707SBarry Smith } 3641be6bf707SBarry Smith 3642f83d6046SBarry Smith 3643be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/ 364417ab2063SBarry Smith /*@C 3645682d7d0cSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in AIJ (compressed row) format 36460d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 36476e62573dSLois Curfman McInnes the user should preallocate the matrix storage by setting the parameter nz 364851c19458SBarry Smith (or the array nnz). By setting these parameters accurately, performance 36492bd5e0b2SLois Curfman McInnes during matrix assembly can be increased by more than a factor of 50. 365017ab2063SBarry Smith 3651db81eaa0SLois Curfman McInnes Collective on MPI_Comm 3652db81eaa0SLois Curfman McInnes 365317ab2063SBarry Smith Input Parameters: 3654db81eaa0SLois Curfman McInnes + comm - MPI communicator, set to PETSC_COMM_SELF 365517ab2063SBarry Smith . m - number of rows 365617ab2063SBarry Smith . n - number of columns 365717ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 365851c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 36590298fd71SBarry Smith (possibly different for each row) or NULL 366017ab2063SBarry Smith 366117ab2063SBarry Smith Output Parameter: 3662416022c9SBarry Smith . A - the matrix 366317ab2063SBarry Smith 3664175b88e8SBarry Smith It is recommended that one use the MatCreate(), MatSetType() and/or MatSetFromOptions(), 3665ae1d86c5SBarry Smith MatXXXXSetPreallocation() paradgm instead of this routine directly. 3666175b88e8SBarry Smith [MatXXXXSetPreallocation() is, for example, MatSeqAIJSetPreallocation] 3667175b88e8SBarry Smith 3668b259b22eSLois Curfman McInnes Notes: 366949a6f317SBarry Smith If nnz is given then nz is ignored 367049a6f317SBarry Smith 367117ab2063SBarry Smith The AIJ format (also called the Yale sparse matrix format or 367217ab2063SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 36730002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 367444cd7ae7SLois Curfman McInnes either one (as in Fortran) or zero. See the users' manual for details. 367517ab2063SBarry Smith 367617ab2063SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 36770298fd71SBarry Smith Set nz=PETSC_DEFAULT and nnz=NULL for PETSc to control dynamic memory 36783d323bbdSBarry Smith allocation. For large problems you MUST preallocate memory or you 36796da5968aSLois Curfman McInnes will get TERRIBLE performance, see the users' manual chapter on matrices. 368017ab2063SBarry Smith 3681682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 36824fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3683682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 36846c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 36856c7ebb05SLois Curfman McInnes 36866c7ebb05SLois Curfman McInnes Options Database Keys: 3687698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 36889db58ca8SBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 368917ab2063SBarry Smith 3690027ccd11SLois Curfman McInnes Level: intermediate 3691027ccd11SLois Curfman McInnes 369269b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatSetValues(), MatSeqAIJSetColumnIndices(), MatCreateSeqAIJWithArrays() 369336db0b34SBarry Smith 369417ab2063SBarry Smith @*/ 36957087cfbeSBarry Smith PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt nz,const PetscInt nnz[],Mat *A) 369617ab2063SBarry Smith { 3697dfbe8321SBarry Smith PetscErrorCode ierr; 36986945ee14SBarry Smith 36993a40ed3dSBarry Smith PetscFunctionBegin; 3700f69a0ea3SMatthew Knepley ierr = MatCreate(comm,A);CHKERRQ(ierr); 3701117016b1SBarry Smith ierr = MatSetSizes(*A,m,n,m,n);CHKERRQ(ierr); 3702c4752a88SBarry Smith ierr = MatSetType(*A,MATSEQAIJ);CHKERRQ(ierr); 3703d28bb7d2SJed Brown ierr = MatSeqAIJSetPreallocation_SeqAIJ(*A,nz,nnz);CHKERRQ(ierr); 3704273d9f13SBarry Smith PetscFunctionReturn(0); 3705273d9f13SBarry Smith } 3706273d9f13SBarry Smith 3707273d9f13SBarry Smith /*@C 3708273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3709273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3710273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3711273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3712273d9f13SBarry Smith 3713273d9f13SBarry Smith Collective on MPI_Comm 3714273d9f13SBarry Smith 3715273d9f13SBarry Smith Input Parameters: 37161c4f3114SJed Brown + B - The matrix 3717273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3718273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 37190298fd71SBarry Smith (possibly different for each row) or NULL 3720273d9f13SBarry Smith 3721273d9f13SBarry Smith Notes: 372249a6f317SBarry Smith If nnz is given then nz is ignored 372349a6f317SBarry Smith 3724273d9f13SBarry Smith The AIJ format (also called the Yale sparse matrix format or 3725273d9f13SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 3726273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3727273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3728273d9f13SBarry Smith 3729273d9f13SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 37300298fd71SBarry Smith Set nz=PETSC_DEFAULT and nnz=NULL for PETSc to control dynamic memory 3731273d9f13SBarry Smith allocation. For large problems you MUST preallocate memory or you 3732273d9f13SBarry Smith will get TERRIBLE performance, see the users' manual chapter on matrices. 3733273d9f13SBarry Smith 3734aa95bbe8SBarry Smith You can call MatGetInfo() to get information on how effective the preallocation was; 3735aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3736aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3737aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3738aa95bbe8SBarry Smith 3739a96a251dSBarry Smith Developers: Use nz of MAT_SKIP_ALLOCATION to not allocate any space for the matrix 3740a96a251dSBarry Smith entries or columns indices 3741a96a251dSBarry Smith 3742273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3743273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3744273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3745273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3746273d9f13SBarry Smith 3747273d9f13SBarry Smith Options Database Keys: 3748698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 374947b2e64bSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 3750273d9f13SBarry Smith 3751273d9f13SBarry Smith Level: intermediate 3752273d9f13SBarry Smith 375369b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatSetValues(), MatSeqAIJSetColumnIndices(), MatCreateSeqAIJWithArrays(), MatGetInfo() 3754273d9f13SBarry Smith 3755273d9f13SBarry Smith @*/ 37567087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation(Mat B,PetscInt nz,const PetscInt nnz[]) 3757273d9f13SBarry Smith { 37584ac538c5SBarry Smith PetscErrorCode ierr; 3759a23d5eceSKris Buschelman 3760a23d5eceSKris Buschelman PetscFunctionBegin; 37616ba663aaSJed Brown PetscValidHeaderSpecific(B,MAT_CLASSID,1); 37626ba663aaSJed Brown PetscValidType(B,1); 37634ac538c5SBarry Smith ierr = PetscTryMethod(B,"MatSeqAIJSetPreallocation_C",(Mat,PetscInt,const PetscInt[]),(B,nz,nnz));CHKERRQ(ierr); 3764a23d5eceSKris Buschelman PetscFunctionReturn(0); 3765a23d5eceSKris Buschelman } 3766a23d5eceSKris Buschelman 37677087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B,PetscInt nz,const PetscInt *nnz) 3768a23d5eceSKris Buschelman { 3769273d9f13SBarry Smith Mat_SeqAIJ *b; 37702576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE,realalloc = PETSC_FALSE; 37716849ba73SBarry Smith PetscErrorCode ierr; 377297f1f81fSBarry Smith PetscInt i; 3773273d9f13SBarry Smith 3774273d9f13SBarry Smith PetscFunctionBegin; 37752576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3776a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3777c461c341SBarry Smith skipallocation = PETSC_TRUE; 3778c461c341SBarry Smith nz = 0; 3779c461c341SBarry Smith } 378026283091SBarry Smith ierr = PetscLayoutSetUp(B->rmap);CHKERRQ(ierr); 378126283091SBarry Smith ierr = PetscLayoutSetUp(B->cmap);CHKERRQ(ierr); 3782899cda47SBarry Smith 3783435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 378460e0710aSBarry Smith if (nz < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nz cannot be less than 0: value %D",nz); 3785b73539f3SBarry Smith if (nnz) { 3786d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) { 378760e0710aSBarry Smith if (nnz[i] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be less than 0: local row %D value %D",i,nnz[i]); 378860e0710aSBarry Smith if (nnz[i] > B->cmap->n) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be greater than row length: local row %D value %d rowlength %D",i,nnz[i],B->cmap->n); 3789b73539f3SBarry Smith } 3790b73539f3SBarry Smith } 3791b73539f3SBarry Smith 3792273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 37932205254eSKarl Rupp 3794273d9f13SBarry Smith b = (Mat_SeqAIJ*)B->data; 3795273d9f13SBarry Smith 3796ab93d7beSBarry Smith if (!skipallocation) { 37972ee49352SLisandro Dalcin if (!b->imax) { 3798dcca6d9dSJed Brown ierr = PetscMalloc2(B->rmap->n,&b->imax,B->rmap->n,&b->ilen);CHKERRQ(ierr); 37993bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)B,2*B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 38002ee49352SLisandro Dalcin } 3801846b4da1SFande Kong if (!b->ipre) { 3802846b4da1SFande Kong ierr = PetscMalloc1(B->rmap->n,&b->ipre);CHKERRQ(ierr); 3803846b4da1SFande Kong ierr = PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 3804846b4da1SFande Kong } 3805273d9f13SBarry Smith if (!nnz) { 3806435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 3807c62bd62aSJed Brown else if (nz < 0) nz = 1; 38085d2a9ed1SStefano Zampini nz = PetscMin(nz,B->cmap->n); 3809d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) b->imax[i] = nz; 3810d0f46423SBarry Smith nz = nz*B->rmap->n; 3811273d9f13SBarry Smith } else { 3812273d9f13SBarry Smith nz = 0; 3813d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) {b->imax[i] = nnz[i]; nz += nnz[i];} 3814273d9f13SBarry Smith } 3815ab93d7beSBarry Smith /* b->ilen will count nonzeros in each row so far. */ 38162205254eSKarl Rupp for (i=0; i<B->rmap->n; i++) b->ilen[i] = 0; 3817ab93d7beSBarry Smith 3818273d9f13SBarry Smith /* allocate the matrix space */ 381953dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 38202ee49352SLisandro Dalcin ierr = MatSeqXAIJFreeAIJ(B,&b->a,&b->j,&b->i);CHKERRQ(ierr); 3821396832f4SHong Zhang if (B->structure_only) { 38225848002fSHong Zhang ierr = PetscMalloc1(nz,&b->j);CHKERRQ(ierr); 38235848002fSHong Zhang ierr = PetscMalloc1(B->rmap->n+1,&b->i);CHKERRQ(ierr); 3824396832f4SHong Zhang ierr = PetscLogObjectMemory((PetscObject)B,(B->rmap->n+1)*sizeof(PetscInt)+nz*sizeof(PetscInt));CHKERRQ(ierr); 3825396832f4SHong Zhang } else { 3826dcca6d9dSJed Brown ierr = PetscMalloc3(nz,&b->a,nz,&b->j,B->rmap->n+1,&b->i);CHKERRQ(ierr); 38273bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)B,(B->rmap->n+1)*sizeof(PetscInt)+nz*(sizeof(PetscScalar)+sizeof(PetscInt)));CHKERRQ(ierr); 3828396832f4SHong Zhang } 3829bfeeae90SHong Zhang b->i[0] = 0; 3830d0f46423SBarry Smith for (i=1; i<B->rmap->n+1; i++) { 38315da197adSKris Buschelman b->i[i] = b->i[i-1] + b->imax[i-1]; 38325da197adSKris Buschelman } 3833396832f4SHong Zhang if (B->structure_only) { 3834396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 3835396832f4SHong Zhang b->free_a = PETSC_FALSE; 3836396832f4SHong Zhang } else { 3837273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 3838e6b907acSBarry Smith b->free_a = PETSC_TRUE; 3839396832f4SHong Zhang } 3840e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 3841c461c341SBarry Smith } else { 3842e6b907acSBarry Smith b->free_a = PETSC_FALSE; 3843e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 3844c461c341SBarry Smith } 3845273d9f13SBarry Smith 3846846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 3847846b4da1SFande Kong /* reserve user-requested sparsity */ 3848846b4da1SFande Kong ierr = PetscMemcpy(b->ipre,b->imax,B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 3849846b4da1SFande Kong } 3850846b4da1SFande Kong 3851846b4da1SFande Kong 3852273d9f13SBarry Smith b->nz = 0; 3853273d9f13SBarry Smith b->maxnz = nz; 3854273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 38552205254eSKarl Rupp if (realalloc) { 38562205254eSKarl Rupp ierr = MatSetOption(B,MAT_NEW_NONZERO_ALLOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 38572205254eSKarl Rupp } 3858cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 3859cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 3860273d9f13SBarry Smith PetscFunctionReturn(0); 3861273d9f13SBarry Smith } 3862273d9f13SBarry Smith 3863846b4da1SFande Kong 3864846b4da1SFande Kong PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 3865846b4da1SFande Kong { 3866846b4da1SFande Kong Mat_SeqAIJ *a; 3867a5bbaf83SFande Kong PetscInt i; 3868846b4da1SFande Kong PetscErrorCode ierr; 3869846b4da1SFande Kong 3870846b4da1SFande Kong PetscFunctionBegin; 3871846b4da1SFande Kong PetscValidHeaderSpecific(A,MAT_CLASSID,1); 3872846b4da1SFande Kong a = (Mat_SeqAIJ*)A->data; 38732c814fdeSFande Kong /* if no saved info, we error out */ 38742c814fdeSFande Kong if (!a->ipre) SETERRQ(PETSC_COMM_WORLD,PETSC_ERR_ARG_NULL,"No saved preallocation info \n"); 38752c814fdeSFande Kong 38762c814fdeSFande Kong if (!a->i || !a->j || !a->a || !a->imax || !a->ilen) SETERRQ(PETSC_COMM_WORLD,PETSC_ERR_ARG_NULL,"Memory info is incomplete, and can not reset preallocation \n"); 38772c814fdeSFande Kong 3878846b4da1SFande Kong ierr = PetscMemcpy(a->imax,a->ipre,A->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 3879846b4da1SFande Kong ierr = PetscMemzero(a->ilen,A->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 3880846b4da1SFande Kong a->i[0] = 0; 3881846b4da1SFande Kong for (i=1; i<A->rmap->n+1; i++) { 3882846b4da1SFande Kong a->i[i] = a->i[i-1] + a->imax[i-1]; 3883846b4da1SFande Kong } 3884846b4da1SFande Kong A->preallocated = PETSC_TRUE; 3885846b4da1SFande Kong a->nz = 0; 3886846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 3887846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 3888846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 3889846b4da1SFande Kong A->assembled = PETSC_FALSE; 3890846b4da1SFande Kong PetscFunctionReturn(0); 3891846b4da1SFande Kong } 3892846b4da1SFande Kong 389358d36128SBarry Smith /*@ 3894a1661176SMatthew Knepley MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in AIJ format. 3895a1661176SMatthew Knepley 3896a1661176SMatthew Knepley Input Parameters: 3897a1661176SMatthew Knepley + B - the matrix 3898a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 3899a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 3900a1661176SMatthew Knepley - v - optional values in the matrix 3901a1661176SMatthew Knepley 3902a1661176SMatthew Knepley Level: developer 3903a1661176SMatthew Knepley 390458d36128SBarry Smith The i,j,v values are COPIED with this routine; to avoid the copy use MatCreateSeqAIJWithArrays() 390558d36128SBarry Smith 3906a1661176SMatthew Knepley .keywords: matrix, aij, compressed row, sparse, sequential 3907a1661176SMatthew Knepley 3908c1c1d628SHong Zhang .seealso: MatCreate(), MatCreateSeqAIJ(), MatSetValues(), MatSeqAIJSetPreallocation(), MatCreateSeqAIJ(), MATSEQAIJ 3909a1661176SMatthew Knepley @*/ 3910a1661176SMatthew Knepley PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B,const PetscInt i[],const PetscInt j[],const PetscScalar v[]) 3911a1661176SMatthew Knepley { 3912a1661176SMatthew Knepley PetscErrorCode ierr; 3913a1661176SMatthew Knepley 3914a1661176SMatthew Knepley PetscFunctionBegin; 39150700a824SBarry Smith PetscValidHeaderSpecific(B,MAT_CLASSID,1); 39166ba663aaSJed Brown PetscValidType(B,1); 39174ac538c5SBarry Smith ierr = PetscTryMethod(B,"MatSeqAIJSetPreallocationCSR_C",(Mat,const PetscInt[],const PetscInt[],const PetscScalar[]),(B,i,j,v));CHKERRQ(ierr); 3918a1661176SMatthew Knepley PetscFunctionReturn(0); 3919a1661176SMatthew Knepley } 3920a1661176SMatthew Knepley 39217087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B,const PetscInt Ii[],const PetscInt J[],const PetscScalar v[]) 3922a1661176SMatthew Knepley { 3923a1661176SMatthew Knepley PetscInt i; 3924a1661176SMatthew Knepley PetscInt m,n; 3925a1661176SMatthew Knepley PetscInt nz; 3926a1661176SMatthew Knepley PetscInt *nnz, nz_max = 0; 3927a1661176SMatthew Knepley PetscScalar *values; 3928a1661176SMatthew Knepley PetscErrorCode ierr; 3929a1661176SMatthew Knepley 3930a1661176SMatthew Knepley PetscFunctionBegin; 393165e19b50SBarry Smith if (Ii[0]) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %D", Ii[0]); 3932779a8d59SSatish Balay 3933779a8d59SSatish Balay ierr = PetscLayoutSetUp(B->rmap);CHKERRQ(ierr); 3934779a8d59SSatish Balay ierr = PetscLayoutSetUp(B->cmap);CHKERRQ(ierr); 3935779a8d59SSatish Balay 3936779a8d59SSatish Balay ierr = MatGetSize(B, &m, &n);CHKERRQ(ierr); 3937854ce69bSBarry Smith ierr = PetscMalloc1(m+1, &nnz);CHKERRQ(ierr); 3938a1661176SMatthew Knepley for (i = 0; i < m; i++) { 3939b7940d39SSatish Balay nz = Ii[i+1]- Ii[i]; 3940a1661176SMatthew Knepley nz_max = PetscMax(nz_max, nz); 394165e19b50SBarry Smith if (nz < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Local row %D has a negative number of columns %D", i, nnz); 3942a1661176SMatthew Knepley nnz[i] = nz; 3943a1661176SMatthew Knepley } 3944a1661176SMatthew Knepley ierr = MatSeqAIJSetPreallocation(B, 0, nnz);CHKERRQ(ierr); 3945a1661176SMatthew Knepley ierr = PetscFree(nnz);CHKERRQ(ierr); 3946a1661176SMatthew Knepley 3947a1661176SMatthew Knepley if (v) { 3948a1661176SMatthew Knepley values = (PetscScalar*) v; 3949a1661176SMatthew Knepley } else { 39501795a4d1SJed Brown ierr = PetscCalloc1(nz_max, &values);CHKERRQ(ierr); 3951a1661176SMatthew Knepley } 3952a1661176SMatthew Knepley 3953a1661176SMatthew Knepley for (i = 0; i < m; i++) { 3954b7940d39SSatish Balay nz = Ii[i+1] - Ii[i]; 3955b7940d39SSatish Balay ierr = MatSetValues_SeqAIJ(B, 1, &i, nz, J+Ii[i], values + (v ? Ii[i] : 0), INSERT_VALUES);CHKERRQ(ierr); 3956a1661176SMatthew Knepley } 3957a1661176SMatthew Knepley 3958a1661176SMatthew Knepley ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3959a1661176SMatthew Knepley ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3960a1661176SMatthew Knepley 3961a1661176SMatthew Knepley if (!v) { 3962a1661176SMatthew Knepley ierr = PetscFree(values);CHKERRQ(ierr); 3963a1661176SMatthew Knepley } 39647827cd58SJed Brown ierr = MatSetOption(B,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 3965a1661176SMatthew Knepley PetscFunctionReturn(0); 3966a1661176SMatthew Knepley } 3967a1661176SMatthew Knepley 3968c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 3969af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 3970170fe5c8SBarry Smith 3971170fe5c8SBarry Smith /* 3972170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 3973170fe5c8SBarry Smith 3974170fe5c8SBarry Smith n p p 3975170fe5c8SBarry Smith ( ) ( ) ( ) 3976170fe5c8SBarry Smith m ( A ) * n ( B ) = m ( C ) 3977170fe5c8SBarry Smith ( ) ( ) ( ) 3978170fe5c8SBarry Smith 3979170fe5c8SBarry Smith */ 3980170fe5c8SBarry Smith PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A,Mat B,Mat C) 3981170fe5c8SBarry Smith { 3982170fe5c8SBarry Smith PetscErrorCode ierr; 3983170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense*)A->data; 3984170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ*)B->data; 3985170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense*)C->data; 39861de00fd4SBarry Smith PetscInt i,n,m,q,p; 3987170fe5c8SBarry Smith const PetscInt *ii,*idx; 3988170fe5c8SBarry Smith const PetscScalar *b,*a,*a_q; 3989170fe5c8SBarry Smith PetscScalar *c,*c_q; 3990170fe5c8SBarry Smith 3991170fe5c8SBarry Smith PetscFunctionBegin; 3992d0f46423SBarry Smith m = A->rmap->n; 3993d0f46423SBarry Smith n = A->cmap->n; 3994d0f46423SBarry Smith p = B->cmap->n; 3995170fe5c8SBarry Smith a = sub_a->v; 3996170fe5c8SBarry Smith b = sub_b->a; 3997170fe5c8SBarry Smith c = sub_c->v; 3998170fe5c8SBarry Smith ierr = PetscMemzero(c,m*p*sizeof(PetscScalar));CHKERRQ(ierr); 3999170fe5c8SBarry Smith 4000170fe5c8SBarry Smith ii = sub_b->i; 4001170fe5c8SBarry Smith idx = sub_b->j; 4002170fe5c8SBarry Smith for (i=0; i<n; i++) { 4003170fe5c8SBarry Smith q = ii[i+1] - ii[i]; 4004170fe5c8SBarry Smith while (q-->0) { 4005170fe5c8SBarry Smith c_q = c + m*(*idx); 4006170fe5c8SBarry Smith a_q = a + m*i; 4007854c7f52SBarry Smith PetscKernelAXPY(c_q,*b,a_q,m); 4008170fe5c8SBarry Smith idx++; 4009170fe5c8SBarry Smith b++; 4010170fe5c8SBarry Smith } 4011170fe5c8SBarry Smith } 4012170fe5c8SBarry Smith PetscFunctionReturn(0); 4013170fe5c8SBarry Smith } 4014170fe5c8SBarry Smith 4015170fe5c8SBarry Smith PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A,Mat B,PetscReal fill,Mat *C) 4016170fe5c8SBarry Smith { 4017170fe5c8SBarry Smith PetscErrorCode ierr; 4018d0f46423SBarry Smith PetscInt m=A->rmap->n,n=B->cmap->n; 4019170fe5c8SBarry Smith Mat Cmat; 4020170fe5c8SBarry Smith 4021170fe5c8SBarry Smith PetscFunctionBegin; 402260e0710aSBarry Smith if (A->cmap->n != B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"A->cmap->n %D != B->rmap->n %D\n",A->cmap->n,B->rmap->n); 4023ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&Cmat);CHKERRQ(ierr); 4024170fe5c8SBarry Smith ierr = MatSetSizes(Cmat,m,n,m,n);CHKERRQ(ierr); 402533d57670SJed Brown ierr = MatSetBlockSizesFromMats(Cmat,A,B);CHKERRQ(ierr); 4026170fe5c8SBarry Smith ierr = MatSetType(Cmat,MATSEQDENSE);CHKERRQ(ierr); 40270298fd71SBarry Smith ierr = MatSeqDenseSetPreallocation(Cmat,NULL);CHKERRQ(ierr); 4028d73949e8SHong Zhang 4029d73949e8SHong Zhang Cmat->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 40302205254eSKarl Rupp 4031170fe5c8SBarry Smith *C = Cmat; 4032170fe5c8SBarry Smith PetscFunctionReturn(0); 4033170fe5c8SBarry Smith } 4034170fe5c8SBarry Smith 4035170fe5c8SBarry Smith /* ----------------------------------------------------------------*/ 4036150d2497SBarry Smith PETSC_INTERN PetscErrorCode MatMatMult_SeqDense_SeqAIJ(Mat A,Mat B,MatReuse scall,PetscReal fill,Mat *C) 4037170fe5c8SBarry Smith { 4038170fe5c8SBarry Smith PetscErrorCode ierr; 4039170fe5c8SBarry Smith 4040170fe5c8SBarry Smith PetscFunctionBegin; 4041170fe5c8SBarry Smith if (scall == MAT_INITIAL_MATRIX) { 40423ff4c91cSHong Zhang ierr = PetscLogEventBegin(MAT_MatMultSymbolic,A,B,0,0);CHKERRQ(ierr); 4043170fe5c8SBarry Smith ierr = MatMatMultSymbolic_SeqDense_SeqAIJ(A,B,fill,C);CHKERRQ(ierr); 40443ff4c91cSHong Zhang ierr = PetscLogEventEnd(MAT_MatMultSymbolic,A,B,0,0);CHKERRQ(ierr); 4045170fe5c8SBarry Smith } 40463ff4c91cSHong Zhang ierr = PetscLogEventBegin(MAT_MatMultNumeric,A,B,0,0);CHKERRQ(ierr); 4047170fe5c8SBarry Smith ierr = MatMatMultNumeric_SeqDense_SeqAIJ(A,B,*C);CHKERRQ(ierr); 40483ff4c91cSHong Zhang ierr = PetscLogEventEnd(MAT_MatMultNumeric,A,B,0,0);CHKERRQ(ierr); 4049170fe5c8SBarry Smith PetscFunctionReturn(0); 4050170fe5c8SBarry Smith } 4051170fe5c8SBarry Smith 4052170fe5c8SBarry Smith 40530bad9183SKris Buschelman /*MC 4054fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 40550bad9183SKris Buschelman based on compressed sparse row format. 40560bad9183SKris Buschelman 40570bad9183SKris Buschelman Options Database Keys: 40580bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 40590bad9183SKris Buschelman 40600bad9183SKris Buschelman Level: beginner 40610bad9183SKris Buschelman 4062f587520bSBarry Smith .seealso: MatCreateSeqAIJ(), MatSetFromOptions(), MatSetType(), MatCreate(), MatType 40630bad9183SKris Buschelman M*/ 40640bad9183SKris Buschelman 4065ccd284c7SBarry Smith /*MC 4066ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4067ccd284c7SBarry Smith 4068ccd284c7SBarry Smith This matrix type is identical to MATSEQAIJ when constructed with a single process communicator, 4069ccd284c7SBarry Smith and MATMPIAIJ otherwise. As a result, for single process communicators, 4070ccd284c7SBarry Smith MatSeqAIJSetPreallocation is supported, and similarly MatMPIAIJSetPreallocation is supported 4071ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4072ccd284c7SBarry Smith the above preallocation routines for simplicity. 4073ccd284c7SBarry Smith 4074ccd284c7SBarry Smith Options Database Keys: 4075ccd284c7SBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to MatSetFromOptions() 4076ccd284c7SBarry Smith 407795452b02SPatrick Sanan Developer Notes: 4078ca9cdca7SRichard Tran Mills Subclasses include MATAIJCUSPARSE, MATAIJPERM, MATAIJSELL, MATAIJMKL, MATAIJCRL, and also automatically switches over to use inodes when 4079ccd284c7SBarry Smith enough exist. 4080ccd284c7SBarry Smith 4081ccd284c7SBarry Smith Level: beginner 4082ccd284c7SBarry Smith 4083ccd284c7SBarry Smith .seealso: MatCreateAIJ(), MatCreateSeqAIJ(), MATSEQAIJ,MATMPIAIJ 4084ccd284c7SBarry Smith M*/ 4085ccd284c7SBarry Smith 4086ccd284c7SBarry Smith /*MC 4087ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4088ccd284c7SBarry Smith 4089ccd284c7SBarry Smith This matrix type is identical to MATSEQAIJCRL when constructed with a single process communicator, 4090ccd284c7SBarry Smith and MATMPIAIJCRL otherwise. As a result, for single process communicators, 4091ccd284c7SBarry Smith MatSeqAIJSetPreallocation() is supported, and similarly MatMPIAIJSetPreallocation() is supported 4092ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4093ccd284c7SBarry Smith the above preallocation routines for simplicity. 4094ccd284c7SBarry Smith 4095ccd284c7SBarry Smith Options Database Keys: 4096ccd284c7SBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to MatSetFromOptions() 4097ccd284c7SBarry Smith 4098ccd284c7SBarry Smith Level: beginner 4099ccd284c7SBarry Smith 4100ccd284c7SBarry Smith .seealso: MatCreateMPIAIJCRL,MATSEQAIJCRL,MATMPIAIJCRL, MATSEQAIJCRL, MATMPIAIJCRL 4101ccd284c7SBarry Smith M*/ 4102ccd284c7SBarry Smith 41037906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat,MatType,MatReuse,Mat*); 41047906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 41057906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat,MatType,MatReuse,Mat*); 41067906f579SHong Zhang #endif 41077906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 41087906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A,MatType,MatReuse,Mat*); 41097906f579SHong Zhang PETSC_INTERN PetscErrorCode MatMatMatMult_Transpose_AIJ_AIJ(Mat,Mat,Mat,MatReuse,PetscReal,Mat*); 41107906f579SHong Zhang #endif 41117906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqDense(Mat,MatType,MatReuse,Mat*); 41127906f579SHong Zhang 4113d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat,MatType,MatReuse,Mat*); 4114c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat,MatType,MatReuse,Mat*); 411575d48cdbSStefano Zampini PETSC_INTERN PetscErrorCode MatPtAP_IS_XAIJ(Mat,Mat,MatReuse,PetscReal,Mat*); 41167906f579SHong Zhang 41178c778c55SBarry Smith /*@C 41188397e458SBarry Smith MatSeqAIJGetArray - gives access to the array where the data for a MATSEQAIJ matrix is stored 41198c778c55SBarry Smith 41208c778c55SBarry Smith Not Collective 41218c778c55SBarry Smith 41228c778c55SBarry Smith Input Parameter: 4123579dbff0SBarry Smith . mat - a MATSEQAIJ matrix 41248c778c55SBarry Smith 41258c778c55SBarry Smith Output Parameter: 41268c778c55SBarry Smith . array - pointer to the data 41278c778c55SBarry Smith 41288c778c55SBarry Smith Level: intermediate 41298c778c55SBarry Smith 4130774cf152SJed Brown .seealso: MatSeqAIJRestoreArray(), MatSeqAIJGetArrayF90() 41318c778c55SBarry Smith @*/ 41328c778c55SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A,PetscScalar **array) 41338c778c55SBarry Smith { 41348c778c55SBarry Smith PetscErrorCode ierr; 41358c778c55SBarry Smith 41368c778c55SBarry Smith PetscFunctionBegin; 41378c778c55SBarry Smith ierr = PetscUseMethod(A,"MatSeqAIJGetArray_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 41388c778c55SBarry Smith PetscFunctionReturn(0); 41398c778c55SBarry Smith } 41408c778c55SBarry Smith 414121e72a00SBarry Smith /*@C 414221e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 414321e72a00SBarry Smith 414421e72a00SBarry Smith Not Collective 414521e72a00SBarry Smith 414621e72a00SBarry Smith Input Parameter: 4147579dbff0SBarry Smith . mat - a MATSEQAIJ matrix 414821e72a00SBarry Smith 414921e72a00SBarry Smith Output Parameter: 415021e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 415121e72a00SBarry Smith 415221e72a00SBarry Smith Level: intermediate 415321e72a00SBarry Smith 415421e72a00SBarry Smith .seealso: MatSeqAIJRestoreArray(), MatSeqAIJGetArrayF90() 415521e72a00SBarry Smith @*/ 415621e72a00SBarry Smith PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A,PetscInt *nz) 415721e72a00SBarry Smith { 415821e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 415921e72a00SBarry Smith 416021e72a00SBarry Smith PetscFunctionBegin; 416121e72a00SBarry Smith *nz = aij->rmax; 416221e72a00SBarry Smith PetscFunctionReturn(0); 416321e72a00SBarry Smith } 416421e72a00SBarry Smith 41658c778c55SBarry Smith /*@C 4166579dbff0SBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a MATSEQAIJ matrix is stored obtained by MatSeqAIJGetArray() 41678c778c55SBarry Smith 41688c778c55SBarry Smith Not Collective 41698c778c55SBarry Smith 41708c778c55SBarry Smith Input Parameters: 4171579dbff0SBarry Smith . mat - a MATSEQAIJ matrix 41728c778c55SBarry Smith . array - pointer to the data 41738c778c55SBarry Smith 41748c778c55SBarry Smith Level: intermediate 41758c778c55SBarry Smith 4176774cf152SJed Brown .seealso: MatSeqAIJGetArray(), MatSeqAIJRestoreArrayF90() 41778c778c55SBarry Smith @*/ 41788c778c55SBarry Smith PetscErrorCode MatSeqAIJRestoreArray(Mat A,PetscScalar **array) 41798c778c55SBarry Smith { 41808c778c55SBarry Smith PetscErrorCode ierr; 41818c778c55SBarry Smith 41828c778c55SBarry Smith PetscFunctionBegin; 41838c778c55SBarry Smith ierr = PetscUseMethod(A,"MatSeqAIJRestoreArray_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 41848c778c55SBarry Smith PetscFunctionReturn(0); 41858c778c55SBarry Smith } 41868c778c55SBarry Smith 418734b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 418802fe1965SBarry Smith PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat); 418902fe1965SBarry Smith #endif 419002fe1965SBarry Smith 41918cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4192273d9f13SBarry Smith { 4193273d9f13SBarry Smith Mat_SeqAIJ *b; 4194dfbe8321SBarry Smith PetscErrorCode ierr; 419538baddfdSBarry Smith PetscMPIInt size; 4196273d9f13SBarry Smith 4197273d9f13SBarry Smith PetscFunctionBegin; 4198ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)B),&size);CHKERRQ(ierr); 4199e32f2f54SBarry Smith if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Comm must be of size 1"); 4200273d9f13SBarry Smith 4201b00a9115SJed Brown ierr = PetscNewLog(B,&b);CHKERRQ(ierr); 42022205254eSKarl Rupp 4203b0a32e0cSBarry Smith B->data = (void*)b; 42042205254eSKarl Rupp 4205549d3d68SSatish Balay ierr = PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps));CHKERRQ(ierr); 42062205254eSKarl Rupp 4207416022c9SBarry Smith b->row = 0; 4208416022c9SBarry Smith b->col = 0; 420982bf6240SBarry Smith b->icol = 0; 4210b810aeb4SBarry Smith b->reallocs = 0; 421136db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4212f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4213416022c9SBarry Smith b->nonew = 0; 4214416022c9SBarry Smith b->diag = 0; 4215416022c9SBarry Smith b->solve_work = 0; 42162a1b7f2aSHong Zhang B->spptr = 0; 4217be6bf707SBarry Smith b->saved_values = 0; 4218d7f994e1SBarry Smith b->idiag = 0; 421971f1c65dSBarry Smith b->mdiag = 0; 422071f1c65dSBarry Smith b->ssor_work = 0; 422171f1c65dSBarry Smith b->omega = 1.0; 422271f1c65dSBarry Smith b->fshift = 0.0; 422371f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4224bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4225a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 422617ab2063SBarry Smith 422735d8aa7fSBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ);CHKERRQ(ierr); 4228bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJGetArray_C",MatSeqAIJGetArray_SeqAIJ);CHKERRQ(ierr); 4229bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJRestoreArray_C",MatSeqAIJRestoreArray_SeqAIJ);CHKERRQ(ierr); 42308c778c55SBarry Smith 4231b3866ffcSBarry Smith #if defined(PETSC_HAVE_MATLAB_ENGINE) 4232bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"PetscMatlabEnginePut_C",MatlabEnginePut_SeqAIJ);CHKERRQ(ierr); 4233bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"PetscMatlabEngineGet_C",MatlabEngineGet_SeqAIJ);CHKERRQ(ierr); 4234b3866ffcSBarry Smith #endif 423517f1a0eaSHong Zhang 4236bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetColumnIndices_C",MatSeqAIJSetColumnIndices_SeqAIJ);CHKERRQ(ierr); 4237bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatStoreValues_C",MatStoreValues_SeqAIJ);CHKERRQ(ierr); 4238bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatRetrieveValues_C",MatRetrieveValues_SeqAIJ);CHKERRQ(ierr); 4239bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqsbaij_C",MatConvert_SeqAIJ_SeqSBAIJ);CHKERRQ(ierr); 4240bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqbaij_C",MatConvert_SeqAIJ_SeqBAIJ);CHKERRQ(ierr); 4241bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijperm_C",MatConvert_SeqAIJ_SeqAIJPERM);CHKERRQ(ierr); 42424dfdc2d9SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijsell_C",MatConvert_SeqAIJ_SeqAIJSELL);CHKERRQ(ierr); 42439779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 42444a2a386eSRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijmkl_C",MatConvert_SeqAIJ_SeqAIJMKL);CHKERRQ(ierr); 4245191b95cbSRichard Tran Mills #endif 424634b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 424702fe1965SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijcusparse_C",MatConvert_SeqAIJ_SeqAIJCUSPARSE);CHKERRQ(ierr); 424802fe1965SBarry Smith #endif 4249bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijcrl_C",MatConvert_SeqAIJ_SeqAIJCRL);CHKERRQ(ierr); 4250af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 4251af8000cdSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_elemental_C",MatConvert_SeqAIJ_Elemental);CHKERRQ(ierr); 4252af8000cdSHong Zhang #endif 425363c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 425463c07aadSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_hypre_C",MatConvert_AIJ_HYPRE);CHKERRQ(ierr); 42553dad0653Sstefano_zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMatMult_transpose_seqaij_seqaij_C",MatMatMatMult_Transpose_AIJ_AIJ);CHKERRQ(ierr); 425663c07aadSStefano Zampini #endif 4257b49cda9fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqdense_C",MatConvert_SeqAIJ_SeqDense);CHKERRQ(ierr); 4258d4002b98SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqsell_C",MatConvert_SeqAIJ_SeqSELL);CHKERRQ(ierr); 4259c9225affSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_is_C",MatConvert_XAIJ_IS);CHKERRQ(ierr); 4260bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatIsTranspose_C",MatIsTranspose_SeqAIJ);CHKERRQ(ierr); 4261bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatIsHermitianTranspose_C",MatIsTranspose_SeqAIJ);CHKERRQ(ierr); 4262bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetPreallocation_C",MatSeqAIJSetPreallocation_SeqAIJ);CHKERRQ(ierr); 4263846b4da1SFande Kong ierr = PetscObjectComposeFunction((PetscObject)B,"MatResetPreallocation_C",MatResetPreallocation_SeqAIJ);CHKERRQ(ierr); 4264bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetPreallocationCSR_C",MatSeqAIJSetPreallocationCSR_SeqAIJ);CHKERRQ(ierr); 4265bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatReorderForNonzeroDiagonal_C",MatReorderForNonzeroDiagonal_SeqAIJ);CHKERRQ(ierr); 4266bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMult_seqdense_seqaij_C",MatMatMult_SeqDense_SeqAIJ);CHKERRQ(ierr); 4267bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_seqdense_seqaij_C",MatMatMultSymbolic_SeqDense_SeqAIJ);CHKERRQ(ierr); 4268bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_seqdense_seqaij_C",MatMatMultNumeric_SeqDense_SeqAIJ);CHKERRQ(ierr); 426975d48cdbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatPtAP_is_seqaij_C",MatPtAP_IS_XAIJ);CHKERRQ(ierr); 42704108e4d5SBarry Smith ierr = MatCreate_SeqAIJ_Inode(B);CHKERRQ(ierr); 427117667f90SBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ);CHKERRQ(ierr); 42724099cc6bSBarry Smith ierr = MatSeqAIJSetTypeFromOptions(B);CHKERRQ(ierr); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 42733a40ed3dSBarry Smith PetscFunctionReturn(0); 427417ab2063SBarry Smith } 427517ab2063SBarry Smith 4276b24902e0SBarry Smith /* 4277b24902e0SBarry Smith Given a matrix generated with MatGetFactor() duplicates all the information in A into B 4278b24902e0SBarry Smith */ 4279ace3abfcSBarry Smith PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C,Mat A,MatDuplicateOption cpvalues,PetscBool mallocmatspace) 428017ab2063SBarry Smith { 4281416022c9SBarry Smith Mat_SeqAIJ *c,*a = (Mat_SeqAIJ*)A->data; 42826849ba73SBarry Smith PetscErrorCode ierr; 4283d0f46423SBarry Smith PetscInt i,m = A->rmap->n; 428417ab2063SBarry Smith 42853a40ed3dSBarry Smith PetscFunctionBegin; 4286273d9f13SBarry Smith c = (Mat_SeqAIJ*)C->data; 4287273d9f13SBarry Smith 4288d5f3da31SBarry Smith C->factortype = A->factortype; 4289416022c9SBarry Smith c->row = 0; 4290416022c9SBarry Smith c->col = 0; 429182bf6240SBarry Smith c->icol = 0; 42926ad4291fSHong Zhang c->reallocs = 0; 429317ab2063SBarry Smith 42946ad4291fSHong Zhang C->assembled = PETSC_TRUE; 429517ab2063SBarry Smith 4296aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->rmap,&C->rmap);CHKERRQ(ierr); 4297aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->cmap,&C->cmap);CHKERRQ(ierr); 4298eec197d1SBarry Smith 4299dcca6d9dSJed Brown ierr = PetscMalloc2(m,&c->imax,m,&c->ilen);CHKERRQ(ierr); 43003bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)C, 2*m*sizeof(PetscInt));CHKERRQ(ierr); 430117ab2063SBarry Smith for (i=0; i<m; i++) { 4302416022c9SBarry Smith c->imax[i] = a->imax[i]; 4303416022c9SBarry Smith c->ilen[i] = a->ilen[i]; 430417ab2063SBarry Smith } 430517ab2063SBarry Smith 430617ab2063SBarry Smith /* allocate the matrix space */ 4307f77e22a1SHong Zhang if (mallocmatspace) { 4308dcca6d9dSJed Brown ierr = PetscMalloc3(a->i[m],&c->a,a->i[m],&c->j,m+1,&c->i);CHKERRQ(ierr); 43093bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)C, a->i[m]*(sizeof(PetscScalar)+sizeof(PetscInt))+(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 43102205254eSKarl Rupp 4311f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 43122205254eSKarl Rupp 431397f1f81fSBarry Smith ierr = PetscMemcpy(c->i,a->i,(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 431417ab2063SBarry Smith if (m > 0) { 431597f1f81fSBarry Smith ierr = PetscMemcpy(c->j,a->j,(a->i[m])*sizeof(PetscInt));CHKERRQ(ierr); 4316be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 4317bfeeae90SHong Zhang ierr = PetscMemcpy(c->a,a->a,(a->i[m])*sizeof(PetscScalar));CHKERRQ(ierr); 4318be6bf707SBarry Smith } else { 4319bfeeae90SHong Zhang ierr = PetscMemzero(c->a,(a->i[m])*sizeof(PetscScalar));CHKERRQ(ierr); 432017ab2063SBarry Smith } 432108480c60SBarry Smith } 4322f77e22a1SHong Zhang } 432317ab2063SBarry Smith 43246ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 4325416022c9SBarry Smith c->roworiented = a->roworiented; 4326416022c9SBarry Smith c->nonew = a->nonew; 4327416022c9SBarry Smith if (a->diag) { 4328854ce69bSBarry Smith ierr = PetscMalloc1(m+1,&c->diag);CHKERRQ(ierr); 43293bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)C,(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 433017ab2063SBarry Smith for (i=0; i<m; i++) { 4331416022c9SBarry Smith c->diag[i] = a->diag[i]; 433217ab2063SBarry Smith } 43333a40ed3dSBarry Smith } else c->diag = 0; 43342205254eSKarl Rupp 43356ad4291fSHong Zhang c->solve_work = 0; 43366ad4291fSHong Zhang c->saved_values = 0; 43376ad4291fSHong Zhang c->idiag = 0; 433871f1c65dSBarry Smith c->ssor_work = 0; 4339a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 4340e6b907acSBarry Smith c->free_a = PETSC_TRUE; 4341e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 43426ad4291fSHong Zhang 4343893ad86cSHong Zhang c->rmax = a->rmax; 4344416022c9SBarry Smith c->nz = a->nz; 43458ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 4346273d9f13SBarry Smith C->preallocated = PETSC_TRUE; 4347754ec7b1SSatish Balay 43486ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 43496ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 4350cd6b891eSBarry Smith if (a->compressedrow.use) { 43516ad4291fSHong Zhang i = a->compressedrow.nrows; 4352dcca6d9dSJed Brown ierr = PetscMalloc2(i+1,&c->compressedrow.i,i,&c->compressedrow.rindex);CHKERRQ(ierr); 43536ad4291fSHong Zhang ierr = PetscMemcpy(c->compressedrow.i,a->compressedrow.i,(i+1)*sizeof(PetscInt));CHKERRQ(ierr); 43546ad4291fSHong Zhang ierr = PetscMemcpy(c->compressedrow.rindex,a->compressedrow.rindex,i*sizeof(PetscInt));CHKERRQ(ierr); 435527ea64f8SHong Zhang } else { 435627ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 43570298fd71SBarry Smith c->compressedrow.i = NULL; 43580298fd71SBarry Smith c->compressedrow.rindex = NULL; 43596ad4291fSHong Zhang } 4360ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 4361e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 43624846f1f5SKris Buschelman 43632205254eSKarl Rupp ierr = MatDuplicate_SeqAIJ_Inode(A,cpvalues,&C);CHKERRQ(ierr); 4364140e18c1SBarry Smith ierr = PetscFunctionListDuplicate(((PetscObject)A)->qlist,&((PetscObject)C)->qlist);CHKERRQ(ierr); 43653a40ed3dSBarry Smith PetscFunctionReturn(0); 436617ab2063SBarry Smith } 436717ab2063SBarry Smith 4368b24902e0SBarry Smith PetscErrorCode MatDuplicate_SeqAIJ(Mat A,MatDuplicateOption cpvalues,Mat *B) 4369b24902e0SBarry Smith { 4370b24902e0SBarry Smith PetscErrorCode ierr; 4371b24902e0SBarry Smith 4372b24902e0SBarry Smith PetscFunctionBegin; 4373ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),B);CHKERRQ(ierr); 43744b6263acSBarry Smith ierr = MatSetSizes(*B,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 4375cfd3f464SBarry Smith if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) { 437633d57670SJed Brown ierr = MatSetBlockSizesFromMats(*B,A,A);CHKERRQ(ierr); 4377cfd3f464SBarry Smith } 4378a54f2f98SBarry Smith ierr = MatSetType(*B,((PetscObject)A)->type_name);CHKERRQ(ierr); 4379f77e22a1SHong Zhang ierr = MatDuplicateNoCreate_SeqAIJ(*B,A,cpvalues,PETSC_TRUE);CHKERRQ(ierr); 4380b24902e0SBarry Smith PetscFunctionReturn(0); 4381b24902e0SBarry Smith } 4382b24902e0SBarry Smith 4383112444f4SShri Abhyankar PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 4384fbdbba38SShri Abhyankar { 438552f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 438652f91c60SVaclav Hapla PetscErrorCode ierr; 438752f91c60SVaclav Hapla 438852f91c60SVaclav Hapla PetscFunctionBegin; 438952f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat,MAT_CLASSID,1); 439052f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer,PETSC_VIEWER_CLASSID,2); 4391c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 4392c27b3999SVaclav Hapla ierr = PetscViewerSetUp(viewer);CHKERRQ(ierr); 439352f91c60SVaclav Hapla ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 439452f91c60SVaclav Hapla ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERHDF5, &ishdf5);CHKERRQ(ierr); 439552f91c60SVaclav Hapla if (isbinary) { 439652f91c60SVaclav Hapla ierr = MatLoad_SeqAIJ_Binary(newMat,viewer);CHKERRQ(ierr); 439752f91c60SVaclav Hapla } else if (ishdf5) { 439852f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 439952f91c60SVaclav Hapla ierr = MatLoad_AIJ_HDF5(newMat,viewer);CHKERRQ(ierr); 440052f91c60SVaclav Hapla #else 440152f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 440252f91c60SVaclav Hapla #endif 440352f91c60SVaclav Hapla } else { 440452f91c60SVaclav Hapla SETERRQ2(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"Viewer type %s not yet supported for reading %s matrices",((PetscObject)viewer)->type_name,((PetscObject)newMat)->type_name); 440552f91c60SVaclav Hapla } 440652f91c60SVaclav Hapla PetscFunctionReturn(0); 440752f91c60SVaclav Hapla } 440852f91c60SVaclav Hapla 440952f91c60SVaclav Hapla PetscErrorCode MatLoad_SeqAIJ_Binary(Mat newMat, PetscViewer viewer) 441052f91c60SVaclav Hapla { 4411fbdbba38SShri Abhyankar Mat_SeqAIJ *a; 4412fbdbba38SShri Abhyankar PetscErrorCode ierr; 4413fbdbba38SShri Abhyankar PetscInt i,sum,nz,header[4],*rowlengths = 0,M,N,rows,cols; 4414fbdbba38SShri Abhyankar int fd; 4415fbdbba38SShri Abhyankar PetscMPIInt size; 4416fbdbba38SShri Abhyankar MPI_Comm comm; 44173059b6faSBarry Smith PetscInt bs = newMat->rmap->bs; 4418fbdbba38SShri Abhyankar 4419fbdbba38SShri Abhyankar PetscFunctionBegin; 4420fbdbba38SShri Abhyankar ierr = PetscObjectGetComm((PetscObject)viewer,&comm);CHKERRQ(ierr); 4421fbdbba38SShri Abhyankar ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 4422fbdbba38SShri Abhyankar if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"view must have one processor"); 4423bbead8a2SBarry Smith 44240298fd71SBarry Smith ierr = PetscOptionsBegin(comm,NULL,"Options for loading SEQAIJ matrix","Mat");CHKERRQ(ierr); 44250298fd71SBarry Smith ierr = PetscOptionsInt("-matload_block_size","Set the blocksize used to store the matrix","MatLoad",bs,&bs,NULL);CHKERRQ(ierr); 4426bbead8a2SBarry Smith ierr = PetscOptionsEnd();CHKERRQ(ierr); 44273059b6faSBarry Smith if (bs < 0) bs = 1; 44283059b6faSBarry Smith ierr = MatSetBlockSize(newMat,bs);CHKERRQ(ierr); 4429bbead8a2SBarry Smith 4430fbdbba38SShri Abhyankar ierr = PetscViewerBinaryGetDescriptor(viewer,&fd);CHKERRQ(ierr); 4431fbdbba38SShri Abhyankar ierr = PetscBinaryRead(fd,header,4,PETSC_INT);CHKERRQ(ierr); 4432fbdbba38SShri Abhyankar if (header[0] != MAT_FILE_CLASSID) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"not matrix object in file"); 4433fbdbba38SShri Abhyankar M = header[1]; N = header[2]; nz = header[3]; 4434fbdbba38SShri Abhyankar 4435bbead8a2SBarry Smith if (nz < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Matrix stored in special format on disk,cannot load as SeqAIJ"); 4436fbdbba38SShri Abhyankar 4437fbdbba38SShri Abhyankar /* read in row lengths */ 4438785e854fSJed Brown ierr = PetscMalloc1(M,&rowlengths);CHKERRQ(ierr); 4439fbdbba38SShri Abhyankar ierr = PetscBinaryRead(fd,rowlengths,M,PETSC_INT);CHKERRQ(ierr); 4440fbdbba38SShri Abhyankar 4441fbdbba38SShri Abhyankar /* check if sum of rowlengths is same as nz */ 4442fbdbba38SShri Abhyankar for (i=0,sum=0; i< M; i++) sum +=rowlengths[i]; 444360e0710aSBarry Smith if (sum != nz) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_FILE_READ,"Inconsistant matrix data in file. no-nonzeros = %dD, sum-row-lengths = %D\n",nz,sum); 4444fbdbba38SShri Abhyankar 4445fbdbba38SShri Abhyankar /* set global size if not set already*/ 4446f501eaabSShri Abhyankar if (newMat->rmap->n < 0 && newMat->rmap->N < 0 && newMat->cmap->n < 0 && newMat->cmap->N < 0) { 4447fbdbba38SShri Abhyankar ierr = MatSetSizes(newMat,PETSC_DECIDE,PETSC_DECIDE,M,N);CHKERRQ(ierr); 4448aabbc4fbSShri Abhyankar } else { 44499d36ed5fSBarry Smith /* if sizes and type are already set, check if the matrix global sizes are correct */ 4450fbdbba38SShri Abhyankar ierr = MatGetSize(newMat,&rows,&cols);CHKERRQ(ierr); 44514c5b953cSHong Zhang if (rows < 0 && cols < 0) { /* user might provide local size instead of global size */ 44524c5b953cSHong Zhang ierr = MatGetLocalSize(newMat,&rows,&cols);CHKERRQ(ierr); 44534c5b953cSHong Zhang } 445460e0710aSBarry Smith if (M != rows || N != cols) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%D, %D) than the input matrix (%D, %D)",M,N,rows,cols); 4455aabbc4fbSShri Abhyankar } 4456fbdbba38SShri Abhyankar ierr = MatSeqAIJSetPreallocation_SeqAIJ(newMat,0,rowlengths);CHKERRQ(ierr); 4457fbdbba38SShri Abhyankar a = (Mat_SeqAIJ*)newMat->data; 4458fbdbba38SShri Abhyankar 4459fbdbba38SShri Abhyankar ierr = PetscBinaryRead(fd,a->j,nz,PETSC_INT);CHKERRQ(ierr); 4460fbdbba38SShri Abhyankar 4461fbdbba38SShri Abhyankar /* read in nonzero values */ 4462fbdbba38SShri Abhyankar ierr = PetscBinaryRead(fd,a->a,nz,PETSC_SCALAR);CHKERRQ(ierr); 4463fbdbba38SShri Abhyankar 4464fbdbba38SShri Abhyankar /* set matrix "i" values */ 4465fbdbba38SShri Abhyankar a->i[0] = 0; 4466fbdbba38SShri Abhyankar for (i=1; i<= M; i++) { 4467fbdbba38SShri Abhyankar a->i[i] = a->i[i-1] + rowlengths[i-1]; 4468fbdbba38SShri Abhyankar a->ilen[i-1] = rowlengths[i-1]; 4469fbdbba38SShri Abhyankar } 4470fbdbba38SShri Abhyankar ierr = PetscFree(rowlengths);CHKERRQ(ierr); 4471fbdbba38SShri Abhyankar 4472fbdbba38SShri Abhyankar ierr = MatAssemblyBegin(newMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4473fbdbba38SShri Abhyankar ierr = MatAssemblyEnd(newMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4474fbdbba38SShri Abhyankar PetscFunctionReturn(0); 4475fbdbba38SShri Abhyankar } 4476fbdbba38SShri Abhyankar 4477ace3abfcSBarry Smith PetscErrorCode MatEqual_SeqAIJ(Mat A,Mat B,PetscBool * flg) 44787264ac53SSatish Balay { 44797264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*b = (Mat_SeqAIJ*)B->data; 4480dfbe8321SBarry Smith PetscErrorCode ierr; 4481eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 4482eeffb40dSHong Zhang PetscInt k; 4483eeffb40dSHong Zhang #endif 44847264ac53SSatish Balay 44853a40ed3dSBarry Smith PetscFunctionBegin; 4486bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 4487d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) ||(a->nz != b->nz)) { 4488ca44d042SBarry Smith *flg = PETSC_FALSE; 4489ca44d042SBarry Smith PetscFunctionReturn(0); 4490bcd2baecSBarry Smith } 44917264ac53SSatish Balay 44927264ac53SSatish Balay /* if the a->i are the same */ 4493d0f46423SBarry Smith ierr = PetscMemcmp(a->i,b->i,(A->rmap->n+1)*sizeof(PetscInt),flg);CHKERRQ(ierr); 4494abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 44957264ac53SSatish Balay 44967264ac53SSatish Balay /* if a->j are the same */ 449797f1f81fSBarry Smith ierr = PetscMemcmp(a->j,b->j,(a->nz)*sizeof(PetscInt),flg);CHKERRQ(ierr); 4498abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 4499bcd2baecSBarry Smith 4500bcd2baecSBarry Smith /* if a->a are the same */ 4501eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 4502eeffb40dSHong Zhang for (k=0; k<a->nz; k++) { 4503eeffb40dSHong Zhang if (PetscRealPart(a->a[k]) != PetscRealPart(b->a[k]) || PetscImaginaryPart(a->a[k]) != PetscImaginaryPart(b->a[k])) { 4504eeffb40dSHong Zhang *flg = PETSC_FALSE; 45053a40ed3dSBarry Smith PetscFunctionReturn(0); 4506eeffb40dSHong Zhang } 4507eeffb40dSHong Zhang } 4508eeffb40dSHong Zhang #else 4509eeffb40dSHong Zhang ierr = PetscMemcmp(a->a,b->a,(a->nz)*sizeof(PetscScalar),flg);CHKERRQ(ierr); 4510eeffb40dSHong Zhang #endif 4511eeffb40dSHong Zhang PetscFunctionReturn(0); 45127264ac53SSatish Balay } 451336db0b34SBarry Smith 451405869f15SSatish Balay /*@ 451536db0b34SBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential AIJ matrix using matrix elements (in CSR format) 451636db0b34SBarry Smith provided by the user. 451736db0b34SBarry Smith 4518c75a6043SHong Zhang Collective on MPI_Comm 451936db0b34SBarry Smith 452036db0b34SBarry Smith Input Parameters: 452136db0b34SBarry Smith + comm - must be an MPI communicator of size 1 452236db0b34SBarry Smith . m - number of rows 452336db0b34SBarry Smith . n - number of columns 4524483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 452536db0b34SBarry Smith . j - column indices 452636db0b34SBarry Smith - a - matrix values 452736db0b34SBarry Smith 452836db0b34SBarry Smith Output Parameter: 452936db0b34SBarry Smith . mat - the matrix 453036db0b34SBarry Smith 453136db0b34SBarry Smith Level: intermediate 453236db0b34SBarry Smith 453336db0b34SBarry Smith Notes: 45340551d7c0SBarry Smith The i, j, and a arrays are not copied by this routine, the user must free these arrays 4535292fb18eSBarry Smith once the matrix is destroyed and not before 453636db0b34SBarry Smith 453736db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 453836db0b34SBarry Smith 4539bfeeae90SHong Zhang The i and j indices are 0 based 454036db0b34SBarry Smith 4541a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 4542a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 45438eef79e4SBarry Smith as shown 4544a4552177SSatish Balay 45458eef79e4SBarry Smith $ 1 0 0 45468eef79e4SBarry Smith $ 2 0 3 45478eef79e4SBarry Smith $ 4 5 6 45488eef79e4SBarry Smith $ 45498eef79e4SBarry Smith $ i = {0,1,3,6} [size = nrow+1 = 3+1] 45508eef79e4SBarry Smith $ j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 45518eef79e4SBarry Smith $ v = {1,2,3,4,5,6} [size = 6] 4552a4552177SSatish Balay 45539985e31cSBarry Smith 455469b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatCreateSeqAIJ(), MatCreateMPIAIJWithArrays(), MatMPIAIJSetPreallocationCSR() 455536db0b34SBarry Smith 455636db0b34SBarry Smith @*/ 4557c3c607ccSBarry Smith PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt i[],PetscInt j[],PetscScalar a[],Mat *mat) 455836db0b34SBarry Smith { 4559dfbe8321SBarry Smith PetscErrorCode ierr; 4560cbcfb4deSHong Zhang PetscInt ii; 456136db0b34SBarry Smith Mat_SeqAIJ *aij; 4562cbcfb4deSHong Zhang #if defined(PETSC_USE_DEBUG) 4563cbcfb4deSHong Zhang PetscInt jj; 4564cbcfb4deSHong Zhang #endif 456536db0b34SBarry Smith 456636db0b34SBarry Smith PetscFunctionBegin; 456741096f02SStefano Zampini if (m > 0 && i[0]) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"i (row indices) must start with 0"); 4568f69a0ea3SMatthew Knepley ierr = MatCreate(comm,mat);CHKERRQ(ierr); 4569f69a0ea3SMatthew Knepley ierr = MatSetSizes(*mat,m,n,m,n);CHKERRQ(ierr); 4570a2f3521dSMark F. Adams /* ierr = MatSetBlockSizes(*mat,,);CHKERRQ(ierr); */ 4571ab93d7beSBarry Smith ierr = MatSetType(*mat,MATSEQAIJ);CHKERRQ(ierr); 4572ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(*mat,MAT_SKIP_ALLOCATION,0);CHKERRQ(ierr); 4573ab93d7beSBarry Smith aij = (Mat_SeqAIJ*)(*mat)->data; 4574dcca6d9dSJed Brown ierr = PetscMalloc2(m,&aij->imax,m,&aij->ilen);CHKERRQ(ierr); 4575ab93d7beSBarry Smith 457636db0b34SBarry Smith aij->i = i; 457736db0b34SBarry Smith aij->j = j; 457836db0b34SBarry Smith aij->a = a; 457936db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 458036db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 4581e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 4582e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 458336db0b34SBarry Smith 458436db0b34SBarry Smith for (ii=0; ii<m; ii++) { 458536db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii+1] - i[ii]; 45862515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 458760e0710aSBarry Smith if (i[ii+1] - i[ii] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row length in i (row indices) row = %D length = %D",ii,i[ii+1] - i[ii]); 45889985e31cSBarry Smith for (jj=i[ii]+1; jj<i[ii+1]; jj++) { 4589a061629eSStefano Zampini if (j[jj] < j[jj-1]) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %D (actual column %D) in row %D is not sorted",jj-i[ii],j[jj],ii); 4590a061629eSStefano Zampini if (j[jj] == j[jj-1]) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %D (actual column %D) in row %D is identical to previous entry",jj-i[ii],j[jj],ii); 45919985e31cSBarry Smith } 459236db0b34SBarry Smith #endif 459336db0b34SBarry Smith } 45942515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 459536db0b34SBarry Smith for (ii=0; ii<aij->i[m]; ii++) { 459660e0710aSBarry Smith if (j[ii] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column index at location = %D index = %D",ii,j[ii]); 459760e0710aSBarry Smith if (j[ii] > n - 1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column index to large at location = %D index = %D",ii,j[ii]); 459836db0b34SBarry Smith } 459936db0b34SBarry Smith #endif 460036db0b34SBarry Smith 4601b65db4caSBarry Smith ierr = MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4602b65db4caSBarry Smith ierr = MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 460336db0b34SBarry Smith PetscFunctionReturn(0); 460436db0b34SBarry Smith } 460580ef6e79SMatthew G Knepley /*@C 4606d021a1c5SVictor Minden MatCreateSeqAIJFromTriple - Creates an sequential AIJ matrix using matrix elements (in COO format) 46078a0b0e6bSVictor Minden provided by the user. 46088a0b0e6bSVictor Minden 46098a0b0e6bSVictor Minden Collective on MPI_Comm 46108a0b0e6bSVictor Minden 46118a0b0e6bSVictor Minden Input Parameters: 46128a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 46138a0b0e6bSVictor Minden . m - number of rows 46148a0b0e6bSVictor Minden . n - number of columns 46158a0b0e6bSVictor Minden . i - row indices 46168a0b0e6bSVictor Minden . j - column indices 46171230e6d1SVictor Minden . a - matrix values 46181230e6d1SVictor Minden . nz - number of nonzeros 46191230e6d1SVictor Minden - idx - 0 or 1 based 46208a0b0e6bSVictor Minden 46218a0b0e6bSVictor Minden Output Parameter: 46228a0b0e6bSVictor Minden . mat - the matrix 46238a0b0e6bSVictor Minden 46248a0b0e6bSVictor Minden Level: intermediate 46258a0b0e6bSVictor Minden 46268a0b0e6bSVictor Minden Notes: 46278a0b0e6bSVictor Minden The i and j indices are 0 based 46288a0b0e6bSVictor Minden 46298a0b0e6bSVictor Minden The format which is used for the sparse matrix input, is equivalent to a 46308a0b0e6bSVictor Minden row-major ordering.. i.e for the following matrix, the input data expected is 46318a0b0e6bSVictor Minden as shown: 46328a0b0e6bSVictor Minden 46338a0b0e6bSVictor Minden 1 0 0 46348a0b0e6bSVictor Minden 2 0 3 46358a0b0e6bSVictor Minden 4 5 6 46368a0b0e6bSVictor Minden 46378a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 46388a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 46398a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 46408a0b0e6bSVictor Minden 46418a0b0e6bSVictor Minden 464269b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatCreateSeqAIJ(), MatCreateSeqAIJWithArrays(), MatMPIAIJSetPreallocationCSR() 46438a0b0e6bSVictor Minden 46448a0b0e6bSVictor Minden @*/ 4645c3c607ccSBarry Smith PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt i[],PetscInt j[],PetscScalar a[],Mat *mat,PetscInt nz,PetscBool idx) 46468a0b0e6bSVictor Minden { 46478a0b0e6bSVictor Minden PetscErrorCode ierr; 4648d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1,row,col; 46498a0b0e6bSVictor Minden 46508a0b0e6bSVictor Minden 46518a0b0e6bSVictor Minden PetscFunctionBegin; 46521795a4d1SJed Brown ierr = PetscCalloc1(m,&nnz);CHKERRQ(ierr); 46531230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 4654c8d679ebSHong Zhang nnz[i[ii] - !!idx] += 1; 46551230e6d1SVictor Minden } 46568a0b0e6bSVictor Minden ierr = MatCreate(comm,mat);CHKERRQ(ierr); 46578a0b0e6bSVictor Minden ierr = MatSetSizes(*mat,m,n,m,n);CHKERRQ(ierr); 46588a0b0e6bSVictor Minden ierr = MatSetType(*mat,MATSEQAIJ);CHKERRQ(ierr); 46591230e6d1SVictor Minden ierr = MatSeqAIJSetPreallocation_SeqAIJ(*mat,0,nnz);CHKERRQ(ierr); 46601230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 46611230e6d1SVictor Minden if (idx) { 46621230e6d1SVictor Minden row = i[ii] - 1; 46631230e6d1SVictor Minden col = j[ii] - 1; 46641230e6d1SVictor Minden } else { 46651230e6d1SVictor Minden row = i[ii]; 46661230e6d1SVictor Minden col = j[ii]; 46678a0b0e6bSVictor Minden } 46681230e6d1SVictor Minden ierr = MatSetValues(*mat,one,&row,one,&col,&a[ii],ADD_VALUES);CHKERRQ(ierr); 46698a0b0e6bSVictor Minden } 46708a0b0e6bSVictor Minden ierr = MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 46718a0b0e6bSVictor Minden ierr = MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4672d021a1c5SVictor Minden ierr = PetscFree(nnz);CHKERRQ(ierr); 46738a0b0e6bSVictor Minden PetscFunctionReturn(0); 46748a0b0e6bSVictor Minden } 467536db0b34SBarry Smith 4676acf2f550SJed Brown PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 4677acf2f550SJed Brown { 4678acf2f550SJed Brown Mat_SeqAIJ *a=(Mat_SeqAIJ*)A->data; 4679acf2f550SJed Brown PetscErrorCode ierr; 4680acf2f550SJed Brown 4681acf2f550SJed Brown PetscFunctionBegin; 4682acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 4683acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 46842205254eSKarl Rupp 4685acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal_Inode(A);CHKERRQ(ierr); 4686acf2f550SJed Brown PetscFunctionReturn(0); 4687acf2f550SJed Brown } 4688acf2f550SJed Brown 46899c8f2541SHong Zhang PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm,Mat inmat,PetscInt n,MatReuse scall,Mat *outmat) 46909c8f2541SHong Zhang { 46919c8f2541SHong Zhang PetscErrorCode ierr; 46928761c3d6SHong Zhang PetscMPIInt size; 46939c8f2541SHong Zhang 46949c8f2541SHong Zhang PetscFunctionBegin; 46958761c3d6SHong Zhang ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 46967bbdc51dSHong Zhang if (size == 1) { 46977bbdc51dSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 46987bbdc51dSHong Zhang ierr = MatDuplicate(inmat,MAT_COPY_VALUES,outmat);CHKERRQ(ierr); 46997bbdc51dSHong Zhang } else { 47008761c3d6SHong Zhang ierr = MatCopy(inmat,*outmat,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 47017bbdc51dSHong Zhang } 47028761c3d6SHong Zhang } else { 47039c8f2541SHong Zhang ierr = MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm,inmat,n,scall,outmat);CHKERRQ(ierr); 47048761c3d6SHong Zhang } 47059c8f2541SHong Zhang PetscFunctionReturn(0); 47069c8f2541SHong Zhang } 47079c8f2541SHong Zhang 470881824310SBarry Smith /* 470953dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 471053dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 471153dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 471253dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 471353dd7562SDmitry Karpeev */ 471453dd7562SDmitry Karpeev PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C,IS rowemb,IS colemb,MatStructure pattern,Mat B) 471553dd7562SDmitry Karpeev { 471653dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 471753dd7562SDmitry Karpeev PetscErrorCode ierr; 471853dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 471953dd7562SDmitry Karpeev PetscBool seqaij; 472053dd7562SDmitry Karpeev PetscInt m,n,*nz,i,j,count; 472153dd7562SDmitry Karpeev PetscScalar v; 472253dd7562SDmitry Karpeev const PetscInt *rowindices,*colindices; 472353dd7562SDmitry Karpeev 472453dd7562SDmitry Karpeev PetscFunctionBegin; 472553dd7562SDmitry Karpeev if (!B) PetscFunctionReturn(0); 472653dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 47274099cc6bSBarry Smith ierr = PetscObjectBaseTypeCompare((PetscObject)B,MATSEQAIJ,&seqaij);CHKERRQ(ierr); 472853dd7562SDmitry Karpeev if (!seqaij) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is of wrong type"); 472953dd7562SDmitry Karpeev if (rowemb) { 473053dd7562SDmitry Karpeev ierr = ISGetLocalSize(rowemb,&m);CHKERRQ(ierr); 473153dd7562SDmitry Karpeev if (m != B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Row IS of size %D is incompatible with matrix row size %D",m,B->rmap->n); 473253dd7562SDmitry Karpeev } else { 47336c4ed002SBarry Smith if (C->rmap->n != B->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is row-incompatible with the target matrix"); 473453dd7562SDmitry Karpeev } 473553dd7562SDmitry Karpeev if (colemb) { 473653dd7562SDmitry Karpeev ierr = ISGetLocalSize(colemb,&n);CHKERRQ(ierr); 473753dd7562SDmitry Karpeev if (n != B->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Diag col IS of size %D is incompatible with input matrix col size %D",n,B->cmap->n); 473853dd7562SDmitry Karpeev } else { 473953dd7562SDmitry Karpeev if (C->cmap->n != B->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is col-incompatible with the target matrix"); 474053dd7562SDmitry Karpeev } 474153dd7562SDmitry Karpeev 474253dd7562SDmitry Karpeev Baij = (Mat_SeqAIJ*)(B->data); 474353dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 474453dd7562SDmitry Karpeev ierr = PetscMalloc1(B->rmap->n,&nz);CHKERRQ(ierr); 474553dd7562SDmitry Karpeev for (i=0; i<B->rmap->n; i++) { 474653dd7562SDmitry Karpeev nz[i] = Baij->i[i+1] - Baij->i[i]; 474753dd7562SDmitry Karpeev } 474853dd7562SDmitry Karpeev ierr = MatSeqAIJSetPreallocation(C,0,nz);CHKERRQ(ierr); 474953dd7562SDmitry Karpeev ierr = PetscFree(nz);CHKERRQ(ierr); 475053dd7562SDmitry Karpeev } 475153dd7562SDmitry Karpeev if (pattern == SUBSET_NONZERO_PATTERN) { 475253dd7562SDmitry Karpeev ierr = MatZeroEntries(C);CHKERRQ(ierr); 475353dd7562SDmitry Karpeev } 475453dd7562SDmitry Karpeev count = 0; 475553dd7562SDmitry Karpeev rowindices = NULL; 475653dd7562SDmitry Karpeev colindices = NULL; 475753dd7562SDmitry Karpeev if (rowemb) { 475853dd7562SDmitry Karpeev ierr = ISGetIndices(rowemb,&rowindices);CHKERRQ(ierr); 475953dd7562SDmitry Karpeev } 476053dd7562SDmitry Karpeev if (colemb) { 476153dd7562SDmitry Karpeev ierr = ISGetIndices(colemb,&colindices);CHKERRQ(ierr); 476253dd7562SDmitry Karpeev } 476353dd7562SDmitry Karpeev for (i=0; i<B->rmap->n; i++) { 476453dd7562SDmitry Karpeev PetscInt row; 476553dd7562SDmitry Karpeev row = i; 476653dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 476753dd7562SDmitry Karpeev for (j=Baij->i[i]; j<Baij->i[i+1]; j++) { 476853dd7562SDmitry Karpeev PetscInt col; 476953dd7562SDmitry Karpeev col = Baij->j[count]; 477053dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 477153dd7562SDmitry Karpeev v = Baij->a[count]; 477253dd7562SDmitry Karpeev ierr = MatSetValues(C,1,&row,1,&col,&v,INSERT_VALUES);CHKERRQ(ierr); 477353dd7562SDmitry Karpeev ++count; 477453dd7562SDmitry Karpeev } 477553dd7562SDmitry Karpeev } 477653dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 477753dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 477853dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 477953dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 478053dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 478153dd7562SDmitry Karpeev PetscFunctionReturn(0); 478253dd7562SDmitry Karpeev } 478353dd7562SDmitry Karpeev 47844099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 47854099cc6bSBarry Smith 47864099cc6bSBarry Smith /*@C 47874099cc6bSBarry Smith MatSeqAIJSetType - Converts a MATSEQAIJ matrix to a subtype 47884099cc6bSBarry Smith 47894099cc6bSBarry Smith Collective on Mat 47904099cc6bSBarry Smith 47914099cc6bSBarry Smith Input Parameters: 47924099cc6bSBarry Smith + mat - the matrix object 47934099cc6bSBarry Smith - matype - matrix type 47944099cc6bSBarry Smith 47954099cc6bSBarry Smith Options Database Key: 47964099cc6bSBarry Smith . -mat_seqai_type <method> - for example seqaijcrl 47974099cc6bSBarry Smith 47984099cc6bSBarry Smith 47994099cc6bSBarry Smith Level: intermediate 48004099cc6bSBarry Smith 48014099cc6bSBarry Smith .keywords: Mat, MatType, set, method 48024099cc6bSBarry Smith 48034099cc6bSBarry Smith .seealso: PCSetType(), VecSetType(), MatCreate(), MatType, Mat 48044099cc6bSBarry Smith @*/ 48054099cc6bSBarry Smith PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 48064099cc6bSBarry Smith { 4807fd9d3c67SJed Brown PetscErrorCode ierr,(*r)(Mat,MatType,MatReuse,Mat*); 48084099cc6bSBarry Smith PetscBool sametype; 48094099cc6bSBarry Smith 48104099cc6bSBarry Smith PetscFunctionBegin; 48114099cc6bSBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 48124099cc6bSBarry Smith ierr = PetscObjectTypeCompare((PetscObject)mat,matype,&sametype);CHKERRQ(ierr); 48134099cc6bSBarry Smith if (sametype) PetscFunctionReturn(0); 48144099cc6bSBarry Smith 48154099cc6bSBarry Smith ierr = PetscFunctionListFind(MatSeqAIJList,matype,&r);CHKERRQ(ierr); 48164099cc6bSBarry Smith if (!r) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_UNKNOWN_TYPE,"Unknown Mat type given: %s",matype); 48174099cc6bSBarry Smith ierr = (*r)(mat,matype,MAT_INPLACE_MATRIX,&mat);CHKERRQ(ierr); 48184099cc6bSBarry Smith PetscFunctionReturn(0); 48194099cc6bSBarry Smith } 48204099cc6bSBarry Smith 48214099cc6bSBarry Smith 48224099cc6bSBarry Smith /*@C 48234099cc6bSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential AIJ matrices 48244099cc6bSBarry Smith 48254099cc6bSBarry Smith Not Collective 48264099cc6bSBarry Smith 48274099cc6bSBarry Smith Input Parameters: 48284099cc6bSBarry Smith + name - name of a new user-defined matrix type, for example MATSEQAIJCRL 48294099cc6bSBarry Smith - function - routine to convert to subtype 48304099cc6bSBarry Smith 48314099cc6bSBarry Smith Notes: 48324099cc6bSBarry Smith MatSeqAIJRegister() may be called multiple times to add several user-defined solvers. 48334099cc6bSBarry Smith 48344099cc6bSBarry Smith 48354099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 48364099cc6bSBarry Smith $ -mat_seqaij_type my_mat 48374099cc6bSBarry Smith 48384099cc6bSBarry Smith Level: advanced 48394099cc6bSBarry Smith 48404099cc6bSBarry Smith .keywords: Mat, register 48414099cc6bSBarry Smith 48424099cc6bSBarry Smith .seealso: MatSeqAIJRegisterAll() 48434099cc6bSBarry Smith 48444099cc6bSBarry Smith 48454099cc6bSBarry Smith Level: advanced 48464099cc6bSBarry Smith @*/ 4847388d47a6SSatish Balay PetscErrorCode MatSeqAIJRegister(const char sname[],PetscErrorCode (*function)(Mat,MatType,MatReuse,Mat *)) 48484099cc6bSBarry Smith { 48494099cc6bSBarry Smith PetscErrorCode ierr; 48504099cc6bSBarry Smith 48514099cc6bSBarry Smith PetscFunctionBegin; 48529cc31a68SJed Brown ierr = MatInitializePackage();CHKERRQ(ierr); 48534099cc6bSBarry Smith ierr = PetscFunctionListAdd(&MatSeqAIJList,sname,function);CHKERRQ(ierr); 48544099cc6bSBarry Smith PetscFunctionReturn(0); 48554099cc6bSBarry Smith } 48564099cc6bSBarry Smith 48574099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 48584099cc6bSBarry Smith 48594099cc6bSBarry Smith /*@C 48604099cc6bSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of SeqAIJ 48614099cc6bSBarry Smith 48624099cc6bSBarry Smith Not Collective 48634099cc6bSBarry Smith 48644099cc6bSBarry Smith Level: advanced 48654099cc6bSBarry Smith 48664099cc6bSBarry Smith Developers Note: CUSP and CUSPARSE do not yet support the MatConvert_SeqAIJ..() paradigm and thus cannot be registered here 48674099cc6bSBarry Smith 48684099cc6bSBarry Smith .keywords: KSP, register, all 48694099cc6bSBarry Smith 48704099cc6bSBarry Smith .seealso: MatRegisterAll(), MatSeqAIJRegister() 48714099cc6bSBarry Smith @*/ 48724099cc6bSBarry Smith PetscErrorCode MatSeqAIJRegisterAll(void) 48734099cc6bSBarry Smith { 48744099cc6bSBarry Smith PetscErrorCode ierr; 48754099cc6bSBarry Smith 48764099cc6bSBarry Smith PetscFunctionBegin; 48774099cc6bSBarry Smith if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(0); 48784099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 48794099cc6bSBarry Smith 48804099cc6bSBarry Smith ierr = MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL);CHKERRQ(ierr); 48814099cc6bSBarry Smith ierr = MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM);CHKERRQ(ierr); 48824dfdc2d9SRichard Tran Mills ierr = MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL);CHKERRQ(ierr); 48839779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 48846b62b571SRichard Tran Mills ierr = MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL);CHKERRQ(ierr); 4885485f9817SRichard Tran Mills #endif 48864099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 48874099cc6bSBarry Smith ierr = MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL);CHKERRQ(ierr); 48884099cc6bSBarry Smith #endif 48894099cc6bSBarry Smith PetscFunctionReturn(0); 48904099cc6bSBarry Smith } 489153dd7562SDmitry Karpeev 489253dd7562SDmitry Karpeev /* 489381824310SBarry Smith Special version for direct calls from Fortran 489481824310SBarry Smith */ 4895af0996ceSBarry Smith #include <petsc/private/fortranimpl.h> 489681824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 489781824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 489881824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 489981824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 490081824310SBarry Smith #endif 490181824310SBarry Smith 490281824310SBarry Smith /* Change these macros so can be used in void function */ 490381824310SBarry Smith #undef CHKERRQ 4904ce94432eSBarry Smith #define CHKERRQ(ierr) CHKERRABORT(PetscObjectComm((PetscObject)A),ierr) 490581824310SBarry Smith #undef SETERRQ2 4906e32f2f54SBarry Smith #define SETERRQ2(comm,ierr,b,c,d) CHKERRABORT(comm,ierr) 49074994cf47SJed Brown #undef SETERRQ3 49084994cf47SJed Brown #define SETERRQ3(comm,ierr,b,c,d,e) CHKERRABORT(comm,ierr) 490981824310SBarry Smith 49108cc058d9SJed Brown PETSC_EXTERN void PETSC_STDCALL matsetvaluesseqaij_(Mat *AA,PetscInt *mm,const PetscInt im[],PetscInt *nn,const PetscInt in[],const PetscScalar v[],InsertMode *isis, PetscErrorCode *_ierr) 491181824310SBarry Smith { 491281824310SBarry Smith Mat A = *AA; 491381824310SBarry Smith PetscInt m = *mm, n = *nn; 491481824310SBarry Smith InsertMode is = *isis; 491581824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 491681824310SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 491781824310SBarry Smith PetscInt *imax,*ai,*ailen; 491881824310SBarry Smith PetscErrorCode ierr; 491981824310SBarry Smith PetscInt *aj,nonew = a->nonew,lastcol = -1; 492054f21887SBarry Smith MatScalar *ap,value,*aa; 4921ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 4922ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 492381824310SBarry Smith 492481824310SBarry Smith PetscFunctionBegin; 49254994cf47SJed Brown MatCheckPreallocated(A,1); 492681824310SBarry Smith imax = a->imax; 492781824310SBarry Smith ai = a->i; 492881824310SBarry Smith ailen = a->ilen; 492981824310SBarry Smith aj = a->j; 493081824310SBarry Smith aa = a->a; 493181824310SBarry Smith 493281824310SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 493381824310SBarry Smith row = im[k]; 493481824310SBarry Smith if (row < 0) continue; 493581824310SBarry Smith #if defined(PETSC_USE_DEBUG) 4936ce94432eSBarry Smith if (row >= A->rmap->n) SETERRABORT(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large"); 493781824310SBarry Smith #endif 493881824310SBarry Smith rp = aj + ai[row]; ap = aa + ai[row]; 493981824310SBarry Smith rmax = imax[row]; nrow = ailen[row]; 494081824310SBarry Smith low = 0; 494181824310SBarry Smith high = nrow; 494281824310SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 494381824310SBarry Smith if (in[l] < 0) continue; 494481824310SBarry Smith #if defined(PETSC_USE_DEBUG) 4945ce94432eSBarry Smith if (in[l] >= A->cmap->n) SETERRABORT(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Column too large"); 494681824310SBarry Smith #endif 494781824310SBarry Smith col = in[l]; 49482205254eSKarl Rupp if (roworiented) value = v[l + k*n]; 49492205254eSKarl Rupp else value = v[k + l*m]; 49502205254eSKarl Rupp 495181824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 495281824310SBarry Smith 49532205254eSKarl Rupp if (col <= lastcol) low = 0; 49542205254eSKarl Rupp else high = nrow; 495581824310SBarry Smith lastcol = col; 495681824310SBarry Smith while (high-low > 5) { 495781824310SBarry Smith t = (low+high)/2; 495881824310SBarry Smith if (rp[t] > col) high = t; 495981824310SBarry Smith else low = t; 496081824310SBarry Smith } 496181824310SBarry Smith for (i=low; i<high; i++) { 496281824310SBarry Smith if (rp[i] > col) break; 496381824310SBarry Smith if (rp[i] == col) { 496481824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 496581824310SBarry Smith else ap[i] = value; 496681824310SBarry Smith goto noinsert; 496781824310SBarry Smith } 496881824310SBarry Smith } 496981824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 497081824310SBarry Smith if (nonew == 1) goto noinsert; 4971ce94432eSBarry Smith if (nonew == -1) SETERRABORT(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero in the matrix"); 4972fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 497381824310SBarry Smith N = nrow++ - 1; a->nz++; high++; 497481824310SBarry Smith /* shift up all the later entries in this row */ 497581824310SBarry Smith for (ii=N; ii>=i; ii--) { 497681824310SBarry Smith rp[ii+1] = rp[ii]; 497781824310SBarry Smith ap[ii+1] = ap[ii]; 497881824310SBarry Smith } 497981824310SBarry Smith rp[i] = col; 498081824310SBarry Smith ap[i] = value; 4981e56f5c9eSBarry Smith A->nonzerostate++; 498281824310SBarry Smith noinsert:; 498381824310SBarry Smith low = i + 1; 498481824310SBarry Smith } 498581824310SBarry Smith ailen[row] = nrow; 498681824310SBarry Smith } 498781824310SBarry Smith PetscFunctionReturnVoid(); 498881824310SBarry Smith } 4989