1b377110cSBarry Smith 2d5d45c9bSBarry Smith /* 33369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 4d5d45c9bSBarry Smith matrix storage format. 5d5d45c9bSBarry Smith */ 63369ce9aSBarry Smith 77c4f633dSBarry Smith 8c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 9c6db04a5SJed Brown #include <petscblaslapack.h> 10c6db04a5SJed Brown #include <petscbt.h> 11af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 120716a85fSBarry Smith 134099cc6bSBarry Smith PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 144099cc6bSBarry Smith { 154099cc6bSBarry Smith PetscErrorCode ierr; 164099cc6bSBarry Smith PetscBool flg; 174099cc6bSBarry Smith char type[256]; 184099cc6bSBarry Smith 194099cc6bSBarry Smith PetscFunctionBegin; 204099cc6bSBarry Smith ierr = PetscObjectOptionsBegin((PetscObject)A); 214099cc6bSBarry Smith ierr = PetscOptionsFList("-mat_seqaij_type","Matrix SeqAIJ type","MatSeqAIJSetType",MatSeqAIJList,"seqaij",type,256,&flg);CHKERRQ(ierr); 224099cc6bSBarry Smith if (flg) { 234099cc6bSBarry Smith ierr = MatSeqAIJSetType(A,type);CHKERRQ(ierr); 244099cc6bSBarry Smith } 254099cc6bSBarry Smith ierr = PetscOptionsEnd();CHKERRQ(ierr); 264099cc6bSBarry Smith PetscFunctionReturn(0); 274099cc6bSBarry Smith } 284099cc6bSBarry Smith 290716a85fSBarry Smith PetscErrorCode MatGetColumnNorms_SeqAIJ(Mat A,NormType type,PetscReal *norms) 300716a85fSBarry Smith { 310716a85fSBarry Smith PetscErrorCode ierr; 320716a85fSBarry Smith PetscInt i,m,n; 330716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 340716a85fSBarry Smith 350716a85fSBarry Smith PetscFunctionBegin; 360716a85fSBarry Smith ierr = MatGetSize(A,&m,&n);CHKERRQ(ierr); 37580bdb30SBarry Smith ierr = PetscArrayzero(norms,n);CHKERRQ(ierr); 380716a85fSBarry Smith if (type == NORM_2) { 390716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 400716a85fSBarry Smith norms[aij->j[i]] += PetscAbsScalar(aij->a[i]*aij->a[i]); 410716a85fSBarry Smith } 420716a85fSBarry Smith } else if (type == NORM_1) { 430716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 440716a85fSBarry Smith norms[aij->j[i]] += PetscAbsScalar(aij->a[i]); 450716a85fSBarry Smith } 460716a85fSBarry Smith } else if (type == NORM_INFINITY) { 470716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 480716a85fSBarry Smith norms[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]),norms[aij->j[i]]); 490716a85fSBarry Smith } 500716a85fSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Unknown NormType"); 510716a85fSBarry Smith 520716a85fSBarry Smith if (type == NORM_2) { 538f1a2a5eSBarry Smith for (i=0; i<n; i++) norms[i] = PetscSqrtReal(norms[i]); 540716a85fSBarry Smith } 550716a85fSBarry Smith PetscFunctionReturn(0); 560716a85fSBarry Smith } 570716a85fSBarry Smith 583a062f41SBarry Smith PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A,IS *is) 593a062f41SBarry Smith { 603a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 613a062f41SBarry Smith PetscInt i,m=A->rmap->n,cnt = 0, bs = A->rmap->bs; 623a062f41SBarry Smith const PetscInt *jj = a->j,*ii = a->i; 633a062f41SBarry Smith PetscInt *rows; 643a062f41SBarry Smith PetscErrorCode ierr; 653a062f41SBarry Smith 663a062f41SBarry Smith PetscFunctionBegin; 673a062f41SBarry Smith for (i=0; i<m; i++) { 683a062f41SBarry Smith if ((ii[i] != ii[i+1]) && ((jj[ii[i]] < bs*(i/bs)) || (jj[ii[i+1]-1] > bs*((i+bs)/bs)-1))) { 693a062f41SBarry Smith cnt++; 703a062f41SBarry Smith } 713a062f41SBarry Smith } 723a062f41SBarry Smith ierr = PetscMalloc1(cnt,&rows);CHKERRQ(ierr); 733a062f41SBarry Smith cnt = 0; 743a062f41SBarry Smith for (i=0; i<m; i++) { 753a062f41SBarry Smith if ((ii[i] != ii[i+1]) && ((jj[ii[i]] < bs*(i/bs)) || (jj[ii[i+1]-1] > bs*((i+bs)/bs)-1))) { 763a062f41SBarry Smith rows[cnt] = i; 773a062f41SBarry Smith cnt++; 783a062f41SBarry Smith } 793a062f41SBarry Smith } 803a062f41SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,cnt,rows,PETSC_OWN_POINTER,is);CHKERRQ(ierr); 813a062f41SBarry Smith PetscFunctionReturn(0); 823a062f41SBarry Smith } 833a062f41SBarry Smith 84f1f41ecbSJed Brown PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A,PetscInt *nrows,PetscInt **zrows) 856ce1633cSBarry Smith { 866ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 876ce1633cSBarry Smith const MatScalar *aa = a->a; 886ce1633cSBarry Smith PetscInt i,m=A->rmap->n,cnt = 0; 89b2db7409Sstefano_zampini const PetscInt *ii = a->i,*jj = a->j,*diag; 906ce1633cSBarry Smith PetscInt *rows; 916ce1633cSBarry Smith PetscErrorCode ierr; 926ce1633cSBarry Smith 936ce1633cSBarry Smith PetscFunctionBegin; 946ce1633cSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 956ce1633cSBarry Smith diag = a->diag; 966ce1633cSBarry Smith for (i=0; i<m; i++) { 97b2db7409Sstefano_zampini if ((diag[i] >= ii[i+1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 986ce1633cSBarry Smith cnt++; 996ce1633cSBarry Smith } 1006ce1633cSBarry Smith } 101785e854fSJed Brown ierr = PetscMalloc1(cnt,&rows);CHKERRQ(ierr); 1026ce1633cSBarry Smith cnt = 0; 1036ce1633cSBarry Smith for (i=0; i<m; i++) { 104b2db7409Sstefano_zampini if ((diag[i] >= ii[i+1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 1056ce1633cSBarry Smith rows[cnt++] = i; 1066ce1633cSBarry Smith } 1076ce1633cSBarry Smith } 108f1f41ecbSJed Brown *nrows = cnt; 109f1f41ecbSJed Brown *zrows = rows; 110f1f41ecbSJed Brown PetscFunctionReturn(0); 111f1f41ecbSJed Brown } 112f1f41ecbSJed Brown 113f1f41ecbSJed Brown PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A,IS *zrows) 114f1f41ecbSJed Brown { 115f1f41ecbSJed Brown PetscInt nrows,*rows; 116f1f41ecbSJed Brown PetscErrorCode ierr; 117f1f41ecbSJed Brown 118f1f41ecbSJed Brown PetscFunctionBegin; 1190298fd71SBarry Smith *zrows = NULL; 120f1f41ecbSJed Brown ierr = MatFindZeroDiagonals_SeqAIJ_Private(A,&nrows,&rows);CHKERRQ(ierr); 121ce94432eSBarry Smith ierr = ISCreateGeneral(PetscObjectComm((PetscObject)A),nrows,rows,PETSC_OWN_POINTER,zrows);CHKERRQ(ierr); 1226ce1633cSBarry Smith PetscFunctionReturn(0); 1236ce1633cSBarry Smith } 1246ce1633cSBarry Smith 125b3a44c85SBarry Smith PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A,IS *keptrows) 126b3a44c85SBarry Smith { 127b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 128b3a44c85SBarry Smith const MatScalar *aa; 129b3a44c85SBarry Smith PetscInt m=A->rmap->n,cnt = 0; 130b3a44c85SBarry Smith const PetscInt *ii; 131b3a44c85SBarry Smith PetscInt n,i,j,*rows; 132b3a44c85SBarry Smith PetscErrorCode ierr; 133b3a44c85SBarry Smith 134b3a44c85SBarry Smith PetscFunctionBegin; 135b3a44c85SBarry Smith *keptrows = 0; 136b3a44c85SBarry Smith ii = a->i; 137b3a44c85SBarry Smith for (i=0; i<m; i++) { 138b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 139b3a44c85SBarry Smith if (!n) { 140b3a44c85SBarry Smith cnt++; 141b3a44c85SBarry Smith goto ok1; 142b3a44c85SBarry Smith } 143b3a44c85SBarry Smith aa = a->a + ii[i]; 144b3a44c85SBarry Smith for (j=0; j<n; j++) { 145b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 146b3a44c85SBarry Smith } 147b3a44c85SBarry Smith cnt++; 148b3a44c85SBarry Smith ok1:; 149b3a44c85SBarry Smith } 150b3a44c85SBarry Smith if (!cnt) PetscFunctionReturn(0); 151854ce69bSBarry Smith ierr = PetscMalloc1(A->rmap->n-cnt,&rows);CHKERRQ(ierr); 152b3a44c85SBarry Smith cnt = 0; 153b3a44c85SBarry Smith for (i=0; i<m; i++) { 154b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 155b3a44c85SBarry Smith if (!n) continue; 156b3a44c85SBarry Smith aa = a->a + ii[i]; 157b3a44c85SBarry Smith for (j=0; j<n; j++) { 158b3a44c85SBarry Smith if (aa[j] != 0.0) { 159b3a44c85SBarry Smith rows[cnt++] = i; 160b3a44c85SBarry Smith break; 161b3a44c85SBarry Smith } 162b3a44c85SBarry Smith } 163b3a44c85SBarry Smith } 164b3a44c85SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,cnt,rows,PETSC_OWN_POINTER,keptrows);CHKERRQ(ierr); 165b3a44c85SBarry Smith PetscFunctionReturn(0); 166b3a44c85SBarry Smith } 167b3a44c85SBarry Smith 1687087cfbeSBarry Smith PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y,Vec D,InsertMode is) 16979299369SBarry Smith { 17079299369SBarry Smith PetscErrorCode ierr; 17179299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) Y->data; 17299e65526SBarry Smith PetscInt i,m = Y->rmap->n; 17399e65526SBarry Smith const PetscInt *diag; 17454f21887SBarry Smith MatScalar *aa = aij->a; 17599e65526SBarry Smith const PetscScalar *v; 176ace3abfcSBarry Smith PetscBool missing; 17779299369SBarry Smith 17879299369SBarry Smith PetscFunctionBegin; 17909f38230SBarry Smith if (Y->assembled) { 1800298fd71SBarry Smith ierr = MatMissingDiagonal_SeqAIJ(Y,&missing,NULL);CHKERRQ(ierr); 18109f38230SBarry Smith if (!missing) { 18279299369SBarry Smith diag = aij->diag; 18399e65526SBarry Smith ierr = VecGetArrayRead(D,&v);CHKERRQ(ierr); 18479299369SBarry Smith if (is == INSERT_VALUES) { 18579299369SBarry Smith for (i=0; i<m; i++) { 18679299369SBarry Smith aa[diag[i]] = v[i]; 18779299369SBarry Smith } 18879299369SBarry Smith } else { 18979299369SBarry Smith for (i=0; i<m; i++) { 19079299369SBarry Smith aa[diag[i]] += v[i]; 19179299369SBarry Smith } 19279299369SBarry Smith } 19399e65526SBarry Smith ierr = VecRestoreArrayRead(D,&v);CHKERRQ(ierr); 19479299369SBarry Smith PetscFunctionReturn(0); 19579299369SBarry Smith } 196acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(Y);CHKERRQ(ierr); 19709f38230SBarry Smith } 19809f38230SBarry Smith ierr = MatDiagonalSet_Default(Y,D,is);CHKERRQ(ierr); 19909f38230SBarry Smith PetscFunctionReturn(0); 20009f38230SBarry Smith } 20179299369SBarry Smith 2021a83f524SJed Brown PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *m,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 20317ab2063SBarry Smith { 204416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 205dfbe8321SBarry Smith PetscErrorCode ierr; 20697f1f81fSBarry Smith PetscInt i,ishift; 20717ab2063SBarry Smith 2083a40ed3dSBarry Smith PetscFunctionBegin; 209d0f46423SBarry Smith *m = A->rmap->n; 2103a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 211bfeeae90SHong Zhang ishift = 0; 21253e63a63SBarry Smith if (symmetric && !A->structurally_symmetric) { 2132462f5fdSStefano Zampini ierr = MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,PETSC_TRUE,ishift,oshift,(PetscInt**)ia,(PetscInt**)ja);CHKERRQ(ierr); 214bfeeae90SHong Zhang } else if (oshift == 1) { 2151a83f524SJed Brown PetscInt *tia; 216d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2173b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 218854ce69bSBarry Smith ierr = PetscMalloc1(A->rmap->n+1,&tia);CHKERRQ(ierr); 2191a83f524SJed Brown for (i=0; i<A->rmap->n+1; i++) tia[i] = a->i[i] + 1; 2201a83f524SJed Brown *ia = tia; 221ecc77c7aSBarry Smith if (ja) { 2221a83f524SJed Brown PetscInt *tja; 223854ce69bSBarry Smith ierr = PetscMalloc1(nz+1,&tja);CHKERRQ(ierr); 2241a83f524SJed Brown for (i=0; i<nz; i++) tja[i] = a->j[i] + 1; 2251a83f524SJed Brown *ja = tja; 226ecc77c7aSBarry Smith } 2276945ee14SBarry Smith } else { 228ecc77c7aSBarry Smith *ia = a->i; 229ecc77c7aSBarry Smith if (ja) *ja = a->j; 230a2ce50c7SBarry Smith } 2313a40ed3dSBarry Smith PetscFunctionReturn(0); 232a2744918SBarry Smith } 233a2744918SBarry Smith 2341a83f524SJed Brown PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2356945ee14SBarry Smith { 236dfbe8321SBarry Smith PetscErrorCode ierr; 2376945ee14SBarry Smith 2383a40ed3dSBarry Smith PetscFunctionBegin; 2393a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 240bfeeae90SHong Zhang if ((symmetric && !A->structurally_symmetric) || oshift == 1) { 241606d414cSSatish Balay ierr = PetscFree(*ia);CHKERRQ(ierr); 242ecc77c7aSBarry Smith if (ja) {ierr = PetscFree(*ja);CHKERRQ(ierr);} 243bcd2baecSBarry Smith } 2443a40ed3dSBarry Smith PetscFunctionReturn(0); 24517ab2063SBarry Smith } 24617ab2063SBarry Smith 2471a83f524SJed Brown PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *nn,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2483b2fbd54SBarry Smith { 2493b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 250dfbe8321SBarry Smith PetscErrorCode ierr; 251d0f46423SBarry Smith PetscInt i,*collengths,*cia,*cja,n = A->cmap->n,m = A->rmap->n; 25297f1f81fSBarry Smith PetscInt nz = a->i[m],row,*jj,mr,col; 2533b2fbd54SBarry Smith 2543a40ed3dSBarry Smith PetscFunctionBegin; 255899cda47SBarry Smith *nn = n; 2563a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2573b2fbd54SBarry Smith if (symmetric) { 2582462f5fdSStefano Zampini ierr = MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,PETSC_TRUE,0,oshift,(PetscInt**)ia,(PetscInt**)ja);CHKERRQ(ierr); 2593b2fbd54SBarry Smith } else { 260b9e7e5c1SBarry Smith ierr = PetscCalloc1(n,&collengths);CHKERRQ(ierr); 261854ce69bSBarry Smith ierr = PetscMalloc1(n+1,&cia);CHKERRQ(ierr); 262b9e7e5c1SBarry Smith ierr = PetscMalloc1(nz,&cja);CHKERRQ(ierr); 2633b2fbd54SBarry Smith jj = a->j; 2643b2fbd54SBarry Smith for (i=0; i<nz; i++) { 265bfeeae90SHong Zhang collengths[jj[i]]++; 2663b2fbd54SBarry Smith } 2673b2fbd54SBarry Smith cia[0] = oshift; 2683b2fbd54SBarry Smith for (i=0; i<n; i++) { 2693b2fbd54SBarry Smith cia[i+1] = cia[i] + collengths[i]; 2703b2fbd54SBarry Smith } 271580bdb30SBarry Smith ierr = PetscArrayzero(collengths,n);CHKERRQ(ierr); 2723b2fbd54SBarry Smith jj = a->j; 273a93ec695SBarry Smith for (row=0; row<m; row++) { 274a93ec695SBarry Smith mr = a->i[row+1] - a->i[row]; 275a93ec695SBarry Smith for (i=0; i<mr; i++) { 276bfeeae90SHong Zhang col = *jj++; 2772205254eSKarl Rupp 2783b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2793b2fbd54SBarry Smith } 2803b2fbd54SBarry Smith } 281606d414cSSatish Balay ierr = PetscFree(collengths);CHKERRQ(ierr); 2823b2fbd54SBarry Smith *ia = cia; *ja = cja; 2833b2fbd54SBarry Smith } 2843a40ed3dSBarry Smith PetscFunctionReturn(0); 2853b2fbd54SBarry Smith } 2863b2fbd54SBarry Smith 2871a83f524SJed Brown PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2883b2fbd54SBarry Smith { 289dfbe8321SBarry Smith PetscErrorCode ierr; 290606d414cSSatish Balay 2913a40ed3dSBarry Smith PetscFunctionBegin; 2923a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2933b2fbd54SBarry Smith 294606d414cSSatish Balay ierr = PetscFree(*ia);CHKERRQ(ierr); 295606d414cSSatish Balay ierr = PetscFree(*ja);CHKERRQ(ierr); 2963a40ed3dSBarry Smith PetscFunctionReturn(0); 2973b2fbd54SBarry Smith } 2983b2fbd54SBarry Smith 2997cee066cSHong Zhang /* 3007cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 3017cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 302040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 3037cee066cSHong Zhang */ 3047cee066cSHong Zhang PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *nn,const PetscInt *ia[],const PetscInt *ja[],PetscInt *spidx[],PetscBool *done) 3057cee066cSHong Zhang { 3067cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3077cee066cSHong Zhang PetscErrorCode ierr; 3087cee066cSHong Zhang PetscInt i,*collengths,*cia,*cja,n = A->cmap->n,m = A->rmap->n; 309071fcb05SBarry Smith PetscInt nz = a->i[m],row,mr,col,tmp; 3107cee066cSHong Zhang PetscInt *cspidx; 311071fcb05SBarry Smith const PetscInt *jj; 3127cee066cSHong Zhang 3137cee066cSHong Zhang PetscFunctionBegin; 3147cee066cSHong Zhang *nn = n; 3157cee066cSHong Zhang if (!ia) PetscFunctionReturn(0); 316625f6d37SHong Zhang 317b9e7e5c1SBarry Smith ierr = PetscCalloc1(n,&collengths);CHKERRQ(ierr); 318854ce69bSBarry Smith ierr = PetscMalloc1(n+1,&cia);CHKERRQ(ierr); 319b9e7e5c1SBarry Smith ierr = PetscMalloc1(nz,&cja);CHKERRQ(ierr); 320b9e7e5c1SBarry Smith ierr = PetscMalloc1(nz,&cspidx);CHKERRQ(ierr); 3217cee066cSHong Zhang jj = a->j; 3227cee066cSHong Zhang for (i=0; i<nz; i++) { 3237cee066cSHong Zhang collengths[jj[i]]++; 3247cee066cSHong Zhang } 3257cee066cSHong Zhang cia[0] = oshift; 3267cee066cSHong Zhang for (i=0; i<n; i++) { 3277cee066cSHong Zhang cia[i+1] = cia[i] + collengths[i]; 3287cee066cSHong Zhang } 329580bdb30SBarry Smith ierr = PetscArrayzero(collengths,n);CHKERRQ(ierr); 3307cee066cSHong Zhang jj = a->j; 3317cee066cSHong Zhang for (row=0; row<m; row++) { 3327cee066cSHong Zhang mr = a->i[row+1] - a->i[row]; 3337cee066cSHong Zhang for (i=0; i<mr; i++) { 3347cee066cSHong Zhang col = *jj++; 335071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 336071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 337071fcb05SBarry Smith cja[tmp] = row + oshift; 3387cee066cSHong Zhang } 3397cee066cSHong Zhang } 3407cee066cSHong Zhang ierr = PetscFree(collengths);CHKERRQ(ierr); 341071fcb05SBarry Smith *ia = cia; 342071fcb05SBarry Smith *ja = cja; 3437cee066cSHong Zhang *spidx = cspidx; 3447cee066cSHong Zhang PetscFunctionReturn(0); 3457cee066cSHong Zhang } 3467cee066cSHong Zhang 3477cee066cSHong Zhang PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscInt *spidx[],PetscBool *done) 3487cee066cSHong Zhang { 3497cee066cSHong Zhang PetscErrorCode ierr; 3507cee066cSHong Zhang 3517cee066cSHong Zhang PetscFunctionBegin; 3525243ef75SHong Zhang ierr = MatRestoreColumnIJ_SeqAIJ(A,oshift,symmetric,inodecompressed,n,ia,ja,done);CHKERRQ(ierr); 3537cee066cSHong Zhang ierr = PetscFree(*spidx);CHKERRQ(ierr); 3547cee066cSHong Zhang PetscFunctionReturn(0); 3557cee066cSHong Zhang } 3567cee066cSHong Zhang 35787d4246cSBarry Smith PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A,PetscInt row,const PetscScalar v[]) 35887d4246cSBarry Smith { 35987d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 36087d4246cSBarry Smith PetscInt *ai = a->i; 36187d4246cSBarry Smith PetscErrorCode ierr; 36287d4246cSBarry Smith 36387d4246cSBarry Smith PetscFunctionBegin; 364580bdb30SBarry Smith ierr = PetscArraycpy(a->a+ai[row],v,ai[row+1]-ai[row]);CHKERRQ(ierr); 365e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 366e2cf4d64SStefano Zampini if (A->valid_GPU_matrix != PETSC_OFFLOAD_UNALLOCATED && ai[row+1]-ai[row]) A->valid_GPU_matrix = PETSC_OFFLOAD_CPU; 367e2cf4d64SStefano Zampini #endif 36887d4246cSBarry Smith PetscFunctionReturn(0); 36987d4246cSBarry Smith } 37087d4246cSBarry Smith 371bd04181cSBarry Smith /* 372bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 373bd04181cSBarry Smith 374bd04181cSBarry Smith - a single row of values is set with each call 375bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 376bd04181cSBarry Smith - the values are always added to the matrix, not set 377bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 378bd04181cSBarry Smith 3791f763a69SBarry Smith This does NOT assume the global column indices are sorted 380bd04181cSBarry Smith 3811f763a69SBarry Smith */ 382bd04181cSBarry Smith 383af0996ceSBarry Smith #include <petsc/private/isimpl.h> 384189e4007SBarry Smith PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 385189e4007SBarry Smith { 386189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3871f763a69SBarry Smith PetscInt low,high,t,row,nrow,i,col,l; 3881f763a69SBarry Smith const PetscInt *rp,*ai = a->i,*ailen = a->ilen,*aj = a->j; 3891f763a69SBarry Smith PetscInt lastcol = -1; 390189e4007SBarry Smith MatScalar *ap,value,*aa = a->a; 391189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices,*cidx = A->cmap->mapping->indices; 392189e4007SBarry Smith 393f38dd0b8SBarry Smith row = ridx[im[0]]; 3941f763a69SBarry Smith rp = aj + ai[row]; 3951f763a69SBarry Smith ap = aa + ai[row]; 3961f763a69SBarry Smith nrow = ailen[row]; 397189e4007SBarry Smith low = 0; 398189e4007SBarry Smith high = nrow; 399189e4007SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 400189e4007SBarry Smith col = cidx[in[l]]; 401f38dd0b8SBarry Smith value = v[l]; 402189e4007SBarry Smith 403189e4007SBarry Smith if (col <= lastcol) low = 0; 404189e4007SBarry Smith else high = nrow; 405189e4007SBarry Smith lastcol = col; 406189e4007SBarry Smith while (high-low > 5) { 407189e4007SBarry Smith t = (low+high)/2; 408189e4007SBarry Smith if (rp[t] > col) high = t; 409189e4007SBarry Smith else low = t; 410189e4007SBarry Smith } 411189e4007SBarry Smith for (i=low; i<high; i++) { 412189e4007SBarry Smith if (rp[i] == col) { 4131f763a69SBarry Smith ap[i] += value; 414189e4007SBarry Smith low = i + 1; 4151f763a69SBarry Smith break; 416189e4007SBarry Smith } 417189e4007SBarry Smith } 418189e4007SBarry Smith } 419e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 420e2cf4d64SStefano Zampini if (A->valid_GPU_matrix != PETSC_OFFLOAD_UNALLOCATED && m*n) A->valid_GPU_matrix = PETSC_OFFLOAD_CPU; 421e2cf4d64SStefano Zampini #endif 422f38dd0b8SBarry Smith return 0; 423189e4007SBarry Smith } 424189e4007SBarry Smith 42597f1f81fSBarry Smith PetscErrorCode MatSetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 42617ab2063SBarry Smith { 427416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 428e2ee6c50SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 42997f1f81fSBarry Smith PetscInt *imax = a->imax,*ai = a->i,*ailen = a->ilen; 4306849ba73SBarry Smith PetscErrorCode ierr; 431e2ee6c50SBarry Smith PetscInt *aj = a->j,nonew = a->nonew,lastcol = -1; 432d8cdefa3SHong Zhang MatScalar *ap=NULL,value=0.0,*aa = a->a; 433ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 434ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 435e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 436e2cf4d64SStefano Zampini PetscBool inserted = PETSC_FALSE; 437e2cf4d64SStefano Zampini #endif 43817ab2063SBarry Smith 4393a40ed3dSBarry Smith PetscFunctionBegin; 44017ab2063SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 441416022c9SBarry Smith row = im[k]; 4425ef9f2a5SBarry Smith if (row < 0) continue; 4432515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 444e32f2f54SBarry Smith if (row >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",row,A->rmap->n-1); 4453b2fbd54SBarry Smith #endif 446720833daSHong Zhang rp = aj + ai[row]; 447876c6284SHong Zhang if (!A->structure_only) ap = aa + ai[row]; 44817ab2063SBarry Smith rmax = imax[row]; nrow = ailen[row]; 449416022c9SBarry Smith low = 0; 450c71e6ed7SBarry Smith high = nrow; 45117ab2063SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 4525ef9f2a5SBarry Smith if (in[l] < 0) continue; 4532515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 454e32f2f54SBarry Smith if (in[l] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",in[l],A->cmap->n-1); 4553b2fbd54SBarry Smith #endif 456bfeeae90SHong Zhang col = in[l]; 457071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k*n] : v[k + l*m]; 458071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 45936db0b34SBarry Smith 4602205254eSKarl Rupp if (col <= lastcol) low = 0; 4612205254eSKarl Rupp else high = nrow; 462e2ee6c50SBarry Smith lastcol = col; 463416022c9SBarry Smith while (high-low > 5) { 464416022c9SBarry Smith t = (low+high)/2; 465416022c9SBarry Smith if (rp[t] > col) high = t; 466416022c9SBarry Smith else low = t; 46717ab2063SBarry Smith } 468416022c9SBarry Smith for (i=low; i<high; i++) { 46917ab2063SBarry Smith if (rp[i] > col) break; 47017ab2063SBarry Smith if (rp[i] == col) { 471876c6284SHong Zhang if (!A->structure_only) { 4720c0d7e18SFande Kong if (is == ADD_VALUES) { 4730c0d7e18SFande Kong ap[i] += value; 4740c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4750c0d7e18SFande Kong } 47617ab2063SBarry Smith else ap[i] = value; 477e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 478e2cf4d64SStefano Zampini inserted = PETSC_TRUE; 479e2cf4d64SStefano Zampini #endif 480720833daSHong Zhang } 481e44c0bd4SBarry Smith low = i + 1; 48217ab2063SBarry Smith goto noinsert; 48317ab2063SBarry Smith } 48417ab2063SBarry Smith } 485dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 486c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 487e32f2f54SBarry Smith if (nonew == -1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero at (%D,%D) in the matrix",row,col); 488720833daSHong Zhang if (A->structure_only) { 489876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A,A->rmap->n,1,nrow,row,col,rmax,ai,aj,rp,imax,nonew,MatScalar); 490720833daSHong Zhang } else { 491fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 492720833daSHong Zhang } 493c03d1d03SSatish Balay N = nrow++ - 1; a->nz++; high++; 494416022c9SBarry Smith /* shift up all the later entries in this row */ 495580bdb30SBarry Smith ierr = PetscArraymove(rp+i+1,rp+i,N-i+1);CHKERRQ(ierr); 49617ab2063SBarry Smith rp[i] = col; 497580bdb30SBarry Smith if (!A->structure_only){ 498580bdb30SBarry Smith ierr = PetscArraymove(ap+i+1,ap+i,N-i+1);CHKERRQ(ierr); 499580bdb30SBarry Smith ap[i] = value; 500580bdb30SBarry Smith } 501416022c9SBarry Smith low = i + 1; 502e56f5c9eSBarry Smith A->nonzerostate++; 503e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 504e2cf4d64SStefano Zampini inserted = PETSC_TRUE; 505e2cf4d64SStefano Zampini #endif 506e44c0bd4SBarry Smith noinsert:; 50717ab2063SBarry Smith } 50817ab2063SBarry Smith ailen[row] = nrow; 50917ab2063SBarry Smith } 510e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 511e2cf4d64SStefano Zampini if (A->valid_GPU_matrix != PETSC_OFFLOAD_UNALLOCATED && inserted) A->valid_GPU_matrix = PETSC_OFFLOAD_CPU; 512e2cf4d64SStefano Zampini #endif 5133a40ed3dSBarry Smith PetscFunctionReturn(0); 51417ab2063SBarry Smith } 51517ab2063SBarry Smith 516071fcb05SBarry Smith PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 517071fcb05SBarry Smith { 518071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 519071fcb05SBarry Smith PetscInt *rp,k,row; 520071fcb05SBarry Smith PetscInt *ai = a->i,*ailen = a->ilen; 521071fcb05SBarry Smith PetscErrorCode ierr; 522071fcb05SBarry Smith PetscInt *aj = a->j; 523071fcb05SBarry Smith MatScalar *aa = a->a,*ap; 524071fcb05SBarry Smith 525071fcb05SBarry Smith PetscFunctionBegin; 526071fcb05SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 527071fcb05SBarry Smith row = im[k]; 528071fcb05SBarry Smith rp = aj + ai[row]; 529071fcb05SBarry Smith ap = aa + ai[row]; 530071fcb05SBarry Smith if (!A->was_assembled) { 531071fcb05SBarry Smith ierr = PetscMemcpy(rp,in,n*sizeof(PetscInt));CHKERRQ(ierr); 532071fcb05SBarry Smith } 533071fcb05SBarry Smith if (!A->structure_only) { 534071fcb05SBarry Smith if (v) { 535071fcb05SBarry Smith ierr = PetscMemcpy(ap,v,n*sizeof(PetscScalar));CHKERRQ(ierr); 536071fcb05SBarry Smith v += n; 537071fcb05SBarry Smith } else { 538071fcb05SBarry Smith ierr = PetscMemzero(ap,n*sizeof(PetscScalar));CHKERRQ(ierr); 539071fcb05SBarry Smith } 540071fcb05SBarry Smith } 541071fcb05SBarry Smith ailen[row] = n; 542071fcb05SBarry Smith a->nz += n; 543071fcb05SBarry Smith } 544e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 545e2cf4d64SStefano Zampini if (A->valid_GPU_matrix != PETSC_OFFLOAD_UNALLOCATED && m*n) A->valid_GPU_matrix = PETSC_OFFLOAD_CPU; 546e2cf4d64SStefano Zampini #endif 547071fcb05SBarry Smith PetscFunctionReturn(0); 548071fcb05SBarry Smith } 549071fcb05SBarry Smith 55081824310SBarry Smith 551a77337e4SBarry Smith PetscErrorCode MatGetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],PetscScalar v[]) 5527eb43aa7SLois Curfman McInnes { 5537eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 55497f1f81fSBarry Smith PetscInt *rp,k,low,high,t,row,nrow,i,col,l,*aj = a->j; 55597f1f81fSBarry Smith PetscInt *ai = a->i,*ailen = a->ilen; 55654f21887SBarry Smith MatScalar *ap,*aa = a->a; 5577eb43aa7SLois Curfman McInnes 5583a40ed3dSBarry Smith PetscFunctionBegin; 5597eb43aa7SLois Curfman McInnes for (k=0; k<m; k++) { /* loop over rows */ 5607eb43aa7SLois Curfman McInnes row = im[k]; 561e32f2f54SBarry Smith if (row < 0) {v += n; continue;} /* SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row: %D",row); */ 562e32f2f54SBarry Smith if (row >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",row,A->rmap->n-1); 563bfeeae90SHong Zhang rp = aj + ai[row]; ap = aa + ai[row]; 5647eb43aa7SLois Curfman McInnes nrow = ailen[row]; 5657eb43aa7SLois Curfman McInnes for (l=0; l<n; l++) { /* loop over columns */ 566e32f2f54SBarry Smith if (in[l] < 0) {v++; continue;} /* SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column: %D",in[l]); */ 567e32f2f54SBarry Smith if (in[l] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",in[l],A->cmap->n-1); 568bfeeae90SHong Zhang col = in[l]; 5697eb43aa7SLois Curfman McInnes high = nrow; low = 0; /* assume unsorted */ 5707eb43aa7SLois Curfman McInnes while (high-low > 5) { 5717eb43aa7SLois Curfman McInnes t = (low+high)/2; 5727eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 5737eb43aa7SLois Curfman McInnes else low = t; 5747eb43aa7SLois Curfman McInnes } 5757eb43aa7SLois Curfman McInnes for (i=low; i<high; i++) { 5767eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 5777eb43aa7SLois Curfman McInnes if (rp[i] == col) { 578b49de8d1SLois Curfman McInnes *v++ = ap[i]; 5797eb43aa7SLois Curfman McInnes goto finished; 5807eb43aa7SLois Curfman McInnes } 5817eb43aa7SLois Curfman McInnes } 58297e567efSBarry Smith *v++ = 0.0; 5837eb43aa7SLois Curfman McInnes finished:; 5847eb43aa7SLois Curfman McInnes } 5857eb43aa7SLois Curfman McInnes } 5863a40ed3dSBarry Smith PetscFunctionReturn(0); 5877eb43aa7SLois Curfman McInnes } 5887eb43aa7SLois Curfman McInnes 58917ab2063SBarry Smith 590dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Binary(Mat A,PetscViewer viewer) 59117ab2063SBarry Smith { 592416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 5936849ba73SBarry Smith PetscErrorCode ierr; 5946f69ff64SBarry Smith PetscInt i,*col_lens; 5956f69ff64SBarry Smith int fd; 596b37d52dbSMark F. Adams FILE *file; 59717ab2063SBarry Smith 5983a40ed3dSBarry Smith PetscFunctionBegin; 599b0a32e0cSBarry Smith ierr = PetscViewerBinaryGetDescriptor(viewer,&fd);CHKERRQ(ierr); 600854ce69bSBarry Smith ierr = PetscMalloc1(4+A->rmap->n,&col_lens);CHKERRQ(ierr); 6012205254eSKarl Rupp 6020700a824SBarry Smith col_lens[0] = MAT_FILE_CLASSID; 603d0f46423SBarry Smith col_lens[1] = A->rmap->n; 604d0f46423SBarry Smith col_lens[2] = A->cmap->n; 605416022c9SBarry Smith col_lens[3] = a->nz; 606416022c9SBarry Smith 607416022c9SBarry Smith /* store lengths of each row and write (including header) to file */ 608d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 609416022c9SBarry Smith col_lens[4+i] = a->i[i+1] - a->i[i]; 61017ab2063SBarry Smith } 611d0f46423SBarry Smith ierr = PetscBinaryWrite(fd,col_lens,4+A->rmap->n,PETSC_INT,PETSC_TRUE);CHKERRQ(ierr); 612606d414cSSatish Balay ierr = PetscFree(col_lens);CHKERRQ(ierr); 613416022c9SBarry Smith 614416022c9SBarry Smith /* store column indices (zero start index) */ 6156f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,a->j,a->nz,PETSC_INT,PETSC_FALSE);CHKERRQ(ierr); 616416022c9SBarry Smith 617416022c9SBarry Smith /* store nonzero values */ 6186f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,a->a,a->nz,PETSC_SCALAR,PETSC_FALSE);CHKERRQ(ierr); 619b37d52dbSMark F. Adams 620b37d52dbSMark F. Adams ierr = PetscViewerBinaryGetInfoPointer(viewer,&file);CHKERRQ(ierr); 621b37d52dbSMark F. Adams if (file) { 62233d57670SJed Brown fprintf(file,"-matload_block_size %d\n",(int)PetscAbs(A->rmap->bs)); 623b37d52dbSMark F. Adams } 6243a40ed3dSBarry Smith PetscFunctionReturn(0); 62517ab2063SBarry Smith } 626416022c9SBarry Smith 6277dc0baabSHong Zhang static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A,PetscViewer viewer) 6287dc0baabSHong Zhang { 6297dc0baabSHong Zhang PetscErrorCode ierr; 6307dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 6317dc0baabSHong Zhang PetscInt i,k,m=A->rmap->N; 6327dc0baabSHong Zhang 6337dc0baabSHong Zhang PetscFunctionBegin; 6347dc0baabSHong Zhang ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 6357dc0baabSHong Zhang for (i=0; i<m; i++) { 6367dc0baabSHong Zhang ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 6377dc0baabSHong Zhang for (k=a->i[i]; k<a->i[i+1]; k++) { 6387dc0baabSHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (%D) ",a->j[k]);CHKERRQ(ierr); 6397dc0baabSHong Zhang } 6407dc0baabSHong Zhang ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 6417dc0baabSHong Zhang } 6427dc0baabSHong Zhang ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 6437dc0baabSHong Zhang PetscFunctionReturn(0); 6447dc0baabSHong Zhang } 6457dc0baabSHong Zhang 64609573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat,PetscViewer); 647cd155464SBarry Smith 648dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_ASCII(Mat A,PetscViewer viewer) 649416022c9SBarry Smith { 650416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 651dfbe8321SBarry Smith PetscErrorCode ierr; 65260e0710aSBarry Smith PetscInt i,j,m = A->rmap->n; 653e060cb09SBarry Smith const char *name; 654f3ef73ceSBarry Smith PetscViewerFormat format; 65517ab2063SBarry Smith 6563a40ed3dSBarry Smith PetscFunctionBegin; 6577dc0baabSHong Zhang if (A->structure_only) { 6587dc0baabSHong Zhang ierr = MatView_SeqAIJ_ASCII_structonly(A,viewer);CHKERRQ(ierr); 6597dc0baabSHong Zhang PetscFunctionReturn(0); 6607dc0baabSHong Zhang } 66143e49210SHong Zhang 662b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 66371c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 66497f1f81fSBarry Smith PetscInt nofinalvalue = 0; 66560e0710aSBarry Smith if (m && ((a->i[m] == a->i[m-1]) || (a->j[a->nz-1] != A->cmap->n-1))) { 666c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 667d00d2cf4SBarry Smith nofinalvalue = 1; 668d00d2cf4SBarry Smith } 669d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 670d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Size = %D %D \n",m,A->cmap->n);CHKERRQ(ierr); 67177431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Nonzeros = %D \n",a->nz);CHKERRQ(ierr); 672fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 673fbfe6fa7SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"zzz = zeros(%D,4);\n",a->nz+nofinalvalue);CHKERRQ(ierr); 674fbfe6fa7SJed Brown #else 67577431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"zzz = zeros(%D,3);\n",a->nz+nofinalvalue);CHKERRQ(ierr); 676fbfe6fa7SJed Brown #endif 677b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"zzz = [\n");CHKERRQ(ierr); 67817ab2063SBarry Smith 67917ab2063SBarry Smith for (i=0; i<m; i++) { 68060e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 681aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 682a9bf72d8SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e %18.16e\n",i+1,a->j[j]+1,(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 68317ab2063SBarry Smith #else 68460e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e\n",i+1,a->j[j]+1,(double)a->a[j]);CHKERRQ(ierr); 68517ab2063SBarry Smith #endif 68617ab2063SBarry Smith } 68717ab2063SBarry Smith } 688d00d2cf4SBarry Smith if (nofinalvalue) { 689c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 690c337ccceSJed Brown ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e %18.16e\n",m,A->cmap->n,0.,0.);CHKERRQ(ierr); 691c337ccceSJed Brown #else 692d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e\n",m,A->cmap->n,0.0);CHKERRQ(ierr); 693c337ccceSJed Brown #endif 694d00d2cf4SBarry Smith } 695317d6ea6SBarry Smith ierr = PetscObjectGetName((PetscObject)A,&name);CHKERRQ(ierr); 696fb9695e5SSatish Balay ierr = PetscViewerASCIIPrintf(viewer,"];\n %s = spconvert(zzz);\n",name);CHKERRQ(ierr); 697d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 69868369a75SKris Buschelman } else if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO) { 699cd155464SBarry Smith PetscFunctionReturn(0); 700fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 701d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 70244cd7ae7SLois Curfman McInnes for (i=0; i<m; i++) { 70377431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 70460e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 705aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 70636db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 70760e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 70836db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 70960e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 71036db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 71160e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(a->a[j]));CHKERRQ(ierr); 7126831982aSBarry Smith } 71344cd7ae7SLois Curfman McInnes #else 71460e0710aSBarry Smith if (a->a[j] != 0.0) {ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)a->a[j]);CHKERRQ(ierr);} 71544cd7ae7SLois Curfman McInnes #endif 71644cd7ae7SLois Curfman McInnes } 717b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 71844cd7ae7SLois Curfman McInnes } 719d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 720fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 72197f1f81fSBarry Smith PetscInt nzd=0,fshift=1,*sptr; 722d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 723854ce69bSBarry Smith ierr = PetscMalloc1(m+1,&sptr);CHKERRQ(ierr); 724496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 725496be53dSLois Curfman McInnes sptr[i] = nzd+1; 72660e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 727496be53dSLois Curfman McInnes if (a->j[j] >= i) { 728aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 72936db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 730496be53dSLois Curfman McInnes #else 731496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 732496be53dSLois Curfman McInnes #endif 733496be53dSLois Curfman McInnes } 734496be53dSLois Curfman McInnes } 735496be53dSLois Curfman McInnes } 7362e44a96cSLois Curfman McInnes sptr[m] = nzd+1; 73777431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %D %D\n\n",m,nzd);CHKERRQ(ierr); 7382e44a96cSLois Curfman McInnes for (i=0; i<m+1; i+=6) { 7392205254eSKarl Rupp if (i+4<m) { 7402205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4],sptr[i+5]);CHKERRQ(ierr); 7412205254eSKarl Rupp } else if (i+3<m) { 7422205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4]);CHKERRQ(ierr); 7432205254eSKarl Rupp } else if (i+2<m) { 7442205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3]);CHKERRQ(ierr); 7452205254eSKarl Rupp } else if (i+1<m) { 7462205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2]);CHKERRQ(ierr); 7472205254eSKarl Rupp } else if (i<m) { 7482205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D %D\n",sptr[i],sptr[i+1]);CHKERRQ(ierr); 7492205254eSKarl Rupp } else { 7502205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D\n",sptr[i]);CHKERRQ(ierr); 7512205254eSKarl Rupp } 752496be53dSLois Curfman McInnes } 753b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 754606d414cSSatish Balay ierr = PetscFree(sptr);CHKERRQ(ierr); 755496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 75660e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 75777431f27SBarry Smith if (a->j[j] >= i) {ierr = PetscViewerASCIIPrintf(viewer," %D ",a->j[j]+fshift);CHKERRQ(ierr);} 758496be53dSLois Curfman McInnes } 759b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 760496be53dSLois Curfman McInnes } 761b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 762496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 76360e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 764496be53dSLois Curfman McInnes if (a->j[j] >= i) { 765aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 76636db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) { 76760e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %18.16e %18.16e ",(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 7686831982aSBarry Smith } 769496be53dSLois Curfman McInnes #else 77060e0710aSBarry Smith if (a->a[j] != 0.0) {ierr = PetscViewerASCIIPrintf(viewer," %18.16e ",(double)a->a[j]);CHKERRQ(ierr);} 771496be53dSLois Curfman McInnes #endif 772496be53dSLois Curfman McInnes } 773496be53dSLois Curfman McInnes } 774b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 775496be53dSLois Curfman McInnes } 776d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 777fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 77897f1f81fSBarry Smith PetscInt cnt = 0,jcnt; 77987828ca2SBarry Smith PetscScalar value; 78068f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 78168f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 78268f1ed48SBarry Smith 78368f1ed48SBarry Smith for (i=0; i<a->i[m]; i++) { 78468f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 78568f1ed48SBarry Smith realonly = PETSC_FALSE; 78668f1ed48SBarry Smith break; 78768f1ed48SBarry Smith } 78868f1ed48SBarry Smith } 78968f1ed48SBarry Smith #endif 79002594712SBarry Smith 791d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 79202594712SBarry Smith for (i=0; i<m; i++) { 79302594712SBarry Smith jcnt = 0; 794d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 795e24b481bSBarry Smith if (jcnt < a->i[i+1]-a->i[i] && j == a->j[cnt]) { 79602594712SBarry Smith value = a->a[cnt++]; 797e24b481bSBarry Smith jcnt++; 79802594712SBarry Smith } else { 79902594712SBarry Smith value = 0.0; 80002594712SBarry Smith } 801aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 80268f1ed48SBarry Smith if (realonly) { 80360e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %7.5e ",(double)PetscRealPart(value));CHKERRQ(ierr); 80468f1ed48SBarry Smith } else { 80560e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %7.5e+%7.5e i ",(double)PetscRealPart(value),(double)PetscImaginaryPart(value));CHKERRQ(ierr); 80668f1ed48SBarry Smith } 80702594712SBarry Smith #else 80860e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %7.5e ",(double)value);CHKERRQ(ierr); 80902594712SBarry Smith #endif 81002594712SBarry Smith } 811b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 81202594712SBarry Smith } 813d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 8143c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 815150b93efSMatthew G. Knepley PetscInt fshift=1; 816d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 8173c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 81819303e72SJonathan Guyer ierr = PetscViewerASCIIPrintf(viewer,"%%%%MatrixMarket matrix coordinate complex general\n");CHKERRQ(ierr); 8193c215bfdSMatthew Knepley #else 82019303e72SJonathan Guyer ierr = PetscViewerASCIIPrintf(viewer,"%%%%MatrixMarket matrix coordinate real general\n");CHKERRQ(ierr); 8213c215bfdSMatthew Knepley #endif 822d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %D\n", m, A->cmap->n, a->nz);CHKERRQ(ierr); 8233c215bfdSMatthew Knepley for (i=0; i<m; i++) { 82460e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 8253c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 826a9a0e077SKarl Rupp ierr = PetscViewerASCIIPrintf(viewer,"%D %D %g %g\n", i+fshift,a->j[j]+fshift,(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 8273c215bfdSMatthew Knepley #else 828150b93efSMatthew G. Knepley ierr = PetscViewerASCIIPrintf(viewer,"%D %D %g\n", i+fshift, a->j[j]+fshift, (double)a->a[j]);CHKERRQ(ierr); 8293c215bfdSMatthew Knepley #endif 8303c215bfdSMatthew Knepley } 8313c215bfdSMatthew Knepley } 832d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 8333a40ed3dSBarry Smith } else { 834d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 835d5f3da31SBarry Smith if (A->factortype) { 83616cd7e1dSShri Abhyankar for (i=0; i<m; i++) { 83716cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 83816cd7e1dSShri Abhyankar /* L part */ 83960e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 84016cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 84116cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 84260e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 84316cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 8446712e2f1SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)(-PetscImaginaryPart(a->a[j])));CHKERRQ(ierr); 84516cd7e1dSShri Abhyankar } else { 84660e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(a->a[j]));CHKERRQ(ierr); 84716cd7e1dSShri Abhyankar } 84816cd7e1dSShri Abhyankar #else 84960e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)a->a[j]);CHKERRQ(ierr); 85016cd7e1dSShri Abhyankar #endif 85116cd7e1dSShri Abhyankar } 85216cd7e1dSShri Abhyankar /* diagonal */ 85316cd7e1dSShri Abhyankar j = a->diag[i]; 85416cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 85516cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 85660e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(1.0/a->a[j]),(double)PetscImaginaryPart(1.0/a->a[j]));CHKERRQ(ierr); 85716cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 8586712e2f1SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(1.0/a->a[j]),(double)(-PetscImaginaryPart(1.0/a->a[j])));CHKERRQ(ierr); 85916cd7e1dSShri Abhyankar } else { 86060e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(1.0/a->a[j]));CHKERRQ(ierr); 86116cd7e1dSShri Abhyankar } 86216cd7e1dSShri Abhyankar #else 86360e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)(1.0/a->a[j]));CHKERRQ(ierr); 86416cd7e1dSShri Abhyankar #endif 86516cd7e1dSShri Abhyankar 86616cd7e1dSShri Abhyankar /* U part */ 86760e0710aSBarry Smith for (j=a->diag[i+1]+1; j<a->diag[i]; j++) { 86816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 86916cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 87060e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 87116cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 87222ab088eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)(-PetscImaginaryPart(a->a[j])));CHKERRQ(ierr); 87316cd7e1dSShri Abhyankar } else { 87460e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(a->a[j]));CHKERRQ(ierr); 87516cd7e1dSShri Abhyankar } 87616cd7e1dSShri Abhyankar #else 87760e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)a->a[j]);CHKERRQ(ierr); 87816cd7e1dSShri Abhyankar #endif 87916cd7e1dSShri Abhyankar } 88016cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 88116cd7e1dSShri Abhyankar } 88216cd7e1dSShri Abhyankar } else { 88317ab2063SBarry Smith for (i=0; i<m; i++) { 88477431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 88560e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 886aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 88736db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 88860e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 88936db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 89060e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 8913a40ed3dSBarry Smith } else { 89260e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(a->a[j]));CHKERRQ(ierr); 89317ab2063SBarry Smith } 89417ab2063SBarry Smith #else 89560e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)a->a[j]);CHKERRQ(ierr); 89617ab2063SBarry Smith #endif 89717ab2063SBarry Smith } 898b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 89917ab2063SBarry Smith } 90016cd7e1dSShri Abhyankar } 901d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 90217ab2063SBarry Smith } 903b0a32e0cSBarry Smith ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 9043a40ed3dSBarry Smith PetscFunctionReturn(0); 905416022c9SBarry Smith } 906416022c9SBarry Smith 9079804daf3SBarry Smith #include <petscdraw.h> 908dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw,void *Aa) 909416022c9SBarry Smith { 910480ef9eaSBarry Smith Mat A = (Mat) Aa; 911416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 912dfbe8321SBarry Smith PetscErrorCode ierr; 913383922c3SLisandro Dalcin PetscInt i,j,m = A->rmap->n; 914383922c3SLisandro Dalcin int color; 915b05fc000SLisandro Dalcin PetscReal xl,yl,xr,yr,x_l,x_r,y_l,y_r; 916b0a32e0cSBarry Smith PetscViewer viewer; 917f3ef73ceSBarry Smith PetscViewerFormat format; 918cddf8d76SBarry Smith 9193a40ed3dSBarry Smith PetscFunctionBegin; 920480ef9eaSBarry Smith ierr = PetscObjectQuery((PetscObject)A,"Zoomviewer",(PetscObject*)&viewer);CHKERRQ(ierr); 921b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 922b0a32e0cSBarry Smith ierr = PetscDrawGetCoordinates(draw,&xl,&yl,&xr,&yr);CHKERRQ(ierr); 923383922c3SLisandro Dalcin 924416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9250513a670SBarry Smith 926fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 927383922c3SLisandro Dalcin ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr); 9280513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 929b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 930416022c9SBarry Smith for (i=0; i<m; i++) { 931cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 932bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 933bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 93436db0b34SBarry Smith if (PetscRealPart(a->a[j]) >= 0.) continue; 935b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 936cddf8d76SBarry Smith } 937cddf8d76SBarry Smith } 938b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 939cddf8d76SBarry Smith for (i=0; i<m; i++) { 940cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 941bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 942bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 943cddf8d76SBarry Smith if (a->a[j] != 0.) continue; 944b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 945cddf8d76SBarry Smith } 946cddf8d76SBarry Smith } 947b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 948cddf8d76SBarry Smith for (i=0; i<m; i++) { 949cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 950bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 951bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 95236db0b34SBarry Smith if (PetscRealPart(a->a[j]) <= 0.) continue; 953b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 954416022c9SBarry Smith } 955416022c9SBarry Smith } 956383922c3SLisandro Dalcin ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr); 9570513a670SBarry Smith } else { 9580513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 9590513a670SBarry Smith /* first determine max of all nonzero values */ 960b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 961383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 962b0a32e0cSBarry Smith PetscDraw popup; 9630513a670SBarry Smith 9640513a670SBarry Smith for (i=0; i<nz; i++) { 9650513a670SBarry Smith if (PetscAbsScalar(a->a[i]) > maxv) maxv = PetscAbsScalar(a->a[i]); 9660513a670SBarry Smith } 967383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 968b0a32e0cSBarry Smith ierr = PetscDrawGetPopup(draw,&popup);CHKERRQ(ierr); 96945f3bb6eSLisandro Dalcin ierr = PetscDrawScalePopup(popup,minv,maxv);CHKERRQ(ierr); 970383922c3SLisandro Dalcin 971383922c3SLisandro Dalcin ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr); 9720513a670SBarry Smith for (i=0; i<m; i++) { 973383922c3SLisandro Dalcin y_l = m - i - 1.0; 974383922c3SLisandro Dalcin y_r = y_l + 1.0; 975bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 976383922c3SLisandro Dalcin x_l = a->j[j]; 977383922c3SLisandro Dalcin x_r = x_l + 1.0; 978b05fc000SLisandro Dalcin color = PetscDrawRealToColor(PetscAbsScalar(a->a[count]),minv,maxv); 979b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 9800513a670SBarry Smith count++; 9810513a670SBarry Smith } 9820513a670SBarry Smith } 983383922c3SLisandro Dalcin ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr); 9840513a670SBarry Smith } 985480ef9eaSBarry Smith PetscFunctionReturn(0); 986480ef9eaSBarry Smith } 987cddf8d76SBarry Smith 9889804daf3SBarry Smith #include <petscdraw.h> 989dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw(Mat A,PetscViewer viewer) 990480ef9eaSBarry Smith { 991dfbe8321SBarry Smith PetscErrorCode ierr; 992b0a32e0cSBarry Smith PetscDraw draw; 99336db0b34SBarry Smith PetscReal xr,yr,xl,yl,h,w; 994ace3abfcSBarry Smith PetscBool isnull; 995480ef9eaSBarry Smith 996480ef9eaSBarry Smith PetscFunctionBegin; 997b0a32e0cSBarry Smith ierr = PetscViewerDrawGetDraw(viewer,0,&draw);CHKERRQ(ierr); 998b0a32e0cSBarry Smith ierr = PetscDrawIsNull(draw,&isnull);CHKERRQ(ierr); 999480ef9eaSBarry Smith if (isnull) PetscFunctionReturn(0); 1000480ef9eaSBarry Smith 1001d0f46423SBarry Smith xr = A->cmap->n; yr = A->rmap->n; h = yr/10.0; w = xr/10.0; 1002480ef9eaSBarry Smith xr += w; yr += h; xl = -w; yl = -h; 1003b0a32e0cSBarry Smith ierr = PetscDrawSetCoordinates(draw,xl,yl,xr,yr);CHKERRQ(ierr); 1004832b7cebSLisandro Dalcin ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",(PetscObject)viewer);CHKERRQ(ierr); 1005b0a32e0cSBarry Smith ierr = PetscDrawZoom(draw,MatView_SeqAIJ_Draw_Zoom,A);CHKERRQ(ierr); 10060298fd71SBarry Smith ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",NULL);CHKERRQ(ierr); 1007832b7cebSLisandro Dalcin ierr = PetscDrawSave(draw);CHKERRQ(ierr); 10083a40ed3dSBarry Smith PetscFunctionReturn(0); 1009416022c9SBarry Smith } 1010416022c9SBarry Smith 1011dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ(Mat A,PetscViewer viewer) 1012416022c9SBarry Smith { 1013dfbe8321SBarry Smith PetscErrorCode ierr; 1014ace3abfcSBarry Smith PetscBool iascii,isbinary,isdraw; 1015416022c9SBarry Smith 10163a40ed3dSBarry Smith PetscFunctionBegin; 1017251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 1018251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 1019251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERDRAW,&isdraw);CHKERRQ(ierr); 1020c45a1595SBarry Smith if (iascii) { 10213a40ed3dSBarry Smith ierr = MatView_SeqAIJ_ASCII(A,viewer);CHKERRQ(ierr); 10220f5bd95cSBarry Smith } else if (isbinary) { 10233a40ed3dSBarry Smith ierr = MatView_SeqAIJ_Binary(A,viewer);CHKERRQ(ierr); 10240f5bd95cSBarry Smith } else if (isdraw) { 10253a40ed3dSBarry Smith ierr = MatView_SeqAIJ_Draw(A,viewer);CHKERRQ(ierr); 102611aeaf0aSBarry Smith } 10274108e4d5SBarry Smith ierr = MatView_SeqAIJ_Inode(A,viewer);CHKERRQ(ierr); 10283a40ed3dSBarry Smith PetscFunctionReturn(0); 102917ab2063SBarry Smith } 103019bcc07fSBarry Smith 1031dfbe8321SBarry Smith PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A,MatAssemblyType mode) 103217ab2063SBarry Smith { 1033416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 10346849ba73SBarry Smith PetscErrorCode ierr; 1035580bdb30SBarry Smith PetscInt fshift = 0,i,*ai = a->i,*aj = a->j,*imax = a->imax; 1036d0f46423SBarry Smith PetscInt m = A->rmap->n,*ip,N,*ailen = a->ilen,rmax = 0; 103754f21887SBarry Smith MatScalar *aa = a->a,*ap; 10383447b6efSHong Zhang PetscReal ratio = 0.6; 103917ab2063SBarry Smith 10403a40ed3dSBarry Smith PetscFunctionBegin; 10413a40ed3dSBarry Smith if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0); 1042071fcb05SBarry Smith ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr); 1043071fcb05SBarry Smith if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) PetscFunctionReturn(0); 104417ab2063SBarry Smith 104543ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 104617ab2063SBarry Smith for (i=1; i<m; i++) { 1047416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 104817ab2063SBarry Smith fshift += imax[i-1] - ailen[i-1]; 104994a9d846SBarry Smith rmax = PetscMax(rmax,ailen[i]); 105017ab2063SBarry Smith if (fshift) { 1051bfeeae90SHong Zhang ip = aj + ai[i]; 1052bfeeae90SHong Zhang ap = aa + ai[i]; 105317ab2063SBarry Smith N = ailen[i]; 1054580bdb30SBarry Smith ierr = PetscArraymove(ip-fshift,ip,N);CHKERRQ(ierr); 1055580bdb30SBarry Smith if (!A->structure_only) { 1056580bdb30SBarry Smith ierr = PetscArraymove(ap-fshift,ap,N);CHKERRQ(ierr); 105717ab2063SBarry Smith } 105817ab2063SBarry Smith } 105917ab2063SBarry Smith ai[i] = ai[i-1] + ailen[i-1]; 106017ab2063SBarry Smith } 106117ab2063SBarry Smith if (m) { 106217ab2063SBarry Smith fshift += imax[m-1] - ailen[m-1]; 106317ab2063SBarry Smith ai[m] = ai[m-1] + ailen[m-1]; 106417ab2063SBarry Smith } 10657b083b7cSBarry Smith 106617ab2063SBarry Smith /* reset ilen and imax for each row */ 10677b083b7cSBarry Smith a->nonzerorowcnt = 0; 1068396832f4SHong Zhang if (A->structure_only) { 1069071fcb05SBarry Smith ierr = PetscFree(a->imax);CHKERRQ(ierr); 1070071fcb05SBarry Smith ierr = PetscFree(a->ilen);CHKERRQ(ierr); 1071396832f4SHong Zhang } else { /* !A->structure_only */ 107217ab2063SBarry Smith for (i=0; i<m; i++) { 107317ab2063SBarry Smith ailen[i] = imax[i] = ai[i+1] - ai[i]; 10747b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i+1] - ai[i]) > 0); 107517ab2063SBarry Smith } 1076396832f4SHong Zhang } 1077bfeeae90SHong Zhang a->nz = ai[m]; 107865e19b50SBarry Smith if (fshift && a->nounused == -1) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_PLIB, "Unused space detected in matrix: %D X %D, %D unneeded", m, A->cmap->n, fshift); 107917ab2063SBarry Smith 108009f38230SBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 1081d0f46423SBarry Smith ierr = PetscInfo4(A,"Matrix size: %D X %D; storage space: %D unneeded,%D used\n",m,A->cmap->n,fshift,a->nz);CHKERRQ(ierr); 1082ae15b995SBarry Smith ierr = PetscInfo1(A,"Number of mallocs during MatSetValues() is %D\n",a->reallocs);CHKERRQ(ierr); 1083ae15b995SBarry Smith ierr = PetscInfo1(A,"Maximum nonzeros in any row is %D\n",rmax);CHKERRQ(ierr); 10842205254eSKarl Rupp 10858e58a170SBarry Smith A->info.mallocs += a->reallocs; 1086dd5f02e7SSatish Balay a->reallocs = 0; 10876712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 108836db0b34SBarry Smith a->rmax = rmax; 10894e220ebcSLois Curfman McInnes 1090396832f4SHong Zhang if (!A->structure_only) { 109111e456e1SBarry Smith ierr = MatCheckCompressedRow(A,a->nonzerorowcnt,&a->compressedrow,a->i,m,ratio);CHKERRQ(ierr); 1092396832f4SHong Zhang } 10934108e4d5SBarry Smith ierr = MatAssemblyEnd_SeqAIJ_Inode(A,mode);CHKERRQ(ierr); 10943a40ed3dSBarry Smith PetscFunctionReturn(0); 109517ab2063SBarry Smith } 109617ab2063SBarry Smith 109799cafbc1SBarry Smith PetscErrorCode MatRealPart_SeqAIJ(Mat A) 109899cafbc1SBarry Smith { 109999cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 110099cafbc1SBarry Smith PetscInt i,nz = a->nz; 110154f21887SBarry Smith MatScalar *aa = a->a; 1102acf2f550SJed Brown PetscErrorCode ierr; 110399cafbc1SBarry Smith 110499cafbc1SBarry Smith PetscFunctionBegin; 110599cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscRealPart(aa[i]); 1106acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr); 1107e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 1108e2cf4d64SStefano Zampini if (A->valid_GPU_matrix != PETSC_OFFLOAD_UNALLOCATED) A->valid_GPU_matrix = PETSC_OFFLOAD_CPU; 1109e2cf4d64SStefano Zampini #endif 111099cafbc1SBarry Smith PetscFunctionReturn(0); 111199cafbc1SBarry Smith } 111299cafbc1SBarry Smith 111399cafbc1SBarry Smith PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 111499cafbc1SBarry Smith { 111599cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 111699cafbc1SBarry Smith PetscInt i,nz = a->nz; 111754f21887SBarry Smith MatScalar *aa = a->a; 1118acf2f550SJed Brown PetscErrorCode ierr; 111999cafbc1SBarry Smith 112099cafbc1SBarry Smith PetscFunctionBegin; 112199cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 1122acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr); 1123e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 1124e2cf4d64SStefano Zampini if (A->valid_GPU_matrix != PETSC_OFFLOAD_UNALLOCATED) A->valid_GPU_matrix = PETSC_OFFLOAD_CPU; 1125e2cf4d64SStefano Zampini #endif 112699cafbc1SBarry Smith PetscFunctionReturn(0); 112799cafbc1SBarry Smith } 112899cafbc1SBarry Smith 1129dfbe8321SBarry Smith PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 113017ab2063SBarry Smith { 1131416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1132dfbe8321SBarry Smith PetscErrorCode ierr; 11333a40ed3dSBarry Smith 11343a40ed3dSBarry Smith PetscFunctionBegin; 1135580bdb30SBarry Smith ierr = PetscArrayzero(a->a,a->i[A->rmap->n]);CHKERRQ(ierr); 1136acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr); 1137e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 1138e2cf4d64SStefano Zampini if (A->valid_GPU_matrix != PETSC_OFFLOAD_UNALLOCATED) A->valid_GPU_matrix = PETSC_OFFLOAD_CPU; 1139e2cf4d64SStefano Zampini #endif 11403a40ed3dSBarry Smith PetscFunctionReturn(0); 114117ab2063SBarry Smith } 1142416022c9SBarry Smith 1143dfbe8321SBarry Smith PetscErrorCode MatDestroy_SeqAIJ(Mat A) 114417ab2063SBarry Smith { 1145416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1146dfbe8321SBarry Smith PetscErrorCode ierr; 1147d5d45c9bSBarry Smith 11483a40ed3dSBarry Smith PetscFunctionBegin; 1149aa482453SBarry Smith #if defined(PETSC_USE_LOG) 1150d0f46423SBarry Smith PetscLogObjectState((PetscObject)A,"Rows=%D, Cols=%D, NZ=%D",A->rmap->n,A->cmap->n,a->nz); 115117ab2063SBarry Smith #endif 1152e6b907acSBarry Smith ierr = MatSeqXAIJFreeAIJ(A,&a->a,&a->j,&a->i);CHKERRQ(ierr); 11536bf464f9SBarry Smith ierr = ISDestroy(&a->row);CHKERRQ(ierr); 11546bf464f9SBarry Smith ierr = ISDestroy(&a->col);CHKERRQ(ierr); 115505b42c5fSBarry Smith ierr = PetscFree(a->diag);CHKERRQ(ierr); 1156d48dcb14SBarry Smith ierr = PetscFree(a->ibdiag);CHKERRQ(ierr); 1157071fcb05SBarry Smith ierr = PetscFree(a->imax);CHKERRQ(ierr); 1158071fcb05SBarry Smith ierr = PetscFree(a->ilen);CHKERRQ(ierr); 1159846b4da1SFande Kong ierr = PetscFree(a->ipre);CHKERRQ(ierr); 116071f1c65dSBarry Smith ierr = PetscFree3(a->idiag,a->mdiag,a->ssor_work);CHKERRQ(ierr); 116105b42c5fSBarry Smith ierr = PetscFree(a->solve_work);CHKERRQ(ierr); 11626bf464f9SBarry Smith ierr = ISDestroy(&a->icol);CHKERRQ(ierr); 116305b42c5fSBarry Smith ierr = PetscFree(a->saved_values);CHKERRQ(ierr); 11646bf464f9SBarry Smith ierr = ISColoringDestroy(&a->coloring);CHKERRQ(ierr); 1165cd6b891eSBarry Smith ierr = PetscFree2(a->compressedrow.i,a->compressedrow.rindex);CHKERRQ(ierr); 11660b7e3e3dSHong Zhang ierr = PetscFree(a->matmult_abdense);CHKERRQ(ierr); 1167a30b2313SHong Zhang 11684108e4d5SBarry Smith ierr = MatDestroy_SeqAIJ_Inode(A);CHKERRQ(ierr); 1169bf0cc555SLisandro Dalcin ierr = PetscFree(A->data);CHKERRQ(ierr); 1170901853e0SKris Buschelman 1171dbd8c25aSHong Zhang ierr = PetscObjectChangeTypeName((PetscObject)A,0);CHKERRQ(ierr); 1172bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetColumnIndices_C",NULL);CHKERRQ(ierr); 1173bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatStoreValues_C",NULL);CHKERRQ(ierr); 1174bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatRetrieveValues_C",NULL);CHKERRQ(ierr); 1175bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqsbaij_C",NULL);CHKERRQ(ierr); 1176bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqbaij_C",NULL);CHKERRQ(ierr); 1177bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijperm_C",NULL);CHKERRQ(ierr); 1178af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 1179af8000cdSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_elemental_C",NULL);CHKERRQ(ierr); 1180af8000cdSHong Zhang #endif 118163c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 118263c07aadSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_hypre_C",NULL);CHKERRQ(ierr); 11833dad0653Sstefano_zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatMatMatMult_transpose_seqaij_seqaij_C",NULL);CHKERRQ(ierr); 118463c07aadSStefano Zampini #endif 1185b49cda9fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 1186c9225affSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqsell_C",NULL);CHKERRQ(ierr); 1187c9225affSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_is_C",NULL);CHKERRQ(ierr); 1188bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatIsTranspose_C",NULL);CHKERRQ(ierr); 1189bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetPreallocation_C",NULL);CHKERRQ(ierr); 1190846b4da1SFande Kong ierr = PetscObjectComposeFunction((PetscObject)A,"MatResetPreallocation_C",NULL);CHKERRQ(ierr); 1191bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetPreallocationCSR_C",NULL);CHKERRQ(ierr); 1192bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatReorderForNonzeroDiagonal_C",NULL);CHKERRQ(ierr); 119375d48cdbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatPtAP_is_seqaij_C",NULL);CHKERRQ(ierr); 11943a40ed3dSBarry Smith PetscFunctionReturn(0); 119517ab2063SBarry Smith } 119617ab2063SBarry Smith 1197ace3abfcSBarry Smith PetscErrorCode MatSetOption_SeqAIJ(Mat A,MatOption op,PetscBool flg) 119817ab2063SBarry Smith { 1199416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 12004846f1f5SKris Buschelman PetscErrorCode ierr; 12013a40ed3dSBarry Smith 12023a40ed3dSBarry Smith PetscFunctionBegin; 1203a65d3064SKris Buschelman switch (op) { 1204a65d3064SKris Buschelman case MAT_ROW_ORIENTED: 12054e0d8c25SBarry Smith a->roworiented = flg; 1206a65d3064SKris Buschelman break; 1207a9817697SBarry Smith case MAT_KEEP_NONZERO_PATTERN: 1208a9817697SBarry Smith a->keepnonzeropattern = flg; 1209a65d3064SKris Buschelman break; 1210512a5fc5SBarry Smith case MAT_NEW_NONZERO_LOCATIONS: 1211512a5fc5SBarry Smith a->nonew = (flg ? 0 : 1); 1212a65d3064SKris Buschelman break; 1213a65d3064SKris Buschelman case MAT_NEW_NONZERO_LOCATION_ERR: 12144e0d8c25SBarry Smith a->nonew = (flg ? -1 : 0); 1215a65d3064SKris Buschelman break; 1216a65d3064SKris Buschelman case MAT_NEW_NONZERO_ALLOCATION_ERR: 12174e0d8c25SBarry Smith a->nonew = (flg ? -2 : 0); 1218a65d3064SKris Buschelman break; 121928b2fa4aSMatthew Knepley case MAT_UNUSED_NONZERO_LOCATION_ERR: 122028b2fa4aSMatthew Knepley a->nounused = (flg ? -1 : 0); 122128b2fa4aSMatthew Knepley break; 1222a65d3064SKris Buschelman case MAT_IGNORE_ZERO_ENTRIES: 12234e0d8c25SBarry Smith a->ignorezeroentries = flg; 12240df259c2SBarry Smith break; 12253d472b54SHong Zhang case MAT_SPD: 1226b1646e73SJed Brown case MAT_SYMMETRIC: 1227b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1228b1646e73SJed Brown case MAT_HERMITIAN: 1229b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1230957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 12315021d80fSJed Brown /* These options are handled directly by MatSetOption() */ 12325021d80fSJed Brown break; 12334e0d8c25SBarry Smith case MAT_NEW_DIAGONALS: 1234a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1235a65d3064SKris Buschelman case MAT_USE_HASH_TABLE: 1236290bbb0aSBarry Smith ierr = PetscInfo1(A,"Option %s ignored\n",MatOptions[op]);CHKERRQ(ierr); 1237a65d3064SKris Buschelman break; 1238b87ac2d8SJed Brown case MAT_USE_INODES: 1239b87ac2d8SJed Brown /* Not an error because MatSetOption_SeqAIJ_Inode handles this one */ 1240b87ac2d8SJed Brown break; 1241c10200c1SHong Zhang case MAT_SUBMAT_SINGLEIS: 1242c10200c1SHong Zhang A->submat_singleis = flg; 1243c10200c1SHong Zhang break; 1244071fcb05SBarry Smith case MAT_SORTED_FULL: 1245071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1246071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1247071fcb05SBarry Smith break; 1248a65d3064SKris Buschelman default: 1249e32f2f54SBarry Smith SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"unknown option %d",op); 1250a65d3064SKris Buschelman } 12514108e4d5SBarry Smith ierr = MatSetOption_SeqAIJ_Inode(A,op,flg);CHKERRQ(ierr); 12523a40ed3dSBarry Smith PetscFunctionReturn(0); 125317ab2063SBarry Smith } 125417ab2063SBarry Smith 1255dfbe8321SBarry Smith PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A,Vec v) 125617ab2063SBarry Smith { 1257416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 12586849ba73SBarry Smith PetscErrorCode ierr; 1259fdc842d1SBarry Smith PetscInt i,j,n,*ai=a->i,*aj=a->j; 1260fdc842d1SBarry Smith PetscScalar *aa=a->a,*x; 126117ab2063SBarry Smith 12623a40ed3dSBarry Smith PetscFunctionBegin; 1263d3e70bfaSHong Zhang ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 1264e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 126535e7444dSHong Zhang 1266d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1267d3e70bfaSHong Zhang PetscInt *diag=a->diag; 1268fdc842d1SBarry Smith ierr = VecGetArrayWrite(v,&x);CHKERRQ(ierr); 12692c990fa1SHong Zhang for (i=0; i<n; i++) x[i] = 1.0/aa[diag[i]]; 1270fdc842d1SBarry Smith ierr = VecRestoreArrayWrite(v,&x);CHKERRQ(ierr); 127135e7444dSHong Zhang PetscFunctionReturn(0); 127235e7444dSHong Zhang } 127335e7444dSHong Zhang 1274fdc842d1SBarry Smith ierr = VecGetArrayWrite(v,&x);CHKERRQ(ierr); 127535e7444dSHong Zhang for (i=0; i<n; i++) { 1276fdc842d1SBarry Smith x[i] = 0.0; 127735e7444dSHong Zhang for (j=ai[i]; j<ai[i+1]; j++) { 127835e7444dSHong Zhang if (aj[j] == i) { 127935e7444dSHong Zhang x[i] = aa[j]; 128017ab2063SBarry Smith break; 128117ab2063SBarry Smith } 128217ab2063SBarry Smith } 128317ab2063SBarry Smith } 1284fdc842d1SBarry Smith ierr = VecRestoreArrayWrite(v,&x);CHKERRQ(ierr); 12853a40ed3dSBarry Smith PetscFunctionReturn(0); 128617ab2063SBarry Smith } 128717ab2063SBarry Smith 1288c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1289dfbe8321SBarry Smith PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A,Vec xx,Vec zz,Vec yy) 129017ab2063SBarry Smith { 1291416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1292d9ca1df4SBarry Smith PetscScalar *y; 1293d9ca1df4SBarry Smith const PetscScalar *x; 1294dfbe8321SBarry Smith PetscErrorCode ierr; 1295d0f46423SBarry Smith PetscInt m = A->rmap->n; 12965c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1297d9ca1df4SBarry Smith const MatScalar *v; 1298a77337e4SBarry Smith PetscScalar alpha; 1299d9ca1df4SBarry Smith PetscInt n,i,j; 1300d9ca1df4SBarry Smith const PetscInt *idx,*ii,*ridx=NULL; 13013447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1302ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 13035c897100SBarry Smith #endif 130417ab2063SBarry Smith 13053a40ed3dSBarry Smith PetscFunctionBegin; 13062e8a6d31SBarry Smith if (zz != yy) {ierr = VecCopy(zz,yy);CHKERRQ(ierr);} 1307d9ca1df4SBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 13081ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 13095c897100SBarry Smith 13105c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1311bfeeae90SHong Zhang fortranmulttransposeaddaij_(&m,x,a->i,a->j,a->a,y); 13125c897100SBarry Smith #else 13133447b6efSHong Zhang if (usecprow) { 13143447b6efSHong Zhang m = cprow.nrows; 13153447b6efSHong Zhang ii = cprow.i; 13167b2bb3b9SHong Zhang ridx = cprow.rindex; 13173447b6efSHong Zhang } else { 13183447b6efSHong Zhang ii = a->i; 13193447b6efSHong Zhang } 132017ab2063SBarry Smith for (i=0; i<m; i++) { 13213447b6efSHong Zhang idx = a->j + ii[i]; 13223447b6efSHong Zhang v = a->a + ii[i]; 13233447b6efSHong Zhang n = ii[i+1] - ii[i]; 13243447b6efSHong Zhang if (usecprow) { 13257b2bb3b9SHong Zhang alpha = x[ridx[i]]; 13263447b6efSHong Zhang } else { 132717ab2063SBarry Smith alpha = x[i]; 13283447b6efSHong Zhang } 132904fbf559SBarry Smith for (j=0; j<n; j++) y[idx[j]] += alpha*v[j]; 133017ab2063SBarry Smith } 13315c897100SBarry Smith #endif 1332dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1333d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 13341ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 13353a40ed3dSBarry Smith PetscFunctionReturn(0); 133617ab2063SBarry Smith } 133717ab2063SBarry Smith 1338dfbe8321SBarry Smith PetscErrorCode MatMultTranspose_SeqAIJ(Mat A,Vec xx,Vec yy) 13395c897100SBarry Smith { 1340dfbe8321SBarry Smith PetscErrorCode ierr; 13415c897100SBarry Smith 13425c897100SBarry Smith PetscFunctionBegin; 1343170fe5c8SBarry Smith ierr = VecSet(yy,0.0);CHKERRQ(ierr); 13445c897100SBarry Smith ierr = MatMultTransposeAdd_SeqAIJ(A,xx,yy,yy);CHKERRQ(ierr); 13455c897100SBarry Smith PetscFunctionReturn(0); 13465c897100SBarry Smith } 13475c897100SBarry Smith 1348c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 134978b84d54SShri Abhyankar 1350dfbe8321SBarry Smith PetscErrorCode MatMult_SeqAIJ(Mat A,Vec xx,Vec yy) 135117ab2063SBarry Smith { 1352416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1353d9fead3dSBarry Smith PetscScalar *y; 135454f21887SBarry Smith const PetscScalar *x; 135554f21887SBarry Smith const MatScalar *aa; 1356dfbe8321SBarry Smith PetscErrorCode ierr; 1357003131ecSBarry Smith PetscInt m=A->rmap->n; 13580298fd71SBarry Smith const PetscInt *aj,*ii,*ridx=NULL; 13597b083b7cSBarry Smith PetscInt n,i; 1360362ced78SSatish Balay PetscScalar sum; 1361ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 136217ab2063SBarry Smith 1363b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 136497952fefSHong Zhang #pragma disjoint(*x,*y,*aa) 1365fee21e36SBarry Smith #endif 1366fee21e36SBarry Smith 13673a40ed3dSBarry Smith PetscFunctionBegin; 13683649974fSBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 13691ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 1370416022c9SBarry Smith ii = a->i; 13714eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 1372580bdb30SBarry Smith ierr = PetscArrayzero(y,m);CHKERRQ(ierr); 137397952fefSHong Zhang m = a->compressedrow.nrows; 137497952fefSHong Zhang ii = a->compressedrow.i; 137597952fefSHong Zhang ridx = a->compressedrow.rindex; 137697952fefSHong Zhang for (i=0; i<m; i++) { 137797952fefSHong Zhang n = ii[i+1] - ii[i]; 137897952fefSHong Zhang aj = a->j + ii[i]; 137997952fefSHong Zhang aa = a->a + ii[i]; 138097952fefSHong Zhang sum = 0.0; 1381003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 1382003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 138397952fefSHong Zhang y[*ridx++] = sum; 138497952fefSHong Zhang } 138597952fefSHong Zhang } else { /* do not use compressed row format */ 1386b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 13873d3eaba7SBarry Smith aj = a->j; 13883d3eaba7SBarry Smith aa = a->a; 1389b05257ddSBarry Smith fortranmultaij_(&m,x,ii,aj,aa,y); 1390b05257ddSBarry Smith #else 139117ab2063SBarry Smith for (i=0; i<m; i++) { 1392003131ecSBarry Smith n = ii[i+1] - ii[i]; 1393003131ecSBarry Smith aj = a->j + ii[i]; 1394003131ecSBarry Smith aa = a->a + ii[i]; 139517ab2063SBarry Smith sum = 0.0; 1396003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 139717ab2063SBarry Smith y[i] = sum; 139817ab2063SBarry Smith } 13998d195f9aSBarry Smith #endif 1400b05257ddSBarry Smith } 14017b083b7cSBarry Smith ierr = PetscLogFlops(2.0*a->nz - a->nonzerorowcnt);CHKERRQ(ierr); 14023649974fSBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 14031ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 14043a40ed3dSBarry Smith PetscFunctionReturn(0); 140517ab2063SBarry Smith } 140617ab2063SBarry Smith 1407b434eb95SMatthew G. Knepley PetscErrorCode MatMultMax_SeqAIJ(Mat A,Vec xx,Vec yy) 1408b434eb95SMatthew G. Knepley { 1409b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1410b434eb95SMatthew G. Knepley PetscScalar *y; 1411b434eb95SMatthew G. Knepley const PetscScalar *x; 1412b434eb95SMatthew G. Knepley const MatScalar *aa; 1413b434eb95SMatthew G. Knepley PetscErrorCode ierr; 1414b434eb95SMatthew G. Knepley PetscInt m=A->rmap->n; 1415b434eb95SMatthew G. Knepley const PetscInt *aj,*ii,*ridx=NULL; 1416b434eb95SMatthew G. Knepley PetscInt n,i,nonzerorow=0; 1417b434eb95SMatthew G. Knepley PetscScalar sum; 1418b434eb95SMatthew G. Knepley PetscBool usecprow=a->compressedrow.use; 1419b434eb95SMatthew G. Knepley 1420b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1421b434eb95SMatthew G. Knepley #pragma disjoint(*x,*y,*aa) 1422b434eb95SMatthew G. Knepley #endif 1423b434eb95SMatthew G. Knepley 1424b434eb95SMatthew G. Knepley PetscFunctionBegin; 1425b434eb95SMatthew G. Knepley ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 1426b434eb95SMatthew G. Knepley ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 1427b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1428b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1429b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1430b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1431b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1432b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1433b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1434b434eb95SMatthew G. Knepley aa = a->a + ii[i]; 1435b434eb95SMatthew G. Knepley sum = 0.0; 1436b434eb95SMatthew G. Knepley nonzerorow += (n>0); 1437b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1438b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1439b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1440b434eb95SMatthew G. Knepley } 1441b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 14423d3eaba7SBarry Smith ii = a->i; 1443b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1444b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1445b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1446b434eb95SMatthew G. Knepley aa = a->a + ii[i]; 1447b434eb95SMatthew G. Knepley sum = 0.0; 1448b434eb95SMatthew G. Knepley nonzerorow += (n>0); 1449b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1450b434eb95SMatthew G. Knepley y[i] = sum; 1451b434eb95SMatthew G. Knepley } 1452b434eb95SMatthew G. Knepley } 1453b434eb95SMatthew G. Knepley ierr = PetscLogFlops(2.0*a->nz - nonzerorow);CHKERRQ(ierr); 1454b434eb95SMatthew G. Knepley ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 1455b434eb95SMatthew G. Knepley ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 1456b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1457b434eb95SMatthew G. Knepley } 1458b434eb95SMatthew G. Knepley 1459b434eb95SMatthew G. Knepley PetscErrorCode MatMultAddMax_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz) 1460b434eb95SMatthew G. Knepley { 1461b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1462b434eb95SMatthew G. Knepley PetscScalar *y,*z; 1463b434eb95SMatthew G. Knepley const PetscScalar *x; 1464b434eb95SMatthew G. Knepley const MatScalar *aa; 1465b434eb95SMatthew G. Knepley PetscErrorCode ierr; 1466b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n,*aj,*ii; 1467b434eb95SMatthew G. Knepley PetscInt n,i,*ridx=NULL; 1468b434eb95SMatthew G. Knepley PetscScalar sum; 1469b434eb95SMatthew G. Knepley PetscBool usecprow=a->compressedrow.use; 1470b434eb95SMatthew G. Knepley 1471b434eb95SMatthew G. Knepley PetscFunctionBegin; 1472b434eb95SMatthew G. Knepley ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 1473d9ca1df4SBarry Smith ierr = VecGetArrayPair(yy,zz,&y,&z);CHKERRQ(ierr); 1474b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1475b434eb95SMatthew G. Knepley if (zz != yy) { 1476580bdb30SBarry Smith ierr = PetscArraycpy(z,y,m);CHKERRQ(ierr); 1477b434eb95SMatthew G. Knepley } 1478b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1479b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1480b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1481b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1482b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1483b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1484b434eb95SMatthew G. Knepley aa = a->a + ii[i]; 1485b434eb95SMatthew G. Knepley sum = y[*ridx]; 1486b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1487b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1488b434eb95SMatthew G. Knepley } 1489b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 14903d3eaba7SBarry Smith ii = a->i; 1491b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1492b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1493b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1494b434eb95SMatthew G. Knepley aa = a->a + ii[i]; 1495b434eb95SMatthew G. Knepley sum = y[i]; 1496b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1497b434eb95SMatthew G. Knepley z[i] = sum; 1498b434eb95SMatthew G. Knepley } 1499b434eb95SMatthew G. Knepley } 1500b434eb95SMatthew G. Knepley ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1501b434eb95SMatthew G. Knepley ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 1502d9ca1df4SBarry Smith ierr = VecRestoreArrayPair(yy,zz,&y,&z);CHKERRQ(ierr); 1503b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1504b434eb95SMatthew G. Knepley } 1505b434eb95SMatthew G. Knepley 1506c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1507dfbe8321SBarry Smith PetscErrorCode MatMultAdd_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz) 150817ab2063SBarry Smith { 1509416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1510f15663dcSBarry Smith PetscScalar *y,*z; 1511f15663dcSBarry Smith const PetscScalar *x; 151254f21887SBarry Smith const MatScalar *aa; 1513dfbe8321SBarry Smith PetscErrorCode ierr; 1514d9ca1df4SBarry Smith const PetscInt *aj,*ii,*ridx=NULL; 1515d9ca1df4SBarry Smith PetscInt m = A->rmap->n,n,i; 1516362ced78SSatish Balay PetscScalar sum; 1517ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 15189ea0dfa2SSatish Balay 15193a40ed3dSBarry Smith PetscFunctionBegin; 1520f15663dcSBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 1521d9ca1df4SBarry Smith ierr = VecGetArrayPair(yy,zz,&y,&z);CHKERRQ(ierr); 15224eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 15234eb6d288SHong Zhang if (zz != yy) { 1524580bdb30SBarry Smith ierr = PetscArraycpy(z,y,m);CHKERRQ(ierr); 15254eb6d288SHong Zhang } 152697952fefSHong Zhang m = a->compressedrow.nrows; 152797952fefSHong Zhang ii = a->compressedrow.i; 152897952fefSHong Zhang ridx = a->compressedrow.rindex; 152997952fefSHong Zhang for (i=0; i<m; i++) { 153097952fefSHong Zhang n = ii[i+1] - ii[i]; 153197952fefSHong Zhang aj = a->j + ii[i]; 153297952fefSHong Zhang aa = a->a + ii[i]; 153397952fefSHong Zhang sum = y[*ridx]; 1534f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 153597952fefSHong Zhang z[*ridx++] = sum; 153697952fefSHong Zhang } 153797952fefSHong Zhang } else { /* do not use compressed row format */ 15383d3eaba7SBarry Smith ii = a->i; 1539f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 15403d3eaba7SBarry Smith aj = a->j; 15413d3eaba7SBarry Smith aa = a->a; 1542f15663dcSBarry Smith fortranmultaddaij_(&m,x,ii,aj,aa,y,z); 1543f15663dcSBarry Smith #else 154417ab2063SBarry Smith for (i=0; i<m; i++) { 1545f15663dcSBarry Smith n = ii[i+1] - ii[i]; 1546f15663dcSBarry Smith aj = a->j + ii[i]; 1547f15663dcSBarry Smith aa = a->a + ii[i]; 154817ab2063SBarry Smith sum = y[i]; 1549f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 155017ab2063SBarry Smith z[i] = sum; 155117ab2063SBarry Smith } 155202ab625aSSatish Balay #endif 1553f15663dcSBarry Smith } 1554dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1555f15663dcSBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 1556d9ca1df4SBarry Smith ierr = VecRestoreArrayPair(yy,zz,&y,&z);CHKERRQ(ierr); 15573a40ed3dSBarry Smith PetscFunctionReturn(0); 155817ab2063SBarry Smith } 155917ab2063SBarry Smith 156017ab2063SBarry Smith /* 156117ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 156217ab2063SBarry Smith */ 1563dfbe8321SBarry Smith PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 156417ab2063SBarry Smith { 1565416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 15666849ba73SBarry Smith PetscErrorCode ierr; 1567d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n; 156817ab2063SBarry Smith 15693a40ed3dSBarry Smith PetscFunctionBegin; 157009f38230SBarry Smith if (!a->diag) { 1571785e854fSJed Brown ierr = PetscMalloc1(m,&a->diag);CHKERRQ(ierr); 15723bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)A, m*sizeof(PetscInt));CHKERRQ(ierr); 157309f38230SBarry Smith } 1574d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 157509f38230SBarry Smith a->diag[i] = a->i[i+1]; 1576bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1577bfeeae90SHong Zhang if (a->j[j] == i) { 157809f38230SBarry Smith a->diag[i] = j; 157917ab2063SBarry Smith break; 158017ab2063SBarry Smith } 158117ab2063SBarry Smith } 158217ab2063SBarry Smith } 15833a40ed3dSBarry Smith PetscFunctionReturn(0); 158417ab2063SBarry Smith } 158517ab2063SBarry Smith 158661ecd0c6SBarry Smith PetscErrorCode MatShift_SeqAIJ(Mat A,PetscScalar v) 158761ecd0c6SBarry Smith { 158861ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 158961ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt*)a->diag; 159061ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt*) a->i; 159161ecd0c6SBarry Smith PetscInt i,*mdiag = NULL; 159261ecd0c6SBarry Smith PetscErrorCode ierr; 159361ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 159461ecd0c6SBarry Smith 159561ecd0c6SBarry Smith PetscFunctionBegin; 159661ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 159761ecd0c6SBarry Smith ierr = MatSeqAIJSetPreallocation(A,1,NULL);CHKERRQ(ierr); 159861ecd0c6SBarry Smith ierr = MatShift_Basic(A,v);CHKERRQ(ierr); 159961ecd0c6SBarry Smith PetscFunctionReturn(0); 160061ecd0c6SBarry Smith } 160161ecd0c6SBarry Smith 160261ecd0c6SBarry Smith if (a->diagonaldense) { 160361ecd0c6SBarry Smith cnt = 0; 160461ecd0c6SBarry Smith } else { 160561ecd0c6SBarry Smith ierr = PetscCalloc1(A->rmap->n,&mdiag);CHKERRQ(ierr); 160661ecd0c6SBarry Smith for (i=0; i<A->rmap->n; i++) { 160761ecd0c6SBarry Smith if (diag[i] >= ii[i+1]) { 160861ecd0c6SBarry Smith cnt++; 160961ecd0c6SBarry Smith mdiag[i] = 1; 161061ecd0c6SBarry Smith } 161161ecd0c6SBarry Smith } 161261ecd0c6SBarry Smith } 161361ecd0c6SBarry Smith if (!cnt) { 161461ecd0c6SBarry Smith ierr = MatShift_Basic(A,v);CHKERRQ(ierr); 161561ecd0c6SBarry Smith } else { 1616b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1617b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 161861ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc,free_a = a->free_a,free_ij = a->free_ij; 161961ecd0c6SBarry Smith 162061ecd0c6SBarry Smith a->a = NULL; 162161ecd0c6SBarry Smith a->j = NULL; 162261ecd0c6SBarry Smith a->i = NULL; 162361ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 162461ecd0c6SBarry Smith for (i=0; i<A->rmap->n; i++) { 162561ecd0c6SBarry Smith a->imax[i] += mdiag[i]; 1626447d62f5SStefano Zampini a->imax[i] = PetscMin(a->imax[i],A->cmap->n); 162761ecd0c6SBarry Smith } 162861ecd0c6SBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(A,0,a->imax);CHKERRQ(ierr); 162961ecd0c6SBarry Smith 163061ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 163161ecd0c6SBarry Smith for (i=0; i<A->rmap->n; i++) { 163261ecd0c6SBarry Smith ierr = MatSetValues(A,1,&i,a->imax[i] - mdiag[i],&oldj[oldi[i]],&olda[oldi[i]],ADD_VALUES);CHKERRQ(ierr); 1633447d62f5SStefano Zampini if (i < A->cmap->n) { 163461ecd0c6SBarry Smith ierr = MatSetValue(A,i,i,v,ADD_VALUES);CHKERRQ(ierr); 163561ecd0c6SBarry Smith } 1636447d62f5SStefano Zampini } 163761ecd0c6SBarry Smith ierr = MatAssemblyBegin(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 163861ecd0c6SBarry Smith ierr = MatAssemblyEnd(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 163961ecd0c6SBarry Smith if (singlemalloc) { 164061ecd0c6SBarry Smith ierr = PetscFree3(olda,oldj,oldi);CHKERRQ(ierr); 164161ecd0c6SBarry Smith } else { 164261ecd0c6SBarry Smith if (free_a) {ierr = PetscFree(olda);CHKERRQ(ierr);} 164361ecd0c6SBarry Smith if (free_ij) {ierr = PetscFree(oldj);CHKERRQ(ierr);} 164461ecd0c6SBarry Smith if (free_ij) {ierr = PetscFree(oldi);CHKERRQ(ierr);} 164561ecd0c6SBarry Smith } 164661ecd0c6SBarry Smith } 164761ecd0c6SBarry Smith ierr = PetscFree(mdiag);CHKERRQ(ierr); 164861ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 164961ecd0c6SBarry Smith PetscFunctionReturn(0); 165061ecd0c6SBarry Smith } 165161ecd0c6SBarry Smith 1652be5855fcSBarry Smith /* 1653be5855fcSBarry Smith Checks for missing diagonals 1654be5855fcSBarry Smith */ 1655ace3abfcSBarry Smith PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A,PetscBool *missing,PetscInt *d) 1656be5855fcSBarry Smith { 1657be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 16587734d3b5SMatthew G. Knepley PetscInt *diag,*ii = a->i,i; 1659994fe344SLisandro Dalcin PetscErrorCode ierr; 1660be5855fcSBarry Smith 1661be5855fcSBarry Smith PetscFunctionBegin; 166209f38230SBarry Smith *missing = PETSC_FALSE; 16637734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 166409f38230SBarry Smith *missing = PETSC_TRUE; 166509f38230SBarry Smith if (d) *d = 0; 1666994fe344SLisandro Dalcin ierr = PetscInfo(A,"Matrix has no entries therefore is missing diagonal\n");CHKERRQ(ierr); 166709f38230SBarry Smith } else { 166801445905SHong Zhang PetscInt n; 166901445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1670f1e2ffcdSBarry Smith diag = a->diag; 167101445905SHong Zhang for (i=0; i<n; i++) { 16727734d3b5SMatthew G. Knepley if (diag[i] >= ii[i+1]) { 167309f38230SBarry Smith *missing = PETSC_TRUE; 167409f38230SBarry Smith if (d) *d = i; 1675994fe344SLisandro Dalcin ierr = PetscInfo1(A,"Matrix is missing diagonal number %D\n",i);CHKERRQ(ierr); 1676358d2f5dSShri Abhyankar break; 167709f38230SBarry Smith } 1678be5855fcSBarry Smith } 1679be5855fcSBarry Smith } 1680be5855fcSBarry Smith PetscFunctionReturn(0); 1681be5855fcSBarry Smith } 1682be5855fcSBarry Smith 16830da83c2eSBarry Smith #include <petscblaslapack.h> 16840da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 16850da83c2eSBarry Smith 16860da83c2eSBarry Smith /* 16870da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 16880da83c2eSBarry Smith */ 16890da83c2eSBarry Smith PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A,PetscInt nblocks,const PetscInt *bsizes,PetscScalar *diag) 16900da83c2eSBarry Smith { 16910da83c2eSBarry Smith PetscErrorCode ierr; 16920da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx,j,bsizemax = 0,*v_pivots; 16930da83c2eSBarry Smith PetscBool allowzeropivot,zeropivotdetected=PETSC_FALSE; 16940da83c2eSBarry Smith const PetscReal shift = 0.0; 16950da83c2eSBarry Smith PetscInt ipvt[5]; 16960da83c2eSBarry Smith PetscScalar work[25],*v_work; 16970da83c2eSBarry Smith 16980da83c2eSBarry Smith PetscFunctionBegin; 16990da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 17000da83c2eSBarry Smith for (i=0; i<nblocks; i++) ncnt += bsizes[i]; 17010da83c2eSBarry Smith if (ncnt != n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Total blocksizes %D doesn't match number matrix rows %D",ncnt,n); 17020da83c2eSBarry Smith for (i=0; i<nblocks; i++) { 17030da83c2eSBarry Smith bsizemax = PetscMax(bsizemax,bsizes[i]); 17040da83c2eSBarry Smith } 17050da83c2eSBarry Smith ierr = PetscMalloc1(bsizemax,&indx);CHKERRQ(ierr); 17060da83c2eSBarry Smith if (bsizemax > 7) { 17070da83c2eSBarry Smith ierr = PetscMalloc2(bsizemax,&v_work,bsizemax,&v_pivots);CHKERRQ(ierr); 17080da83c2eSBarry Smith } 17090da83c2eSBarry Smith ncnt = 0; 17100da83c2eSBarry Smith for (i=0; i<nblocks; i++) { 17110da83c2eSBarry Smith for (j=0; j<bsizes[i]; j++) indx[j] = ncnt+j; 17120da83c2eSBarry Smith ierr = MatGetValues(A,bsizes[i],indx,bsizes[i],indx,diag);CHKERRQ(ierr); 17130da83c2eSBarry Smith switch (bsizes[i]) { 17140da83c2eSBarry Smith case 1: 17150da83c2eSBarry Smith *diag = 1.0/(*diag); 17160da83c2eSBarry Smith break; 17170da83c2eSBarry Smith case 2: 17180da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_2(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 17190da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17200da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_2(diag);CHKERRQ(ierr); 17210da83c2eSBarry Smith break; 17220da83c2eSBarry Smith case 3: 17230da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_3(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 17240da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17250da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_3(diag);CHKERRQ(ierr); 17260da83c2eSBarry Smith break; 17270da83c2eSBarry Smith case 4: 17280da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_4(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 17290da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17300da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_4(diag);CHKERRQ(ierr); 17310da83c2eSBarry Smith break; 17320da83c2eSBarry Smith case 5: 17330da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_5(diag,ipvt,work,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 17340da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17350da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_5(diag);CHKERRQ(ierr); 17360da83c2eSBarry Smith break; 17370da83c2eSBarry Smith case 6: 17380da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_6(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 17390da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17400da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_6(diag);CHKERRQ(ierr); 17410da83c2eSBarry Smith break; 17420da83c2eSBarry Smith case 7: 17430da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_7(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 17440da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17450da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_7(diag);CHKERRQ(ierr); 17460da83c2eSBarry Smith break; 17470da83c2eSBarry Smith default: 17480da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A(bsizes[i],diag,v_pivots,v_work,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 17490da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17500da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_N(diag,bsizes[i]);CHKERRQ(ierr); 17510da83c2eSBarry Smith } 17520da83c2eSBarry Smith ncnt += bsizes[i]; 17530da83c2eSBarry Smith diag += bsizes[i]*bsizes[i]; 17540da83c2eSBarry Smith } 17550da83c2eSBarry Smith if (bsizemax > 7) { 17560da83c2eSBarry Smith ierr = PetscFree2(v_work,v_pivots);CHKERRQ(ierr); 17570da83c2eSBarry Smith } 17580da83c2eSBarry Smith ierr = PetscFree(indx);CHKERRQ(ierr); 17590da83c2eSBarry Smith PetscFunctionReturn(0); 17600da83c2eSBarry Smith } 17610da83c2eSBarry Smith 1762422a814eSBarry Smith /* 1763422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1764422a814eSBarry Smith */ 17657087cfbeSBarry Smith PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A,PetscScalar omega,PetscScalar fshift) 176671f1c65dSBarry Smith { 176771f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 176871f1c65dSBarry Smith PetscErrorCode ierr; 1769d0f46423SBarry Smith PetscInt i,*diag,m = A->rmap->n; 177054f21887SBarry Smith MatScalar *v = a->a; 177154f21887SBarry Smith PetscScalar *idiag,*mdiag; 177271f1c65dSBarry Smith 177371f1c65dSBarry Smith PetscFunctionBegin; 177471f1c65dSBarry Smith if (a->idiagvalid) PetscFunctionReturn(0); 177571f1c65dSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 177671f1c65dSBarry Smith diag = a->diag; 177771f1c65dSBarry Smith if (!a->idiag) { 1778dcca6d9dSJed Brown ierr = PetscMalloc3(m,&a->idiag,m,&a->mdiag,m,&a->ssor_work);CHKERRQ(ierr); 17793bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)A, 3*m*sizeof(PetscScalar));CHKERRQ(ierr); 178071f1c65dSBarry Smith v = a->a; 178171f1c65dSBarry Smith } 178271f1c65dSBarry Smith mdiag = a->mdiag; 178371f1c65dSBarry Smith idiag = a->idiag; 178471f1c65dSBarry Smith 1785422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 178671f1c65dSBarry Smith for (i=0; i<m; i++) { 178771f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1788899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1789899639b0SHong Zhang if (PetscRealPart(fshift)) { 1790899639b0SHong Zhang ierr = PetscInfo1(A,"Zero diagonal on row %D\n",i);CHKERRQ(ierr); 17917b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17927b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 17937b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 1794a6fa060aSHong Zhang } else SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Zero diagonal on row %D",i); 1795899639b0SHong Zhang } 179671f1c65dSBarry Smith idiag[i] = 1.0/v[diag[i]]; 179771f1c65dSBarry Smith } 179871f1c65dSBarry Smith ierr = PetscLogFlops(m);CHKERRQ(ierr); 179971f1c65dSBarry Smith } else { 180071f1c65dSBarry Smith for (i=0; i<m; i++) { 180171f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 180271f1c65dSBarry Smith idiag[i] = omega/(fshift + v[diag[i]]); 180371f1c65dSBarry Smith } 1804dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*m);CHKERRQ(ierr); 180571f1c65dSBarry Smith } 180671f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 180771f1c65dSBarry Smith PetscFunctionReturn(0); 180871f1c65dSBarry Smith } 180971f1c65dSBarry Smith 1810c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 181141f059aeSBarry Smith PetscErrorCode MatSOR_SeqAIJ(Mat A,Vec bb,PetscReal omega,MatSORType flag,PetscReal fshift,PetscInt its,PetscInt lits,Vec xx) 181217ab2063SBarry Smith { 1813416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1814e6d1f457SBarry Smith PetscScalar *x,d,sum,*t,scale; 18153d3eaba7SBarry Smith const MatScalar *v,*idiag=0,*mdiag; 181654f21887SBarry Smith const PetscScalar *b, *bs,*xb, *ts; 1817dfbe8321SBarry Smith PetscErrorCode ierr; 18183d3eaba7SBarry Smith PetscInt n,m = A->rmap->n,i; 181997f1f81fSBarry Smith const PetscInt *idx,*diag; 182017ab2063SBarry Smith 18213a40ed3dSBarry Smith PetscFunctionBegin; 1822b965ef7fSBarry Smith its = its*lits; 182391723122SBarry Smith 182471f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 182571f1c65dSBarry Smith if (!a->idiagvalid) {ierr = MatInvertDiagonal_SeqAIJ(A,omega,fshift);CHKERRQ(ierr);} 182671f1c65dSBarry Smith a->fshift = fshift; 182771f1c65dSBarry Smith a->omega = omega; 1828ed480e8bSBarry Smith 182971f1c65dSBarry Smith diag = a->diag; 183071f1c65dSBarry Smith t = a->ssor_work; 1831ed480e8bSBarry Smith idiag = a->idiag; 183271f1c65dSBarry Smith mdiag = a->mdiag; 1833ed480e8bSBarry Smith 18341ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 18353649974fSBarry Smith ierr = VecGetArrayRead(bb,&b);CHKERRQ(ierr); 1836ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 183717ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 183817ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1839ed480e8bSBarry Smith bs = b; 184017ab2063SBarry Smith for (i=0; i<m; i++) { 184171f1c65dSBarry Smith d = fshift + mdiag[i]; 1842416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1843ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1844ed480e8bSBarry Smith v = a->a + diag[i] + 1; 184517ab2063SBarry Smith sum = b[i]*d/omega; 1846003131ecSBarry Smith PetscSparseDensePlusDot(sum,bs,v,idx,n); 184717ab2063SBarry Smith x[i] = sum; 184817ab2063SBarry Smith } 18491ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 18503649974fSBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 1851efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 18523a40ed3dSBarry Smith PetscFunctionReturn(0); 185317ab2063SBarry Smith } 1854c783ea89SBarry Smith 18552205254eSKarl Rupp if (flag == SOR_APPLY_LOWER) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"SOR_APPLY_LOWER is not implemented"); 18562205254eSKarl Rupp else if (flag & SOR_EISENSTAT) { 185717ab2063SBarry Smith /* Let A = L + U + D; where L is lower trianglar, 1858887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 185917ab2063SBarry Smith 186017ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 186117ab2063SBarry Smith 1862887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 186317ab2063SBarry Smith */ 186417ab2063SBarry Smith scale = (2.0/omega) - 1.0; 186517ab2063SBarry Smith 186617ab2063SBarry Smith /* x = (E + U)^{-1} b */ 186717ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1868416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1869ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1870ed480e8bSBarry Smith v = a->a + diag[i] + 1; 187117ab2063SBarry Smith sum = b[i]; 1872e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 1873ed480e8bSBarry Smith x[i] = sum*idiag[i]; 187417ab2063SBarry Smith } 187517ab2063SBarry Smith 187617ab2063SBarry Smith /* t = b - (2*E - D)x */ 1877416022c9SBarry Smith v = a->a; 18782205254eSKarl Rupp for (i=0; i<m; i++) t[i] = b[i] - scale*(v[*diag++])*x[i]; 187917ab2063SBarry Smith 188017ab2063SBarry Smith /* t = (E + L)^{-1}t */ 1881ed480e8bSBarry Smith ts = t; 1882416022c9SBarry Smith diag = a->diag; 188317ab2063SBarry Smith for (i=0; i<m; i++) { 1884416022c9SBarry Smith n = diag[i] - a->i[i]; 1885ed480e8bSBarry Smith idx = a->j + a->i[i]; 1886ed480e8bSBarry Smith v = a->a + a->i[i]; 188717ab2063SBarry Smith sum = t[i]; 1888003131ecSBarry Smith PetscSparseDenseMinusDot(sum,ts,v,idx,n); 1889ed480e8bSBarry Smith t[i] = sum*idiag[i]; 1890733d66baSBarry Smith /* x = x + t */ 1891733d66baSBarry Smith x[i] += t[i]; 189217ab2063SBarry Smith } 189317ab2063SBarry Smith 1894dc0b31edSSatish Balay ierr = PetscLogFlops(6.0*m-1 + 2.0*a->nz);CHKERRQ(ierr); 18951ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 18963649974fSBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 18973a40ed3dSBarry Smith PetscFunctionReturn(0); 189817ab2063SBarry Smith } 189917ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 190017ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 190117ab2063SBarry Smith for (i=0; i<m; i++) { 1902416022c9SBarry Smith n = diag[i] - a->i[i]; 1903ed480e8bSBarry Smith idx = a->j + a->i[i]; 1904ed480e8bSBarry Smith v = a->a + a->i[i]; 190517ab2063SBarry Smith sum = b[i]; 1906e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 19075c99c7daSBarry Smith t[i] = sum; 1908ed480e8bSBarry Smith x[i] = sum*idiag[i]; 190917ab2063SBarry Smith } 19105c99c7daSBarry Smith xb = t; 1911efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 19123a40ed3dSBarry Smith } else xb = b; 191317ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 191417ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1915416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1916ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1917ed480e8bSBarry Smith v = a->a + diag[i] + 1; 191817ab2063SBarry Smith sum = xb[i]; 1919e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 19205c99c7daSBarry Smith if (xb == b) { 1921ed480e8bSBarry Smith x[i] = sum*idiag[i]; 19225c99c7daSBarry Smith } else { 1923b19a5dc2SMark Adams x[i] = (1-omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 192417ab2063SBarry Smith } 19255c99c7daSBarry Smith } 1926b19a5dc2SMark Adams ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); /* assumes 1/2 in upper */ 192717ab2063SBarry Smith } 192817ab2063SBarry Smith its--; 192917ab2063SBarry Smith } 193017ab2063SBarry Smith while (its--) { 193117ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 193217ab2063SBarry Smith for (i=0; i<m; i++) { 1933b19a5dc2SMark Adams /* lower */ 1934b19a5dc2SMark Adams n = diag[i] - a->i[i]; 1935ed480e8bSBarry Smith idx = a->j + a->i[i]; 1936ed480e8bSBarry Smith v = a->a + a->i[i]; 193717ab2063SBarry Smith sum = b[i]; 1938e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 1939b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 1940b19a5dc2SMark Adams /* upper */ 1941b19a5dc2SMark Adams n = a->i[i+1] - diag[i] - 1; 1942b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 1943b19a5dc2SMark Adams v = a->a + diag[i] + 1; 1944b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum,x,v,idx,n); 1945b19a5dc2SMark Adams x[i] = (1. - omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 194617ab2063SBarry Smith } 1947b19a5dc2SMark Adams xb = t; 19489f863219SBarry Smith ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1949b19a5dc2SMark Adams } else xb = b; 195017ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 195117ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1952b19a5dc2SMark Adams sum = xb[i]; 1953b19a5dc2SMark Adams if (xb == b) { 1954b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 1955416022c9SBarry Smith n = a->i[i+1] - a->i[i]; 1956ed480e8bSBarry Smith idx = a->j + a->i[i]; 1957ed480e8bSBarry Smith v = a->a + a->i[i]; 1958e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 1959ed480e8bSBarry Smith x[i] = (1. - omega)*x[i] + (sum + mdiag[i]*x[i])*idiag[i]; 1960b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 1961b19a5dc2SMark Adams n = a->i[i+1] - diag[i] - 1; 1962b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 1963b19a5dc2SMark Adams v = a->a + diag[i] + 1; 1964b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum,x,v,idx,n); 1965b19a5dc2SMark Adams x[i] = (1. - omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 196617ab2063SBarry Smith } 1967b19a5dc2SMark Adams } 1968b19a5dc2SMark Adams if (xb == b) { 19699f863219SBarry Smith ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1970b19a5dc2SMark Adams } else { 1971b19a5dc2SMark Adams ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); /* assumes 1/2 in upper */ 1972b19a5dc2SMark Adams } 197317ab2063SBarry Smith } 197417ab2063SBarry Smith } 19751ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 19763649974fSBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 1977365a8a9eSBarry Smith PetscFunctionReturn(0); 197817ab2063SBarry Smith } 197917ab2063SBarry Smith 19802af78befSBarry Smith 1981dfbe8321SBarry Smith PetscErrorCode MatGetInfo_SeqAIJ(Mat A,MatInfoType flag,MatInfo *info) 198217ab2063SBarry Smith { 1983416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 19844e220ebcSLois Curfman McInnes 19853a40ed3dSBarry Smith PetscFunctionBegin; 19864e220ebcSLois Curfman McInnes info->block_size = 1.0; 19874e220ebcSLois Curfman McInnes info->nz_allocated = (double)a->maxnz; 19884e220ebcSLois Curfman McInnes info->nz_used = (double)a->nz; 19894e220ebcSLois Curfman McInnes info->nz_unneeded = (double)(a->maxnz - a->nz); 19904e220ebcSLois Curfman McInnes info->assemblies = (double)A->num_ass; 19918e58a170SBarry Smith info->mallocs = (double)A->info.mallocs; 19927adad957SLisandro Dalcin info->memory = ((PetscObject)A)->mem; 1993d5f3da31SBarry Smith if (A->factortype) { 19944e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 19954e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 19964e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 19974e220ebcSLois Curfman McInnes } else { 19984e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 19994e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 20004e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 20014e220ebcSLois Curfman McInnes } 20023a40ed3dSBarry Smith PetscFunctionReturn(0); 200317ab2063SBarry Smith } 200417ab2063SBarry Smith 20052b40b63fSBarry Smith PetscErrorCode MatZeroRows_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 200617ab2063SBarry Smith { 2007416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2008c7da8527SEric Chamberland PetscInt i,m = A->rmap->n - 1; 20096849ba73SBarry Smith PetscErrorCode ierr; 201097b48c8fSBarry Smith const PetscScalar *xx; 201197b48c8fSBarry Smith PetscScalar *bb; 2012c7da8527SEric Chamberland PetscInt d = 0; 201317ab2063SBarry Smith 20143a40ed3dSBarry Smith PetscFunctionBegin; 201597b48c8fSBarry Smith if (x && b) { 201697b48c8fSBarry Smith ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 201797b48c8fSBarry Smith ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 201897b48c8fSBarry Smith for (i=0; i<N; i++) { 201997b48c8fSBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 2020447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 202197b48c8fSBarry Smith bb[rows[i]] = diag*xx[rows[i]]; 202297b48c8fSBarry Smith } 202397b48c8fSBarry Smith ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 202497b48c8fSBarry Smith ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 202597b48c8fSBarry Smith } 202697b48c8fSBarry Smith 2027a9817697SBarry Smith if (a->keepnonzeropattern) { 2028f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 2029e32f2f54SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 2030580bdb30SBarry Smith ierr = PetscArrayzero(&a->a[a->i[rows[i]]],a->ilen[rows[i]]);CHKERRQ(ierr); 2031f1e2ffcdSBarry Smith } 2032f4df32b1SMatthew Knepley if (diag != 0.0) { 2033c7da8527SEric Chamberland for (i=0; i<N; i++) { 2034c7da8527SEric Chamberland d = rows[i]; 2035447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 2036c7da8527SEric Chamberland if (a->diag[d] >= a->i[d+1]) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in the zeroed row %D",d); 2037c7da8527SEric Chamberland } 2038f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 2039447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 2040f4df32b1SMatthew Knepley a->a[a->diag[rows[i]]] = diag; 2041f1e2ffcdSBarry Smith } 2042f1e2ffcdSBarry Smith } 2043f1e2ffcdSBarry Smith } else { 2044f4df32b1SMatthew Knepley if (diag != 0.0) { 204517ab2063SBarry Smith for (i=0; i<N; i++) { 2046e32f2f54SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 20477ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2048447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2049447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2050447d62f5SStefano Zampini } else { 2051416022c9SBarry Smith a->ilen[rows[i]] = 1; 2052f4df32b1SMatthew Knepley a->a[a->i[rows[i]]] = diag; 2053bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2054447d62f5SStefano Zampini } 2055447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 2056f4df32b1SMatthew Knepley ierr = MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],&diag,INSERT_VALUES);CHKERRQ(ierr); 205717ab2063SBarry Smith } 205817ab2063SBarry Smith } 20593a40ed3dSBarry Smith } else { 206017ab2063SBarry Smith for (i=0; i<N; i++) { 2061e32f2f54SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 2062416022c9SBarry Smith a->ilen[rows[i]] = 0; 206317ab2063SBarry Smith } 206417ab2063SBarry Smith } 2065e56f5c9eSBarry Smith A->nonzerostate++; 2066f1e2ffcdSBarry Smith } 2067e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 2068e2cf4d64SStefano Zampini if (A->valid_GPU_matrix != PETSC_OFFLOAD_UNALLOCATED) A->valid_GPU_matrix = PETSC_OFFLOAD_CPU; 2069e2cf4d64SStefano Zampini #endif 20704099cc6bSBarry Smith ierr = (*A->ops->assemblyend)(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 20713a40ed3dSBarry Smith PetscFunctionReturn(0); 207217ab2063SBarry Smith } 207317ab2063SBarry Smith 20746e169961SBarry Smith PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 20756e169961SBarry Smith { 20766e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 20776e169961SBarry Smith PetscInt i,j,m = A->rmap->n - 1,d = 0; 20786e169961SBarry Smith PetscErrorCode ierr; 20792b40b63fSBarry Smith PetscBool missing,*zeroed,vecs = PETSC_FALSE; 20806e169961SBarry Smith const PetscScalar *xx; 20816e169961SBarry Smith PetscScalar *bb; 20826e169961SBarry Smith 20836e169961SBarry Smith PetscFunctionBegin; 20846e169961SBarry Smith if (x && b) { 20856e169961SBarry Smith ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 20866e169961SBarry Smith ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 20872b40b63fSBarry Smith vecs = PETSC_TRUE; 20886e169961SBarry Smith } 20891795a4d1SJed Brown ierr = PetscCalloc1(A->rmap->n,&zeroed);CHKERRQ(ierr); 20906e169961SBarry Smith for (i=0; i<N; i++) { 20916e169961SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 2092580bdb30SBarry Smith ierr = PetscArrayzero(&a->a[a->i[rows[i]]],a->ilen[rows[i]]);CHKERRQ(ierr); 20932205254eSKarl Rupp 20946e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 20956e169961SBarry Smith } 20966e169961SBarry Smith for (i=0; i<A->rmap->n; i++) { 20976e169961SBarry Smith if (!zeroed[i]) { 20986e169961SBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 20994cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 21002b40b63fSBarry Smith if (vecs) bb[i] -= a->a[j]*xx[a->j[j]]; 21016e169961SBarry Smith a->a[j] = 0.0; 21026e169961SBarry Smith } 21036e169961SBarry Smith } 21044cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag*xx[i]; 21056e169961SBarry Smith } 21066e169961SBarry Smith if (x && b) { 21076e169961SBarry Smith ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 21086e169961SBarry Smith ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 21096e169961SBarry Smith } 21106e169961SBarry Smith ierr = PetscFree(zeroed);CHKERRQ(ierr); 21116e169961SBarry Smith if (diag != 0.0) { 21126e169961SBarry Smith ierr = MatMissingDiagonal_SeqAIJ(A,&missing,&d);CHKERRQ(ierr); 21131d5a398dSstefano_zampini if (missing) { 21141d5a398dSstefano_zampini for (i=0; i<N; i++) { 21154cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 21164cf107fdSStefano Zampini if (a->nonew && rows[i] >= d) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in row %D (%D)",d,rows[i]); 21171d5a398dSstefano_zampini ierr = MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],&diag,INSERT_VALUES);CHKERRQ(ierr); 21181d5a398dSstefano_zampini } 21191d5a398dSstefano_zampini } else { 21206e169961SBarry Smith for (i=0; i<N; i++) { 21216e169961SBarry Smith a->a[a->diag[rows[i]]] = diag; 21226e169961SBarry Smith } 21236e169961SBarry Smith } 21241d5a398dSstefano_zampini } 2125e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 2126e2cf4d64SStefano Zampini if (A->valid_GPU_matrix != PETSC_OFFLOAD_UNALLOCATED) A->valid_GPU_matrix = PETSC_OFFLOAD_CPU; 2127e2cf4d64SStefano Zampini #endif 21284099cc6bSBarry Smith ierr = (*A->ops->assemblyend)(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 21296e169961SBarry Smith PetscFunctionReturn(0); 21306e169961SBarry Smith } 21316e169961SBarry Smith 2132a77337e4SBarry Smith PetscErrorCode MatGetRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 213317ab2063SBarry Smith { 2134416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 213597f1f81fSBarry Smith PetscInt *itmp; 213617ab2063SBarry Smith 21373a40ed3dSBarry Smith PetscFunctionBegin; 2138e32f2f54SBarry Smith if (row < 0 || row >= A->rmap->n) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D out of range",row); 213917ab2063SBarry Smith 2140416022c9SBarry Smith *nz = a->i[row+1] - a->i[row]; 2141bfeeae90SHong Zhang if (v) *v = a->a + a->i[row]; 214217ab2063SBarry Smith if (idx) { 2143bfeeae90SHong Zhang itmp = a->j + a->i[row]; 214426fbe8dcSKarl Rupp if (*nz) *idx = itmp; 214517ab2063SBarry Smith else *idx = 0; 214617ab2063SBarry Smith } 21473a40ed3dSBarry Smith PetscFunctionReturn(0); 214817ab2063SBarry Smith } 214917ab2063SBarry Smith 2150bfeeae90SHong Zhang /* remove this function? */ 2151a77337e4SBarry Smith PetscErrorCode MatRestoreRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 215217ab2063SBarry Smith { 21533a40ed3dSBarry Smith PetscFunctionBegin; 21543a40ed3dSBarry Smith PetscFunctionReturn(0); 215517ab2063SBarry Smith } 215617ab2063SBarry Smith 2157dfbe8321SBarry Smith PetscErrorCode MatNorm_SeqAIJ(Mat A,NormType type,PetscReal *nrm) 215817ab2063SBarry Smith { 2159416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 216054f21887SBarry Smith MatScalar *v = a->a; 216136db0b34SBarry Smith PetscReal sum = 0.0; 21626849ba73SBarry Smith PetscErrorCode ierr; 216397f1f81fSBarry Smith PetscInt i,j; 216417ab2063SBarry Smith 21653a40ed3dSBarry Smith PetscFunctionBegin; 216617ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2167570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2168570b7f6dSBarry Smith PetscBLASInt one = 1,nz = a->nz; 2169570b7f6dSBarry Smith *nrm = BLASnrm2_(&nz,v,&one); 2170570b7f6dSBarry Smith #else 2171416022c9SBarry Smith for (i=0; i<a->nz; i++) { 217236db0b34SBarry Smith sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 217317ab2063SBarry Smith } 21748f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2175570b7f6dSBarry Smith #endif 217651f70360SJed Brown ierr = PetscLogFlops(2*a->nz);CHKERRQ(ierr); 21773a40ed3dSBarry Smith } else if (type == NORM_1) { 217836db0b34SBarry Smith PetscReal *tmp; 217997f1f81fSBarry Smith PetscInt *jj = a->j; 21801795a4d1SJed Brown ierr = PetscCalloc1(A->cmap->n+1,&tmp);CHKERRQ(ierr); 2181064f8208SBarry Smith *nrm = 0.0; 2182416022c9SBarry Smith for (j=0; j<a->nz; j++) { 2183bfeeae90SHong Zhang tmp[*jj++] += PetscAbsScalar(*v); v++; 218417ab2063SBarry Smith } 2185d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 2186064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 218717ab2063SBarry Smith } 2188606d414cSSatish Balay ierr = PetscFree(tmp);CHKERRQ(ierr); 218951f70360SJed Brown ierr = PetscLogFlops(PetscMax(a->nz-1,0));CHKERRQ(ierr); 21903a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2191064f8208SBarry Smith *nrm = 0.0; 2192d0f46423SBarry Smith for (j=0; j<A->rmap->n; j++) { 2193bfeeae90SHong Zhang v = a->a + a->i[j]; 219417ab2063SBarry Smith sum = 0.0; 2195416022c9SBarry Smith for (i=0; i<a->i[j+1]-a->i[j]; i++) { 2196cddf8d76SBarry Smith sum += PetscAbsScalar(*v); v++; 219717ab2063SBarry Smith } 2198064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 219917ab2063SBarry Smith } 220051f70360SJed Brown ierr = PetscLogFlops(PetscMax(a->nz-1,0));CHKERRQ(ierr); 2201f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"No support for two norm"); 22023a40ed3dSBarry Smith PetscFunctionReturn(0); 220317ab2063SBarry Smith } 220417ab2063SBarry Smith 22054e938277SHong Zhang /* Merged from MatGetSymbolicTranspose_SeqAIJ() - replace MatGetSymbolicTranspose_SeqAIJ()? */ 22064e938277SHong Zhang PetscErrorCode MatTransposeSymbolic_SeqAIJ(Mat A,Mat *B) 22074e938277SHong Zhang { 22084e938277SHong Zhang PetscErrorCode ierr; 22094e938277SHong Zhang PetscInt i,j,anzj; 22104e938277SHong Zhang Mat_SeqAIJ *a=(Mat_SeqAIJ*)A->data,*b; 22114e938277SHong Zhang PetscInt an=A->cmap->N,am=A->rmap->N; 22124e938277SHong Zhang PetscInt *ati,*atj,*atfill,*ai=a->i,*aj=a->j; 22134e938277SHong Zhang 22144e938277SHong Zhang PetscFunctionBegin; 22154e938277SHong Zhang /* Allocate space for symbolic transpose info and work array */ 2216854ce69bSBarry Smith ierr = PetscCalloc1(an+1,&ati);CHKERRQ(ierr); 2217785e854fSJed Brown ierr = PetscMalloc1(ai[am],&atj);CHKERRQ(ierr); 2218785e854fSJed Brown ierr = PetscMalloc1(an,&atfill);CHKERRQ(ierr); 22194e938277SHong Zhang 22204e938277SHong Zhang /* Walk through aj and count ## of non-zeros in each row of A^T. */ 22214e938277SHong Zhang /* Note: offset by 1 for fast conversion into csr format. */ 222226fbe8dcSKarl Rupp for (i=0;i<ai[am];i++) ati[aj[i]+1] += 1; 22234e938277SHong Zhang /* Form ati for csr format of A^T. */ 222426fbe8dcSKarl Rupp for (i=0;i<an;i++) ati[i+1] += ati[i]; 22254e938277SHong Zhang 22264e938277SHong Zhang /* Copy ati into atfill so we have locations of the next free space in atj */ 2227580bdb30SBarry Smith ierr = PetscArraycpy(atfill,ati,an);CHKERRQ(ierr); 22284e938277SHong Zhang 22294e938277SHong Zhang /* Walk through A row-wise and mark nonzero entries of A^T. */ 22304e938277SHong Zhang for (i=0;i<am;i++) { 22314e938277SHong Zhang anzj = ai[i+1] - ai[i]; 22324e938277SHong Zhang for (j=0;j<anzj;j++) { 22334e938277SHong Zhang atj[atfill[*aj]] = i; 22344e938277SHong Zhang atfill[*aj++] += 1; 22354e938277SHong Zhang } 22364e938277SHong Zhang } 22374e938277SHong Zhang 22384e938277SHong Zhang /* Clean up temporary space and complete requests. */ 22394e938277SHong Zhang ierr = PetscFree(atfill);CHKERRQ(ierr); 2240ce94432eSBarry Smith ierr = MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),an,am,ati,atj,NULL,B);CHKERRQ(ierr); 224133d57670SJed Brown ierr = MatSetBlockSizes(*B,PetscAbs(A->cmap->bs),PetscAbs(A->rmap->bs));CHKERRQ(ierr); 2242b5bb3eecSMark Adams ierr = MatSetType(*B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2243a2f3521dSMark F. Adams 22444e938277SHong Zhang b = (Mat_SeqAIJ*)((*B)->data); 22454e938277SHong Zhang b->free_a = PETSC_FALSE; 22464e938277SHong Zhang b->free_ij = PETSC_TRUE; 22474e938277SHong Zhang b->nonew = 0; 22484e938277SHong Zhang PetscFunctionReturn(0); 22494e938277SHong Zhang } 22504e938277SHong Zhang 22517087cfbeSBarry Smith PetscErrorCode MatIsTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 2252cd0d46ebSvictorle { 22533d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) A->data,*bij = (Mat_SeqAIJ*) B->data; 225454f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 225554f21887SBarry Smith MatScalar *va,*vb; 22566849ba73SBarry Smith PetscErrorCode ierr; 225797f1f81fSBarry Smith PetscInt ma,na,mb,nb, i; 2258cd0d46ebSvictorle 2259cd0d46ebSvictorle PetscFunctionBegin; 2260cd0d46ebSvictorle ierr = MatGetSize(A,&ma,&na);CHKERRQ(ierr); 2261cd0d46ebSvictorle ierr = MatGetSize(B,&mb,&nb);CHKERRQ(ierr); 22625485867bSBarry Smith if (ma!=nb || na!=mb) { 22635485867bSBarry Smith *f = PETSC_FALSE; 22645485867bSBarry Smith PetscFunctionReturn(0); 22655485867bSBarry Smith } 2266cd0d46ebSvictorle aii = aij->i; bii = bij->i; 2267cd0d46ebSvictorle adx = aij->j; bdx = bij->j; 2268cd0d46ebSvictorle va = aij->a; vb = bij->a; 2269785e854fSJed Brown ierr = PetscMalloc1(ma,&aptr);CHKERRQ(ierr); 2270785e854fSJed Brown ierr = PetscMalloc1(mb,&bptr);CHKERRQ(ierr); 2271cd0d46ebSvictorle for (i=0; i<ma; i++) aptr[i] = aii[i]; 2272cd0d46ebSvictorle for (i=0; i<mb; i++) bptr[i] = bii[i]; 2273cd0d46ebSvictorle 2274cd0d46ebSvictorle *f = PETSC_TRUE; 2275cd0d46ebSvictorle for (i=0; i<ma; i++) { 2276cd0d46ebSvictorle while (aptr[i]<aii[i+1]) { 227797f1f81fSBarry Smith PetscInt idc,idr; 22785485867bSBarry Smith PetscScalar vc,vr; 2279cd0d46ebSvictorle /* column/row index/value */ 22805485867bSBarry Smith idc = adx[aptr[i]]; 22815485867bSBarry Smith idr = bdx[bptr[idc]]; 22825485867bSBarry Smith vc = va[aptr[i]]; 22835485867bSBarry Smith vr = vb[bptr[idc]]; 22845485867bSBarry Smith if (i!=idr || PetscAbsScalar(vc-vr) > tol) { 22855485867bSBarry Smith *f = PETSC_FALSE; 22865485867bSBarry Smith goto done; 2287cd0d46ebSvictorle } else { 22885485867bSBarry Smith aptr[i]++; 22895485867bSBarry Smith if (B || i!=idc) bptr[idc]++; 2290cd0d46ebSvictorle } 2291cd0d46ebSvictorle } 2292cd0d46ebSvictorle } 2293cd0d46ebSvictorle done: 2294cd0d46ebSvictorle ierr = PetscFree(aptr);CHKERRQ(ierr); 22953aeef889SHong Zhang ierr = PetscFree(bptr);CHKERRQ(ierr); 2296cd0d46ebSvictorle PetscFunctionReturn(0); 2297cd0d46ebSvictorle } 2298cd0d46ebSvictorle 22997087cfbeSBarry Smith PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 23001cbb95d3SBarry Smith { 23013d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) A->data,*bij = (Mat_SeqAIJ*) B->data; 230254f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 230354f21887SBarry Smith MatScalar *va,*vb; 23041cbb95d3SBarry Smith PetscErrorCode ierr; 23051cbb95d3SBarry Smith PetscInt ma,na,mb,nb, i; 23061cbb95d3SBarry Smith 23071cbb95d3SBarry Smith PetscFunctionBegin; 23081cbb95d3SBarry Smith ierr = MatGetSize(A,&ma,&na);CHKERRQ(ierr); 23091cbb95d3SBarry Smith ierr = MatGetSize(B,&mb,&nb);CHKERRQ(ierr); 23101cbb95d3SBarry Smith if (ma!=nb || na!=mb) { 23111cbb95d3SBarry Smith *f = PETSC_FALSE; 23121cbb95d3SBarry Smith PetscFunctionReturn(0); 23131cbb95d3SBarry Smith } 23141cbb95d3SBarry Smith aii = aij->i; bii = bij->i; 23151cbb95d3SBarry Smith adx = aij->j; bdx = bij->j; 23161cbb95d3SBarry Smith va = aij->a; vb = bij->a; 2317785e854fSJed Brown ierr = PetscMalloc1(ma,&aptr);CHKERRQ(ierr); 2318785e854fSJed Brown ierr = PetscMalloc1(mb,&bptr);CHKERRQ(ierr); 23191cbb95d3SBarry Smith for (i=0; i<ma; i++) aptr[i] = aii[i]; 23201cbb95d3SBarry Smith for (i=0; i<mb; i++) bptr[i] = bii[i]; 23211cbb95d3SBarry Smith 23221cbb95d3SBarry Smith *f = PETSC_TRUE; 23231cbb95d3SBarry Smith for (i=0; i<ma; i++) { 23241cbb95d3SBarry Smith while (aptr[i]<aii[i+1]) { 23251cbb95d3SBarry Smith PetscInt idc,idr; 23261cbb95d3SBarry Smith PetscScalar vc,vr; 23271cbb95d3SBarry Smith /* column/row index/value */ 23281cbb95d3SBarry Smith idc = adx[aptr[i]]; 23291cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 23301cbb95d3SBarry Smith vc = va[aptr[i]]; 23311cbb95d3SBarry Smith vr = vb[bptr[idc]]; 23321cbb95d3SBarry Smith if (i!=idr || PetscAbsScalar(vc-PetscConj(vr)) > tol) { 23331cbb95d3SBarry Smith *f = PETSC_FALSE; 23341cbb95d3SBarry Smith goto done; 23351cbb95d3SBarry Smith } else { 23361cbb95d3SBarry Smith aptr[i]++; 23371cbb95d3SBarry Smith if (B || i!=idc) bptr[idc]++; 23381cbb95d3SBarry Smith } 23391cbb95d3SBarry Smith } 23401cbb95d3SBarry Smith } 23411cbb95d3SBarry Smith done: 23421cbb95d3SBarry Smith ierr = PetscFree(aptr);CHKERRQ(ierr); 23431cbb95d3SBarry Smith ierr = PetscFree(bptr);CHKERRQ(ierr); 23441cbb95d3SBarry Smith PetscFunctionReturn(0); 23451cbb95d3SBarry Smith } 23461cbb95d3SBarry Smith 2347ace3abfcSBarry Smith PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 23489e29f15eSvictorle { 2349dfbe8321SBarry Smith PetscErrorCode ierr; 23506e111a19SKarl Rupp 23519e29f15eSvictorle PetscFunctionBegin; 23525485867bSBarry Smith ierr = MatIsTranspose_SeqAIJ(A,A,tol,f);CHKERRQ(ierr); 23539e29f15eSvictorle PetscFunctionReturn(0); 23549e29f15eSvictorle } 23559e29f15eSvictorle 2356ace3abfcSBarry Smith PetscErrorCode MatIsHermitian_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 23571cbb95d3SBarry Smith { 23581cbb95d3SBarry Smith PetscErrorCode ierr; 23596e111a19SKarl Rupp 23601cbb95d3SBarry Smith PetscFunctionBegin; 23611cbb95d3SBarry Smith ierr = MatIsHermitianTranspose_SeqAIJ(A,A,tol,f);CHKERRQ(ierr); 23621cbb95d3SBarry Smith PetscFunctionReturn(0); 23631cbb95d3SBarry Smith } 23641cbb95d3SBarry Smith 2365dfbe8321SBarry Smith PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A,Vec ll,Vec rr) 236617ab2063SBarry Smith { 2367416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2368fff8e43fSBarry Smith const PetscScalar *l,*r; 2369fff8e43fSBarry Smith PetscScalar x; 237054f21887SBarry Smith MatScalar *v; 2371dfbe8321SBarry Smith PetscErrorCode ierr; 2372fff8e43fSBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,M,nz = a->nz; 2373fff8e43fSBarry Smith const PetscInt *jj; 237417ab2063SBarry Smith 23753a40ed3dSBarry Smith PetscFunctionBegin; 237617ab2063SBarry Smith if (ll) { 23773ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 23783ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 2379e1311b90SBarry Smith ierr = VecGetLocalSize(ll,&m);CHKERRQ(ierr); 2380e32f2f54SBarry Smith if (m != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Left scaling vector wrong length"); 2381fff8e43fSBarry Smith ierr = VecGetArrayRead(ll,&l);CHKERRQ(ierr); 2382416022c9SBarry Smith v = a->a; 238317ab2063SBarry Smith for (i=0; i<m; i++) { 238417ab2063SBarry Smith x = l[i]; 2385416022c9SBarry Smith M = a->i[i+1] - a->i[i]; 23862205254eSKarl Rupp for (j=0; j<M; j++) (*v++) *= x; 238717ab2063SBarry Smith } 2388fff8e43fSBarry Smith ierr = VecRestoreArrayRead(ll,&l);CHKERRQ(ierr); 2389efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 239017ab2063SBarry Smith } 239117ab2063SBarry Smith if (rr) { 2392e1311b90SBarry Smith ierr = VecGetLocalSize(rr,&n);CHKERRQ(ierr); 2393e32f2f54SBarry Smith if (n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Right scaling vector wrong length"); 2394fff8e43fSBarry Smith ierr = VecGetArrayRead(rr,&r);CHKERRQ(ierr); 2395416022c9SBarry Smith v = a->a; jj = a->j; 23962205254eSKarl Rupp for (i=0; i<nz; i++) (*v++) *= r[*jj++]; 2397fff8e43fSBarry Smith ierr = VecRestoreArrayRead(rr,&r);CHKERRQ(ierr); 2398efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 239917ab2063SBarry Smith } 2400acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr); 2401e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 2402e2cf4d64SStefano Zampini if (A->valid_GPU_matrix != PETSC_OFFLOAD_UNALLOCATED) A->valid_GPU_matrix = PETSC_OFFLOAD_CPU; 2403e2cf4d64SStefano Zampini #endif 24043a40ed3dSBarry Smith PetscFunctionReturn(0); 240517ab2063SBarry Smith } 240617ab2063SBarry Smith 24077dae84e0SHong Zhang PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A,IS isrow,IS iscol,PetscInt csize,MatReuse scall,Mat *B) 240817ab2063SBarry Smith { 2409db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*c; 24106849ba73SBarry Smith PetscErrorCode ierr; 2411d0f46423SBarry Smith PetscInt *smap,i,k,kstart,kend,oldcols = A->cmap->n,*lens; 241297f1f81fSBarry Smith PetscInt row,mat_i,*mat_j,tcol,first,step,*mat_ilen,sum,lensi; 24135d0c19d7SBarry Smith const PetscInt *irow,*icol; 24145d0c19d7SBarry Smith PetscInt nrows,ncols; 241597f1f81fSBarry Smith PetscInt *starts,*j_new,*i_new,*aj = a->j,*ai = a->i,ii,*ailen = a->ilen; 241654f21887SBarry Smith MatScalar *a_new,*mat_a; 2417416022c9SBarry Smith Mat C; 2418cdc6f3adSToby Isaac PetscBool stride; 241917ab2063SBarry Smith 24203a40ed3dSBarry Smith PetscFunctionBegin; 242199141d43SSatish Balay 242217ab2063SBarry Smith ierr = ISGetIndices(isrow,&irow);CHKERRQ(ierr); 2423b9b97703SBarry Smith ierr = ISGetLocalSize(isrow,&nrows);CHKERRQ(ierr); 2424b9b97703SBarry Smith ierr = ISGetLocalSize(iscol,&ncols);CHKERRQ(ierr); 242517ab2063SBarry Smith 2426251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)iscol,ISSTRIDE,&stride);CHKERRQ(ierr); 2427ff718158SBarry Smith if (stride) { 2428ff718158SBarry Smith ierr = ISStrideGetInfo(iscol,&first,&step);CHKERRQ(ierr); 2429ff718158SBarry Smith } else { 2430ff718158SBarry Smith first = 0; 2431ff718158SBarry Smith step = 0; 2432ff718158SBarry Smith } 2433fee21e36SBarry Smith if (stride && step == 1) { 243402834360SBarry Smith /* special case of contiguous rows */ 2435dcca6d9dSJed Brown ierr = PetscMalloc2(nrows,&lens,nrows,&starts);CHKERRQ(ierr); 243602834360SBarry Smith /* loop over new rows determining lens and starting points */ 243702834360SBarry Smith for (i=0; i<nrows; i++) { 2438bfeeae90SHong Zhang kstart = ai[irow[i]]; 2439a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2440a91a9bebSLisandro Dalcin starts[i] = kstart; 244102834360SBarry Smith for (k=kstart; k<kend; k++) { 2442bfeeae90SHong Zhang if (aj[k] >= first) { 244302834360SBarry Smith starts[i] = k; 244402834360SBarry Smith break; 244502834360SBarry Smith } 244602834360SBarry Smith } 2447a2744918SBarry Smith sum = 0; 244802834360SBarry Smith while (k < kend) { 2449bfeeae90SHong Zhang if (aj[k++] >= first+ncols) break; 2450a2744918SBarry Smith sum++; 245102834360SBarry Smith } 2452a2744918SBarry Smith lens[i] = sum; 245302834360SBarry Smith } 245402834360SBarry Smith /* create submatrix */ 2455cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 245697f1f81fSBarry Smith PetscInt n_cols,n_rows; 245708480c60SBarry Smith ierr = MatGetSize(*B,&n_rows,&n_cols);CHKERRQ(ierr); 2458e32f2f54SBarry Smith if (n_rows != nrows || n_cols != ncols) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Reused submatrix wrong size"); 2459d8ced48eSBarry Smith ierr = MatZeroEntries(*B);CHKERRQ(ierr); 246008480c60SBarry Smith C = *B; 24613a40ed3dSBarry Smith } else { 24623bef6203SJed Brown PetscInt rbs,cbs; 2463ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&C);CHKERRQ(ierr); 2464f69a0ea3SMatthew Knepley ierr = MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr); 24653bef6203SJed Brown ierr = ISGetBlockSize(isrow,&rbs);CHKERRQ(ierr); 24663bef6203SJed Brown ierr = ISGetBlockSize(iscol,&cbs);CHKERRQ(ierr); 24673bef6203SJed Brown ierr = MatSetBlockSizes(C,rbs,cbs);CHKERRQ(ierr); 24687adad957SLisandro Dalcin ierr = MatSetType(C,((PetscObject)A)->type_name);CHKERRQ(ierr); 2469ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens);CHKERRQ(ierr); 247008480c60SBarry Smith } 2471db02288aSLois Curfman McInnes c = (Mat_SeqAIJ*)C->data; 2472db02288aSLois Curfman McInnes 247302834360SBarry Smith /* loop over rows inserting into submatrix */ 2474db02288aSLois Curfman McInnes a_new = c->a; 2475db02288aSLois Curfman McInnes j_new = c->j; 2476db02288aSLois Curfman McInnes i_new = c->i; 2477bfeeae90SHong Zhang 247802834360SBarry Smith for (i=0; i<nrows; i++) { 2479a2744918SBarry Smith ii = starts[i]; 2480a2744918SBarry Smith lensi = lens[i]; 2481a2744918SBarry Smith for (k=0; k<lensi; k++) { 2482a2744918SBarry Smith *j_new++ = aj[ii+k] - first; 248302834360SBarry Smith } 2484580bdb30SBarry Smith ierr = PetscArraycpy(a_new,a->a + starts[i],lensi);CHKERRQ(ierr); 2485a2744918SBarry Smith a_new += lensi; 2486a2744918SBarry Smith i_new[i+1] = i_new[i] + lensi; 2487a2744918SBarry Smith c->ilen[i] = lensi; 248802834360SBarry Smith } 24890e83c824SBarry Smith ierr = PetscFree2(lens,starts);CHKERRQ(ierr); 24903a40ed3dSBarry Smith } else { 249102834360SBarry Smith ierr = ISGetIndices(iscol,&icol);CHKERRQ(ierr); 24921795a4d1SJed Brown ierr = PetscCalloc1(oldcols,&smap);CHKERRQ(ierr); 2493854ce69bSBarry Smith ierr = PetscMalloc1(1+nrows,&lens);CHKERRQ(ierr); 24944dcab191SBarry Smith for (i=0; i<ncols; i++) { 24954dcab191SBarry Smith #if defined(PETSC_USE_DEBUG) 24964dcab191SBarry Smith if (icol[i] >= oldcols) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Requesting column beyond largest column icol[%D] %D <= A->cmap->n %D",i,icol[i],oldcols); 24974dcab191SBarry Smith #endif 24984dcab191SBarry Smith smap[icol[i]] = i+1; 24994dcab191SBarry Smith } 25004dcab191SBarry Smith 250102834360SBarry Smith /* determine lens of each row */ 250202834360SBarry Smith for (i=0; i<nrows; i++) { 2503bfeeae90SHong Zhang kstart = ai[irow[i]]; 250402834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 250502834360SBarry Smith lens[i] = 0; 250602834360SBarry Smith for (k=kstart; k<kend; k++) { 2507bfeeae90SHong Zhang if (smap[aj[k]]) { 250802834360SBarry Smith lens[i]++; 250902834360SBarry Smith } 251002834360SBarry Smith } 251102834360SBarry Smith } 251217ab2063SBarry Smith /* Create and fill new matrix */ 2513a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2514ace3abfcSBarry Smith PetscBool equal; 25150f5bd95cSBarry Smith 251699141d43SSatish Balay c = (Mat_SeqAIJ*)((*B)->data); 2517e32f2f54SBarry Smith if ((*B)->rmap->n != nrows || (*B)->cmap->n != ncols) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong size"); 2518580bdb30SBarry Smith ierr = PetscArraycmp(c->ilen,lens,(*B)->rmap->n,&equal);CHKERRQ(ierr); 2519f23aa3ddSBarry Smith if (!equal) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong no of nonzeros"); 2520580bdb30SBarry Smith ierr = PetscArrayzero(c->ilen,(*B)->rmap->n);CHKERRQ(ierr); 252108480c60SBarry Smith C = *B; 25223a40ed3dSBarry Smith } else { 25233bef6203SJed Brown PetscInt rbs,cbs; 2524ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&C);CHKERRQ(ierr); 2525f69a0ea3SMatthew Knepley ierr = MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr); 25263bef6203SJed Brown ierr = ISGetBlockSize(isrow,&rbs);CHKERRQ(ierr); 25273bef6203SJed Brown ierr = ISGetBlockSize(iscol,&cbs);CHKERRQ(ierr); 25283bef6203SJed Brown ierr = MatSetBlockSizes(C,rbs,cbs);CHKERRQ(ierr); 25297adad957SLisandro Dalcin ierr = MatSetType(C,((PetscObject)A)->type_name);CHKERRQ(ierr); 2530ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens);CHKERRQ(ierr); 253108480c60SBarry Smith } 253299141d43SSatish Balay c = (Mat_SeqAIJ*)(C->data); 253317ab2063SBarry Smith for (i=0; i<nrows; i++) { 253499141d43SSatish Balay row = irow[i]; 2535bfeeae90SHong Zhang kstart = ai[row]; 253699141d43SSatish Balay kend = kstart + a->ilen[row]; 2537bfeeae90SHong Zhang mat_i = c->i[i]; 253899141d43SSatish Balay mat_j = c->j + mat_i; 253999141d43SSatish Balay mat_a = c->a + mat_i; 254099141d43SSatish Balay mat_ilen = c->ilen + i; 254117ab2063SBarry Smith for (k=kstart; k<kend; k++) { 2542bfeeae90SHong Zhang if ((tcol=smap[a->j[k]])) { 2543ed480e8bSBarry Smith *mat_j++ = tcol - 1; 254499141d43SSatish Balay *mat_a++ = a->a[k]; 254599141d43SSatish Balay (*mat_ilen)++; 254699141d43SSatish Balay 254717ab2063SBarry Smith } 254817ab2063SBarry Smith } 254917ab2063SBarry Smith } 255002834360SBarry Smith /* Free work space */ 255102834360SBarry Smith ierr = ISRestoreIndices(iscol,&icol);CHKERRQ(ierr); 2552606d414cSSatish Balay ierr = PetscFree(smap);CHKERRQ(ierr); 2553606d414cSSatish Balay ierr = PetscFree(lens);CHKERRQ(ierr); 2554cdc6f3adSToby Isaac /* sort */ 2555cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2556cdc6f3adSToby Isaac PetscInt ilen; 2557cdc6f3adSToby Isaac 2558cdc6f3adSToby Isaac mat_i = c->i[i]; 2559cdc6f3adSToby Isaac mat_j = c->j + mat_i; 2560cdc6f3adSToby Isaac mat_a = c->a + mat_i; 2561cdc6f3adSToby Isaac ilen = c->ilen[i]; 2562390e1bf2SBarry Smith ierr = PetscSortIntWithScalarArray(ilen,mat_j,mat_a);CHKERRQ(ierr); 2563cdc6f3adSToby Isaac } 256402834360SBarry Smith } 25656d4a8577SBarry Smith ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 25666d4a8577SBarry Smith ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 256717ab2063SBarry Smith 256817ab2063SBarry Smith ierr = ISRestoreIndices(isrow,&irow);CHKERRQ(ierr); 2569416022c9SBarry Smith *B = C; 25703a40ed3dSBarry Smith PetscFunctionReturn(0); 257117ab2063SBarry Smith } 257217ab2063SBarry Smith 2573fc08c53fSHong Zhang PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat,MPI_Comm subComm,MatReuse scall,Mat *subMat) 257482d44351SHong Zhang { 257582d44351SHong Zhang PetscErrorCode ierr; 257682d44351SHong Zhang Mat B; 257782d44351SHong Zhang 257882d44351SHong Zhang PetscFunctionBegin; 2579c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 258082d44351SHong Zhang ierr = MatCreate(subComm,&B);CHKERRQ(ierr); 258182d44351SHong Zhang ierr = MatSetSizes(B,mat->rmap->n,mat->cmap->n,mat->rmap->n,mat->cmap->n);CHKERRQ(ierr); 258233d57670SJed Brown ierr = MatSetBlockSizesFromMats(B,mat,mat);CHKERRQ(ierr); 258382d44351SHong Zhang ierr = MatSetType(B,MATSEQAIJ);CHKERRQ(ierr); 258482d44351SHong Zhang ierr = MatDuplicateNoCreate_SeqAIJ(B,mat,MAT_COPY_VALUES,PETSC_TRUE);CHKERRQ(ierr); 258582d44351SHong Zhang *subMat = B; 2586c2d650bdSHong Zhang } else { 2587c2d650bdSHong Zhang ierr = MatCopy_SeqAIJ(mat,*subMat,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 2588c2d650bdSHong Zhang } 258982d44351SHong Zhang PetscFunctionReturn(0); 259082d44351SHong Zhang } 259182d44351SHong Zhang 25929a625307SHong Zhang PetscErrorCode MatILUFactor_SeqAIJ(Mat inA,IS row,IS col,const MatFactorInfo *info) 2593a871dcd8SBarry Smith { 259463b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 2595dfbe8321SBarry Smith PetscErrorCode ierr; 259663b91edcSBarry Smith Mat outA; 2597ace3abfcSBarry Smith PetscBool row_identity,col_identity; 259863b91edcSBarry Smith 25993a40ed3dSBarry Smith PetscFunctionBegin; 2600e32f2f54SBarry Smith if (info->levels != 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Only levels=0 supported for in-place ilu"); 26011df811f5SHong Zhang 2602b8a78c4aSBarry Smith ierr = ISIdentity(row,&row_identity);CHKERRQ(ierr); 2603b8a78c4aSBarry Smith ierr = ISIdentity(col,&col_identity);CHKERRQ(ierr); 2604a871dcd8SBarry Smith 260563b91edcSBarry Smith outA = inA; 2606d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 2607f6224b95SHong Zhang ierr = PetscFree(inA->solvertype);CHKERRQ(ierr); 2608f6224b95SHong Zhang ierr = PetscStrallocpy(MATSOLVERPETSC,&inA->solvertype);CHKERRQ(ierr); 26092205254eSKarl Rupp 2610c38d4ed2SBarry Smith ierr = PetscObjectReference((PetscObject)row);CHKERRQ(ierr); 26116bf464f9SBarry Smith ierr = ISDestroy(&a->row);CHKERRQ(ierr); 26122205254eSKarl Rupp 2613c3122656SLisandro Dalcin a->row = row; 26142205254eSKarl Rupp 2615c38d4ed2SBarry Smith ierr = PetscObjectReference((PetscObject)col);CHKERRQ(ierr); 26166bf464f9SBarry Smith ierr = ISDestroy(&a->col);CHKERRQ(ierr); 26172205254eSKarl Rupp 2618c3122656SLisandro Dalcin a->col = col; 261963b91edcSBarry Smith 262036db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26216bf464f9SBarry Smith ierr = ISDestroy(&a->icol);CHKERRQ(ierr); 26224c49b128SBarry Smith ierr = ISInvertPermutation(col,PETSC_DECIDE,&a->icol);CHKERRQ(ierr); 26233bb1ff40SBarry Smith ierr = PetscLogObjectParent((PetscObject)inA,(PetscObject)a->icol);CHKERRQ(ierr); 2624f0ec6fceSSatish Balay 262594a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 2626854ce69bSBarry Smith ierr = PetscMalloc1(inA->rmap->n+1,&a->solve_work);CHKERRQ(ierr); 26273bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)inA, (inA->rmap->n+1)*sizeof(PetscScalar));CHKERRQ(ierr); 262894a9d846SBarry Smith } 262963b91edcSBarry Smith 2630f1e2ffcdSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(inA);CHKERRQ(ierr); 2631137fb511SHong Zhang if (row_identity && col_identity) { 2632ad04f41aSHong Zhang ierr = MatLUFactorNumeric_SeqAIJ_inplace(outA,inA,info);CHKERRQ(ierr); 2633137fb511SHong Zhang } else { 2634719d5645SBarry Smith ierr = MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA,inA,info);CHKERRQ(ierr); 2635137fb511SHong Zhang } 26363a40ed3dSBarry Smith PetscFunctionReturn(0); 2637a871dcd8SBarry Smith } 2638a871dcd8SBarry Smith 2639f4df32b1SMatthew Knepley PetscErrorCode MatScale_SeqAIJ(Mat inA,PetscScalar alpha) 2640f0b747eeSBarry Smith { 2641f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 2642f4df32b1SMatthew Knepley PetscScalar oalpha = alpha; 2643efee365bSSatish Balay PetscErrorCode ierr; 2644c5df96a5SBarry Smith PetscBLASInt one = 1,bnz; 26453a40ed3dSBarry Smith 26463a40ed3dSBarry Smith PetscFunctionBegin; 2647c5df96a5SBarry Smith ierr = PetscBLASIntCast(a->nz,&bnz);CHKERRQ(ierr); 26488b83055fSJed Brown PetscStackCallBLAS("BLASscal",BLASscal_(&bnz,&oalpha,a->a,&one)); 2649efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 2650acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(inA);CHKERRQ(ierr); 2651e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 2652e2cf4d64SStefano Zampini if (inA->valid_GPU_matrix != PETSC_OFFLOAD_UNALLOCATED) inA->valid_GPU_matrix = PETSC_OFFLOAD_CPU; 2653e2cf4d64SStefano Zampini #endif 26543a40ed3dSBarry Smith PetscFunctionReturn(0); 2655f0b747eeSBarry Smith } 2656f0b747eeSBarry Smith 2657f68bb481SHong Zhang PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 265816b64355SHong Zhang { 265916b64355SHong Zhang PetscErrorCode ierr; 266016b64355SHong Zhang PetscInt i; 266116b64355SHong Zhang 266216b64355SHong Zhang PetscFunctionBegin; 266316b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 266416b64355SHong Zhang ierr = PetscFree4(submatj->sbuf1,submatj->ptr,submatj->tmp,submatj->ctr);CHKERRQ(ierr); 266516b64355SHong Zhang 266616b64355SHong Zhang for (i=0; i<submatj->nrqr; ++i) { 266716b64355SHong Zhang ierr = PetscFree(submatj->sbuf2[i]);CHKERRQ(ierr); 266816b64355SHong Zhang } 266916b64355SHong Zhang ierr = PetscFree3(submatj->sbuf2,submatj->req_size,submatj->req_source1);CHKERRQ(ierr); 267016b64355SHong Zhang 267116b64355SHong Zhang if (submatj->rbuf1) { 267216b64355SHong Zhang ierr = PetscFree(submatj->rbuf1[0]);CHKERRQ(ierr); 267316b64355SHong Zhang ierr = PetscFree(submatj->rbuf1);CHKERRQ(ierr); 267416b64355SHong Zhang } 267516b64355SHong Zhang 267616b64355SHong Zhang for (i=0; i<submatj->nrqs; ++i) { 267716b64355SHong Zhang ierr = PetscFree(submatj->rbuf3[i]);CHKERRQ(ierr); 267816b64355SHong Zhang } 267916b64355SHong Zhang ierr = PetscFree3(submatj->req_source2,submatj->rbuf2,submatj->rbuf3);CHKERRQ(ierr); 268016b64355SHong Zhang ierr = PetscFree(submatj->pa);CHKERRQ(ierr); 268116b64355SHong Zhang } 268216b64355SHong Zhang 268316b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 268416b64355SHong Zhang ierr = PetscTableDestroy((PetscTable*)&submatj->rmap);CHKERRQ(ierr); 268516b64355SHong Zhang if (submatj->cmap_loc) {ierr = PetscFree(submatj->cmap_loc);CHKERRQ(ierr);} 268616b64355SHong Zhang ierr = PetscFree(submatj->rmap_loc);CHKERRQ(ierr); 268716b64355SHong Zhang #else 268816b64355SHong Zhang ierr = PetscFree(submatj->rmap);CHKERRQ(ierr); 268916b64355SHong Zhang #endif 269016b64355SHong Zhang 269116b64355SHong Zhang if (!submatj->allcolumns) { 269216b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 269316b64355SHong Zhang ierr = PetscTableDestroy((PetscTable*)&submatj->cmap);CHKERRQ(ierr); 269416b64355SHong Zhang #else 269516b64355SHong Zhang ierr = PetscFree(submatj->cmap);CHKERRQ(ierr); 269616b64355SHong Zhang #endif 269716b64355SHong Zhang } 269816b64355SHong Zhang ierr = PetscFree(submatj->row2proc);CHKERRQ(ierr); 269916b64355SHong Zhang 270016b64355SHong Zhang ierr = PetscFree(submatj);CHKERRQ(ierr); 270116b64355SHong Zhang PetscFunctionReturn(0); 270216b64355SHong Zhang } 270316b64355SHong Zhang 27040fb991dcSHong Zhang PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 270516b64355SHong Zhang { 270616b64355SHong Zhang PetscErrorCode ierr; 270716b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ*)C->data; 27085c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 270916b64355SHong Zhang 271016b64355SHong Zhang PetscFunctionBegin; 271134136279SStefano Zampini ierr = (*submatj->destroy)(C);CHKERRQ(ierr); 2712f68bb481SHong Zhang ierr = MatDestroySubMatrix_Private(submatj);CHKERRQ(ierr); 271316b64355SHong Zhang PetscFunctionReturn(0); 271416b64355SHong Zhang } 271516b64355SHong Zhang 27162d033e1fSHong Zhang PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n,Mat *mat[]) 27172d033e1fSHong Zhang { 27182d033e1fSHong Zhang PetscErrorCode ierr; 27192d033e1fSHong Zhang PetscInt i; 27200fb991dcSHong Zhang Mat C; 27210fb991dcSHong Zhang Mat_SeqAIJ *c; 27220fb991dcSHong Zhang Mat_SubSppt *submatj; 27232d033e1fSHong Zhang 27242d033e1fSHong Zhang PetscFunctionBegin; 27252d033e1fSHong Zhang for (i=0; i<n; i++) { 27260fb991dcSHong Zhang C = (*mat)[i]; 27270fb991dcSHong Zhang c = (Mat_SeqAIJ*)C->data; 27280fb991dcSHong Zhang submatj = c->submatis1; 27292d033e1fSHong Zhang if (submatj) { 2730682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 273134136279SStefano Zampini ierr = (*submatj->destroy)(C);CHKERRQ(ierr); 2732f68bb481SHong Zhang ierr = MatDestroySubMatrix_Private(submatj);CHKERRQ(ierr); 273334136279SStefano Zampini ierr = PetscFree(C->defaultvectype);CHKERRQ(ierr); 27342d033e1fSHong Zhang ierr = PetscLayoutDestroy(&C->rmap);CHKERRQ(ierr); 27352d033e1fSHong Zhang ierr = PetscLayoutDestroy(&C->cmap);CHKERRQ(ierr); 27362d033e1fSHong Zhang ierr = PetscHeaderDestroy(&C);CHKERRQ(ierr); 2737682e4c99SStefano Zampini } 27382d033e1fSHong Zhang } else { 27392d033e1fSHong Zhang ierr = MatDestroy(&C);CHKERRQ(ierr); 27402d033e1fSHong Zhang } 27412d033e1fSHong Zhang } 274286e85357SHong Zhang 274363a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 274463a75b2aSHong Zhang ierr = MatDestroySubMatrices_Dummy(n,mat);CHKERRQ(ierr); 274563a75b2aSHong Zhang 27462d033e1fSHong Zhang ierr = PetscFree(*mat);CHKERRQ(ierr); 27472d033e1fSHong Zhang PetscFunctionReturn(0); 27482d033e1fSHong Zhang } 27492d033e1fSHong Zhang 27507dae84e0SHong Zhang PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A,PetscInt n,const IS irow[],const IS icol[],MatReuse scall,Mat *B[]) 2751cddf8d76SBarry Smith { 2752dfbe8321SBarry Smith PetscErrorCode ierr; 275397f1f81fSBarry Smith PetscInt i; 2754cddf8d76SBarry Smith 27553a40ed3dSBarry Smith PetscFunctionBegin; 2756cddf8d76SBarry Smith if (scall == MAT_INITIAL_MATRIX) { 2757df750dc8SHong Zhang ierr = PetscCalloc1(n+1,B);CHKERRQ(ierr); 2758cddf8d76SBarry Smith } 2759cddf8d76SBarry Smith 2760cddf8d76SBarry Smith for (i=0; i<n; i++) { 27617dae84e0SHong Zhang ierr = MatCreateSubMatrix_SeqAIJ(A,irow[i],icol[i],PETSC_DECIDE,scall,&(*B)[i]);CHKERRQ(ierr); 2762cddf8d76SBarry Smith } 27633a40ed3dSBarry Smith PetscFunctionReturn(0); 2764cddf8d76SBarry Smith } 2765cddf8d76SBarry Smith 276697f1f81fSBarry Smith PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A,PetscInt is_max,IS is[],PetscInt ov) 27674dcbc457SBarry Smith { 2768e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 27696849ba73SBarry Smith PetscErrorCode ierr; 27705d0c19d7SBarry Smith PetscInt row,i,j,k,l,m,n,*nidx,isz,val; 27715d0c19d7SBarry Smith const PetscInt *idx; 277297f1f81fSBarry Smith PetscInt start,end,*ai,*aj; 2773f1af5d2fSBarry Smith PetscBT table; 2774bbd702dbSSatish Balay 27753a40ed3dSBarry Smith PetscFunctionBegin; 2776d0f46423SBarry Smith m = A->rmap->n; 2777e4d965acSSatish Balay ai = a->i; 2778bfeeae90SHong Zhang aj = a->j; 27798a047759SSatish Balay 2780e32f2f54SBarry Smith if (ov < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"illegal negative overlap value used"); 278106763907SSatish Balay 2782854ce69bSBarry Smith ierr = PetscMalloc1(m+1,&nidx);CHKERRQ(ierr); 278353b8de81SBarry Smith ierr = PetscBTCreate(m,&table);CHKERRQ(ierr); 278406763907SSatish Balay 2785e4d965acSSatish Balay for (i=0; i<is_max; i++) { 2786b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2787e4d965acSSatish Balay isz = 0; 27886831982aSBarry Smith ierr = PetscBTMemzero(m,table);CHKERRQ(ierr); 2789e4d965acSSatish Balay 2790e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 27914dcbc457SBarry Smith ierr = ISGetIndices(is[i],&idx);CHKERRQ(ierr); 2792b9b97703SBarry Smith ierr = ISGetLocalSize(is[i],&n);CHKERRQ(ierr); 2793e4d965acSSatish Balay 2794dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2795e4d965acSSatish Balay for (j=0; j<n; ++j) { 27962205254eSKarl Rupp if (!PetscBTLookupSet(table,idx[j])) nidx[isz++] = idx[j]; 27974dcbc457SBarry Smith } 279806763907SSatish Balay ierr = ISRestoreIndices(is[i],&idx);CHKERRQ(ierr); 27996bf464f9SBarry Smith ierr = ISDestroy(&is[i]);CHKERRQ(ierr); 2800e4d965acSSatish Balay 280104a348a9SBarry Smith k = 0; 280204a348a9SBarry Smith for (j=0; j<ov; j++) { /* for each overlap */ 280304a348a9SBarry Smith n = isz; 280406763907SSatish Balay for (; k<n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2805e4d965acSSatish Balay row = nidx[k]; 2806e4d965acSSatish Balay start = ai[row]; 2807e4d965acSSatish Balay end = ai[row+1]; 280804a348a9SBarry Smith for (l = start; l<end; l++) { 2809efb16452SHong Zhang val = aj[l]; 28102205254eSKarl Rupp if (!PetscBTLookupSet(table,val)) nidx[isz++] = val; 2811e4d965acSSatish Balay } 2812e4d965acSSatish Balay } 2813e4d965acSSatish Balay } 281470b3c8c7SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,isz,nidx,PETSC_COPY_VALUES,(is+i));CHKERRQ(ierr); 2815e4d965acSSatish Balay } 281694bacf5dSBarry Smith ierr = PetscBTDestroy(&table);CHKERRQ(ierr); 2817606d414cSSatish Balay ierr = PetscFree(nidx);CHKERRQ(ierr); 28183a40ed3dSBarry Smith PetscFunctionReturn(0); 28194dcbc457SBarry Smith } 282017ab2063SBarry Smith 28210513a670SBarry Smith /* -------------------------------------------------------------- */ 2822dfbe8321SBarry Smith PetscErrorCode MatPermute_SeqAIJ(Mat A,IS rowp,IS colp,Mat *B) 28230513a670SBarry Smith { 28240513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 28256849ba73SBarry Smith PetscErrorCode ierr; 28263b98c0a2SBarry Smith PetscInt i,nz = 0,m = A->rmap->n,n = A->cmap->n; 28275d0c19d7SBarry Smith const PetscInt *row,*col; 28285d0c19d7SBarry Smith PetscInt *cnew,j,*lens; 282956cd22aeSBarry Smith IS icolp,irowp; 28300298fd71SBarry Smith PetscInt *cwork = NULL; 28310298fd71SBarry Smith PetscScalar *vwork = NULL; 28320513a670SBarry Smith 28333a40ed3dSBarry Smith PetscFunctionBegin; 28344c49b128SBarry Smith ierr = ISInvertPermutation(rowp,PETSC_DECIDE,&irowp);CHKERRQ(ierr); 283556cd22aeSBarry Smith ierr = ISGetIndices(irowp,&row);CHKERRQ(ierr); 28364c49b128SBarry Smith ierr = ISInvertPermutation(colp,PETSC_DECIDE,&icolp);CHKERRQ(ierr); 283756cd22aeSBarry Smith ierr = ISGetIndices(icolp,&col);CHKERRQ(ierr); 28380513a670SBarry Smith 28390513a670SBarry Smith /* determine lengths of permuted rows */ 2840854ce69bSBarry Smith ierr = PetscMalloc1(m+1,&lens);CHKERRQ(ierr); 28412205254eSKarl Rupp for (i=0; i<m; i++) lens[row[i]] = a->i[i+1] - a->i[i]; 2842ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),B);CHKERRQ(ierr); 2843f69a0ea3SMatthew Knepley ierr = MatSetSizes(*B,m,n,m,n);CHKERRQ(ierr); 284433d57670SJed Brown ierr = MatSetBlockSizesFromMats(*B,A,A);CHKERRQ(ierr); 28457adad957SLisandro Dalcin ierr = MatSetType(*B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2846ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(*B,0,lens);CHKERRQ(ierr); 2847606d414cSSatish Balay ierr = PetscFree(lens);CHKERRQ(ierr); 28480513a670SBarry Smith 2849785e854fSJed Brown ierr = PetscMalloc1(n,&cnew);CHKERRQ(ierr); 28500513a670SBarry Smith for (i=0; i<m; i++) { 285132ec9ce4SBarry Smith ierr = MatGetRow_SeqAIJ(A,i,&nz,&cwork,&vwork);CHKERRQ(ierr); 28522205254eSKarl Rupp for (j=0; j<nz; j++) cnew[j] = col[cwork[j]]; 2853cdc0ba36SBarry Smith ierr = MatSetValues_SeqAIJ(*B,1,&row[i],nz,cnew,vwork,INSERT_VALUES);CHKERRQ(ierr); 285432ec9ce4SBarry Smith ierr = MatRestoreRow_SeqAIJ(A,i,&nz,&cwork,&vwork);CHKERRQ(ierr); 28550513a670SBarry Smith } 2856606d414cSSatish Balay ierr = PetscFree(cnew);CHKERRQ(ierr); 28572205254eSKarl Rupp 28583c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 28592205254eSKarl Rupp 28600513a670SBarry Smith ierr = MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 28610513a670SBarry Smith ierr = MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 286256cd22aeSBarry Smith ierr = ISRestoreIndices(irowp,&row);CHKERRQ(ierr); 286356cd22aeSBarry Smith ierr = ISRestoreIndices(icolp,&col);CHKERRQ(ierr); 28646bf464f9SBarry Smith ierr = ISDestroy(&irowp);CHKERRQ(ierr); 28656bf464f9SBarry Smith ierr = ISDestroy(&icolp);CHKERRQ(ierr); 28663a40ed3dSBarry Smith PetscFunctionReturn(0); 28670513a670SBarry Smith } 28680513a670SBarry Smith 2869dfbe8321SBarry Smith PetscErrorCode MatCopy_SeqAIJ(Mat A,Mat B,MatStructure str) 2870cb5b572fSBarry Smith { 2871dfbe8321SBarry Smith PetscErrorCode ierr; 2872cb5b572fSBarry Smith 2873cb5b572fSBarry Smith PetscFunctionBegin; 287433f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 287533f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2876be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2877be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ*)B->data; 2878be6bf707SBarry Smith 2879700c5bfcSBarry Smith if (a->i[A->rmap->n] != b->i[B->rmap->n]) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Number of nonzeros in two matrices are different"); 2880580bdb30SBarry Smith ierr = PetscArraycpy(b->a,a->a,a->i[A->rmap->n]);CHKERRQ(ierr); 2881cdc753b6SBarry Smith ierr = PetscObjectStateIncrease((PetscObject)B);CHKERRQ(ierr); 2882cb5b572fSBarry Smith } else { 2883cb5b572fSBarry Smith ierr = MatCopy_Basic(A,B,str);CHKERRQ(ierr); 2884cb5b572fSBarry Smith } 2885cb5b572fSBarry Smith PetscFunctionReturn(0); 2886cb5b572fSBarry Smith } 2887cb5b572fSBarry Smith 28884994cf47SJed Brown PetscErrorCode MatSetUp_SeqAIJ(Mat A) 2889273d9f13SBarry Smith { 2890dfbe8321SBarry Smith PetscErrorCode ierr; 2891273d9f13SBarry Smith 2892273d9f13SBarry Smith PetscFunctionBegin; 2893ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(A,PETSC_DEFAULT,0);CHKERRQ(ierr); 2894273d9f13SBarry Smith PetscFunctionReturn(0); 2895273d9f13SBarry Smith } 2896273d9f13SBarry Smith 28978c778c55SBarry Smith PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A,PetscScalar *array[]) 28986c0721eeSBarry Smith { 28996c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 29006e111a19SKarl Rupp 29016c0721eeSBarry Smith PetscFunctionBegin; 29026c0721eeSBarry Smith *array = a->a; 29036c0721eeSBarry Smith PetscFunctionReturn(0); 29046c0721eeSBarry Smith } 29056c0721eeSBarry Smith 29068c778c55SBarry Smith PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A,PetscScalar *array[]) 29076c0721eeSBarry Smith { 29086c0721eeSBarry Smith PetscFunctionBegin; 29096c0721eeSBarry Smith PetscFunctionReturn(0); 29106c0721eeSBarry Smith } 2911273d9f13SBarry Smith 29128229c054SShri Abhyankar /* 29138229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29148229c054SShri Abhyankar have different nonzero structure. 29158229c054SShri Abhyankar */ 2916b264fe52SHong Zhang PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m,const PetscInt *xi,const PetscInt *xj,const PetscInt *yi,const PetscInt *yj,PetscInt *nnz) 2917ec7775f6SShri Abhyankar { 2918b264fe52SHong Zhang PetscInt i,j,k,nzx,nzy; 2919ec7775f6SShri Abhyankar 2920ec7775f6SShri Abhyankar PetscFunctionBegin; 2921ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 2922ec7775f6SShri Abhyankar for (i=0; i<m; i++) { 2923b264fe52SHong Zhang const PetscInt *xjj = xj+xi[i],*yjj = yj+yi[i]; 2924b264fe52SHong Zhang nzx = xi[i+1] - xi[i]; 2925b264fe52SHong Zhang nzy = yi[i+1] - yi[i]; 29268af7cee1SJed Brown nnz[i] = 0; 29278af7cee1SJed Brown for (j=0,k=0; j<nzx; j++) { /* Point in X */ 2928b264fe52SHong Zhang for (; k<nzy && yjj[k]<xjj[j]; k++) nnz[i]++; /* Catch up to X */ 2929b264fe52SHong Zhang if (k<nzy && yjj[k]==xjj[j]) k++; /* Skip duplicate */ 29308af7cee1SJed Brown nnz[i]++; 29318af7cee1SJed Brown } 29328af7cee1SJed Brown for (; k<nzy; k++) nnz[i]++; 2933ec7775f6SShri Abhyankar } 2934ec7775f6SShri Abhyankar PetscFunctionReturn(0); 2935ec7775f6SShri Abhyankar } 2936ec7775f6SShri Abhyankar 2937b264fe52SHong Zhang PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y,Mat X,PetscInt *nnz) 2938b264fe52SHong Zhang { 2939b264fe52SHong Zhang PetscInt m = Y->rmap->N; 2940b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ*)X->data; 2941b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ*)Y->data; 2942b264fe52SHong Zhang PetscErrorCode ierr; 2943b264fe52SHong Zhang 2944b264fe52SHong Zhang PetscFunctionBegin; 2945b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 2946b264fe52SHong Zhang ierr = MatAXPYGetPreallocation_SeqX_private(m,x->i,x->j,y->i,y->j,nnz);CHKERRQ(ierr); 2947b264fe52SHong Zhang PetscFunctionReturn(0); 2948b264fe52SHong Zhang } 2949b264fe52SHong Zhang 2950f4df32b1SMatthew Knepley PetscErrorCode MatAXPY_SeqAIJ(Mat Y,PetscScalar a,Mat X,MatStructure str) 2951ac90fabeSBarry Smith { 2952dfbe8321SBarry Smith PetscErrorCode ierr; 2953ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ*)X->data,*y = (Mat_SeqAIJ*)Y->data; 2954c5df96a5SBarry Smith PetscBLASInt one=1,bnz; 2955ac90fabeSBarry Smith 2956ac90fabeSBarry Smith PetscFunctionBegin; 2957c5df96a5SBarry Smith ierr = PetscBLASIntCast(x->nz,&bnz);CHKERRQ(ierr); 2958ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 2959f4df32b1SMatthew Knepley PetscScalar alpha = a; 29608b83055fSJed Brown PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&bnz,&alpha,x->a,&one,y->a,&one)); 2961acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(Y);CHKERRQ(ierr); 2962a3fa217bSJose E. Roman ierr = PetscObjectStateIncrease((PetscObject)Y);CHKERRQ(ierr); 2963e2cf4d64SStefano Zampini /* the MatAXPY_Basic* subroutines calls MatAssembly, so the matrix on the GPU 2964e2cf4d64SStefano Zampini will be updated */ 2965e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 2966e2cf4d64SStefano Zampini if (Y->valid_GPU_matrix != PETSC_OFFLOAD_UNALLOCATED) { 2967e2cf4d64SStefano Zampini Y->valid_GPU_matrix = PETSC_OFFLOAD_CPU; 2968e2cf4d64SStefano Zampini } 2969e2cf4d64SStefano Zampini #endif 2970ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 2971ab784542SHong Zhang ierr = MatAXPY_Basic(Y,a,X,str);CHKERRQ(ierr); 2972ac90fabeSBarry Smith } else { 29738229c054SShri Abhyankar Mat B; 29748229c054SShri Abhyankar PetscInt *nnz; 2975785e854fSJed Brown ierr = PetscMalloc1(Y->rmap->N,&nnz);CHKERRQ(ierr); 2976ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)Y),&B);CHKERRQ(ierr); 2977bc5a2726SShri Abhyankar ierr = PetscObjectSetName((PetscObject)B,((PetscObject)Y)->name);CHKERRQ(ierr); 29784aa94f47SShri Abhyankar ierr = MatSetSizes(B,Y->rmap->n,Y->cmap->n,Y->rmap->N,Y->cmap->N);CHKERRQ(ierr); 297933d57670SJed Brown ierr = MatSetBlockSizesFromMats(B,Y,Y);CHKERRQ(ierr); 2980176df525SBarry Smith ierr = MatSetType(B,(MatType) ((PetscObject)Y)->type_name);CHKERRQ(ierr); 29818229c054SShri Abhyankar ierr = MatAXPYGetPreallocation_SeqAIJ(Y,X,nnz);CHKERRQ(ierr); 2982ecd8bba6SJed Brown ierr = MatSeqAIJSetPreallocation(B,0,nnz);CHKERRQ(ierr); 2983ec7775f6SShri Abhyankar ierr = MatAXPY_BasicWithPreallocation(B,Y,a,X,str);CHKERRQ(ierr); 298428be2f97SBarry Smith ierr = MatHeaderReplace(Y,&B);CHKERRQ(ierr); 29858229c054SShri Abhyankar ierr = PetscFree(nnz);CHKERRQ(ierr); 2986ac90fabeSBarry Smith } 2987ac90fabeSBarry Smith PetscFunctionReturn(0); 2988ac90fabeSBarry Smith } 2989ac90fabeSBarry Smith 29907087cfbeSBarry Smith PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 2991354c94deSBarry Smith { 2992354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 2993354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 2994354c94deSBarry Smith PetscInt i,nz; 2995354c94deSBarry Smith PetscScalar *a; 2996354c94deSBarry Smith 2997354c94deSBarry Smith PetscFunctionBegin; 2998354c94deSBarry Smith nz = aij->nz; 2999354c94deSBarry Smith a = aij->a; 30002205254eSKarl Rupp for (i=0; i<nz; i++) a[i] = PetscConj(a[i]); 3001e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 3002e2cf4d64SStefano Zampini if (mat->valid_GPU_matrix != PETSC_OFFLOAD_UNALLOCATED) mat->valid_GPU_matrix = PETSC_OFFLOAD_CPU; 3003e2cf4d64SStefano Zampini #endif 3004354c94deSBarry Smith #else 3005354c94deSBarry Smith PetscFunctionBegin; 3006354c94deSBarry Smith #endif 3007354c94deSBarry Smith PetscFunctionReturn(0); 3008354c94deSBarry Smith } 3009354c94deSBarry Smith 3010985db425SBarry Smith PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3011e34fafa9SBarry Smith { 3012e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3013e34fafa9SBarry Smith PetscErrorCode ierr; 3014d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3015e34fafa9SBarry Smith PetscReal atmp; 3016985db425SBarry Smith PetscScalar *x; 3017e34fafa9SBarry Smith MatScalar *aa; 3018e34fafa9SBarry Smith 3019e34fafa9SBarry Smith PetscFunctionBegin; 3020e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3021e34fafa9SBarry Smith aa = a->a; 3022e34fafa9SBarry Smith ai = a->i; 3023e34fafa9SBarry Smith aj = a->j; 3024e34fafa9SBarry Smith 3025985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 3026e34fafa9SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 3027e34fafa9SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 3028e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3029e34fafa9SBarry Smith for (i=0; i<m; i++) { 3030e34fafa9SBarry Smith ncols = ai[1] - ai[0]; ai++; 30319189402eSHong Zhang x[i] = 0.0; 3032e34fafa9SBarry Smith for (j=0; j<ncols; j++) { 3033985db425SBarry Smith atmp = PetscAbsScalar(*aa); 3034985db425SBarry Smith if (PetscAbsScalar(x[i]) < atmp) {x[i] = atmp; if (idx) idx[i] = *aj;} 3035985db425SBarry Smith aa++; aj++; 3036985db425SBarry Smith } 3037985db425SBarry Smith } 3038985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 3039985db425SBarry Smith PetscFunctionReturn(0); 3040985db425SBarry Smith } 3041985db425SBarry Smith 3042985db425SBarry Smith PetscErrorCode MatGetRowMax_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3043985db425SBarry Smith { 3044985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3045985db425SBarry Smith PetscErrorCode ierr; 3046d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3047985db425SBarry Smith PetscScalar *x; 3048985db425SBarry Smith MatScalar *aa; 3049985db425SBarry Smith 3050985db425SBarry Smith PetscFunctionBegin; 3051e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3052985db425SBarry Smith aa = a->a; 3053985db425SBarry Smith ai = a->i; 3054985db425SBarry Smith aj = a->j; 3055985db425SBarry Smith 3056985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 3057985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 3058985db425SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 3059e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3060985db425SBarry Smith for (i=0; i<m; i++) { 3061985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 3062d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 3063985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 3064985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3065985db425SBarry Smith x[i] = 0.0; 3066985db425SBarry Smith if (idx) { 3067985db425SBarry Smith idx[i] = 0; /* in case ncols is zero */ 3068985db425SBarry Smith for (j=0;j<ncols;j++) { /* find first implicit 0.0 in the row */ 3069985db425SBarry Smith if (aj[j] > j) { 3070985db425SBarry Smith idx[i] = j; 3071985db425SBarry Smith break; 3072985db425SBarry Smith } 3073985db425SBarry Smith } 3074985db425SBarry Smith } 3075985db425SBarry Smith } 3076985db425SBarry Smith for (j=0; j<ncols; j++) { 3077985db425SBarry Smith if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 3078985db425SBarry Smith aa++; aj++; 3079985db425SBarry Smith } 3080985db425SBarry Smith } 3081985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 3082985db425SBarry Smith PetscFunctionReturn(0); 3083985db425SBarry Smith } 3084985db425SBarry Smith 3085c87e5d42SMatthew Knepley PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3086c87e5d42SMatthew Knepley { 3087c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3088c87e5d42SMatthew Knepley PetscErrorCode ierr; 3089c87e5d42SMatthew Knepley PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3090c87e5d42SMatthew Knepley PetscReal atmp; 3091c87e5d42SMatthew Knepley PetscScalar *x; 3092c87e5d42SMatthew Knepley MatScalar *aa; 3093c87e5d42SMatthew Knepley 3094c87e5d42SMatthew Knepley PetscFunctionBegin; 3095e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3096c87e5d42SMatthew Knepley aa = a->a; 3097c87e5d42SMatthew Knepley ai = a->i; 3098c87e5d42SMatthew Knepley aj = a->j; 3099c87e5d42SMatthew Knepley 3100c87e5d42SMatthew Knepley ierr = VecSet(v,0.0);CHKERRQ(ierr); 3101c87e5d42SMatthew Knepley ierr = VecGetArray(v,&x);CHKERRQ(ierr); 3102c87e5d42SMatthew Knepley ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 310360e0710aSBarry Smith if (n != A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector, %D vs. %D rows", A->rmap->n, n); 3104c87e5d42SMatthew Knepley for (i=0; i<m; i++) { 3105c87e5d42SMatthew Knepley ncols = ai[1] - ai[0]; ai++; 3106289a08f5SMatthew Knepley if (ncols) { 3107289a08f5SMatthew Knepley /* Get first nonzero */ 3108289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3109289a08f5SMatthew Knepley atmp = PetscAbsScalar(aa[j]); 31102205254eSKarl Rupp if (atmp > 1.0e-12) { 31112205254eSKarl Rupp x[i] = atmp; 31122205254eSKarl Rupp if (idx) idx[i] = aj[j]; 31132205254eSKarl Rupp break; 31142205254eSKarl Rupp } 3115289a08f5SMatthew Knepley } 311612431cb0SMatthew G Knepley if (j == ncols) {x[i] = PetscAbsScalar(*aa); if (idx) idx[i] = *aj;} 3117289a08f5SMatthew Knepley } else { 3118289a08f5SMatthew Knepley x[i] = 0.0; if (idx) idx[i] = 0; 3119289a08f5SMatthew Knepley } 3120c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 3121c87e5d42SMatthew Knepley atmp = PetscAbsScalar(*aa); 3122289a08f5SMatthew Knepley if (atmp > 1.0e-12 && PetscAbsScalar(x[i]) > atmp) {x[i] = atmp; if (idx) idx[i] = *aj;} 3123c87e5d42SMatthew Knepley aa++; aj++; 3124c87e5d42SMatthew Knepley } 3125c87e5d42SMatthew Knepley } 3126c87e5d42SMatthew Knepley ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 3127c87e5d42SMatthew Knepley PetscFunctionReturn(0); 3128c87e5d42SMatthew Knepley } 3129c87e5d42SMatthew Knepley 3130985db425SBarry Smith PetscErrorCode MatGetRowMin_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3131985db425SBarry Smith { 3132985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3133985db425SBarry Smith PetscErrorCode ierr; 3134d9ca1df4SBarry Smith PetscInt i,j,m = A->rmap->n,ncols,n; 3135d9ca1df4SBarry Smith const PetscInt *ai,*aj; 3136985db425SBarry Smith PetscScalar *x; 3137d9ca1df4SBarry Smith const MatScalar *aa; 3138985db425SBarry Smith 3139985db425SBarry Smith PetscFunctionBegin; 3140e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3141985db425SBarry Smith aa = a->a; 3142985db425SBarry Smith ai = a->i; 3143985db425SBarry Smith aj = a->j; 3144985db425SBarry Smith 3145985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 3146985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 3147985db425SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 3148e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3149985db425SBarry Smith for (i=0; i<m; i++) { 3150985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 3151d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 3152985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 3153985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3154985db425SBarry Smith x[i] = 0.0; 3155985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3156985db425SBarry Smith idx[i] = 0; /* in case ncols is zero */ 3157985db425SBarry Smith for (j=0; j<ncols; j++) { 3158985db425SBarry Smith if (aj[j] > j) { 3159985db425SBarry Smith idx[i] = j; 3160985db425SBarry Smith break; 3161985db425SBarry Smith } 3162985db425SBarry Smith } 3163985db425SBarry Smith } 3164985db425SBarry Smith } 3165985db425SBarry Smith for (j=0; j<ncols; j++) { 3166985db425SBarry Smith if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 3167985db425SBarry Smith aa++; aj++; 3168e34fafa9SBarry Smith } 3169e34fafa9SBarry Smith } 3170e34fafa9SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 3171e34fafa9SBarry Smith PetscFunctionReturn(0); 3172e34fafa9SBarry Smith } 3173bbead8a2SBarry Smith 3174713ccfa9SJed Brown PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A,const PetscScalar **values) 3175bbead8a2SBarry Smith { 3176bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 3177bbead8a2SBarry Smith PetscErrorCode ierr; 317833d57670SJed Brown PetscInt i,bs = PetscAbs(A->rmap->bs),mbs = A->rmap->n/bs,ipvt[5],bs2 = bs*bs,*v_pivots,ij[7],*IJ,j; 3179bbead8a2SBarry Smith MatScalar *diag,work[25],*v_work; 31800da83c2eSBarry Smith const PetscReal shift = 0.0; 31811a9391e3SHong Zhang PetscBool allowzeropivot,zeropivotdetected=PETSC_FALSE; 3182bbead8a2SBarry Smith 3183bbead8a2SBarry Smith PetscFunctionBegin; 3184a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 31854a0d0026SBarry Smith if (a->ibdiagvalid) { 31864a0d0026SBarry Smith if (values) *values = a->ibdiag; 31874a0d0026SBarry Smith PetscFunctionReturn(0); 31884a0d0026SBarry Smith } 3189bbead8a2SBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 3190bbead8a2SBarry Smith if (!a->ibdiag) { 3191785e854fSJed Brown ierr = PetscMalloc1(bs2*mbs,&a->ibdiag);CHKERRQ(ierr); 31923bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)A,bs2*mbs*sizeof(PetscScalar));CHKERRQ(ierr); 3193bbead8a2SBarry Smith } 3194bbead8a2SBarry Smith diag = a->ibdiag; 3195bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3196bbead8a2SBarry Smith /* factor and invert each block */ 3197bbead8a2SBarry Smith switch (bs) { 3198bbead8a2SBarry Smith case 1: 3199bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3200bbead8a2SBarry Smith ierr = MatGetValues(A,1,&i,1,&i,diag+i);CHKERRQ(ierr); 3201ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3202ec1892c8SHong Zhang if (allowzeropivot) { 32037b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 32047b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 32057b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 32067b6c816cSBarry Smith ierr = PetscInfo3(A,"Zero pivot, row %D pivot %g tolerance %g\n",i,(double)PetscAbsScalar(diag[i]),(double)PETSC_MACHINE_EPSILON);CHKERRQ(ierr); 32077b6c816cSBarry Smith } else SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_MAT_LU_ZRPVT,"Zero pivot, row %D pivot %g tolerance %g",i,(double)PetscAbsScalar(diag[i]),(double)PETSC_MACHINE_EPSILON); 3208ec1892c8SHong Zhang } 3209bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3210bbead8a2SBarry Smith } 3211bbead8a2SBarry Smith break; 3212bbead8a2SBarry Smith case 2: 3213bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3214bbead8a2SBarry Smith ij[0] = 2*i; ij[1] = 2*i + 1; 3215bbead8a2SBarry Smith ierr = MatGetValues(A,2,ij,2,ij,diag);CHKERRQ(ierr); 3216a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_2(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 32177b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 321896b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_2(diag);CHKERRQ(ierr); 3219bbead8a2SBarry Smith diag += 4; 3220bbead8a2SBarry Smith } 3221bbead8a2SBarry Smith break; 3222bbead8a2SBarry Smith case 3: 3223bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3224bbead8a2SBarry Smith ij[0] = 3*i; ij[1] = 3*i + 1; ij[2] = 3*i + 2; 3225bbead8a2SBarry Smith ierr = MatGetValues(A,3,ij,3,ij,diag);CHKERRQ(ierr); 3226a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_3(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 32277b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 322896b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_3(diag);CHKERRQ(ierr); 3229bbead8a2SBarry Smith diag += 9; 3230bbead8a2SBarry Smith } 3231bbead8a2SBarry Smith break; 3232bbead8a2SBarry Smith case 4: 3233bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3234bbead8a2SBarry Smith ij[0] = 4*i; ij[1] = 4*i + 1; ij[2] = 4*i + 2; ij[3] = 4*i + 3; 3235bbead8a2SBarry Smith ierr = MatGetValues(A,4,ij,4,ij,diag);CHKERRQ(ierr); 3236a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_4(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 32377b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 323896b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_4(diag);CHKERRQ(ierr); 3239bbead8a2SBarry Smith diag += 16; 3240bbead8a2SBarry Smith } 3241bbead8a2SBarry Smith break; 3242bbead8a2SBarry Smith case 5: 3243bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3244bbead8a2SBarry Smith ij[0] = 5*i; ij[1] = 5*i + 1; ij[2] = 5*i + 2; ij[3] = 5*i + 3; ij[4] = 5*i + 4; 3245bbead8a2SBarry Smith ierr = MatGetValues(A,5,ij,5,ij,diag);CHKERRQ(ierr); 3246a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_5(diag,ipvt,work,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 32477b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 324896b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_5(diag);CHKERRQ(ierr); 3249bbead8a2SBarry Smith diag += 25; 3250bbead8a2SBarry Smith } 3251bbead8a2SBarry Smith break; 3252bbead8a2SBarry Smith case 6: 3253bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3254bbead8a2SBarry Smith ij[0] = 6*i; ij[1] = 6*i + 1; ij[2] = 6*i + 2; ij[3] = 6*i + 3; ij[4] = 6*i + 4; ij[5] = 6*i + 5; 3255bbead8a2SBarry Smith ierr = MatGetValues(A,6,ij,6,ij,diag);CHKERRQ(ierr); 3256a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_6(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 32577b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 325896b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_6(diag);CHKERRQ(ierr); 3259bbead8a2SBarry Smith diag += 36; 3260bbead8a2SBarry Smith } 3261bbead8a2SBarry Smith break; 3262bbead8a2SBarry Smith case 7: 3263bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3264bbead8a2SBarry Smith ij[0] = 7*i; ij[1] = 7*i + 1; ij[2] = 7*i + 2; ij[3] = 7*i + 3; ij[4] = 7*i + 4; ij[5] = 7*i + 5; ij[5] = 7*i + 6; 3265bbead8a2SBarry Smith ierr = MatGetValues(A,7,ij,7,ij,diag);CHKERRQ(ierr); 3266a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_7(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 32677b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 326896b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_7(diag);CHKERRQ(ierr); 3269bbead8a2SBarry Smith diag += 49; 3270bbead8a2SBarry Smith } 3271bbead8a2SBarry Smith break; 3272bbead8a2SBarry Smith default: 3273dcca6d9dSJed Brown ierr = PetscMalloc3(bs,&v_work,bs,&v_pivots,bs,&IJ);CHKERRQ(ierr); 3274bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3275bbead8a2SBarry Smith for (j=0; j<bs; j++) { 3276bbead8a2SBarry Smith IJ[j] = bs*i + j; 3277bbead8a2SBarry Smith } 3278bbead8a2SBarry Smith ierr = MatGetValues(A,bs,IJ,bs,IJ,diag);CHKERRQ(ierr); 32795f8bbccaSHong Zhang ierr = PetscKernel_A_gets_inverse_A(bs,diag,v_pivots,v_work,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 32807b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 328196b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_N(diag,bs);CHKERRQ(ierr); 3282bbead8a2SBarry Smith diag += bs2; 3283bbead8a2SBarry Smith } 3284bbead8a2SBarry Smith ierr = PetscFree3(v_work,v_pivots,IJ);CHKERRQ(ierr); 3285bbead8a2SBarry Smith } 3286bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 3287bbead8a2SBarry Smith PetscFunctionReturn(0); 3288bbead8a2SBarry Smith } 3289bbead8a2SBarry Smith 329073a71a0fSBarry Smith static PetscErrorCode MatSetRandom_SeqAIJ(Mat x,PetscRandom rctx) 329173a71a0fSBarry Smith { 329273a71a0fSBarry Smith PetscErrorCode ierr; 329373a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)x->data; 329473a71a0fSBarry Smith PetscScalar a; 329573a71a0fSBarry Smith PetscInt m,n,i,j,col; 329673a71a0fSBarry Smith 329773a71a0fSBarry Smith PetscFunctionBegin; 329873a71a0fSBarry Smith if (!x->assembled) { 329973a71a0fSBarry Smith ierr = MatGetSize(x,&m,&n);CHKERRQ(ierr); 330073a71a0fSBarry Smith for (i=0; i<m; i++) { 330173a71a0fSBarry Smith for (j=0; j<aij->imax[i]; j++) { 330273a71a0fSBarry Smith ierr = PetscRandomGetValue(rctx,&a);CHKERRQ(ierr); 330373a71a0fSBarry Smith col = (PetscInt)(n*PetscRealPart(a)); 330473a71a0fSBarry Smith ierr = MatSetValues(x,1,&i,1,&col,&a,ADD_VALUES);CHKERRQ(ierr); 330573a71a0fSBarry Smith } 330673a71a0fSBarry Smith } 3307e2ce353bSJunchao Zhang } else { 3308e2ce353bSJunchao Zhang for (i=0; i<aij->nz; i++) {ierr = PetscRandomGetValue(rctx,aij->a+i);CHKERRQ(ierr);} 3309e2ce353bSJunchao Zhang } 331073a71a0fSBarry Smith ierr = MatAssemblyBegin(x,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 331173a71a0fSBarry Smith ierr = MatAssemblyEnd(x,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 331273a71a0fSBarry Smith PetscFunctionReturn(0); 331373a71a0fSBarry Smith } 331473a71a0fSBarry Smith 3315679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3316679944adSJunchao Zhang PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x,PetscInt low,PetscInt high,PetscRandom rctx) 3317679944adSJunchao Zhang { 3318679944adSJunchao Zhang PetscErrorCode ierr; 3319679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)x->data; 3320679944adSJunchao Zhang PetscScalar a; 3321679944adSJunchao Zhang PetscInt m,n,i,j,col,nskip; 3322679944adSJunchao Zhang 3323679944adSJunchao Zhang PetscFunctionBegin; 3324679944adSJunchao Zhang nskip = high - low; 3325679944adSJunchao Zhang ierr = MatGetSize(x,&m,&n);CHKERRQ(ierr); 3326679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3327679944adSJunchao Zhang for (i=0; i<m; i++) { 3328679944adSJunchao Zhang for (j=0; j<aij->imax[i]; j++) { 3329679944adSJunchao Zhang ierr = PetscRandomGetValue(rctx,&a);CHKERRQ(ierr); 3330679944adSJunchao Zhang col = (PetscInt)(n*PetscRealPart(a)); 3331679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 3332679944adSJunchao Zhang ierr = MatSetValues(x,1,&i,1,&col,&a,ADD_VALUES);CHKERRQ(ierr); 3333679944adSJunchao Zhang } 3334e2ce353bSJunchao Zhang } 3335679944adSJunchao Zhang ierr = MatAssemblyBegin(x,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3336679944adSJunchao Zhang ierr = MatAssemblyEnd(x,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3337679944adSJunchao Zhang PetscFunctionReturn(0); 3338679944adSJunchao Zhang } 3339679944adSJunchao Zhang 3340679944adSJunchao Zhang 3341682d7d0cSBarry Smith /* -------------------------------------------------------------------*/ 33420a6ffc59SBarry Smith static struct _MatOps MatOps_Values = { MatSetValues_SeqAIJ, 3343cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3344cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3345cb5b572fSBarry Smith MatMult_SeqAIJ, 334697304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 33477c922b88SBarry Smith MatMultTranspose_SeqAIJ, 33487c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3349db4efbfdSBarry Smith 0, 3350db4efbfdSBarry Smith 0, 3351db4efbfdSBarry Smith 0, 3352db4efbfdSBarry Smith /* 10*/ 0, 3353cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3354cb5b572fSBarry Smith 0, 335541f059aeSBarry Smith MatSOR_SeqAIJ, 335691e9d3e2SHong Zhang MatTranspose_SeqAIJ, 335797304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3358cb5b572fSBarry Smith MatEqual_SeqAIJ, 3359cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3360cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3361cb5b572fSBarry Smith MatNorm_SeqAIJ, 336297304618SKris Buschelman /* 20*/ 0, 3363cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3364cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3365cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3366d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3367db4efbfdSBarry Smith 0, 3368db4efbfdSBarry Smith 0, 3369db4efbfdSBarry Smith 0, 3370db4efbfdSBarry Smith 0, 33714994cf47SJed Brown /* 29*/ MatSetUp_SeqAIJ, 3372db4efbfdSBarry Smith 0, 3373db4efbfdSBarry Smith 0, 33748c778c55SBarry Smith 0, 33758c778c55SBarry Smith 0, 3376d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3377cb5b572fSBarry Smith 0, 3378cb5b572fSBarry Smith 0, 3379cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3380cb5b572fSBarry Smith 0, 3381d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 33827dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3383cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3384cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3385cb5b572fSBarry Smith MatCopy_SeqAIJ, 3386d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3387cb5b572fSBarry Smith MatScale_SeqAIJ, 33887d68702bSBarry Smith MatShift_SeqAIJ, 338979299369SBarry Smith MatDiagonalSet_SeqAIJ, 33906e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 339173a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 33923b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 33933b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 33943b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3395a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 339693dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3397b9617806SBarry Smith 0, 33980513a670SBarry Smith 0, 3399cda55fadSBarry Smith MatPermute_SeqAIJ, 3400cda55fadSBarry Smith 0, 3401d519adbfSMatthew Knepley /* 59*/ 0, 3402b9b97703SBarry Smith MatDestroy_SeqAIJ, 3403b9b97703SBarry Smith MatView_SeqAIJ, 3404357abbc8SBarry Smith 0, 3405321b30b9SSatish Balay MatMatMatMult_SeqAIJ_SeqAIJ_SeqAIJ, 3406321b30b9SSatish Balay /* 64*/ MatMatMatMultSymbolic_SeqAIJ_SeqAIJ_SeqAIJ, 3407321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3408ee4f033dSBarry Smith 0, 3409ee4f033dSBarry Smith 0, 3410ee4f033dSBarry Smith 0, 3411d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3412c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3413ee4f033dSBarry Smith 0, 3414dcf5cc72SBarry Smith 0, 34152c93a97aSBarry Smith 0, 34162c93a97aSBarry Smith /* 74*/ 0, 34173acb8795SBarry Smith MatFDColoringApply_AIJ, 341897304618SKris Buschelman 0, 341997304618SKris Buschelman 0, 342097304618SKris Buschelman 0, 34216ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 342297304618SKris Buschelman 0, 342397304618SKris Buschelman 0, 342497304618SKris Buschelman 0, 3425bc011b1eSHong Zhang MatLoad_SeqAIJ, 3426d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqAIJ, 34271cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 34286284ec50SHong Zhang 0, 34296284ec50SHong Zhang 0, 3430bc011b1eSHong Zhang 0, 3431d519adbfSMatthew Knepley /* 89*/ MatMatMult_SeqAIJ_SeqAIJ, 343226be0446SHong Zhang MatMatMultSymbolic_SeqAIJ_SeqAIJ, 343326be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 343465e8a0caSHong Zhang MatPtAP_SeqAIJ_SeqAIJ, 34358fa4b5a6SHong Zhang MatPtAPSymbolic_SeqAIJ_SeqAIJ_SparseAxpy, 34368fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 34376fc122caSHong Zhang MatMatTransposeMult_SeqAIJ_SeqAIJ, 34386fc122caSHong Zhang MatMatTransposeMultSymbolic_SeqAIJ_SeqAIJ, 34396fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 34402121bac1SHong Zhang 0, 34412121bac1SHong Zhang /* 99*/ 0, 3442609c6c4dSKris Buschelman 0, 3443609c6c4dSKris Buschelman 0, 344487d4246cSBarry Smith MatConjugate_SeqAIJ, 344587d4246cSBarry Smith 0, 3446d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 344799cafbc1SBarry Smith MatRealPart_SeqAIJ, 3448f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3449f5edf698SHong Zhang 0, 34502bebee5dSHong Zhang 0, 3451cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3452985db425SBarry Smith 0, 34532af78befSBarry Smith MatGetRowMin_SeqAIJ, 34542af78befSBarry Smith 0, 3455599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3456d519adbfSMatthew Knepley /*114*/ 0, 3457599ef60dSHong Zhang 0, 34583c2a7987SHong Zhang 0, 3459fe97e370SBarry Smith 0, 3460fbdbba38SShri Abhyankar 0, 3461fbdbba38SShri Abhyankar /*119*/ 0, 3462fbdbba38SShri Abhyankar 0, 3463fbdbba38SShri Abhyankar 0, 346482d44351SHong Zhang 0, 3465b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 34660716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3467bbead8a2SBarry Smith MatGetColumnNorms_SeqAIJ, 346837868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 34690da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 347037868618SMatthew G Knepley 0, 34715df89d91SHong Zhang /*129*/ 0, 347275648e8dSHong Zhang MatTransposeMatMult_SeqAIJ_SeqAIJ, 347375648e8dSHong Zhang MatTransposeMatMultSymbolic_SeqAIJ_SeqAIJ, 347475648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3475b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3476b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 34772b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 34782b8ad9a3SHong Zhang MatRARt_SeqAIJ_SeqAIJ, 34792b8ad9a3SHong Zhang MatRARtSymbolic_SeqAIJ_SeqAIJ, 34803964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 34813964eb88SJed Brown /*139*/0, 3482f9426fe0SMark Adams 0, 34831919a2e2SJed Brown 0, 34843a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 34859c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 34862d033e1fSHong Zhang /*144*/MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 34872d033e1fSHong Zhang MatDestroySubMatrices_SeqAIJ 34889e29f15eSvictorle }; 348917ab2063SBarry Smith 34907087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat,PetscInt *indices) 3491bef8e0ddSBarry Smith { 3492bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 349397f1f81fSBarry Smith PetscInt i,nz,n; 3494bef8e0ddSBarry Smith 3495bef8e0ddSBarry Smith PetscFunctionBegin; 3496bef8e0ddSBarry Smith nz = aij->maxnz; 3497d0f46423SBarry Smith n = mat->rmap->n; 3498bef8e0ddSBarry Smith for (i=0; i<nz; i++) { 3499bef8e0ddSBarry Smith aij->j[i] = indices[i]; 3500bef8e0ddSBarry Smith } 3501bef8e0ddSBarry Smith aij->nz = nz; 3502bef8e0ddSBarry Smith for (i=0; i<n; i++) { 3503bef8e0ddSBarry Smith aij->ilen[i] = aij->imax[i]; 3504bef8e0ddSBarry Smith } 3505bef8e0ddSBarry Smith PetscFunctionReturn(0); 3506bef8e0ddSBarry Smith } 3507bef8e0ddSBarry Smith 3508a3bb6f32SFande Kong /* 3509e8b528d9SFande Kong * When a sparse matrix has many zero columns, we should compact them out to save the space 3510a3bb6f32SFande Kong * This happens in MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3511a3bb6f32SFande Kong * */ 3512a3bb6f32SFande Kong PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3513a3bb6f32SFande Kong { 3514a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3515a3bb6f32SFande Kong PetscTable gid1_lid1; 3516a3bb6f32SFande Kong PetscTablePosition tpos; 3517a3bb6f32SFande Kong PetscInt gid,lid,i,j,ncols,ec; 3518a3bb6f32SFande Kong PetscInt *garray; 3519a3bb6f32SFande Kong PetscErrorCode ierr; 3520a3bb6f32SFande Kong 3521a3bb6f32SFande Kong PetscFunctionBegin; 3522a3bb6f32SFande Kong PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3523a3bb6f32SFande Kong PetscValidPointer(mapping,2); 3524a3bb6f32SFande Kong /* use a table */ 3525a3bb6f32SFande Kong ierr = PetscTableCreate(mat->rmap->n,mat->cmap->N+1,&gid1_lid1);CHKERRQ(ierr); 3526a3bb6f32SFande Kong ec = 0; 3527a3bb6f32SFande Kong for (i=0; i<mat->rmap->n; i++) { 3528a3bb6f32SFande Kong ncols = aij->i[i+1] - aij->i[i]; 3529a3bb6f32SFande Kong for (j=0; j<ncols; j++) { 3530a3bb6f32SFande Kong PetscInt data,gid1 = aij->j[aij->i[i] + j] + 1; 3531a3bb6f32SFande Kong ierr = PetscTableFind(gid1_lid1,gid1,&data);CHKERRQ(ierr); 3532a3bb6f32SFande Kong if (!data) { 3533a3bb6f32SFande Kong /* one based table */ 3534a3bb6f32SFande Kong ierr = PetscTableAdd(gid1_lid1,gid1,++ec,INSERT_VALUES);CHKERRQ(ierr); 3535a3bb6f32SFande Kong } 3536a3bb6f32SFande Kong } 3537a3bb6f32SFande Kong } 3538a3bb6f32SFande Kong /* form array of columns we need */ 3539a3bb6f32SFande Kong ierr = PetscMalloc1(ec+1,&garray);CHKERRQ(ierr); 3540a3bb6f32SFande Kong ierr = PetscTableGetHeadPosition(gid1_lid1,&tpos);CHKERRQ(ierr); 3541a3bb6f32SFande Kong while (tpos) { 3542a3bb6f32SFande Kong ierr = PetscTableGetNext(gid1_lid1,&tpos,&gid,&lid);CHKERRQ(ierr); 3543a3bb6f32SFande Kong gid--; 3544a3bb6f32SFande Kong lid--; 3545a3bb6f32SFande Kong garray[lid] = gid; 3546a3bb6f32SFande Kong } 3547a3bb6f32SFande Kong ierr = PetscSortInt(ec,garray);CHKERRQ(ierr); /* sort, and rebuild */ 3548a3bb6f32SFande Kong ierr = PetscTableRemoveAll(gid1_lid1);CHKERRQ(ierr); 3549a3bb6f32SFande Kong for (i=0; i<ec; i++) { 3550a3bb6f32SFande Kong ierr = PetscTableAdd(gid1_lid1,garray[i]+1,i+1,INSERT_VALUES);CHKERRQ(ierr); 3551a3bb6f32SFande Kong } 3552a3bb6f32SFande Kong /* compact out the extra columns in B */ 3553a3bb6f32SFande Kong for (i=0; i<mat->rmap->n; i++) { 3554a3bb6f32SFande Kong ncols = aij->i[i+1] - aij->i[i]; 3555a3bb6f32SFande Kong for (j=0; j<ncols; j++) { 3556a3bb6f32SFande Kong PetscInt gid1 = aij->j[aij->i[i] + j] + 1; 3557a3bb6f32SFande Kong ierr = PetscTableFind(gid1_lid1,gid1,&lid);CHKERRQ(ierr); 3558a3bb6f32SFande Kong lid--; 3559a3bb6f32SFande Kong aij->j[aij->i[i] + j] = lid; 3560a3bb6f32SFande Kong } 3561a3bb6f32SFande Kong } 3562a3bb6f32SFande Kong mat->cmap->n = mat->cmap->N = ec; 3563a3bb6f32SFande Kong mat->cmap->bs = 1; 3564a3bb6f32SFande Kong 3565a3bb6f32SFande Kong ierr = PetscTableDestroy(&gid1_lid1);CHKERRQ(ierr); 3566a3bb6f32SFande Kong ierr = PetscLayoutSetUp((mat->cmap));CHKERRQ(ierr); 3567a3bb6f32SFande Kong ierr = ISLocalToGlobalMappingCreate(PETSC_COMM_SELF,mat->cmap->bs,mat->cmap->n,garray,PETSC_OWN_POINTER,mapping);CHKERRQ(ierr); 3568a3bb6f32SFande Kong ierr = ISLocalToGlobalMappingSetType(*mapping,ISLOCALTOGLOBALMAPPINGHASH);CHKERRQ(ierr); 3569a3bb6f32SFande Kong PetscFunctionReturn(0); 3570a3bb6f32SFande Kong } 3571a3bb6f32SFande Kong 3572bef8e0ddSBarry Smith /*@ 3573bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3574bef8e0ddSBarry Smith in the matrix. 3575bef8e0ddSBarry Smith 3576bef8e0ddSBarry Smith Input Parameters: 3577bef8e0ddSBarry Smith + mat - the SeqAIJ matrix 3578bef8e0ddSBarry Smith - indices - the column indices 3579bef8e0ddSBarry Smith 358015091d37SBarry Smith Level: advanced 358115091d37SBarry Smith 3582bef8e0ddSBarry Smith Notes: 3583bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3584bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 3585bef8e0ddSBarry Smith of the MatSetValues() operation. 3586bef8e0ddSBarry Smith 3587bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 3588d1be2dadSMatthew Knepley MatCreateSeqAIJ(), and the columns indices MUST be sorted. 3589bef8e0ddSBarry Smith 3590bef8e0ddSBarry Smith MUST be called before any calls to MatSetValues(); 3591bef8e0ddSBarry Smith 3592b9617806SBarry Smith The indices should start with zero, not one. 3593b9617806SBarry Smith 3594bef8e0ddSBarry Smith @*/ 35957087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat,PetscInt *indices) 3596bef8e0ddSBarry Smith { 35974ac538c5SBarry Smith PetscErrorCode ierr; 3598bef8e0ddSBarry Smith 3599bef8e0ddSBarry Smith PetscFunctionBegin; 36000700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 36014482741eSBarry Smith PetscValidPointer(indices,2); 36024ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatSeqAIJSetColumnIndices_C",(Mat,PetscInt*),(mat,indices));CHKERRQ(ierr); 3603bef8e0ddSBarry Smith PetscFunctionReturn(0); 3604bef8e0ddSBarry Smith } 3605bef8e0ddSBarry Smith 3606be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/ 3607be6bf707SBarry Smith 36087087cfbeSBarry Smith PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3609be6bf707SBarry Smith { 3610be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 36116849ba73SBarry Smith PetscErrorCode ierr; 3612d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3613be6bf707SBarry Smith 3614be6bf707SBarry Smith PetscFunctionBegin; 3615169f6850SBarry Smith if (!aij->nonew) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3616be6bf707SBarry Smith 3617be6bf707SBarry Smith /* allocate space for values if not already there */ 3618be6bf707SBarry Smith if (!aij->saved_values) { 3619854ce69bSBarry Smith ierr = PetscMalloc1(nz+1,&aij->saved_values);CHKERRQ(ierr); 36203bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)mat,(nz+1)*sizeof(PetscScalar));CHKERRQ(ierr); 3621be6bf707SBarry Smith } 3622be6bf707SBarry Smith 3623be6bf707SBarry Smith /* copy values over */ 3624580bdb30SBarry Smith ierr = PetscArraycpy(aij->saved_values,aij->a,nz);CHKERRQ(ierr); 3625be6bf707SBarry Smith PetscFunctionReturn(0); 3626be6bf707SBarry Smith } 3627be6bf707SBarry Smith 3628be6bf707SBarry Smith /*@ 3629be6bf707SBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows, for 3630be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3631be6bf707SBarry Smith nonlinear portion. 3632be6bf707SBarry Smith 3633be6bf707SBarry Smith Collect on Mat 3634be6bf707SBarry Smith 3635be6bf707SBarry Smith Input Parameters: 36360e609b76SBarry Smith . mat - the matrix (currently only AIJ matrices support this option) 3637be6bf707SBarry Smith 363815091d37SBarry Smith Level: advanced 363915091d37SBarry Smith 3640be6bf707SBarry Smith Common Usage, with SNESSolve(): 3641be6bf707SBarry Smith $ Create Jacobian matrix 3642be6bf707SBarry Smith $ Set linear terms into matrix 3643be6bf707SBarry Smith $ Apply boundary conditions to matrix, at this time matrix must have 3644be6bf707SBarry Smith $ final nonzero structure (i.e. setting the nonlinear terms and applying 3645be6bf707SBarry Smith $ boundary conditions again will not change the nonzero structure 3646512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3647be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3648be6bf707SBarry Smith $ Call SNESSetJacobian() with matrix 3649be6bf707SBarry Smith $ In your Jacobian routine 3650be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3651be6bf707SBarry Smith $ Set nonlinear terms in matrix 3652be6bf707SBarry Smith 3653be6bf707SBarry Smith Common Usage without SNESSolve(), i.e. when you handle nonlinear solve yourself: 3654be6bf707SBarry Smith $ // build linear portion of Jacobian 3655512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3656be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3657be6bf707SBarry Smith $ loop over nonlinear iterations 3658be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3659be6bf707SBarry Smith $ // call MatSetValues(mat,...) to set nonliner portion of Jacobian 3660be6bf707SBarry Smith $ // call MatAssemblyBegin/End() on matrix 3661be6bf707SBarry Smith $ Solve linear system with Jacobian 3662be6bf707SBarry Smith $ endloop 3663be6bf707SBarry Smith 3664be6bf707SBarry Smith Notes: 3665be6bf707SBarry Smith Matrix must already be assemblied before calling this routine 3666512a5fc5SBarry Smith Must set the matrix option MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); before 3667be6bf707SBarry Smith calling this routine. 3668be6bf707SBarry Smith 36690c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 36700c468ba9SBarry Smith and does not allocated additional space. 36710c468ba9SBarry Smith 3672be6bf707SBarry Smith .seealso: MatRetrieveValues() 3673be6bf707SBarry Smith 3674be6bf707SBarry Smith @*/ 36757087cfbeSBarry Smith PetscErrorCode MatStoreValues(Mat mat) 3676be6bf707SBarry Smith { 36774ac538c5SBarry Smith PetscErrorCode ierr; 3678be6bf707SBarry Smith 3679be6bf707SBarry Smith PetscFunctionBegin; 36800700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3681e32f2f54SBarry Smith if (!mat->assembled) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 3682e32f2f54SBarry Smith if (mat->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 36834ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatStoreValues_C",(Mat),(mat));CHKERRQ(ierr); 3684be6bf707SBarry Smith PetscFunctionReturn(0); 3685be6bf707SBarry Smith } 3686be6bf707SBarry Smith 36877087cfbeSBarry Smith PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3688be6bf707SBarry Smith { 3689be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 36906849ba73SBarry Smith PetscErrorCode ierr; 3691d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3692be6bf707SBarry Smith 3693be6bf707SBarry Smith PetscFunctionBegin; 3694169f6850SBarry Smith if (!aij->nonew) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3695f23aa3ddSBarry Smith if (!aij->saved_values) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatStoreValues(A);first"); 3696be6bf707SBarry Smith /* copy values over */ 3697580bdb30SBarry Smith ierr = PetscArraycpy(aij->a,aij->saved_values,nz);CHKERRQ(ierr); 3698be6bf707SBarry Smith PetscFunctionReturn(0); 3699be6bf707SBarry Smith } 3700be6bf707SBarry Smith 3701be6bf707SBarry Smith /*@ 3702be6bf707SBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for 3703be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3704be6bf707SBarry Smith nonlinear portion. 3705be6bf707SBarry Smith 3706be6bf707SBarry Smith Collect on Mat 3707be6bf707SBarry Smith 3708be6bf707SBarry Smith Input Parameters: 3709386f7cf9SBarry Smith . mat - the matrix (currently only AIJ matrices support this option) 3710be6bf707SBarry Smith 371115091d37SBarry Smith Level: advanced 371215091d37SBarry Smith 3713be6bf707SBarry Smith .seealso: MatStoreValues() 3714be6bf707SBarry Smith 3715be6bf707SBarry Smith @*/ 37167087cfbeSBarry Smith PetscErrorCode MatRetrieveValues(Mat mat) 3717be6bf707SBarry Smith { 37184ac538c5SBarry Smith PetscErrorCode ierr; 3719be6bf707SBarry Smith 3720be6bf707SBarry Smith PetscFunctionBegin; 37210700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3722e32f2f54SBarry Smith if (!mat->assembled) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 3723e32f2f54SBarry Smith if (mat->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 37244ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatRetrieveValues_C",(Mat),(mat));CHKERRQ(ierr); 3725be6bf707SBarry Smith PetscFunctionReturn(0); 3726be6bf707SBarry Smith } 3727be6bf707SBarry Smith 3728f83d6046SBarry Smith 3729be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/ 373017ab2063SBarry Smith /*@C 3731682d7d0cSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in AIJ (compressed row) format 37320d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 37336e62573dSLois Curfman McInnes the user should preallocate the matrix storage by setting the parameter nz 373451c19458SBarry Smith (or the array nnz). By setting these parameters accurately, performance 37352bd5e0b2SLois Curfman McInnes during matrix assembly can be increased by more than a factor of 50. 373617ab2063SBarry Smith 3737d083f849SBarry Smith Collective 3738db81eaa0SLois Curfman McInnes 373917ab2063SBarry Smith Input Parameters: 3740db81eaa0SLois Curfman McInnes + comm - MPI communicator, set to PETSC_COMM_SELF 374117ab2063SBarry Smith . m - number of rows 374217ab2063SBarry Smith . n - number of columns 374317ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 374451c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 37450298fd71SBarry Smith (possibly different for each row) or NULL 374617ab2063SBarry Smith 374717ab2063SBarry Smith Output Parameter: 3748416022c9SBarry Smith . A - the matrix 374917ab2063SBarry Smith 3750175b88e8SBarry Smith It is recommended that one use the MatCreate(), MatSetType() and/or MatSetFromOptions(), 3751f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 3752175b88e8SBarry Smith [MatXXXXSetPreallocation() is, for example, MatSeqAIJSetPreallocation] 3753175b88e8SBarry Smith 3754b259b22eSLois Curfman McInnes Notes: 375549a6f317SBarry Smith If nnz is given then nz is ignored 375649a6f317SBarry Smith 375717ab2063SBarry Smith The AIJ format (also called the Yale sparse matrix format or 375817ab2063SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 37590002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 376044cd7ae7SLois Curfman McInnes either one (as in Fortran) or zero. See the users' manual for details. 376117ab2063SBarry Smith 376217ab2063SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 37630298fd71SBarry Smith Set nz=PETSC_DEFAULT and nnz=NULL for PETSc to control dynamic memory 37643d323bbdSBarry Smith allocation. For large problems you MUST preallocate memory or you 37656da5968aSLois Curfman McInnes will get TERRIBLE performance, see the users' manual chapter on matrices. 376617ab2063SBarry Smith 3767682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 37684fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3769682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 37706c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 37716c7ebb05SLois Curfman McInnes 37726c7ebb05SLois Curfman McInnes Options Database Keys: 3773698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 37749db58ca8SBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 377517ab2063SBarry Smith 3776027ccd11SLois Curfman McInnes Level: intermediate 3777027ccd11SLois Curfman McInnes 377869b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatSetValues(), MatSeqAIJSetColumnIndices(), MatCreateSeqAIJWithArrays() 377936db0b34SBarry Smith 378017ab2063SBarry Smith @*/ 37817087cfbeSBarry Smith PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt nz,const PetscInt nnz[],Mat *A) 378217ab2063SBarry Smith { 3783dfbe8321SBarry Smith PetscErrorCode ierr; 37846945ee14SBarry Smith 37853a40ed3dSBarry Smith PetscFunctionBegin; 3786f69a0ea3SMatthew Knepley ierr = MatCreate(comm,A);CHKERRQ(ierr); 3787117016b1SBarry Smith ierr = MatSetSizes(*A,m,n,m,n);CHKERRQ(ierr); 3788c4752a88SBarry Smith ierr = MatSetType(*A,MATSEQAIJ);CHKERRQ(ierr); 3789d28bb7d2SJed Brown ierr = MatSeqAIJSetPreallocation_SeqAIJ(*A,nz,nnz);CHKERRQ(ierr); 3790273d9f13SBarry Smith PetscFunctionReturn(0); 3791273d9f13SBarry Smith } 3792273d9f13SBarry Smith 3793273d9f13SBarry Smith /*@C 3794273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3795273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3796273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3797273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3798273d9f13SBarry Smith 3799d083f849SBarry Smith Collective 3800273d9f13SBarry Smith 3801273d9f13SBarry Smith Input Parameters: 38021c4f3114SJed Brown + B - The matrix 3803273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3804273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38050298fd71SBarry Smith (possibly different for each row) or NULL 3806273d9f13SBarry Smith 3807273d9f13SBarry Smith Notes: 380849a6f317SBarry Smith If nnz is given then nz is ignored 380949a6f317SBarry Smith 3810273d9f13SBarry Smith The AIJ format (also called the Yale sparse matrix format or 3811273d9f13SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 3812273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3813273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3814273d9f13SBarry Smith 3815273d9f13SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 38160298fd71SBarry Smith Set nz=PETSC_DEFAULT and nnz=NULL for PETSc to control dynamic memory 3817273d9f13SBarry Smith allocation. For large problems you MUST preallocate memory or you 3818273d9f13SBarry Smith will get TERRIBLE performance, see the users' manual chapter on matrices. 3819273d9f13SBarry Smith 3820aa95bbe8SBarry Smith You can call MatGetInfo() to get information on how effective the preallocation was; 3821aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3822aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3823aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3824aa95bbe8SBarry Smith 3825a96a251dSBarry Smith Developers: Use nz of MAT_SKIP_ALLOCATION to not allocate any space for the matrix 3826a96a251dSBarry Smith entries or columns indices 3827a96a251dSBarry Smith 3828273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3829273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3830273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3831273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3832273d9f13SBarry Smith 3833273d9f13SBarry Smith Options Database Keys: 3834698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 383547b2e64bSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 3836273d9f13SBarry Smith 3837273d9f13SBarry Smith Level: intermediate 3838273d9f13SBarry Smith 383969b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatSetValues(), MatSeqAIJSetColumnIndices(), MatCreateSeqAIJWithArrays(), MatGetInfo() 3840273d9f13SBarry Smith 3841273d9f13SBarry Smith @*/ 38427087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation(Mat B,PetscInt nz,const PetscInt nnz[]) 3843273d9f13SBarry Smith { 38444ac538c5SBarry Smith PetscErrorCode ierr; 3845a23d5eceSKris Buschelman 3846a23d5eceSKris Buschelman PetscFunctionBegin; 38476ba663aaSJed Brown PetscValidHeaderSpecific(B,MAT_CLASSID,1); 38486ba663aaSJed Brown PetscValidType(B,1); 38494ac538c5SBarry Smith ierr = PetscTryMethod(B,"MatSeqAIJSetPreallocation_C",(Mat,PetscInt,const PetscInt[]),(B,nz,nnz));CHKERRQ(ierr); 3850a23d5eceSKris Buschelman PetscFunctionReturn(0); 3851a23d5eceSKris Buschelman } 3852a23d5eceSKris Buschelman 38537087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B,PetscInt nz,const PetscInt *nnz) 3854a23d5eceSKris Buschelman { 3855273d9f13SBarry Smith Mat_SeqAIJ *b; 38562576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE,realalloc = PETSC_FALSE; 38576849ba73SBarry Smith PetscErrorCode ierr; 385897f1f81fSBarry Smith PetscInt i; 3859273d9f13SBarry Smith 3860273d9f13SBarry Smith PetscFunctionBegin; 38612576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3862a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3863c461c341SBarry Smith skipallocation = PETSC_TRUE; 3864c461c341SBarry Smith nz = 0; 3865c461c341SBarry Smith } 386626283091SBarry Smith ierr = PetscLayoutSetUp(B->rmap);CHKERRQ(ierr); 386726283091SBarry Smith ierr = PetscLayoutSetUp(B->cmap);CHKERRQ(ierr); 3868899cda47SBarry Smith 3869435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 387060e0710aSBarry Smith if (nz < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nz cannot be less than 0: value %D",nz); 3871071fcb05SBarry Smith #if defined(PETSC_USE_DEBUG) 3872b73539f3SBarry Smith if (nnz) { 3873d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) { 387460e0710aSBarry Smith if (nnz[i] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be less than 0: local row %D value %D",i,nnz[i]); 387560e0710aSBarry Smith if (nnz[i] > B->cmap->n) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be greater than row length: local row %D value %d rowlength %D",i,nnz[i],B->cmap->n); 3876b73539f3SBarry Smith } 3877b73539f3SBarry Smith } 3878071fcb05SBarry Smith #endif 3879b73539f3SBarry Smith 3880273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 38812205254eSKarl Rupp 3882273d9f13SBarry Smith b = (Mat_SeqAIJ*)B->data; 3883273d9f13SBarry Smith 3884ab93d7beSBarry Smith if (!skipallocation) { 38852ee49352SLisandro Dalcin if (!b->imax) { 3886071fcb05SBarry Smith ierr = PetscMalloc1(B->rmap->n,&b->imax);CHKERRQ(ierr); 3887071fcb05SBarry Smith ierr = PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 3888071fcb05SBarry Smith } 3889071fcb05SBarry Smith if (!b->ilen) { 3890071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 3891071fcb05SBarry Smith ierr = PetscCalloc1(B->rmap->n,&b->ilen);CHKERRQ(ierr); 3892071fcb05SBarry Smith ierr = PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 3893071fcb05SBarry Smith } else { 3894071fcb05SBarry Smith ierr = PetscMemzero(b->ilen,B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 38952ee49352SLisandro Dalcin } 3896846b4da1SFande Kong if (!b->ipre) { 3897846b4da1SFande Kong ierr = PetscMalloc1(B->rmap->n,&b->ipre);CHKERRQ(ierr); 3898846b4da1SFande Kong ierr = PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 3899846b4da1SFande Kong } 3900273d9f13SBarry Smith if (!nnz) { 3901435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 3902c62bd62aSJed Brown else if (nz < 0) nz = 1; 39035d2a9ed1SStefano Zampini nz = PetscMin(nz,B->cmap->n); 3904d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) b->imax[i] = nz; 3905d0f46423SBarry Smith nz = nz*B->rmap->n; 3906273d9f13SBarry Smith } else { 3907c73702f5SBarry Smith PetscInt64 nz64 = 0; 3908c73702f5SBarry Smith for (i=0; i<B->rmap->n; i++) {b->imax[i] = nnz[i]; nz64 += nnz[i];} 3909c73702f5SBarry Smith ierr = PetscIntCast(nz64,&nz);CHKERRQ(ierr); 3910273d9f13SBarry Smith } 3911ab93d7beSBarry Smith 3912273d9f13SBarry Smith /* allocate the matrix space */ 391353dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 39142ee49352SLisandro Dalcin ierr = MatSeqXAIJFreeAIJ(B,&b->a,&b->j,&b->i);CHKERRQ(ierr); 3915396832f4SHong Zhang if (B->structure_only) { 39165848002fSHong Zhang ierr = PetscMalloc1(nz,&b->j);CHKERRQ(ierr); 39175848002fSHong Zhang ierr = PetscMalloc1(B->rmap->n+1,&b->i);CHKERRQ(ierr); 3918396832f4SHong Zhang ierr = PetscLogObjectMemory((PetscObject)B,(B->rmap->n+1)*sizeof(PetscInt)+nz*sizeof(PetscInt));CHKERRQ(ierr); 3919396832f4SHong Zhang } else { 3920dcca6d9dSJed Brown ierr = PetscMalloc3(nz,&b->a,nz,&b->j,B->rmap->n+1,&b->i);CHKERRQ(ierr); 39213bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)B,(B->rmap->n+1)*sizeof(PetscInt)+nz*(sizeof(PetscScalar)+sizeof(PetscInt)));CHKERRQ(ierr); 3922396832f4SHong Zhang } 3923bfeeae90SHong Zhang b->i[0] = 0; 3924d0f46423SBarry Smith for (i=1; i<B->rmap->n+1; i++) { 39255da197adSKris Buschelman b->i[i] = b->i[i-1] + b->imax[i-1]; 39265da197adSKris Buschelman } 3927396832f4SHong Zhang if (B->structure_only) { 3928396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 3929396832f4SHong Zhang b->free_a = PETSC_FALSE; 3930396832f4SHong Zhang } else { 3931273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 3932e6b907acSBarry Smith b->free_a = PETSC_TRUE; 3933396832f4SHong Zhang } 3934e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 3935c461c341SBarry Smith } else { 3936e6b907acSBarry Smith b->free_a = PETSC_FALSE; 3937e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 3938c461c341SBarry Smith } 3939273d9f13SBarry Smith 3940846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 3941846b4da1SFande Kong /* reserve user-requested sparsity */ 3942580bdb30SBarry Smith ierr = PetscArraycpy(b->ipre,b->imax,B->rmap->n);CHKERRQ(ierr); 3943846b4da1SFande Kong } 3944846b4da1SFande Kong 3945846b4da1SFande Kong 3946273d9f13SBarry Smith b->nz = 0; 3947273d9f13SBarry Smith b->maxnz = nz; 3948273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 39492205254eSKarl Rupp if (realalloc) { 39502205254eSKarl Rupp ierr = MatSetOption(B,MAT_NEW_NONZERO_ALLOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 39512205254eSKarl Rupp } 3952cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 3953cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 3954273d9f13SBarry Smith PetscFunctionReturn(0); 3955273d9f13SBarry Smith } 3956273d9f13SBarry Smith 3957846b4da1SFande Kong 3958846b4da1SFande Kong PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 3959846b4da1SFande Kong { 3960846b4da1SFande Kong Mat_SeqAIJ *a; 3961a5bbaf83SFande Kong PetscInt i; 3962846b4da1SFande Kong PetscErrorCode ierr; 3963846b4da1SFande Kong 3964846b4da1SFande Kong PetscFunctionBegin; 3965846b4da1SFande Kong PetscValidHeaderSpecific(A,MAT_CLASSID,1); 396614d0e64fSAlex Lindsay 396714d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 396814d0e64fSAlex Lindsay if (!A->rmap->n) PetscFunctionReturn(0); 396914d0e64fSAlex Lindsay 3970846b4da1SFande Kong a = (Mat_SeqAIJ*)A->data; 39712c814fdeSFande Kong /* if no saved info, we error out */ 3972fb4dc15dSAlex Lindsay if (!a->ipre) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_NULL,"No saved preallocation info \n"); 39732c814fdeSFande Kong 3974fb4dc15dSAlex Lindsay if (!a->i || !a->j || !a->a || !a->imax || !a->ilen) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_NULL,"Memory info is incomplete, and can not reset preallocation \n"); 39752c814fdeSFande Kong 3976580bdb30SBarry Smith ierr = PetscArraycpy(a->imax,a->ipre,A->rmap->n);CHKERRQ(ierr); 3977580bdb30SBarry Smith ierr = PetscArrayzero(a->ilen,A->rmap->n);CHKERRQ(ierr); 3978846b4da1SFande Kong a->i[0] = 0; 3979846b4da1SFande Kong for (i=1; i<A->rmap->n+1; i++) { 3980846b4da1SFande Kong a->i[i] = a->i[i-1] + a->imax[i-1]; 3981846b4da1SFande Kong } 3982846b4da1SFande Kong A->preallocated = PETSC_TRUE; 3983846b4da1SFande Kong a->nz = 0; 3984846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 3985846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 3986846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 3987846b4da1SFande Kong A->assembled = PETSC_FALSE; 3988846b4da1SFande Kong PetscFunctionReturn(0); 3989846b4da1SFande Kong } 3990846b4da1SFande Kong 399158d36128SBarry Smith /*@ 3992a1661176SMatthew Knepley MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in AIJ format. 3993a1661176SMatthew Knepley 3994a1661176SMatthew Knepley Input Parameters: 3995a1661176SMatthew Knepley + B - the matrix 3996a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 3997a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 3998a1661176SMatthew Knepley - v - optional values in the matrix 3999a1661176SMatthew Knepley 4000a1661176SMatthew Knepley Level: developer 4001a1661176SMatthew Knepley 400258d36128SBarry Smith The i,j,v values are COPIED with this routine; to avoid the copy use MatCreateSeqAIJWithArrays() 400358d36128SBarry Smith 4004c1c1d628SHong Zhang .seealso: MatCreate(), MatCreateSeqAIJ(), MatSetValues(), MatSeqAIJSetPreallocation(), MatCreateSeqAIJ(), MATSEQAIJ 4005a1661176SMatthew Knepley @*/ 4006a1661176SMatthew Knepley PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B,const PetscInt i[],const PetscInt j[],const PetscScalar v[]) 4007a1661176SMatthew Knepley { 4008a1661176SMatthew Knepley PetscErrorCode ierr; 4009a1661176SMatthew Knepley 4010a1661176SMatthew Knepley PetscFunctionBegin; 40110700a824SBarry Smith PetscValidHeaderSpecific(B,MAT_CLASSID,1); 40126ba663aaSJed Brown PetscValidType(B,1); 40134ac538c5SBarry Smith ierr = PetscTryMethod(B,"MatSeqAIJSetPreallocationCSR_C",(Mat,const PetscInt[],const PetscInt[],const PetscScalar[]),(B,i,j,v));CHKERRQ(ierr); 4014a1661176SMatthew Knepley PetscFunctionReturn(0); 4015a1661176SMatthew Knepley } 4016a1661176SMatthew Knepley 40177087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B,const PetscInt Ii[],const PetscInt J[],const PetscScalar v[]) 4018a1661176SMatthew Knepley { 4019a1661176SMatthew Knepley PetscInt i; 4020a1661176SMatthew Knepley PetscInt m,n; 4021a1661176SMatthew Knepley PetscInt nz; 4022a1661176SMatthew Knepley PetscInt *nnz, nz_max = 0; 4023a1661176SMatthew Knepley PetscErrorCode ierr; 4024a1661176SMatthew Knepley 4025a1661176SMatthew Knepley PetscFunctionBegin; 402665e19b50SBarry Smith if (Ii[0]) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %D", Ii[0]); 4027779a8d59SSatish Balay 4028779a8d59SSatish Balay ierr = PetscLayoutSetUp(B->rmap);CHKERRQ(ierr); 4029779a8d59SSatish Balay ierr = PetscLayoutSetUp(B->cmap);CHKERRQ(ierr); 4030779a8d59SSatish Balay 4031779a8d59SSatish Balay ierr = MatGetSize(B, &m, &n);CHKERRQ(ierr); 4032854ce69bSBarry Smith ierr = PetscMalloc1(m+1, &nnz);CHKERRQ(ierr); 4033a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4034b7940d39SSatish Balay nz = Ii[i+1]- Ii[i]; 4035a1661176SMatthew Knepley nz_max = PetscMax(nz_max, nz); 403665e19b50SBarry Smith if (nz < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Local row %D has a negative number of columns %D", i, nnz); 4037a1661176SMatthew Knepley nnz[i] = nz; 4038a1661176SMatthew Knepley } 4039a1661176SMatthew Knepley ierr = MatSeqAIJSetPreallocation(B, 0, nnz);CHKERRQ(ierr); 4040a1661176SMatthew Knepley ierr = PetscFree(nnz);CHKERRQ(ierr); 4041a1661176SMatthew Knepley 4042a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4043071fcb05SBarry Smith ierr = MatSetValues_SeqAIJ(B, 1, &i, Ii[i+1] - Ii[i], J+Ii[i], v ? v + Ii[i] : NULL, INSERT_VALUES);CHKERRQ(ierr); 4044a1661176SMatthew Knepley } 4045a1661176SMatthew Knepley 4046a1661176SMatthew Knepley ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4047a1661176SMatthew Knepley ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4048a1661176SMatthew Knepley 40497827cd58SJed Brown ierr = MatSetOption(B,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 4050a1661176SMatthew Knepley PetscFunctionReturn(0); 4051a1661176SMatthew Knepley } 4052a1661176SMatthew Knepley 4053c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4054af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4055170fe5c8SBarry Smith 4056170fe5c8SBarry Smith /* 4057170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4058170fe5c8SBarry Smith 4059170fe5c8SBarry Smith n p p 4060170fe5c8SBarry Smith ( ) ( ) ( ) 4061170fe5c8SBarry Smith m ( A ) * n ( B ) = m ( C ) 4062170fe5c8SBarry Smith ( ) ( ) ( ) 4063170fe5c8SBarry Smith 4064170fe5c8SBarry Smith */ 4065170fe5c8SBarry Smith PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A,Mat B,Mat C) 4066170fe5c8SBarry Smith { 4067170fe5c8SBarry Smith PetscErrorCode ierr; 4068170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense*)A->data; 4069170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ*)B->data; 4070170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense*)C->data; 40711de00fd4SBarry Smith PetscInt i,n,m,q,p; 4072170fe5c8SBarry Smith const PetscInt *ii,*idx; 4073170fe5c8SBarry Smith const PetscScalar *b,*a,*a_q; 4074170fe5c8SBarry Smith PetscScalar *c,*c_q; 4075170fe5c8SBarry Smith 4076170fe5c8SBarry Smith PetscFunctionBegin; 4077d0f46423SBarry Smith m = A->rmap->n; 4078d0f46423SBarry Smith n = A->cmap->n; 4079d0f46423SBarry Smith p = B->cmap->n; 4080170fe5c8SBarry Smith a = sub_a->v; 4081170fe5c8SBarry Smith b = sub_b->a; 4082170fe5c8SBarry Smith c = sub_c->v; 4083580bdb30SBarry Smith ierr = PetscArrayzero(c,m*p);CHKERRQ(ierr); 4084170fe5c8SBarry Smith 4085170fe5c8SBarry Smith ii = sub_b->i; 4086170fe5c8SBarry Smith idx = sub_b->j; 4087170fe5c8SBarry Smith for (i=0; i<n; i++) { 4088170fe5c8SBarry Smith q = ii[i+1] - ii[i]; 4089170fe5c8SBarry Smith while (q-->0) { 4090170fe5c8SBarry Smith c_q = c + m*(*idx); 4091170fe5c8SBarry Smith a_q = a + m*i; 4092854c7f52SBarry Smith PetscKernelAXPY(c_q,*b,a_q,m); 4093170fe5c8SBarry Smith idx++; 4094170fe5c8SBarry Smith b++; 4095170fe5c8SBarry Smith } 4096170fe5c8SBarry Smith } 4097170fe5c8SBarry Smith PetscFunctionReturn(0); 4098170fe5c8SBarry Smith } 4099170fe5c8SBarry Smith 4100170fe5c8SBarry Smith PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A,Mat B,PetscReal fill,Mat *C) 4101170fe5c8SBarry Smith { 4102170fe5c8SBarry Smith PetscErrorCode ierr; 4103d0f46423SBarry Smith PetscInt m=A->rmap->n,n=B->cmap->n; 4104170fe5c8SBarry Smith Mat Cmat; 4105170fe5c8SBarry Smith 4106170fe5c8SBarry Smith PetscFunctionBegin; 410760e0710aSBarry Smith if (A->cmap->n != B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"A->cmap->n %D != B->rmap->n %D\n",A->cmap->n,B->rmap->n); 4108ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&Cmat);CHKERRQ(ierr); 4109170fe5c8SBarry Smith ierr = MatSetSizes(Cmat,m,n,m,n);CHKERRQ(ierr); 411033d57670SJed Brown ierr = MatSetBlockSizesFromMats(Cmat,A,B);CHKERRQ(ierr); 4111170fe5c8SBarry Smith ierr = MatSetType(Cmat,MATSEQDENSE);CHKERRQ(ierr); 41120298fd71SBarry Smith ierr = MatSeqDenseSetPreallocation(Cmat,NULL);CHKERRQ(ierr); 4113d73949e8SHong Zhang 4114d73949e8SHong Zhang Cmat->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 41152205254eSKarl Rupp 4116170fe5c8SBarry Smith *C = Cmat; 4117170fe5c8SBarry Smith PetscFunctionReturn(0); 4118170fe5c8SBarry Smith } 4119170fe5c8SBarry Smith 4120170fe5c8SBarry Smith /* ----------------------------------------------------------------*/ 4121150d2497SBarry Smith PETSC_INTERN PetscErrorCode MatMatMult_SeqDense_SeqAIJ(Mat A,Mat B,MatReuse scall,PetscReal fill,Mat *C) 4122170fe5c8SBarry Smith { 4123170fe5c8SBarry Smith PetscErrorCode ierr; 4124170fe5c8SBarry Smith 4125170fe5c8SBarry Smith PetscFunctionBegin; 4126170fe5c8SBarry Smith if (scall == MAT_INITIAL_MATRIX) { 41273ff4c91cSHong Zhang ierr = PetscLogEventBegin(MAT_MatMultSymbolic,A,B,0,0);CHKERRQ(ierr); 4128170fe5c8SBarry Smith ierr = MatMatMultSymbolic_SeqDense_SeqAIJ(A,B,fill,C);CHKERRQ(ierr); 41293ff4c91cSHong Zhang ierr = PetscLogEventEnd(MAT_MatMultSymbolic,A,B,0,0);CHKERRQ(ierr); 4130170fe5c8SBarry Smith } 41313ff4c91cSHong Zhang ierr = PetscLogEventBegin(MAT_MatMultNumeric,A,B,0,0);CHKERRQ(ierr); 4132170fe5c8SBarry Smith ierr = MatMatMultNumeric_SeqDense_SeqAIJ(A,B,*C);CHKERRQ(ierr); 41333ff4c91cSHong Zhang ierr = PetscLogEventEnd(MAT_MatMultNumeric,A,B,0,0);CHKERRQ(ierr); 4134170fe5c8SBarry Smith PetscFunctionReturn(0); 4135170fe5c8SBarry Smith } 4136170fe5c8SBarry Smith 4137170fe5c8SBarry Smith 41380bad9183SKris Buschelman /*MC 4139fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 41400bad9183SKris Buschelman based on compressed sparse row format. 41410bad9183SKris Buschelman 41420bad9183SKris Buschelman Options Database Keys: 41430bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 41440bad9183SKris Buschelman 41450bad9183SKris Buschelman Level: beginner 41460bad9183SKris Buschelman 4147*0cd7f59aSBarry Smith Notes: 4148*0cd7f59aSBarry Smith MatSetValues() may be called for this matrix type with a NULL argument for the numerical values, 4149*0cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 4150*0cd7f59aSBarry Smith in the matrix 4151*0cd7f59aSBarry Smith 4152*0cd7f59aSBarry Smith MatSetOptions(,MAT_STRUCTURE_ONLY,PETSC_TRUE) may be called for this matrix type. In this no 4153*0cd7f59aSBarry Smith space is allocated for the nonzero entries and any entries passed with MatSetValues() are ignored 4154*0cd7f59aSBarry Smith 4155*0cd7f59aSBarry Smith Developer Notes: 4156*0cd7f59aSBarry Smith It would be nice if all matrix formats supported passing NULL in for the numerical values 4157*0cd7f59aSBarry Smith 4158f587520bSBarry Smith .seealso: MatCreateSeqAIJ(), MatSetFromOptions(), MatSetType(), MatCreate(), MatType 41590bad9183SKris Buschelman M*/ 41600bad9183SKris Buschelman 4161ccd284c7SBarry Smith /*MC 4162ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4163ccd284c7SBarry Smith 4164ccd284c7SBarry Smith This matrix type is identical to MATSEQAIJ when constructed with a single process communicator, 4165ccd284c7SBarry Smith and MATMPIAIJ otherwise. As a result, for single process communicators, 4166*0cd7f59aSBarry Smith MatSeqAIJSetPreallocation is supported, and similarly MatMPIAIJSetPreallocation() is supported 4167ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4168ccd284c7SBarry Smith the above preallocation routines for simplicity. 4169ccd284c7SBarry Smith 4170ccd284c7SBarry Smith Options Database Keys: 4171ccd284c7SBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to MatSetFromOptions() 4172ccd284c7SBarry Smith 417395452b02SPatrick Sanan Developer Notes: 4174ca9cdca7SRichard Tran Mills Subclasses include MATAIJCUSPARSE, MATAIJPERM, MATAIJSELL, MATAIJMKL, MATAIJCRL, and also automatically switches over to use inodes when 4175ccd284c7SBarry Smith enough exist. 4176ccd284c7SBarry Smith 4177ccd284c7SBarry Smith Level: beginner 4178ccd284c7SBarry Smith 4179ccd284c7SBarry Smith .seealso: MatCreateAIJ(), MatCreateSeqAIJ(), MATSEQAIJ,MATMPIAIJ 4180ccd284c7SBarry Smith M*/ 4181ccd284c7SBarry Smith 4182ccd284c7SBarry Smith /*MC 4183ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4184ccd284c7SBarry Smith 4185ccd284c7SBarry Smith This matrix type is identical to MATSEQAIJCRL when constructed with a single process communicator, 4186ccd284c7SBarry Smith and MATMPIAIJCRL otherwise. As a result, for single process communicators, 4187ccd284c7SBarry Smith MatSeqAIJSetPreallocation() is supported, and similarly MatMPIAIJSetPreallocation() is supported 4188ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4189ccd284c7SBarry Smith the above preallocation routines for simplicity. 4190ccd284c7SBarry Smith 4191ccd284c7SBarry Smith Options Database Keys: 4192ccd284c7SBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to MatSetFromOptions() 4193ccd284c7SBarry Smith 4194ccd284c7SBarry Smith Level: beginner 4195ccd284c7SBarry Smith 4196ccd284c7SBarry Smith .seealso: MatCreateMPIAIJCRL,MATSEQAIJCRL,MATMPIAIJCRL, MATSEQAIJCRL, MATMPIAIJCRL 4197ccd284c7SBarry Smith M*/ 4198ccd284c7SBarry Smith 41997906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat,MatType,MatReuse,Mat*); 42007906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 42017906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat,MatType,MatReuse,Mat*); 42027906f579SHong Zhang #endif 42037906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 42047906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A,MatType,MatReuse,Mat*); 42057906f579SHong Zhang PETSC_INTERN PetscErrorCode MatMatMatMult_Transpose_AIJ_AIJ(Mat,Mat,Mat,MatReuse,PetscReal,Mat*); 42067906f579SHong Zhang #endif 42077906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqDense(Mat,MatType,MatReuse,Mat*); 42087906f579SHong Zhang 4209d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat,MatType,MatReuse,Mat*); 4210c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat,MatType,MatReuse,Mat*); 421175d48cdbSStefano Zampini PETSC_INTERN PetscErrorCode MatPtAP_IS_XAIJ(Mat,Mat,MatReuse,PetscReal,Mat*); 42127906f579SHong Zhang 42138c778c55SBarry Smith /*@C 42148397e458SBarry Smith MatSeqAIJGetArray - gives access to the array where the data for a MATSEQAIJ matrix is stored 42158c778c55SBarry Smith 42168c778c55SBarry Smith Not Collective 42178c778c55SBarry Smith 42188c778c55SBarry Smith Input Parameter: 4219579dbff0SBarry Smith . mat - a MATSEQAIJ matrix 42208c778c55SBarry Smith 42218c778c55SBarry Smith Output Parameter: 42228c778c55SBarry Smith . array - pointer to the data 42238c778c55SBarry Smith 42248c778c55SBarry Smith Level: intermediate 42258c778c55SBarry Smith 4226774cf152SJed Brown .seealso: MatSeqAIJRestoreArray(), MatSeqAIJGetArrayF90() 42278c778c55SBarry Smith @*/ 42288c778c55SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A,PetscScalar **array) 42298c778c55SBarry Smith { 42308c778c55SBarry Smith PetscErrorCode ierr; 42318c778c55SBarry Smith 42328c778c55SBarry Smith PetscFunctionBegin; 42338c778c55SBarry Smith ierr = PetscUseMethod(A,"MatSeqAIJGetArray_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 42348c778c55SBarry Smith PetscFunctionReturn(0); 42358c778c55SBarry Smith } 42368c778c55SBarry Smith 423721e72a00SBarry Smith /*@C 423821e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 423921e72a00SBarry Smith 424021e72a00SBarry Smith Not Collective 424121e72a00SBarry Smith 424221e72a00SBarry Smith Input Parameter: 4243579dbff0SBarry Smith . mat - a MATSEQAIJ matrix 424421e72a00SBarry Smith 424521e72a00SBarry Smith Output Parameter: 424621e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 424721e72a00SBarry Smith 424821e72a00SBarry Smith Level: intermediate 424921e72a00SBarry Smith 425021e72a00SBarry Smith .seealso: MatSeqAIJRestoreArray(), MatSeqAIJGetArrayF90() 425121e72a00SBarry Smith @*/ 425221e72a00SBarry Smith PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A,PetscInt *nz) 425321e72a00SBarry Smith { 425421e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 425521e72a00SBarry Smith 425621e72a00SBarry Smith PetscFunctionBegin; 425721e72a00SBarry Smith *nz = aij->rmax; 425821e72a00SBarry Smith PetscFunctionReturn(0); 425921e72a00SBarry Smith } 426021e72a00SBarry Smith 42618c778c55SBarry Smith /*@C 4262579dbff0SBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a MATSEQAIJ matrix is stored obtained by MatSeqAIJGetArray() 42638c778c55SBarry Smith 42648c778c55SBarry Smith Not Collective 42658c778c55SBarry Smith 42668c778c55SBarry Smith Input Parameters: 4267a2b725a8SWilliam Gropp + mat - a MATSEQAIJ matrix 4268a2b725a8SWilliam Gropp - array - pointer to the data 42698c778c55SBarry Smith 42708c778c55SBarry Smith Level: intermediate 42718c778c55SBarry Smith 4272774cf152SJed Brown .seealso: MatSeqAIJGetArray(), MatSeqAIJRestoreArrayF90() 42738c778c55SBarry Smith @*/ 42748c778c55SBarry Smith PetscErrorCode MatSeqAIJRestoreArray(Mat A,PetscScalar **array) 42758c778c55SBarry Smith { 42768c778c55SBarry Smith PetscErrorCode ierr; 42778c778c55SBarry Smith 42788c778c55SBarry Smith PetscFunctionBegin; 42798c778c55SBarry Smith ierr = PetscUseMethod(A,"MatSeqAIJRestoreArray_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 42808c778c55SBarry Smith PetscFunctionReturn(0); 42818c778c55SBarry Smith } 42828c778c55SBarry Smith 428334b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 428402fe1965SBarry Smith PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat); 428502fe1965SBarry Smith #endif 428602fe1965SBarry Smith 42878cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4288273d9f13SBarry Smith { 4289273d9f13SBarry Smith Mat_SeqAIJ *b; 4290dfbe8321SBarry Smith PetscErrorCode ierr; 429138baddfdSBarry Smith PetscMPIInt size; 4292273d9f13SBarry Smith 4293273d9f13SBarry Smith PetscFunctionBegin; 4294ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)B),&size);CHKERRQ(ierr); 4295e32f2f54SBarry Smith if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Comm must be of size 1"); 4296273d9f13SBarry Smith 4297b00a9115SJed Brown ierr = PetscNewLog(B,&b);CHKERRQ(ierr); 42982205254eSKarl Rupp 4299b0a32e0cSBarry Smith B->data = (void*)b; 43002205254eSKarl Rupp 4301549d3d68SSatish Balay ierr = PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps));CHKERRQ(ierr); 4302071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 43032205254eSKarl Rupp 4304416022c9SBarry Smith b->row = 0; 4305416022c9SBarry Smith b->col = 0; 430682bf6240SBarry Smith b->icol = 0; 4307b810aeb4SBarry Smith b->reallocs = 0; 430836db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4309f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4310416022c9SBarry Smith b->nonew = 0; 4311416022c9SBarry Smith b->diag = 0; 4312416022c9SBarry Smith b->solve_work = 0; 43132a1b7f2aSHong Zhang B->spptr = 0; 4314be6bf707SBarry Smith b->saved_values = 0; 4315d7f994e1SBarry Smith b->idiag = 0; 431671f1c65dSBarry Smith b->mdiag = 0; 431771f1c65dSBarry Smith b->ssor_work = 0; 431871f1c65dSBarry Smith b->omega = 1.0; 431971f1c65dSBarry Smith b->fshift = 0.0; 432071f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4321bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4322a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 432317ab2063SBarry Smith 432435d8aa7fSBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ);CHKERRQ(ierr); 4325bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJGetArray_C",MatSeqAIJGetArray_SeqAIJ);CHKERRQ(ierr); 4326bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJRestoreArray_C",MatSeqAIJRestoreArray_SeqAIJ);CHKERRQ(ierr); 43278c778c55SBarry Smith 4328b3866ffcSBarry Smith #if defined(PETSC_HAVE_MATLAB_ENGINE) 4329bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"PetscMatlabEnginePut_C",MatlabEnginePut_SeqAIJ);CHKERRQ(ierr); 4330bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"PetscMatlabEngineGet_C",MatlabEngineGet_SeqAIJ);CHKERRQ(ierr); 4331b3866ffcSBarry Smith #endif 433217f1a0eaSHong Zhang 4333bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetColumnIndices_C",MatSeqAIJSetColumnIndices_SeqAIJ);CHKERRQ(ierr); 4334bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatStoreValues_C",MatStoreValues_SeqAIJ);CHKERRQ(ierr); 4335bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatRetrieveValues_C",MatRetrieveValues_SeqAIJ);CHKERRQ(ierr); 4336bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqsbaij_C",MatConvert_SeqAIJ_SeqSBAIJ);CHKERRQ(ierr); 4337bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqbaij_C",MatConvert_SeqAIJ_SeqBAIJ);CHKERRQ(ierr); 4338bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijperm_C",MatConvert_SeqAIJ_SeqAIJPERM);CHKERRQ(ierr); 43394dfdc2d9SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijsell_C",MatConvert_SeqAIJ_SeqAIJSELL);CHKERRQ(ierr); 43409779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 43414a2a386eSRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijmkl_C",MatConvert_SeqAIJ_SeqAIJMKL);CHKERRQ(ierr); 4342191b95cbSRichard Tran Mills #endif 434334b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 434402fe1965SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijcusparse_C",MatConvert_SeqAIJ_SeqAIJCUSPARSE);CHKERRQ(ierr); 434502fe1965SBarry Smith #endif 4346bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijcrl_C",MatConvert_SeqAIJ_SeqAIJCRL);CHKERRQ(ierr); 4347af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 4348af8000cdSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_elemental_C",MatConvert_SeqAIJ_Elemental);CHKERRQ(ierr); 4349af8000cdSHong Zhang #endif 435063c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 435163c07aadSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_hypre_C",MatConvert_AIJ_HYPRE);CHKERRQ(ierr); 43523dad0653Sstefano_zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMatMult_transpose_seqaij_seqaij_C",MatMatMatMult_Transpose_AIJ_AIJ);CHKERRQ(ierr); 435363c07aadSStefano Zampini #endif 4354b49cda9fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqdense_C",MatConvert_SeqAIJ_SeqDense);CHKERRQ(ierr); 4355d4002b98SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqsell_C",MatConvert_SeqAIJ_SeqSELL);CHKERRQ(ierr); 4356c9225affSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_is_C",MatConvert_XAIJ_IS);CHKERRQ(ierr); 4357bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatIsTranspose_C",MatIsTranspose_SeqAIJ);CHKERRQ(ierr); 4358bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatIsHermitianTranspose_C",MatIsTranspose_SeqAIJ);CHKERRQ(ierr); 4359bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetPreallocation_C",MatSeqAIJSetPreallocation_SeqAIJ);CHKERRQ(ierr); 4360846b4da1SFande Kong ierr = PetscObjectComposeFunction((PetscObject)B,"MatResetPreallocation_C",MatResetPreallocation_SeqAIJ);CHKERRQ(ierr); 4361bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetPreallocationCSR_C",MatSeqAIJSetPreallocationCSR_SeqAIJ);CHKERRQ(ierr); 4362bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatReorderForNonzeroDiagonal_C",MatReorderForNonzeroDiagonal_SeqAIJ);CHKERRQ(ierr); 4363bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMult_seqdense_seqaij_C",MatMatMult_SeqDense_SeqAIJ);CHKERRQ(ierr); 4364bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_seqdense_seqaij_C",MatMatMultSymbolic_SeqDense_SeqAIJ);CHKERRQ(ierr); 4365bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_seqdense_seqaij_C",MatMatMultNumeric_SeqDense_SeqAIJ);CHKERRQ(ierr); 436675d48cdbSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatPtAP_is_seqaij_C",MatPtAP_IS_XAIJ);CHKERRQ(ierr); 43674108e4d5SBarry Smith ierr = MatCreate_SeqAIJ_Inode(B);CHKERRQ(ierr); 436817667f90SBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ);CHKERRQ(ierr); 43694099cc6bSBarry Smith ierr = MatSeqAIJSetTypeFromOptions(B);CHKERRQ(ierr); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 43703a40ed3dSBarry Smith PetscFunctionReturn(0); 437117ab2063SBarry Smith } 437217ab2063SBarry Smith 4373b24902e0SBarry Smith /* 4374b24902e0SBarry Smith Given a matrix generated with MatGetFactor() duplicates all the information in A into B 4375b24902e0SBarry Smith */ 4376ace3abfcSBarry Smith PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C,Mat A,MatDuplicateOption cpvalues,PetscBool mallocmatspace) 437717ab2063SBarry Smith { 4378416022c9SBarry Smith Mat_SeqAIJ *c,*a = (Mat_SeqAIJ*)A->data; 43796849ba73SBarry Smith PetscErrorCode ierr; 4380071fcb05SBarry Smith PetscInt m = A->rmap->n,i; 438117ab2063SBarry Smith 43823a40ed3dSBarry Smith PetscFunctionBegin; 4383273d9f13SBarry Smith c = (Mat_SeqAIJ*)C->data; 4384273d9f13SBarry Smith 4385d5f3da31SBarry Smith C->factortype = A->factortype; 4386416022c9SBarry Smith c->row = 0; 4387416022c9SBarry Smith c->col = 0; 438882bf6240SBarry Smith c->icol = 0; 43896ad4291fSHong Zhang c->reallocs = 0; 439017ab2063SBarry Smith 43916ad4291fSHong Zhang C->assembled = PETSC_TRUE; 439217ab2063SBarry Smith 4393aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->rmap,&C->rmap);CHKERRQ(ierr); 4394aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->cmap,&C->cmap);CHKERRQ(ierr); 4395eec197d1SBarry Smith 4396071fcb05SBarry Smith ierr = PetscMalloc1(m,&c->imax);CHKERRQ(ierr); 4397071fcb05SBarry Smith ierr = PetscMemcpy(c->imax,a->imax,m*sizeof(PetscInt));CHKERRQ(ierr); 4398071fcb05SBarry Smith ierr = PetscMalloc1(m,&c->ilen);CHKERRQ(ierr); 4399071fcb05SBarry Smith ierr = PetscMemcpy(c->ilen,a->ilen,m*sizeof(PetscInt));CHKERRQ(ierr); 44003bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)C, 2*m*sizeof(PetscInt));CHKERRQ(ierr); 440117ab2063SBarry Smith 440217ab2063SBarry Smith /* allocate the matrix space */ 4403f77e22a1SHong Zhang if (mallocmatspace) { 4404dcca6d9dSJed Brown ierr = PetscMalloc3(a->i[m],&c->a,a->i[m],&c->j,m+1,&c->i);CHKERRQ(ierr); 44053bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)C, a->i[m]*(sizeof(PetscScalar)+sizeof(PetscInt))+(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 44062205254eSKarl Rupp 4407f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 44082205254eSKarl Rupp 4409580bdb30SBarry Smith ierr = PetscArraycpy(c->i,a->i,m+1);CHKERRQ(ierr); 441017ab2063SBarry Smith if (m > 0) { 4411580bdb30SBarry Smith ierr = PetscArraycpy(c->j,a->j,a->i[m]);CHKERRQ(ierr); 4412be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 4413580bdb30SBarry Smith ierr = PetscArraycpy(c->a,a->a,a->i[m]);CHKERRQ(ierr); 4414be6bf707SBarry Smith } else { 4415580bdb30SBarry Smith ierr = PetscArrayzero(c->a,a->i[m]);CHKERRQ(ierr); 441617ab2063SBarry Smith } 441708480c60SBarry Smith } 4418f77e22a1SHong Zhang } 441917ab2063SBarry Smith 44206ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 4421416022c9SBarry Smith c->roworiented = a->roworiented; 4422416022c9SBarry Smith c->nonew = a->nonew; 4423416022c9SBarry Smith if (a->diag) { 4424854ce69bSBarry Smith ierr = PetscMalloc1(m+1,&c->diag);CHKERRQ(ierr); 4425071fcb05SBarry Smith ierr = PetscMemcpy(c->diag,a->diag,m*sizeof(PetscInt));CHKERRQ(ierr); 44263bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)C,(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 4427071fcb05SBarry Smith } else c->diag = NULL; 44282205254eSKarl Rupp 44296ad4291fSHong Zhang c->solve_work = 0; 44306ad4291fSHong Zhang c->saved_values = 0; 44316ad4291fSHong Zhang c->idiag = 0; 443271f1c65dSBarry Smith c->ssor_work = 0; 4433a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 4434e6b907acSBarry Smith c->free_a = PETSC_TRUE; 4435e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 44366ad4291fSHong Zhang 4437893ad86cSHong Zhang c->rmax = a->rmax; 4438416022c9SBarry Smith c->nz = a->nz; 44398ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 4440273d9f13SBarry Smith C->preallocated = PETSC_TRUE; 4441754ec7b1SSatish Balay 44426ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 44436ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 4444cd6b891eSBarry Smith if (a->compressedrow.use) { 44456ad4291fSHong Zhang i = a->compressedrow.nrows; 4446dcca6d9dSJed Brown ierr = PetscMalloc2(i+1,&c->compressedrow.i,i,&c->compressedrow.rindex);CHKERRQ(ierr); 4447580bdb30SBarry Smith ierr = PetscArraycpy(c->compressedrow.i,a->compressedrow.i,i+1);CHKERRQ(ierr); 4448580bdb30SBarry Smith ierr = PetscArraycpy(c->compressedrow.rindex,a->compressedrow.rindex,i);CHKERRQ(ierr); 444927ea64f8SHong Zhang } else { 445027ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 44510298fd71SBarry Smith c->compressedrow.i = NULL; 44520298fd71SBarry Smith c->compressedrow.rindex = NULL; 44536ad4291fSHong Zhang } 4454ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 4455e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 44564846f1f5SKris Buschelman 44572205254eSKarl Rupp ierr = MatDuplicate_SeqAIJ_Inode(A,cpvalues,&C);CHKERRQ(ierr); 4458140e18c1SBarry Smith ierr = PetscFunctionListDuplicate(((PetscObject)A)->qlist,&((PetscObject)C)->qlist);CHKERRQ(ierr); 44593a40ed3dSBarry Smith PetscFunctionReturn(0); 446017ab2063SBarry Smith } 446117ab2063SBarry Smith 4462b24902e0SBarry Smith PetscErrorCode MatDuplicate_SeqAIJ(Mat A,MatDuplicateOption cpvalues,Mat *B) 4463b24902e0SBarry Smith { 4464b24902e0SBarry Smith PetscErrorCode ierr; 4465b24902e0SBarry Smith 4466b24902e0SBarry Smith PetscFunctionBegin; 4467ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),B);CHKERRQ(ierr); 44684b6263acSBarry Smith ierr = MatSetSizes(*B,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 4469cfd3f464SBarry Smith if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) { 447033d57670SJed Brown ierr = MatSetBlockSizesFromMats(*B,A,A);CHKERRQ(ierr); 4471cfd3f464SBarry Smith } 4472a54f2f98SBarry Smith ierr = MatSetType(*B,((PetscObject)A)->type_name);CHKERRQ(ierr); 4473f77e22a1SHong Zhang ierr = MatDuplicateNoCreate_SeqAIJ(*B,A,cpvalues,PETSC_TRUE);CHKERRQ(ierr); 4474b24902e0SBarry Smith PetscFunctionReturn(0); 4475b24902e0SBarry Smith } 4476b24902e0SBarry Smith 4477112444f4SShri Abhyankar PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 4478fbdbba38SShri Abhyankar { 447952f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 448052f91c60SVaclav Hapla PetscErrorCode ierr; 448152f91c60SVaclav Hapla 448252f91c60SVaclav Hapla PetscFunctionBegin; 448352f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat,MAT_CLASSID,1); 448452f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer,PETSC_VIEWER_CLASSID,2); 4485c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 4486c27b3999SVaclav Hapla ierr = PetscViewerSetUp(viewer);CHKERRQ(ierr); 448752f91c60SVaclav Hapla ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 448852f91c60SVaclav Hapla ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERHDF5, &ishdf5);CHKERRQ(ierr); 448952f91c60SVaclav Hapla if (isbinary) { 449052f91c60SVaclav Hapla ierr = MatLoad_SeqAIJ_Binary(newMat,viewer);CHKERRQ(ierr); 449152f91c60SVaclav Hapla } else if (ishdf5) { 449252f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 449352f91c60SVaclav Hapla ierr = MatLoad_AIJ_HDF5(newMat,viewer);CHKERRQ(ierr); 449452f91c60SVaclav Hapla #else 449552f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 449652f91c60SVaclav Hapla #endif 449752f91c60SVaclav Hapla } else { 449852f91c60SVaclav Hapla SETERRQ2(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"Viewer type %s not yet supported for reading %s matrices",((PetscObject)viewer)->type_name,((PetscObject)newMat)->type_name); 449952f91c60SVaclav Hapla } 450052f91c60SVaclav Hapla PetscFunctionReturn(0); 450152f91c60SVaclav Hapla } 450252f91c60SVaclav Hapla 450352f91c60SVaclav Hapla PetscErrorCode MatLoad_SeqAIJ_Binary(Mat newMat, PetscViewer viewer) 450452f91c60SVaclav Hapla { 4505fbdbba38SShri Abhyankar Mat_SeqAIJ *a; 4506fbdbba38SShri Abhyankar PetscErrorCode ierr; 4507fbdbba38SShri Abhyankar PetscInt i,sum,nz,header[4],*rowlengths = 0,M,N,rows,cols; 4508fbdbba38SShri Abhyankar int fd; 4509fbdbba38SShri Abhyankar PetscMPIInt size; 4510fbdbba38SShri Abhyankar MPI_Comm comm; 45113059b6faSBarry Smith PetscInt bs = newMat->rmap->bs; 4512fbdbba38SShri Abhyankar 4513fbdbba38SShri Abhyankar PetscFunctionBegin; 4514fbdbba38SShri Abhyankar ierr = PetscObjectGetComm((PetscObject)viewer,&comm);CHKERRQ(ierr); 4515fbdbba38SShri Abhyankar ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 4516fbdbba38SShri Abhyankar if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"view must have one processor"); 4517bbead8a2SBarry Smith 45180298fd71SBarry Smith ierr = PetscOptionsBegin(comm,NULL,"Options for loading SEQAIJ matrix","Mat");CHKERRQ(ierr); 45190298fd71SBarry Smith ierr = PetscOptionsInt("-matload_block_size","Set the blocksize used to store the matrix","MatLoad",bs,&bs,NULL);CHKERRQ(ierr); 4520bbead8a2SBarry Smith ierr = PetscOptionsEnd();CHKERRQ(ierr); 45213059b6faSBarry Smith if (bs < 0) bs = 1; 45223059b6faSBarry Smith ierr = MatSetBlockSize(newMat,bs);CHKERRQ(ierr); 4523bbead8a2SBarry Smith 4524fbdbba38SShri Abhyankar ierr = PetscViewerBinaryGetDescriptor(viewer,&fd);CHKERRQ(ierr); 45259860990eSLisandro Dalcin ierr = PetscBinaryRead(fd,header,4,NULL,PETSC_INT);CHKERRQ(ierr); 4526fbdbba38SShri Abhyankar if (header[0] != MAT_FILE_CLASSID) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"not matrix object in file"); 4527fbdbba38SShri Abhyankar M = header[1]; N = header[2]; nz = header[3]; 4528fbdbba38SShri Abhyankar 4529bbead8a2SBarry Smith if (nz < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Matrix stored in special format on disk,cannot load as SeqAIJ"); 4530fbdbba38SShri Abhyankar 4531fbdbba38SShri Abhyankar /* read in row lengths */ 4532785e854fSJed Brown ierr = PetscMalloc1(M,&rowlengths);CHKERRQ(ierr); 45339860990eSLisandro Dalcin ierr = PetscBinaryRead(fd,rowlengths,M,NULL,PETSC_INT);CHKERRQ(ierr); 4534fbdbba38SShri Abhyankar 4535fbdbba38SShri Abhyankar /* check if sum of rowlengths is same as nz */ 4536fbdbba38SShri Abhyankar for (i=0,sum=0; i< M; i++) sum +=rowlengths[i]; 453760e0710aSBarry Smith if (sum != nz) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_FILE_READ,"Inconsistant matrix data in file. no-nonzeros = %dD, sum-row-lengths = %D\n",nz,sum); 4538fbdbba38SShri Abhyankar 4539fbdbba38SShri Abhyankar /* set global size if not set already*/ 4540f501eaabSShri Abhyankar if (newMat->rmap->n < 0 && newMat->rmap->N < 0 && newMat->cmap->n < 0 && newMat->cmap->N < 0) { 4541fbdbba38SShri Abhyankar ierr = MatSetSizes(newMat,PETSC_DECIDE,PETSC_DECIDE,M,N);CHKERRQ(ierr); 4542aabbc4fbSShri Abhyankar } else { 45439d36ed5fSBarry Smith /* if sizes and type are already set, check if the matrix global sizes are correct */ 4544fbdbba38SShri Abhyankar ierr = MatGetSize(newMat,&rows,&cols);CHKERRQ(ierr); 45454c5b953cSHong Zhang if (rows < 0 && cols < 0) { /* user might provide local size instead of global size */ 45464c5b953cSHong Zhang ierr = MatGetLocalSize(newMat,&rows,&cols);CHKERRQ(ierr); 45474c5b953cSHong Zhang } 454860e0710aSBarry Smith if (M != rows || N != cols) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%D, %D) than the input matrix (%D, %D)",M,N,rows,cols); 4549aabbc4fbSShri Abhyankar } 4550fbdbba38SShri Abhyankar ierr = MatSeqAIJSetPreallocation_SeqAIJ(newMat,0,rowlengths);CHKERRQ(ierr); 4551fbdbba38SShri Abhyankar a = (Mat_SeqAIJ*)newMat->data; 4552fbdbba38SShri Abhyankar 45539860990eSLisandro Dalcin ierr = PetscBinaryRead(fd,a->j,nz,NULL,PETSC_INT);CHKERRQ(ierr); 4554fbdbba38SShri Abhyankar 4555fbdbba38SShri Abhyankar /* read in nonzero values */ 45569860990eSLisandro Dalcin ierr = PetscBinaryRead(fd,a->a,nz,NULL,PETSC_SCALAR);CHKERRQ(ierr); 4557fbdbba38SShri Abhyankar 4558fbdbba38SShri Abhyankar /* set matrix "i" values */ 4559fbdbba38SShri Abhyankar a->i[0] = 0; 4560fbdbba38SShri Abhyankar for (i=1; i<= M; i++) { 4561fbdbba38SShri Abhyankar a->i[i] = a->i[i-1] + rowlengths[i-1]; 4562fbdbba38SShri Abhyankar a->ilen[i-1] = rowlengths[i-1]; 4563fbdbba38SShri Abhyankar } 4564fbdbba38SShri Abhyankar ierr = PetscFree(rowlengths);CHKERRQ(ierr); 4565fbdbba38SShri Abhyankar 4566fbdbba38SShri Abhyankar ierr = MatAssemblyBegin(newMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4567fbdbba38SShri Abhyankar ierr = MatAssemblyEnd(newMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4568fbdbba38SShri Abhyankar PetscFunctionReturn(0); 4569fbdbba38SShri Abhyankar } 4570fbdbba38SShri Abhyankar 4571ace3abfcSBarry Smith PetscErrorCode MatEqual_SeqAIJ(Mat A,Mat B,PetscBool * flg) 45727264ac53SSatish Balay { 45737264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*b = (Mat_SeqAIJ*)B->data; 4574dfbe8321SBarry Smith PetscErrorCode ierr; 4575eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 4576eeffb40dSHong Zhang PetscInt k; 4577eeffb40dSHong Zhang #endif 45787264ac53SSatish Balay 45793a40ed3dSBarry Smith PetscFunctionBegin; 4580bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 4581d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) ||(a->nz != b->nz)) { 4582ca44d042SBarry Smith *flg = PETSC_FALSE; 4583ca44d042SBarry Smith PetscFunctionReturn(0); 4584bcd2baecSBarry Smith } 45857264ac53SSatish Balay 45867264ac53SSatish Balay /* if the a->i are the same */ 4587580bdb30SBarry Smith ierr = PetscArraycmp(a->i,b->i,A->rmap->n+1,flg);CHKERRQ(ierr); 4588abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 45897264ac53SSatish Balay 45907264ac53SSatish Balay /* if a->j are the same */ 4591580bdb30SBarry Smith ierr = PetscArraycmp(a->j,b->j,a->nz,flg);CHKERRQ(ierr); 4592abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 4593bcd2baecSBarry Smith 4594bcd2baecSBarry Smith /* if a->a are the same */ 4595eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 4596eeffb40dSHong Zhang for (k=0; k<a->nz; k++) { 4597eeffb40dSHong Zhang if (PetscRealPart(a->a[k]) != PetscRealPart(b->a[k]) || PetscImaginaryPart(a->a[k]) != PetscImaginaryPart(b->a[k])) { 4598eeffb40dSHong Zhang *flg = PETSC_FALSE; 45993a40ed3dSBarry Smith PetscFunctionReturn(0); 4600eeffb40dSHong Zhang } 4601eeffb40dSHong Zhang } 4602eeffb40dSHong Zhang #else 4603580bdb30SBarry Smith ierr = PetscArraycmp(a->a,b->a,a->nz,flg);CHKERRQ(ierr); 4604eeffb40dSHong Zhang #endif 4605eeffb40dSHong Zhang PetscFunctionReturn(0); 46067264ac53SSatish Balay } 460736db0b34SBarry Smith 460805869f15SSatish Balay /*@ 460936db0b34SBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential AIJ matrix using matrix elements (in CSR format) 461036db0b34SBarry Smith provided by the user. 461136db0b34SBarry Smith 4612d083f849SBarry Smith Collective 461336db0b34SBarry Smith 461436db0b34SBarry Smith Input Parameters: 461536db0b34SBarry Smith + comm - must be an MPI communicator of size 1 461636db0b34SBarry Smith . m - number of rows 461736db0b34SBarry Smith . n - number of columns 4618483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 461936db0b34SBarry Smith . j - column indices 462036db0b34SBarry Smith - a - matrix values 462136db0b34SBarry Smith 462236db0b34SBarry Smith Output Parameter: 462336db0b34SBarry Smith . mat - the matrix 462436db0b34SBarry Smith 462536db0b34SBarry Smith Level: intermediate 462636db0b34SBarry Smith 462736db0b34SBarry Smith Notes: 46280551d7c0SBarry Smith The i, j, and a arrays are not copied by this routine, the user must free these arrays 4629292fb18eSBarry Smith once the matrix is destroyed and not before 463036db0b34SBarry Smith 463136db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 463236db0b34SBarry Smith 4633bfeeae90SHong Zhang The i and j indices are 0 based 463436db0b34SBarry Smith 4635a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 4636a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 46378eef79e4SBarry Smith as shown 4638a4552177SSatish Balay 46398eef79e4SBarry Smith $ 1 0 0 46408eef79e4SBarry Smith $ 2 0 3 46418eef79e4SBarry Smith $ 4 5 6 46428eef79e4SBarry Smith $ 46438eef79e4SBarry Smith $ i = {0,1,3,6} [size = nrow+1 = 3+1] 46448eef79e4SBarry Smith $ j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 46458eef79e4SBarry Smith $ v = {1,2,3,4,5,6} [size = 6] 4646a4552177SSatish Balay 46479985e31cSBarry Smith 464869b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatCreateSeqAIJ(), MatCreateMPIAIJWithArrays(), MatMPIAIJSetPreallocationCSR() 464936db0b34SBarry Smith 465036db0b34SBarry Smith @*/ 4651c3c607ccSBarry Smith PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt i[],PetscInt j[],PetscScalar a[],Mat *mat) 465236db0b34SBarry Smith { 4653dfbe8321SBarry Smith PetscErrorCode ierr; 4654cbcfb4deSHong Zhang PetscInt ii; 465536db0b34SBarry Smith Mat_SeqAIJ *aij; 4656cbcfb4deSHong Zhang #if defined(PETSC_USE_DEBUG) 4657cbcfb4deSHong Zhang PetscInt jj; 4658cbcfb4deSHong Zhang #endif 465936db0b34SBarry Smith 466036db0b34SBarry Smith PetscFunctionBegin; 466141096f02SStefano Zampini if (m > 0 && i[0]) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"i (row indices) must start with 0"); 4662f69a0ea3SMatthew Knepley ierr = MatCreate(comm,mat);CHKERRQ(ierr); 4663f69a0ea3SMatthew Knepley ierr = MatSetSizes(*mat,m,n,m,n);CHKERRQ(ierr); 4664a2f3521dSMark F. Adams /* ierr = MatSetBlockSizes(*mat,,);CHKERRQ(ierr); */ 4665ab93d7beSBarry Smith ierr = MatSetType(*mat,MATSEQAIJ);CHKERRQ(ierr); 4666ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(*mat,MAT_SKIP_ALLOCATION,0);CHKERRQ(ierr); 4667ab93d7beSBarry Smith aij = (Mat_SeqAIJ*)(*mat)->data; 4668071fcb05SBarry Smith ierr = PetscMalloc1(m,&aij->imax);CHKERRQ(ierr); 4669071fcb05SBarry Smith ierr = PetscMalloc1(m,&aij->ilen);CHKERRQ(ierr); 4670ab93d7beSBarry Smith 467136db0b34SBarry Smith aij->i = i; 467236db0b34SBarry Smith aij->j = j; 467336db0b34SBarry Smith aij->a = a; 467436db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 467536db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 4676e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 4677e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 467836db0b34SBarry Smith 467936db0b34SBarry Smith for (ii=0; ii<m; ii++) { 468036db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii+1] - i[ii]; 46812515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 468260e0710aSBarry Smith if (i[ii+1] - i[ii] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row length in i (row indices) row = %D length = %D",ii,i[ii+1] - i[ii]); 46839985e31cSBarry Smith for (jj=i[ii]+1; jj<i[ii+1]; jj++) { 4684a061629eSStefano Zampini if (j[jj] < j[jj-1]) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %D (actual column %D) in row %D is not sorted",jj-i[ii],j[jj],ii); 4685a061629eSStefano Zampini if (j[jj] == j[jj-1]) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %D (actual column %D) in row %D is identical to previous entry",jj-i[ii],j[jj],ii); 46869985e31cSBarry Smith } 468736db0b34SBarry Smith #endif 468836db0b34SBarry Smith } 46892515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 469036db0b34SBarry Smith for (ii=0; ii<aij->i[m]; ii++) { 469160e0710aSBarry Smith if (j[ii] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column index at location = %D index = %D",ii,j[ii]); 469260e0710aSBarry Smith if (j[ii] > n - 1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column index to large at location = %D index = %D",ii,j[ii]); 469336db0b34SBarry Smith } 469436db0b34SBarry Smith #endif 469536db0b34SBarry Smith 4696b65db4caSBarry Smith ierr = MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4697b65db4caSBarry Smith ierr = MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 469836db0b34SBarry Smith PetscFunctionReturn(0); 469936db0b34SBarry Smith } 470080ef6e79SMatthew G Knepley /*@C 4701d021a1c5SVictor Minden MatCreateSeqAIJFromTriple - Creates an sequential AIJ matrix using matrix elements (in COO format) 47028a0b0e6bSVictor Minden provided by the user. 47038a0b0e6bSVictor Minden 4704d083f849SBarry Smith Collective 47058a0b0e6bSVictor Minden 47068a0b0e6bSVictor Minden Input Parameters: 47078a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 47088a0b0e6bSVictor Minden . m - number of rows 47098a0b0e6bSVictor Minden . n - number of columns 47108a0b0e6bSVictor Minden . i - row indices 47118a0b0e6bSVictor Minden . j - column indices 47121230e6d1SVictor Minden . a - matrix values 47131230e6d1SVictor Minden . nz - number of nonzeros 47141230e6d1SVictor Minden - idx - 0 or 1 based 47158a0b0e6bSVictor Minden 47168a0b0e6bSVictor Minden Output Parameter: 47178a0b0e6bSVictor Minden . mat - the matrix 47188a0b0e6bSVictor Minden 47198a0b0e6bSVictor Minden Level: intermediate 47208a0b0e6bSVictor Minden 47218a0b0e6bSVictor Minden Notes: 47228a0b0e6bSVictor Minden The i and j indices are 0 based 47238a0b0e6bSVictor Minden 47248a0b0e6bSVictor Minden The format which is used for the sparse matrix input, is equivalent to a 47258a0b0e6bSVictor Minden row-major ordering.. i.e for the following matrix, the input data expected is 47268a0b0e6bSVictor Minden as shown: 47278a0b0e6bSVictor Minden 47288a0b0e6bSVictor Minden 1 0 0 47298a0b0e6bSVictor Minden 2 0 3 47308a0b0e6bSVictor Minden 4 5 6 47318a0b0e6bSVictor Minden 47328a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 47338a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 47348a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 47358a0b0e6bSVictor Minden 47368a0b0e6bSVictor Minden 473769b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatCreateSeqAIJ(), MatCreateSeqAIJWithArrays(), MatMPIAIJSetPreallocationCSR() 47388a0b0e6bSVictor Minden 47398a0b0e6bSVictor Minden @*/ 4740c3c607ccSBarry Smith PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt i[],PetscInt j[],PetscScalar a[],Mat *mat,PetscInt nz,PetscBool idx) 47418a0b0e6bSVictor Minden { 47428a0b0e6bSVictor Minden PetscErrorCode ierr; 4743d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1,row,col; 47448a0b0e6bSVictor Minden 47458a0b0e6bSVictor Minden 47468a0b0e6bSVictor Minden PetscFunctionBegin; 47471795a4d1SJed Brown ierr = PetscCalloc1(m,&nnz);CHKERRQ(ierr); 47481230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 4749c8d679ebSHong Zhang nnz[i[ii] - !!idx] += 1; 47501230e6d1SVictor Minden } 47518a0b0e6bSVictor Minden ierr = MatCreate(comm,mat);CHKERRQ(ierr); 47528a0b0e6bSVictor Minden ierr = MatSetSizes(*mat,m,n,m,n);CHKERRQ(ierr); 47538a0b0e6bSVictor Minden ierr = MatSetType(*mat,MATSEQAIJ);CHKERRQ(ierr); 47541230e6d1SVictor Minden ierr = MatSeqAIJSetPreallocation_SeqAIJ(*mat,0,nnz);CHKERRQ(ierr); 47551230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 47561230e6d1SVictor Minden if (idx) { 47571230e6d1SVictor Minden row = i[ii] - 1; 47581230e6d1SVictor Minden col = j[ii] - 1; 47591230e6d1SVictor Minden } else { 47601230e6d1SVictor Minden row = i[ii]; 47611230e6d1SVictor Minden col = j[ii]; 47628a0b0e6bSVictor Minden } 47631230e6d1SVictor Minden ierr = MatSetValues(*mat,one,&row,one,&col,&a[ii],ADD_VALUES);CHKERRQ(ierr); 47648a0b0e6bSVictor Minden } 47658a0b0e6bSVictor Minden ierr = MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 47668a0b0e6bSVictor Minden ierr = MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4767d021a1c5SVictor Minden ierr = PetscFree(nnz);CHKERRQ(ierr); 47688a0b0e6bSVictor Minden PetscFunctionReturn(0); 47698a0b0e6bSVictor Minden } 477036db0b34SBarry Smith 4771acf2f550SJed Brown PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 4772acf2f550SJed Brown { 4773acf2f550SJed Brown Mat_SeqAIJ *a=(Mat_SeqAIJ*)A->data; 4774acf2f550SJed Brown PetscErrorCode ierr; 4775acf2f550SJed Brown 4776acf2f550SJed Brown PetscFunctionBegin; 4777acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 4778acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 47792205254eSKarl Rupp 4780acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal_Inode(A);CHKERRQ(ierr); 4781acf2f550SJed Brown PetscFunctionReturn(0); 4782acf2f550SJed Brown } 4783acf2f550SJed Brown 47849c8f2541SHong Zhang PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm,Mat inmat,PetscInt n,MatReuse scall,Mat *outmat) 47859c8f2541SHong Zhang { 47869c8f2541SHong Zhang PetscErrorCode ierr; 47878761c3d6SHong Zhang PetscMPIInt size; 47889c8f2541SHong Zhang 47899c8f2541SHong Zhang PetscFunctionBegin; 47908761c3d6SHong Zhang ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 47917bbdc51dSHong Zhang if (size == 1) { 47927bbdc51dSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 47937bbdc51dSHong Zhang ierr = MatDuplicate(inmat,MAT_COPY_VALUES,outmat);CHKERRQ(ierr); 47947bbdc51dSHong Zhang } else { 47958761c3d6SHong Zhang ierr = MatCopy(inmat,*outmat,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 47967bbdc51dSHong Zhang } 47978761c3d6SHong Zhang } else { 47989c8f2541SHong Zhang ierr = MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm,inmat,n,scall,outmat);CHKERRQ(ierr); 47998761c3d6SHong Zhang } 48009c8f2541SHong Zhang PetscFunctionReturn(0); 48019c8f2541SHong Zhang } 48029c8f2541SHong Zhang 480381824310SBarry Smith /* 480453dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 480553dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 480653dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 480753dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 480853dd7562SDmitry Karpeev */ 480953dd7562SDmitry Karpeev PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C,IS rowemb,IS colemb,MatStructure pattern,Mat B) 481053dd7562SDmitry Karpeev { 481153dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 481253dd7562SDmitry Karpeev PetscErrorCode ierr; 481353dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 481453dd7562SDmitry Karpeev PetscBool seqaij; 481553dd7562SDmitry Karpeev PetscInt m,n,*nz,i,j,count; 481653dd7562SDmitry Karpeev PetscScalar v; 481753dd7562SDmitry Karpeev const PetscInt *rowindices,*colindices; 481853dd7562SDmitry Karpeev 481953dd7562SDmitry Karpeev PetscFunctionBegin; 482053dd7562SDmitry Karpeev if (!B) PetscFunctionReturn(0); 482153dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 48224099cc6bSBarry Smith ierr = PetscObjectBaseTypeCompare((PetscObject)B,MATSEQAIJ,&seqaij);CHKERRQ(ierr); 482353dd7562SDmitry Karpeev if (!seqaij) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is of wrong type"); 482453dd7562SDmitry Karpeev if (rowemb) { 482553dd7562SDmitry Karpeev ierr = ISGetLocalSize(rowemb,&m);CHKERRQ(ierr); 482653dd7562SDmitry Karpeev if (m != B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Row IS of size %D is incompatible with matrix row size %D",m,B->rmap->n); 482753dd7562SDmitry Karpeev } else { 48286c4ed002SBarry Smith if (C->rmap->n != B->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is row-incompatible with the target matrix"); 482953dd7562SDmitry Karpeev } 483053dd7562SDmitry Karpeev if (colemb) { 483153dd7562SDmitry Karpeev ierr = ISGetLocalSize(colemb,&n);CHKERRQ(ierr); 483253dd7562SDmitry Karpeev if (n != B->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Diag col IS of size %D is incompatible with input matrix col size %D",n,B->cmap->n); 483353dd7562SDmitry Karpeev } else { 483453dd7562SDmitry Karpeev if (C->cmap->n != B->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is col-incompatible with the target matrix"); 483553dd7562SDmitry Karpeev } 483653dd7562SDmitry Karpeev 483753dd7562SDmitry Karpeev Baij = (Mat_SeqAIJ*)(B->data); 483853dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 483953dd7562SDmitry Karpeev ierr = PetscMalloc1(B->rmap->n,&nz);CHKERRQ(ierr); 484053dd7562SDmitry Karpeev for (i=0; i<B->rmap->n; i++) { 484153dd7562SDmitry Karpeev nz[i] = Baij->i[i+1] - Baij->i[i]; 484253dd7562SDmitry Karpeev } 484353dd7562SDmitry Karpeev ierr = MatSeqAIJSetPreallocation(C,0,nz);CHKERRQ(ierr); 484453dd7562SDmitry Karpeev ierr = PetscFree(nz);CHKERRQ(ierr); 484553dd7562SDmitry Karpeev } 484653dd7562SDmitry Karpeev if (pattern == SUBSET_NONZERO_PATTERN) { 484753dd7562SDmitry Karpeev ierr = MatZeroEntries(C);CHKERRQ(ierr); 484853dd7562SDmitry Karpeev } 484953dd7562SDmitry Karpeev count = 0; 485053dd7562SDmitry Karpeev rowindices = NULL; 485153dd7562SDmitry Karpeev colindices = NULL; 485253dd7562SDmitry Karpeev if (rowemb) { 485353dd7562SDmitry Karpeev ierr = ISGetIndices(rowemb,&rowindices);CHKERRQ(ierr); 485453dd7562SDmitry Karpeev } 485553dd7562SDmitry Karpeev if (colemb) { 485653dd7562SDmitry Karpeev ierr = ISGetIndices(colemb,&colindices);CHKERRQ(ierr); 485753dd7562SDmitry Karpeev } 485853dd7562SDmitry Karpeev for (i=0; i<B->rmap->n; i++) { 485953dd7562SDmitry Karpeev PetscInt row; 486053dd7562SDmitry Karpeev row = i; 486153dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 486253dd7562SDmitry Karpeev for (j=Baij->i[i]; j<Baij->i[i+1]; j++) { 486353dd7562SDmitry Karpeev PetscInt col; 486453dd7562SDmitry Karpeev col = Baij->j[count]; 486553dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 486653dd7562SDmitry Karpeev v = Baij->a[count]; 486753dd7562SDmitry Karpeev ierr = MatSetValues(C,1,&row,1,&col,&v,INSERT_VALUES);CHKERRQ(ierr); 486853dd7562SDmitry Karpeev ++count; 486953dd7562SDmitry Karpeev } 487053dd7562SDmitry Karpeev } 487153dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 487253dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 487353dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 487453dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 487553dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 487653dd7562SDmitry Karpeev PetscFunctionReturn(0); 487753dd7562SDmitry Karpeev } 487853dd7562SDmitry Karpeev 48794099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 48804099cc6bSBarry Smith 48814099cc6bSBarry Smith /*@C 48824099cc6bSBarry Smith MatSeqAIJSetType - Converts a MATSEQAIJ matrix to a subtype 48834099cc6bSBarry Smith 48844099cc6bSBarry Smith Collective on Mat 48854099cc6bSBarry Smith 48864099cc6bSBarry Smith Input Parameters: 48874099cc6bSBarry Smith + mat - the matrix object 48884099cc6bSBarry Smith - matype - matrix type 48894099cc6bSBarry Smith 48904099cc6bSBarry Smith Options Database Key: 48914099cc6bSBarry Smith . -mat_seqai_type <method> - for example seqaijcrl 48924099cc6bSBarry Smith 48934099cc6bSBarry Smith 48944099cc6bSBarry Smith Level: intermediate 48954099cc6bSBarry Smith 48964099cc6bSBarry Smith .seealso: PCSetType(), VecSetType(), MatCreate(), MatType, Mat 48974099cc6bSBarry Smith @*/ 48984099cc6bSBarry Smith PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 48994099cc6bSBarry Smith { 4900fd9d3c67SJed Brown PetscErrorCode ierr,(*r)(Mat,MatType,MatReuse,Mat*); 49014099cc6bSBarry Smith PetscBool sametype; 49024099cc6bSBarry Smith 49034099cc6bSBarry Smith PetscFunctionBegin; 49044099cc6bSBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 49054099cc6bSBarry Smith ierr = PetscObjectTypeCompare((PetscObject)mat,matype,&sametype);CHKERRQ(ierr); 49064099cc6bSBarry Smith if (sametype) PetscFunctionReturn(0); 49074099cc6bSBarry Smith 49084099cc6bSBarry Smith ierr = PetscFunctionListFind(MatSeqAIJList,matype,&r);CHKERRQ(ierr); 49094099cc6bSBarry Smith if (!r) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_UNKNOWN_TYPE,"Unknown Mat type given: %s",matype); 49104099cc6bSBarry Smith ierr = (*r)(mat,matype,MAT_INPLACE_MATRIX,&mat);CHKERRQ(ierr); 49114099cc6bSBarry Smith PetscFunctionReturn(0); 49124099cc6bSBarry Smith } 49134099cc6bSBarry Smith 49144099cc6bSBarry Smith 49154099cc6bSBarry Smith /*@C 49164099cc6bSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential AIJ matrices 49174099cc6bSBarry Smith 49184099cc6bSBarry Smith Not Collective 49194099cc6bSBarry Smith 49204099cc6bSBarry Smith Input Parameters: 49214099cc6bSBarry Smith + name - name of a new user-defined matrix type, for example MATSEQAIJCRL 49224099cc6bSBarry Smith - function - routine to convert to subtype 49234099cc6bSBarry Smith 49244099cc6bSBarry Smith Notes: 49254099cc6bSBarry Smith MatSeqAIJRegister() may be called multiple times to add several user-defined solvers. 49264099cc6bSBarry Smith 49274099cc6bSBarry Smith 49284099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 49294099cc6bSBarry Smith $ -mat_seqaij_type my_mat 49304099cc6bSBarry Smith 49314099cc6bSBarry Smith Level: advanced 49324099cc6bSBarry Smith 49334099cc6bSBarry Smith .seealso: MatSeqAIJRegisterAll() 49344099cc6bSBarry Smith 49354099cc6bSBarry Smith 49364099cc6bSBarry Smith Level: advanced 49374099cc6bSBarry Smith @*/ 4938388d47a6SSatish Balay PetscErrorCode MatSeqAIJRegister(const char sname[],PetscErrorCode (*function)(Mat,MatType,MatReuse,Mat *)) 49394099cc6bSBarry Smith { 49404099cc6bSBarry Smith PetscErrorCode ierr; 49414099cc6bSBarry Smith 49424099cc6bSBarry Smith PetscFunctionBegin; 49439cc31a68SJed Brown ierr = MatInitializePackage();CHKERRQ(ierr); 49444099cc6bSBarry Smith ierr = PetscFunctionListAdd(&MatSeqAIJList,sname,function);CHKERRQ(ierr); 49454099cc6bSBarry Smith PetscFunctionReturn(0); 49464099cc6bSBarry Smith } 49474099cc6bSBarry Smith 49484099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 49494099cc6bSBarry Smith 49504099cc6bSBarry Smith /*@C 49514099cc6bSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of SeqAIJ 49524099cc6bSBarry Smith 49534099cc6bSBarry Smith Not Collective 49544099cc6bSBarry Smith 49554099cc6bSBarry Smith Level: advanced 49564099cc6bSBarry Smith 49574099cc6bSBarry Smith Developers Note: CUSP and CUSPARSE do not yet support the MatConvert_SeqAIJ..() paradigm and thus cannot be registered here 49584099cc6bSBarry Smith 49594099cc6bSBarry Smith .seealso: MatRegisterAll(), MatSeqAIJRegister() 49604099cc6bSBarry Smith @*/ 49614099cc6bSBarry Smith PetscErrorCode MatSeqAIJRegisterAll(void) 49624099cc6bSBarry Smith { 49634099cc6bSBarry Smith PetscErrorCode ierr; 49644099cc6bSBarry Smith 49654099cc6bSBarry Smith PetscFunctionBegin; 49664099cc6bSBarry Smith if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(0); 49674099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 49684099cc6bSBarry Smith 49694099cc6bSBarry Smith ierr = MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL);CHKERRQ(ierr); 49704099cc6bSBarry Smith ierr = MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM);CHKERRQ(ierr); 49714dfdc2d9SRichard Tran Mills ierr = MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL);CHKERRQ(ierr); 49729779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 49736b62b571SRichard Tran Mills ierr = MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL);CHKERRQ(ierr); 4974485f9817SRichard Tran Mills #endif 49754099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 49764099cc6bSBarry Smith ierr = MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL);CHKERRQ(ierr); 49774099cc6bSBarry Smith #endif 49784099cc6bSBarry Smith PetscFunctionReturn(0); 49794099cc6bSBarry Smith } 498053dd7562SDmitry Karpeev 498153dd7562SDmitry Karpeev /* 498281824310SBarry Smith Special version for direct calls from Fortran 498381824310SBarry Smith */ 4984af0996ceSBarry Smith #include <petsc/private/fortranimpl.h> 498581824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 498681824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 498781824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 498881824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 498981824310SBarry Smith #endif 499081824310SBarry Smith 499181824310SBarry Smith /* Change these macros so can be used in void function */ 499281824310SBarry Smith #undef CHKERRQ 4993ce94432eSBarry Smith #define CHKERRQ(ierr) CHKERRABORT(PetscObjectComm((PetscObject)A),ierr) 499481824310SBarry Smith #undef SETERRQ2 4995e32f2f54SBarry Smith #define SETERRQ2(comm,ierr,b,c,d) CHKERRABORT(comm,ierr) 49964994cf47SJed Brown #undef SETERRQ3 49974994cf47SJed Brown #define SETERRQ3(comm,ierr,b,c,d,e) CHKERRABORT(comm,ierr) 499881824310SBarry Smith 49998cc058d9SJed Brown PETSC_EXTERN void PETSC_STDCALL matsetvaluesseqaij_(Mat *AA,PetscInt *mm,const PetscInt im[],PetscInt *nn,const PetscInt in[],const PetscScalar v[],InsertMode *isis, PetscErrorCode *_ierr) 500081824310SBarry Smith { 500181824310SBarry Smith Mat A = *AA; 500281824310SBarry Smith PetscInt m = *mm, n = *nn; 500381824310SBarry Smith InsertMode is = *isis; 500481824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 500581824310SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 500681824310SBarry Smith PetscInt *imax,*ai,*ailen; 500781824310SBarry Smith PetscErrorCode ierr; 500881824310SBarry Smith PetscInt *aj,nonew = a->nonew,lastcol = -1; 500954f21887SBarry Smith MatScalar *ap,value,*aa; 5010ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5011ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 501281824310SBarry Smith 501381824310SBarry Smith PetscFunctionBegin; 50144994cf47SJed Brown MatCheckPreallocated(A,1); 501581824310SBarry Smith imax = a->imax; 501681824310SBarry Smith ai = a->i; 501781824310SBarry Smith ailen = a->ilen; 501881824310SBarry Smith aj = a->j; 501981824310SBarry Smith aa = a->a; 502081824310SBarry Smith 502181824310SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 502281824310SBarry Smith row = im[k]; 502381824310SBarry Smith if (row < 0) continue; 502481824310SBarry Smith #if defined(PETSC_USE_DEBUG) 5025ce94432eSBarry Smith if (row >= A->rmap->n) SETERRABORT(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large"); 502681824310SBarry Smith #endif 502781824310SBarry Smith rp = aj + ai[row]; ap = aa + ai[row]; 502881824310SBarry Smith rmax = imax[row]; nrow = ailen[row]; 502981824310SBarry Smith low = 0; 503081824310SBarry Smith high = nrow; 503181824310SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 503281824310SBarry Smith if (in[l] < 0) continue; 503381824310SBarry Smith #if defined(PETSC_USE_DEBUG) 5034ce94432eSBarry Smith if (in[l] >= A->cmap->n) SETERRABORT(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Column too large"); 503581824310SBarry Smith #endif 503681824310SBarry Smith col = in[l]; 50372205254eSKarl Rupp if (roworiented) value = v[l + k*n]; 50382205254eSKarl Rupp else value = v[k + l*m]; 50392205254eSKarl Rupp 504081824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 504181824310SBarry Smith 50422205254eSKarl Rupp if (col <= lastcol) low = 0; 50432205254eSKarl Rupp else high = nrow; 504481824310SBarry Smith lastcol = col; 504581824310SBarry Smith while (high-low > 5) { 504681824310SBarry Smith t = (low+high)/2; 504781824310SBarry Smith if (rp[t] > col) high = t; 504881824310SBarry Smith else low = t; 504981824310SBarry Smith } 505081824310SBarry Smith for (i=low; i<high; i++) { 505181824310SBarry Smith if (rp[i] > col) break; 505281824310SBarry Smith if (rp[i] == col) { 505381824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 505481824310SBarry Smith else ap[i] = value; 505581824310SBarry Smith goto noinsert; 505681824310SBarry Smith } 505781824310SBarry Smith } 505881824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 505981824310SBarry Smith if (nonew == 1) goto noinsert; 5060ce94432eSBarry Smith if (nonew == -1) SETERRABORT(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero in the matrix"); 5061fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 506281824310SBarry Smith N = nrow++ - 1; a->nz++; high++; 506381824310SBarry Smith /* shift up all the later entries in this row */ 506481824310SBarry Smith for (ii=N; ii>=i; ii--) { 506581824310SBarry Smith rp[ii+1] = rp[ii]; 506681824310SBarry Smith ap[ii+1] = ap[ii]; 506781824310SBarry Smith } 506881824310SBarry Smith rp[i] = col; 506981824310SBarry Smith ap[i] = value; 5070e56f5c9eSBarry Smith A->nonzerostate++; 507181824310SBarry Smith noinsert:; 507281824310SBarry Smith low = i + 1; 507381824310SBarry Smith } 507481824310SBarry Smith ailen[row] = nrow; 507581824310SBarry Smith } 507681824310SBarry Smith PetscFunctionReturnVoid(); 507781824310SBarry Smith } 5078