1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 114099cc6bSBarry Smith PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 124099cc6bSBarry Smith { 134099cc6bSBarry Smith PetscBool flg; 144099cc6bSBarry Smith char type[256]; 154099cc6bSBarry Smith 164099cc6bSBarry Smith PetscFunctionBegin; 17d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 189566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type","Matrix SeqAIJ type","MatSeqAIJSetType",MatSeqAIJList,"seqaij",type,256,&flg)); 199566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A,type)); 20d0609cedSBarry Smith PetscOptionsEnd(); 214099cc6bSBarry Smith PetscFunctionReturn(0); 224099cc6bSBarry Smith } 234099cc6bSBarry Smith 24857cbf51SRichard Tran Mills PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A,PetscInt type,PetscReal *reductions) 250716a85fSBarry Smith { 260716a85fSBarry Smith PetscInt i,m,n; 270716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 280716a85fSBarry Smith 290716a85fSBarry Smith PetscFunctionBegin; 309566063dSJacob Faibussowitsch PetscCall(MatGetSize(A,&m,&n)); 319566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions,n)); 320716a85fSBarry Smith if (type == NORM_2) { 330716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 34a873a8cdSSam Reynolds reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]*aij->a[i]); 350716a85fSBarry Smith } 360716a85fSBarry Smith } else if (type == NORM_1) { 370716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 38a873a8cdSSam Reynolds reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 390716a85fSBarry Smith } 400716a85fSBarry Smith } else if (type == NORM_INFINITY) { 410716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 42a873a8cdSSam Reynolds reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]),reductions[aij->j[i]]); 430716a85fSBarry Smith } 44857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 45a873a8cdSSam Reynolds for (i=0; i<aij->i[m]; i++) { 46857cbf51SRichard Tran Mills reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 47a873a8cdSSam Reynolds } 48857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 49857cbf51SRichard Tran Mills for (i=0; i<aij->i[m]; i++) { 50857cbf51SRichard Tran Mills reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 51857cbf51SRichard Tran Mills } 52857cbf51SRichard Tran Mills } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Unknown reduction type"); 530716a85fSBarry Smith 540716a85fSBarry Smith if (type == NORM_2) { 55a873a8cdSSam Reynolds for (i=0; i<n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 56857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 57a873a8cdSSam Reynolds for (i=0; i<n; i++) reductions[i] /= m; 580716a85fSBarry Smith } 590716a85fSBarry Smith PetscFunctionReturn(0); 600716a85fSBarry Smith } 610716a85fSBarry Smith 623a062f41SBarry Smith PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A,IS *is) 633a062f41SBarry Smith { 643a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 653a062f41SBarry Smith PetscInt i,m=A->rmap->n,cnt = 0, bs = A->rmap->bs; 663a062f41SBarry Smith const PetscInt *jj = a->j,*ii = a->i; 673a062f41SBarry Smith PetscInt *rows; 683a062f41SBarry Smith 693a062f41SBarry Smith PetscFunctionBegin; 703a062f41SBarry Smith for (i=0; i<m; i++) { 713a062f41SBarry Smith if ((ii[i] != ii[i+1]) && ((jj[ii[i]] < bs*(i/bs)) || (jj[ii[i+1]-1] > bs*((i+bs)/bs)-1))) { 723a062f41SBarry Smith cnt++; 733a062f41SBarry Smith } 743a062f41SBarry Smith } 759566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt,&rows)); 763a062f41SBarry Smith cnt = 0; 773a062f41SBarry Smith for (i=0; i<m; i++) { 783a062f41SBarry Smith if ((ii[i] != ii[i+1]) && ((jj[ii[i]] < bs*(i/bs)) || (jj[ii[i+1]-1] > bs*((i+bs)/bs)-1))) { 793a062f41SBarry Smith rows[cnt] = i; 803a062f41SBarry Smith cnt++; 813a062f41SBarry Smith } 823a062f41SBarry Smith } 839566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF,cnt,rows,PETSC_OWN_POINTER,is)); 843a062f41SBarry Smith PetscFunctionReturn(0); 853a062f41SBarry Smith } 863a062f41SBarry Smith 87f1f41ecbSJed Brown PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A,PetscInt *nrows,PetscInt **zrows) 886ce1633cSBarry Smith { 896ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 90fff043a9SJunchao Zhang const MatScalar *aa; 916ce1633cSBarry Smith PetscInt i,m=A->rmap->n,cnt = 0; 92b2db7409Sstefano_zampini const PetscInt *ii = a->i,*jj = a->j,*diag; 936ce1633cSBarry Smith PetscInt *rows; 946ce1633cSBarry Smith 956ce1633cSBarry Smith PetscFunctionBegin; 969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 979566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 986ce1633cSBarry Smith diag = a->diag; 996ce1633cSBarry Smith for (i=0; i<m; i++) { 100b2db7409Sstefano_zampini if ((diag[i] >= ii[i+1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 1016ce1633cSBarry Smith cnt++; 1026ce1633cSBarry Smith } 1036ce1633cSBarry Smith } 1049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt,&rows)); 1056ce1633cSBarry Smith cnt = 0; 1066ce1633cSBarry Smith for (i=0; i<m; i++) { 107b2db7409Sstefano_zampini if ((diag[i] >= ii[i+1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 1086ce1633cSBarry Smith rows[cnt++] = i; 1096ce1633cSBarry Smith } 1106ce1633cSBarry Smith } 111f1f41ecbSJed Brown *nrows = cnt; 112f1f41ecbSJed Brown *zrows = rows; 1139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 114f1f41ecbSJed Brown PetscFunctionReturn(0); 115f1f41ecbSJed Brown } 116f1f41ecbSJed Brown 117f1f41ecbSJed Brown PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A,IS *zrows) 118f1f41ecbSJed Brown { 119f1f41ecbSJed Brown PetscInt nrows,*rows; 120f1f41ecbSJed Brown 121f1f41ecbSJed Brown PetscFunctionBegin; 1220298fd71SBarry Smith *zrows = NULL; 1239566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A,&nrows,&rows)); 1249566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A),nrows,rows,PETSC_OWN_POINTER,zrows)); 1256ce1633cSBarry Smith PetscFunctionReturn(0); 1266ce1633cSBarry Smith } 1276ce1633cSBarry Smith 128b3a44c85SBarry Smith PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A,IS *keptrows) 129b3a44c85SBarry Smith { 130b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 131b3a44c85SBarry Smith const MatScalar *aa; 132b3a44c85SBarry Smith PetscInt m=A->rmap->n,cnt = 0; 133b3a44c85SBarry Smith const PetscInt *ii; 134b3a44c85SBarry Smith PetscInt n,i,j,*rows; 135b3a44c85SBarry Smith 136b3a44c85SBarry Smith PetscFunctionBegin; 1379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 138f4259b30SLisandro Dalcin *keptrows = NULL; 139b3a44c85SBarry Smith ii = a->i; 140b3a44c85SBarry Smith for (i=0; i<m; i++) { 141b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 142b3a44c85SBarry Smith if (!n) { 143b3a44c85SBarry Smith cnt++; 144b3a44c85SBarry Smith goto ok1; 145b3a44c85SBarry Smith } 1462e5835c6SStefano Zampini for (j=ii[i]; j<ii[i+1]; j++) { 147b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 148b3a44c85SBarry Smith } 149b3a44c85SBarry Smith cnt++; 150b3a44c85SBarry Smith ok1:; 151b3a44c85SBarry Smith } 1522e5835c6SStefano Zampini if (!cnt) { 1539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 1542e5835c6SStefano Zampini PetscFunctionReturn(0); 1552e5835c6SStefano Zampini } 1569566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n-cnt,&rows)); 157b3a44c85SBarry Smith cnt = 0; 158b3a44c85SBarry Smith for (i=0; i<m; i++) { 159b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 160b3a44c85SBarry Smith if (!n) continue; 1612e5835c6SStefano Zampini for (j=ii[i]; j<ii[i+1]; j++) { 162b3a44c85SBarry Smith if (aa[j] != 0.0) { 163b3a44c85SBarry Smith rows[cnt++] = i; 164b3a44c85SBarry Smith break; 165b3a44c85SBarry Smith } 166b3a44c85SBarry Smith } 167b3a44c85SBarry Smith } 1689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 1699566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF,cnt,rows,PETSC_OWN_POINTER,keptrows)); 170b3a44c85SBarry Smith PetscFunctionReturn(0); 171b3a44c85SBarry Smith } 172b3a44c85SBarry Smith 1737087cfbeSBarry Smith PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y,Vec D,InsertMode is) 17479299369SBarry Smith { 17579299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) Y->data; 17699e65526SBarry Smith PetscInt i,m = Y->rmap->n; 17799e65526SBarry Smith const PetscInt *diag; 1782e5835c6SStefano Zampini MatScalar *aa; 17999e65526SBarry Smith const PetscScalar *v; 180ace3abfcSBarry Smith PetscBool missing; 18179299369SBarry Smith 18279299369SBarry Smith PetscFunctionBegin; 18309f38230SBarry Smith if (Y->assembled) { 1849566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y,&missing,NULL)); 18509f38230SBarry Smith if (!missing) { 18679299369SBarry Smith diag = aij->diag; 1879566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D,&v)); 1889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y,&aa)); 18979299369SBarry Smith if (is == INSERT_VALUES) { 19079299369SBarry Smith for (i=0; i<m; i++) { 19179299369SBarry Smith aa[diag[i]] = v[i]; 19279299369SBarry Smith } 19379299369SBarry Smith } else { 19479299369SBarry Smith for (i=0; i<m; i++) { 19579299369SBarry Smith aa[diag[i]] += v[i]; 19679299369SBarry Smith } 19779299369SBarry Smith } 1989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y,&aa)); 1999566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D,&v)); 20079299369SBarry Smith PetscFunctionReturn(0); 20179299369SBarry Smith } 2029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 20309f38230SBarry Smith } 2049566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y,D,is)); 20509f38230SBarry Smith PetscFunctionReturn(0); 20609f38230SBarry Smith } 20779299369SBarry Smith 2081a83f524SJed Brown PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *m,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 20917ab2063SBarry Smith { 210416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 21197f1f81fSBarry Smith PetscInt i,ishift; 21217ab2063SBarry Smith 2133a40ed3dSBarry Smith PetscFunctionBegin; 214d0f46423SBarry Smith *m = A->rmap->n; 2153a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 216bfeeae90SHong Zhang ishift = 0; 21753e63a63SBarry Smith if (symmetric && !A->structurally_symmetric) { 2189566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,PETSC_TRUE,ishift,oshift,(PetscInt**)ia,(PetscInt**)ja)); 219bfeeae90SHong Zhang } else if (oshift == 1) { 2201a83f524SJed Brown PetscInt *tia; 221d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2223b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2239566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n+1,&tia)); 2241a83f524SJed Brown for (i=0; i<A->rmap->n+1; i++) tia[i] = a->i[i] + 1; 2251a83f524SJed Brown *ia = tia; 226ecc77c7aSBarry Smith if (ja) { 2271a83f524SJed Brown PetscInt *tja; 2289566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz+1,&tja)); 2291a83f524SJed Brown for (i=0; i<nz; i++) tja[i] = a->j[i] + 1; 2301a83f524SJed Brown *ja = tja; 231ecc77c7aSBarry Smith } 2326945ee14SBarry Smith } else { 233ecc77c7aSBarry Smith *ia = a->i; 234ecc77c7aSBarry Smith if (ja) *ja = a->j; 235a2ce50c7SBarry Smith } 2363a40ed3dSBarry Smith PetscFunctionReturn(0); 237a2744918SBarry Smith } 238a2744918SBarry Smith 2391a83f524SJed Brown PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2406945ee14SBarry Smith { 2413a40ed3dSBarry Smith PetscFunctionBegin; 2423a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 243bfeeae90SHong Zhang if ((symmetric && !A->structurally_symmetric) || oshift == 1) { 2449566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2459566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 246bcd2baecSBarry Smith } 2473a40ed3dSBarry Smith PetscFunctionReturn(0); 24817ab2063SBarry Smith } 24917ab2063SBarry Smith 2501a83f524SJed Brown PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *nn,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2513b2fbd54SBarry Smith { 2523b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 253d0f46423SBarry Smith PetscInt i,*collengths,*cia,*cja,n = A->cmap->n,m = A->rmap->n; 25497f1f81fSBarry Smith PetscInt nz = a->i[m],row,*jj,mr,col; 2553b2fbd54SBarry Smith 2563a40ed3dSBarry Smith PetscFunctionBegin; 257899cda47SBarry Smith *nn = n; 2583a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2593b2fbd54SBarry Smith if (symmetric) { 2609566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,PETSC_TRUE,0,oshift,(PetscInt**)ia,(PetscInt**)ja)); 2613b2fbd54SBarry Smith } else { 2629566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n,&collengths)); 2639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n+1,&cia)); 2649566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz,&cja)); 2653b2fbd54SBarry Smith jj = a->j; 2663b2fbd54SBarry Smith for (i=0; i<nz; i++) { 267bfeeae90SHong Zhang collengths[jj[i]]++; 2683b2fbd54SBarry Smith } 2693b2fbd54SBarry Smith cia[0] = oshift; 2703b2fbd54SBarry Smith for (i=0; i<n; i++) { 2713b2fbd54SBarry Smith cia[i+1] = cia[i] + collengths[i]; 2723b2fbd54SBarry Smith } 2739566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths,n)); 2743b2fbd54SBarry Smith jj = a->j; 275a93ec695SBarry Smith for (row=0; row<m; row++) { 276a93ec695SBarry Smith mr = a->i[row+1] - a->i[row]; 277a93ec695SBarry Smith for (i=0; i<mr; i++) { 278bfeeae90SHong Zhang col = *jj++; 2792205254eSKarl Rupp 2803b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2813b2fbd54SBarry Smith } 2823b2fbd54SBarry Smith } 2839566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2843b2fbd54SBarry Smith *ia = cia; *ja = cja; 2853b2fbd54SBarry Smith } 2863a40ed3dSBarry Smith PetscFunctionReturn(0); 2873b2fbd54SBarry Smith } 2883b2fbd54SBarry Smith 2891a83f524SJed Brown PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2903b2fbd54SBarry Smith { 2913a40ed3dSBarry Smith PetscFunctionBegin; 2923a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2933b2fbd54SBarry Smith 2949566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2959566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2963a40ed3dSBarry Smith PetscFunctionReturn(0); 2973b2fbd54SBarry Smith } 2983b2fbd54SBarry Smith 2997cee066cSHong Zhang /* 3007cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 3017cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 302040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 3037cee066cSHong Zhang */ 3047cee066cSHong Zhang PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *nn,const PetscInt *ia[],const PetscInt *ja[],PetscInt *spidx[],PetscBool *done) 3057cee066cSHong Zhang { 3067cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3077cee066cSHong Zhang PetscInt i,*collengths,*cia,*cja,n = A->cmap->n,m = A->rmap->n; 308071fcb05SBarry Smith PetscInt nz = a->i[m],row,mr,col,tmp; 3097cee066cSHong Zhang PetscInt *cspidx; 310071fcb05SBarry Smith const PetscInt *jj; 3117cee066cSHong Zhang 3127cee066cSHong Zhang PetscFunctionBegin; 3137cee066cSHong Zhang *nn = n; 3147cee066cSHong Zhang if (!ia) PetscFunctionReturn(0); 315625f6d37SHong Zhang 3169566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n,&collengths)); 3179566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n+1,&cia)); 3189566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz,&cja)); 3199566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz,&cspidx)); 3207cee066cSHong Zhang jj = a->j; 3217cee066cSHong Zhang for (i=0; i<nz; i++) { 3227cee066cSHong Zhang collengths[jj[i]]++; 3237cee066cSHong Zhang } 3247cee066cSHong Zhang cia[0] = oshift; 3257cee066cSHong Zhang for (i=0; i<n; i++) { 3267cee066cSHong Zhang cia[i+1] = cia[i] + collengths[i]; 3277cee066cSHong Zhang } 3289566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths,n)); 3297cee066cSHong Zhang jj = a->j; 3307cee066cSHong Zhang for (row=0; row<m; row++) { 3317cee066cSHong Zhang mr = a->i[row+1] - a->i[row]; 3327cee066cSHong Zhang for (i=0; i<mr; i++) { 3337cee066cSHong Zhang col = *jj++; 334071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 335071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 336071fcb05SBarry Smith cja[tmp] = row + oshift; 3377cee066cSHong Zhang } 3387cee066cSHong Zhang } 3399566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 340071fcb05SBarry Smith *ia = cia; 341071fcb05SBarry Smith *ja = cja; 3427cee066cSHong Zhang *spidx = cspidx; 3437cee066cSHong Zhang PetscFunctionReturn(0); 3447cee066cSHong Zhang } 3457cee066cSHong Zhang 3467cee066cSHong Zhang PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscInt *spidx[],PetscBool *done) 3477cee066cSHong Zhang { 3487cee066cSHong Zhang PetscFunctionBegin; 3499566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A,oshift,symmetric,inodecompressed,n,ia,ja,done)); 3509566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3517cee066cSHong Zhang PetscFunctionReturn(0); 3527cee066cSHong Zhang } 3537cee066cSHong Zhang 35487d4246cSBarry Smith PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A,PetscInt row,const PetscScalar v[]) 35587d4246cSBarry Smith { 35687d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 35787d4246cSBarry Smith PetscInt *ai = a->i; 358fff043a9SJunchao Zhang PetscScalar *aa; 35987d4246cSBarry Smith 36087d4246cSBarry Smith PetscFunctionBegin; 3619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 3629566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa+ai[row],v,ai[row+1]-ai[row])); 3639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 36487d4246cSBarry Smith PetscFunctionReturn(0); 36587d4246cSBarry Smith } 36687d4246cSBarry Smith 367bd04181cSBarry Smith /* 368bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 369bd04181cSBarry Smith 370bd04181cSBarry Smith - a single row of values is set with each call 371bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 372bd04181cSBarry Smith - the values are always added to the matrix, not set 373bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 374bd04181cSBarry Smith 3751f763a69SBarry Smith This does NOT assume the global column indices are sorted 376bd04181cSBarry Smith 3771f763a69SBarry Smith */ 378bd04181cSBarry Smith 379af0996ceSBarry Smith #include <petsc/private/isimpl.h> 380189e4007SBarry Smith PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 381189e4007SBarry Smith { 382189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3831f763a69SBarry Smith PetscInt low,high,t,row,nrow,i,col,l; 3841f763a69SBarry Smith const PetscInt *rp,*ai = a->i,*ailen = a->ilen,*aj = a->j; 3851f763a69SBarry Smith PetscInt lastcol = -1; 386fff043a9SJunchao Zhang MatScalar *ap,value,*aa; 387189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices,*cidx = A->cmap->mapping->indices; 388189e4007SBarry Smith 389fff043a9SJunchao Zhang PetscFunctionBegin; 3909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 391f38dd0b8SBarry Smith row = ridx[im[0]]; 3921f763a69SBarry Smith rp = aj + ai[row]; 3931f763a69SBarry Smith ap = aa + ai[row]; 3941f763a69SBarry Smith nrow = ailen[row]; 395189e4007SBarry Smith low = 0; 396189e4007SBarry Smith high = nrow; 397189e4007SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 398189e4007SBarry Smith col = cidx[in[l]]; 399f38dd0b8SBarry Smith value = v[l]; 400189e4007SBarry Smith 401189e4007SBarry Smith if (col <= lastcol) low = 0; 402189e4007SBarry Smith else high = nrow; 403189e4007SBarry Smith lastcol = col; 404189e4007SBarry Smith while (high-low > 5) { 405189e4007SBarry Smith t = (low+high)/2; 406189e4007SBarry Smith if (rp[t] > col) high = t; 407189e4007SBarry Smith else low = t; 408189e4007SBarry Smith } 409189e4007SBarry Smith for (i=low; i<high; i++) { 410189e4007SBarry Smith if (rp[i] == col) { 4111f763a69SBarry Smith ap[i] += value; 412189e4007SBarry Smith low = i + 1; 4131f763a69SBarry Smith break; 414189e4007SBarry Smith } 415189e4007SBarry Smith } 416189e4007SBarry Smith } 4179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 418f38dd0b8SBarry Smith return 0; 419189e4007SBarry Smith } 420189e4007SBarry Smith 42197f1f81fSBarry Smith PetscErrorCode MatSetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 42217ab2063SBarry Smith { 423416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 424e2ee6c50SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 42597f1f81fSBarry Smith PetscInt *imax = a->imax,*ai = a->i,*ailen = a->ilen; 426e2ee6c50SBarry Smith PetscInt *aj = a->j,nonew = a->nonew,lastcol = -1; 427ce496241SStefano Zampini MatScalar *ap=NULL,value=0.0,*aa; 428ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 429ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 43017ab2063SBarry Smith 4313a40ed3dSBarry Smith PetscFunctionBegin; 4329566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 43317ab2063SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 434416022c9SBarry Smith row = im[k]; 4355ef9f2a5SBarry Smith if (row < 0) continue; 4366bdcaf15SBarry Smith PetscCheck(row < A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT,row,A->rmap->n-1); 437720833daSHong Zhang rp = aj + ai[row]; 438876c6284SHong Zhang if (!A->structure_only) ap = aa + ai[row]; 43917ab2063SBarry Smith rmax = imax[row]; nrow = ailen[row]; 440416022c9SBarry Smith low = 0; 441c71e6ed7SBarry Smith high = nrow; 44217ab2063SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 4435ef9f2a5SBarry Smith if (in[l] < 0) continue; 4446bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT,in[l],A->cmap->n-1); 445bfeeae90SHong Zhang col = in[l]; 446071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k*n] : v[k + l*m]; 447071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 44836db0b34SBarry Smith 4492205254eSKarl Rupp if (col <= lastcol) low = 0; 4502205254eSKarl Rupp else high = nrow; 451e2ee6c50SBarry Smith lastcol = col; 452416022c9SBarry Smith while (high-low > 5) { 453416022c9SBarry Smith t = (low+high)/2; 454416022c9SBarry Smith if (rp[t] > col) high = t; 455416022c9SBarry Smith else low = t; 45617ab2063SBarry Smith } 457416022c9SBarry Smith for (i=low; i<high; i++) { 45817ab2063SBarry Smith if (rp[i] > col) break; 45917ab2063SBarry Smith if (rp[i] == col) { 460876c6284SHong Zhang if (!A->structure_only) { 4610c0d7e18SFande Kong if (is == ADD_VALUES) { 4620c0d7e18SFande Kong ap[i] += value; 4630c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4640c0d7e18SFande Kong } 46517ab2063SBarry Smith else ap[i] = value; 466720833daSHong Zhang } 467e44c0bd4SBarry Smith low = i + 1; 46817ab2063SBarry Smith goto noinsert; 46917ab2063SBarry Smith } 47017ab2063SBarry Smith } 471dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 472c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 47308401ef6SPierre Jolivet PetscCheck(nonew != -1,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix",row,col); 474720833daSHong Zhang if (A->structure_only) { 475876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A,A->rmap->n,1,nrow,row,col,rmax,ai,aj,rp,imax,nonew,MatScalar); 476720833daSHong Zhang } else { 477fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 478720833daSHong Zhang } 479c03d1d03SSatish Balay N = nrow++ - 1; a->nz++; high++; 480416022c9SBarry Smith /* shift up all the later entries in this row */ 4819566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp+i+1,rp+i,N-i+1)); 48217ab2063SBarry Smith rp[i] = col; 483580bdb30SBarry Smith if (!A->structure_only) { 4849566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap+i+1,ap+i,N-i+1)); 485580bdb30SBarry Smith ap[i] = value; 486580bdb30SBarry Smith } 487416022c9SBarry Smith low = i + 1; 488e56f5c9eSBarry Smith A->nonzerostate++; 489e44c0bd4SBarry Smith noinsert:; 49017ab2063SBarry Smith } 49117ab2063SBarry Smith ailen[row] = nrow; 49217ab2063SBarry Smith } 4939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 4943a40ed3dSBarry Smith PetscFunctionReturn(0); 49517ab2063SBarry Smith } 49617ab2063SBarry Smith 49719b08ed1SBarry Smith PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 49819b08ed1SBarry Smith { 49919b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 50019b08ed1SBarry Smith PetscInt *rp,k,row; 50119b08ed1SBarry Smith PetscInt *ai = a->i; 50219b08ed1SBarry Smith PetscInt *aj = a->j; 503fff043a9SJunchao Zhang MatScalar *aa,*ap; 50419b08ed1SBarry Smith 50519b08ed1SBarry Smith PetscFunctionBegin; 50628b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Cannot call on assembled matrix."); 50708401ef6SPierre Jolivet PetscCheck(m*n+a->nz <= a->maxnz,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()",a->maxnz); 508fff043a9SJunchao Zhang 5099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 51019b08ed1SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 51119b08ed1SBarry Smith row = im[k]; 51219b08ed1SBarry Smith rp = aj + ai[row]; 51319b08ed1SBarry Smith ap = aa + ai[row]; 51419b08ed1SBarry Smith 5159566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp,in,n*sizeof(PetscInt))); 51619b08ed1SBarry Smith if (!A->structure_only) { 51719b08ed1SBarry Smith if (v) { 5189566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap,v,n*sizeof(PetscScalar))); 51919b08ed1SBarry Smith v += n; 52019b08ed1SBarry Smith } else { 5219566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap,n*sizeof(PetscScalar))); 52219b08ed1SBarry Smith } 52319b08ed1SBarry Smith } 52419b08ed1SBarry Smith a->ilen[row] = n; 52519b08ed1SBarry Smith a->imax[row] = n; 52619b08ed1SBarry Smith a->i[row+1] = a->i[row]+n; 52719b08ed1SBarry Smith a->nz += n; 52819b08ed1SBarry Smith } 5299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 53019b08ed1SBarry Smith PetscFunctionReturn(0); 53119b08ed1SBarry Smith } 53219b08ed1SBarry Smith 53319b08ed1SBarry Smith /*@ 53419b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 53519b08ed1SBarry Smith 53619b08ed1SBarry Smith Input Parameters: 53719b08ed1SBarry Smith + A - the SeqAIJ matrix 53819b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 53919b08ed1SBarry Smith 54019b08ed1SBarry Smith Level: advanced 54119b08ed1SBarry Smith 54219b08ed1SBarry Smith Notes: 54319b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 54419b08ed1SBarry Smith Simply call MatSetValues() after this call to provide the matrix entries in the usual manner. This matrix may be used 54519b08ed1SBarry Smith as always with multiple matrix assemblies. 54619b08ed1SBarry Smith 547db781477SPatrick Sanan .seealso: `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 54819b08ed1SBarry Smith @*/ 54919b08ed1SBarry Smith 55019b08ed1SBarry Smith PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A,PetscInt nztotal) 55119b08ed1SBarry Smith { 55219b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 55319b08ed1SBarry Smith 55419b08ed1SBarry Smith PetscFunctionBegin; 5559566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5569566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 55719b08ed1SBarry Smith a->maxnz = nztotal; 55819b08ed1SBarry Smith if (!a->imax) { 5599566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n,&a->imax)); 5609566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,A->rmap->n*sizeof(PetscInt))); 56119b08ed1SBarry Smith } 56219b08ed1SBarry Smith if (!a->ilen) { 5639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n,&a->ilen)); 5649566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,A->rmap->n*sizeof(PetscInt))); 56519b08ed1SBarry Smith } else { 5669566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen,A->rmap->n*sizeof(PetscInt))); 56719b08ed1SBarry Smith } 56819b08ed1SBarry Smith 56919b08ed1SBarry Smith /* allocate the matrix space */ 57019b08ed1SBarry Smith if (A->structure_only) { 5719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nztotal,&a->j)); 5729566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n+1,&a->i)); 5739566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,(A->rmap->n+1)*sizeof(PetscInt)+nztotal*sizeof(PetscInt))); 57419b08ed1SBarry Smith } else { 5759566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nztotal,&a->a,nztotal,&a->j,A->rmap->n+1,&a->i)); 5769566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,(A->rmap->n+1)*sizeof(PetscInt)+nztotal*(sizeof(PetscScalar)+sizeof(PetscInt)))); 57719b08ed1SBarry Smith } 57819b08ed1SBarry Smith a->i[0] = 0; 57919b08ed1SBarry Smith if (A->structure_only) { 58019b08ed1SBarry Smith a->singlemalloc = PETSC_FALSE; 58119b08ed1SBarry Smith a->free_a = PETSC_FALSE; 58219b08ed1SBarry Smith } else { 58319b08ed1SBarry Smith a->singlemalloc = PETSC_TRUE; 58419b08ed1SBarry Smith a->free_a = PETSC_TRUE; 58519b08ed1SBarry Smith } 58619b08ed1SBarry Smith a->free_ij = PETSC_TRUE; 58719b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 58819b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 58919b08ed1SBarry Smith PetscFunctionReturn(0); 59019b08ed1SBarry Smith } 59119b08ed1SBarry Smith 592071fcb05SBarry Smith PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 593071fcb05SBarry Smith { 594071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 595071fcb05SBarry Smith PetscInt *rp,k,row; 596071fcb05SBarry Smith PetscInt *ai = a->i,*ailen = a->ilen; 597071fcb05SBarry Smith PetscInt *aj = a->j; 598fff043a9SJunchao Zhang MatScalar *aa,*ap; 599071fcb05SBarry Smith 600071fcb05SBarry Smith PetscFunctionBegin; 6019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 602071fcb05SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 603071fcb05SBarry Smith row = im[k]; 6046bdcaf15SBarry Smith PetscCheck(n <= a->imax[row],PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Preallocation for row %" PetscInt_FMT " does not match number of columns provided",n); 605071fcb05SBarry Smith rp = aj + ai[row]; 606071fcb05SBarry Smith ap = aa + ai[row]; 607071fcb05SBarry Smith if (!A->was_assembled) { 6089566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp,in,n*sizeof(PetscInt))); 609071fcb05SBarry Smith } 610071fcb05SBarry Smith if (!A->structure_only) { 611071fcb05SBarry Smith if (v) { 6129566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap,v,n*sizeof(PetscScalar))); 613071fcb05SBarry Smith v += n; 614071fcb05SBarry Smith } else { 6159566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap,n*sizeof(PetscScalar))); 616071fcb05SBarry Smith } 617071fcb05SBarry Smith } 618071fcb05SBarry Smith ailen[row] = n; 619071fcb05SBarry Smith a->nz += n; 620071fcb05SBarry Smith } 6219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 622071fcb05SBarry Smith PetscFunctionReturn(0); 623071fcb05SBarry Smith } 624071fcb05SBarry Smith 625a77337e4SBarry Smith PetscErrorCode MatGetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],PetscScalar v[]) 6267eb43aa7SLois Curfman McInnes { 6277eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 62897f1f81fSBarry Smith PetscInt *rp,k,low,high,t,row,nrow,i,col,l,*aj = a->j; 62997f1f81fSBarry Smith PetscInt *ai = a->i,*ailen = a->ilen; 630fff043a9SJunchao Zhang MatScalar *ap,*aa; 6317eb43aa7SLois Curfman McInnes 6323a40ed3dSBarry Smith PetscFunctionBegin; 6339566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 6347eb43aa7SLois Curfman McInnes for (k=0; k<m; k++) { /* loop over rows */ 6357eb43aa7SLois Curfman McInnes row = im[k]; 63654c59aa7SJacob Faibussowitsch if (row < 0) {v += n; continue;} /* negative row */ 63754c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT,row,A->rmap->n-1); 638bfeeae90SHong Zhang rp = aj + ai[row]; ap = aa + ai[row]; 6397eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6407eb43aa7SLois Curfman McInnes for (l=0; l<n; l++) { /* loop over columns */ 64154c59aa7SJacob Faibussowitsch if (in[l] < 0) {v++; continue;} /* negative column */ 64254c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT,in[l],A->cmap->n-1); 643bfeeae90SHong Zhang col = in[l]; 6447eb43aa7SLois Curfman McInnes high = nrow; low = 0; /* assume unsorted */ 6457eb43aa7SLois Curfman McInnes while (high-low > 5) { 6467eb43aa7SLois Curfman McInnes t = (low+high)/2; 6477eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6487eb43aa7SLois Curfman McInnes else low = t; 6497eb43aa7SLois Curfman McInnes } 6507eb43aa7SLois Curfman McInnes for (i=low; i<high; i++) { 6517eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6527eb43aa7SLois Curfman McInnes if (rp[i] == col) { 653b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6547eb43aa7SLois Curfman McInnes goto finished; 6557eb43aa7SLois Curfman McInnes } 6567eb43aa7SLois Curfman McInnes } 65797e567efSBarry Smith *v++ = 0.0; 6587eb43aa7SLois Curfman McInnes finished:; 6597eb43aa7SLois Curfman McInnes } 6607eb43aa7SLois Curfman McInnes } 6619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 6623a40ed3dSBarry Smith PetscFunctionReturn(0); 6637eb43aa7SLois Curfman McInnes } 6647eb43aa7SLois Curfman McInnes 6653ea6fe3dSLisandro Dalcin PetscErrorCode MatView_SeqAIJ_Binary(Mat mat,PetscViewer viewer) 66617ab2063SBarry Smith { 6673ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ*)mat->data; 668c898d852SStefano Zampini const PetscScalar *av; 6693ea6fe3dSLisandro Dalcin PetscInt header[4],M,N,m,nz,i; 6703ea6fe3dSLisandro Dalcin PetscInt *rowlens; 67117ab2063SBarry Smith 6723a40ed3dSBarry Smith PetscFunctionBegin; 6739566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6742205254eSKarl Rupp 6753ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6763ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6773ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6783ea6fe3dSLisandro Dalcin nz = A->nz; 679416022c9SBarry Smith 6803ea6fe3dSLisandro Dalcin /* write matrix header */ 6813ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6823ea6fe3dSLisandro Dalcin header[1] = M; header[2] = N; header[3] = nz; 6839566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer,header,4,PETSC_INT)); 684416022c9SBarry Smith 6853ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6869566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&rowlens)); 6873ea6fe3dSLisandro Dalcin for (i=0; i<m; i++) rowlens[i] = A->i[i+1] - A->i[i]; 6889566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer,rowlens,m,PETSC_INT)); 6899566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6903ea6fe3dSLisandro Dalcin /* store column indices */ 6919566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer,A->j,nz,PETSC_INT)); 692416022c9SBarry Smith /* store nonzero values */ 6939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat,&av)); 6949566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer,av,nz,PETSC_SCALAR)); 6959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat,&av)); 696b37d52dbSMark F. Adams 6973ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6989566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat,viewer)); 6993a40ed3dSBarry Smith PetscFunctionReturn(0); 70017ab2063SBarry Smith } 701416022c9SBarry Smith 7027dc0baabSHong Zhang static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A,PetscViewer viewer) 7037dc0baabSHong Zhang { 7047dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 7057dc0baabSHong Zhang PetscInt i,k,m=A->rmap->N; 7067dc0baabSHong Zhang 7077dc0baabSHong Zhang PetscFunctionBegin; 7089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 7097dc0baabSHong Zhang for (i=0; i<m; i++) { 7109566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"row %" PetscInt_FMT ":",i)); 7117dc0baabSHong Zhang for (k=a->i[i]; k<a->i[i+1]; k++) { 7129566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ") ",a->j[k])); 7137dc0baabSHong Zhang } 7149566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 7157dc0baabSHong Zhang } 7169566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 7177dc0baabSHong Zhang PetscFunctionReturn(0); 7187dc0baabSHong Zhang } 7197dc0baabSHong Zhang 72009573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat,PetscViewer); 721cd155464SBarry Smith 722dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_ASCII(Mat A,PetscViewer viewer) 723416022c9SBarry Smith { 724416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 725c898d852SStefano Zampini const PetscScalar *av; 72660e0710aSBarry Smith PetscInt i,j,m = A->rmap->n; 727e060cb09SBarry Smith const char *name; 728f3ef73ceSBarry Smith PetscViewerFormat format; 72917ab2063SBarry Smith 7303a40ed3dSBarry Smith PetscFunctionBegin; 7317dc0baabSHong Zhang if (A->structure_only) { 7329566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A,viewer)); 7337dc0baabSHong Zhang PetscFunctionReturn(0); 7347dc0baabSHong Zhang } 73543e49210SHong Zhang 7369566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer,&format)); 7372e5835c6SStefano Zampini if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0); 7382e5835c6SStefano Zampini 739c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&av)); 7419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&av)); 74271c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 74397f1f81fSBarry Smith PetscInt nofinalvalue = 0; 74460e0710aSBarry Smith if (m && ((a->i[m] == a->i[m-1]) || (a->j[a->nz-1] != A->cmap->n-1))) { 745c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 746d00d2cf4SBarry Smith nofinalvalue = 1; 747d00d2cf4SBarry Smith } 7489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 7499566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n",m,A->cmap->n)); 7509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%% Nonzeros = %" PetscInt_FMT " \n",a->nz)); 751fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7529566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"zzz = zeros(%" PetscInt_FMT ",4);\n",a->nz+nofinalvalue)); 753fbfe6fa7SJed Brown #else 7549566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"zzz = zeros(%" PetscInt_FMT ",3);\n",a->nz+nofinalvalue)); 755fbfe6fa7SJed Brown #endif 7569566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"zzz = [\n")); 75717ab2063SBarry Smith 75817ab2063SBarry Smith for (i=0; i<m; i++) { 75960e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 760aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n",i+1,a->j[j]+1,(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 76217ab2063SBarry Smith #else 7639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n",i+1,a->j[j]+1,(double)a->a[j])); 76417ab2063SBarry Smith #endif 76517ab2063SBarry Smith } 76617ab2063SBarry Smith } 767d00d2cf4SBarry Smith if (nofinalvalue) { 768c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n",m,A->cmap->n,0.,0.)); 770c337ccceSJed Brown #else 7719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n",m,A->cmap->n,0.0)); 772c337ccceSJed Brown #endif 773d00d2cf4SBarry Smith } 7749566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A,&name)); 7759566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"];\n %s = spconvert(zzz);\n",name)); 7769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 777fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 77944cd7ae7SLois Curfman McInnes for (i=0; i<m; i++) { 7809566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"row %" PetscInt_FMT ":",i)); 78160e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 782aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78336db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7849566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 78536db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7869566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)-PetscImaginaryPart(a->a[j]))); 78736db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7889566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)PetscRealPart(a->a[j]))); 7896831982aSBarry Smith } 79044cd7ae7SLois Curfman McInnes #else 7919566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)a->a[j])); 79244cd7ae7SLois Curfman McInnes #endif 79344cd7ae7SLois Curfman McInnes } 7949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 79544cd7ae7SLois Curfman McInnes } 7969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 797fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 79897f1f81fSBarry Smith PetscInt nzd=0,fshift=1,*sptr; 7999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 8009566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1,&sptr)); 801496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 802496be53dSLois Curfman McInnes sptr[i] = nzd+1; 80360e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 804496be53dSLois Curfman McInnes if (a->j[j] >= i) { 805aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 80636db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 807496be53dSLois Curfman McInnes #else 808496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 809496be53dSLois Curfman McInnes #endif 810496be53dSLois Curfman McInnes } 811496be53dSLois Curfman McInnes } 812496be53dSLois Curfman McInnes } 8132e44a96cSLois Curfman McInnes sptr[m] = nzd+1; 8149566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT "\n\n",m,nzd)); 8152e44a96cSLois Curfman McInnes for (i=0; i<m+1; i+=6) { 8162205254eSKarl Rupp if (i+4<m) { 8179566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4],sptr[i+5])); 8182205254eSKarl Rupp } else if (i+3<m) { 8199566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4])); 8202205254eSKarl Rupp } else if (i+2<m) { 8219566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3])); 8222205254eSKarl Rupp } else if (i+1<m) { 8239566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n",sptr[i],sptr[i+1],sptr[i+2])); 8242205254eSKarl Rupp } else if (i<m) { 8259566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT "\n",sptr[i],sptr[i+1])); 8262205254eSKarl Rupp } else { 8279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT "\n",sptr[i])); 8282205254eSKarl Rupp } 829496be53dSLois Curfman McInnes } 8309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 8319566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 832496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 83360e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 8349566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " ",a->j[j]+fshift)); 835496be53dSLois Curfman McInnes } 8369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 837496be53dSLois Curfman McInnes } 8389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 839496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 84060e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 841496be53dSLois Curfman McInnes if (a->j[j] >= i) { 842aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 84336db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) { 8449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %18.16e %18.16e ",(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 8456831982aSBarry Smith } 846496be53dSLois Curfman McInnes #else 8479566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer," %18.16e ",(double)a->a[j])); 848496be53dSLois Curfman McInnes #endif 849496be53dSLois Curfman McInnes } 850496be53dSLois Curfman McInnes } 8519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 852496be53dSLois Curfman McInnes } 8539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 854fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 85597f1f81fSBarry Smith PetscInt cnt = 0,jcnt; 85687828ca2SBarry Smith PetscScalar value; 85768f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 85868f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 85968f1ed48SBarry Smith 86068f1ed48SBarry Smith for (i=0; i<a->i[m]; i++) { 86168f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 86268f1ed48SBarry Smith realonly = PETSC_FALSE; 86368f1ed48SBarry Smith break; 86468f1ed48SBarry Smith } 86568f1ed48SBarry Smith } 86668f1ed48SBarry Smith #endif 86702594712SBarry Smith 8689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 86902594712SBarry Smith for (i=0; i<m; i++) { 87002594712SBarry Smith jcnt = 0; 871d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 872e24b481bSBarry Smith if (jcnt < a->i[i+1]-a->i[i] && j == a->j[cnt]) { 87302594712SBarry Smith value = a->a[cnt++]; 874e24b481bSBarry Smith jcnt++; 87502594712SBarry Smith } else { 87602594712SBarry Smith value = 0.0; 87702594712SBarry Smith } 878aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 87968f1ed48SBarry Smith if (realonly) { 8809566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %7.5e ",(double)PetscRealPart(value))); 88168f1ed48SBarry Smith } else { 8829566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %7.5e+%7.5e i ",(double)PetscRealPart(value),(double)PetscImaginaryPart(value))); 88368f1ed48SBarry Smith } 88402594712SBarry Smith #else 8859566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %7.5e ",(double)value)); 88602594712SBarry Smith #endif 88702594712SBarry Smith } 8889566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 88902594712SBarry Smith } 8909566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 8913c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 892150b93efSMatthew G. Knepley PetscInt fshift=1; 8939566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 8943c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8959566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%%%%MatrixMarket matrix coordinate complex general\n")); 8963c215bfdSMatthew Knepley #else 8979566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%%%%MatrixMarket matrix coordinate real general\n")); 8983c215bfdSMatthew Knepley #endif 8999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 9003c215bfdSMatthew Knepley for (i=0; i<m; i++) { 90160e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 9023c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 9039566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i+fshift,a->j[j]+fshift,(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 9043c215bfdSMatthew Knepley #else 9059566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i+fshift, a->j[j]+fshift, (double)a->a[j])); 9063c215bfdSMatthew Knepley #endif 9073c215bfdSMatthew Knepley } 9083c215bfdSMatthew Knepley } 9099566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 9103a40ed3dSBarry Smith } else { 9119566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 912d5f3da31SBarry Smith if (A->factortype) { 91316cd7e1dSShri Abhyankar for (i=0; i<m; i++) { 9149566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"row %" PetscInt_FMT ":",i)); 91516cd7e1dSShri Abhyankar /* L part */ 91660e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 91716cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91816cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9199566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 92016cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9219566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)(-PetscImaginaryPart(a->a[j])))); 92216cd7e1dSShri Abhyankar } else { 9239566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)PetscRealPart(a->a[j]))); 92416cd7e1dSShri Abhyankar } 92516cd7e1dSShri Abhyankar #else 9269566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)a->a[j])); 92716cd7e1dSShri Abhyankar #endif 92816cd7e1dSShri Abhyankar } 92916cd7e1dSShri Abhyankar /* diagonal */ 93016cd7e1dSShri Abhyankar j = a->diag[i]; 93116cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 93216cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g + %g i)",a->j[j],(double)PetscRealPart(1.0/a->a[j]),(double)PetscImaginaryPart(1.0/a->a[j]))); 93416cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9359566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g - %g i)",a->j[j],(double)PetscRealPart(1.0/a->a[j]),(double)(-PetscImaginaryPart(1.0/a->a[j])))); 93616cd7e1dSShri Abhyankar } else { 9379566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)PetscRealPart(1.0/a->a[j]))); 93816cd7e1dSShri Abhyankar } 93916cd7e1dSShri Abhyankar #else 9409566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)(1.0/a->a[j]))); 94116cd7e1dSShri Abhyankar #endif 94216cd7e1dSShri Abhyankar 94316cd7e1dSShri Abhyankar /* U part */ 94460e0710aSBarry Smith for (j=a->diag[i+1]+1; j<a->diag[i]; j++) { 94516cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 94616cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9479566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 94816cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9499566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)(-PetscImaginaryPart(a->a[j])))); 95016cd7e1dSShri Abhyankar } else { 9519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)PetscRealPart(a->a[j]))); 95216cd7e1dSShri Abhyankar } 95316cd7e1dSShri Abhyankar #else 9549566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)a->a[j])); 95516cd7e1dSShri Abhyankar #endif 95616cd7e1dSShri Abhyankar } 9579566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 95816cd7e1dSShri Abhyankar } 95916cd7e1dSShri Abhyankar } else { 96017ab2063SBarry Smith for (i=0; i<m; i++) { 9619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"row %" PetscInt_FMT ":",i)); 96260e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 963aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 96436db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9659566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 96636db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9679566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)-PetscImaginaryPart(a->a[j]))); 9683a40ed3dSBarry Smith } else { 9699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)PetscRealPart(a->a[j]))); 97017ab2063SBarry Smith } 97117ab2063SBarry Smith #else 9729566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)a->a[j])); 97317ab2063SBarry Smith #endif 97417ab2063SBarry Smith } 9759566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 97617ab2063SBarry Smith } 97716cd7e1dSShri Abhyankar } 9789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 97917ab2063SBarry Smith } 9809566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9813a40ed3dSBarry Smith PetscFunctionReturn(0); 982416022c9SBarry Smith } 983416022c9SBarry Smith 9849804daf3SBarry Smith #include <petscdraw.h> 985dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw,void *Aa) 986416022c9SBarry Smith { 987480ef9eaSBarry Smith Mat A = (Mat) Aa; 988416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 989383922c3SLisandro Dalcin PetscInt i,j,m = A->rmap->n; 990383922c3SLisandro Dalcin int color; 991b05fc000SLisandro Dalcin PetscReal xl,yl,xr,yr,x_l,x_r,y_l,y_r; 992b0a32e0cSBarry Smith PetscViewer viewer; 993f3ef73ceSBarry Smith PetscViewerFormat format; 994fff043a9SJunchao Zhang const PetscScalar *aa; 995cddf8d76SBarry Smith 9963a40ed3dSBarry Smith PetscFunctionBegin; 9979566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A,"Zoomviewer",(PetscObject*)&viewer)); 9989566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer,&format)); 9999566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw,&xl,&yl,&xr,&yr)); 1000383922c3SLisandro Dalcin 1001416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 10029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 1003fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 1004d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10050513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 1006b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 1007416022c9SBarry Smith for (i=0; i<m; i++) { 1008cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 1009bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1010bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 1011fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 10129566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color)); 1013cddf8d76SBarry Smith } 1014cddf8d76SBarry Smith } 1015b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 1016cddf8d76SBarry Smith for (i=0; i<m; i++) { 1017cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 1018bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1019bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 1020fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 10219566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color)); 1022cddf8d76SBarry Smith } 1023cddf8d76SBarry Smith } 1024b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1025cddf8d76SBarry Smith for (i=0; i<m; i++) { 1026cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 1027bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1028bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 1029fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10309566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color)); 1031416022c9SBarry Smith } 1032416022c9SBarry Smith } 1033d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10340513a670SBarry Smith } else { 10350513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10360513a670SBarry Smith /* first determine max of all nonzero values */ 1037b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1038383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1039b0a32e0cSBarry Smith PetscDraw popup; 10400513a670SBarry Smith 10410513a670SBarry Smith for (i=0; i<nz; i++) { 1042fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10430513a670SBarry Smith } 1044383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10459566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw,&popup)); 10469566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup,minv,maxv)); 1047383922c3SLisandro Dalcin 1048d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10490513a670SBarry Smith for (i=0; i<m; i++) { 1050383922c3SLisandro Dalcin y_l = m - i - 1.0; 1051383922c3SLisandro Dalcin y_r = y_l + 1.0; 1052bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1053383922c3SLisandro Dalcin x_l = a->j[j]; 1054383922c3SLisandro Dalcin x_r = x_l + 1.0; 1055fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]),minv,maxv); 10569566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color)); 10570513a670SBarry Smith count++; 10580513a670SBarry Smith } 10590513a670SBarry Smith } 1060d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10610513a670SBarry Smith } 10629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 1063480ef9eaSBarry Smith PetscFunctionReturn(0); 1064480ef9eaSBarry Smith } 1065cddf8d76SBarry Smith 10669804daf3SBarry Smith #include <petscdraw.h> 1067dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw(Mat A,PetscViewer viewer) 1068480ef9eaSBarry Smith { 1069b0a32e0cSBarry Smith PetscDraw draw; 107036db0b34SBarry Smith PetscReal xr,yr,xl,yl,h,w; 1071ace3abfcSBarry Smith PetscBool isnull; 1072480ef9eaSBarry Smith 1073480ef9eaSBarry Smith PetscFunctionBegin; 10749566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer,0,&draw)); 10759566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw,&isnull)); 1076480ef9eaSBarry Smith if (isnull) PetscFunctionReturn(0); 1077480ef9eaSBarry Smith 1078d0f46423SBarry Smith xr = A->cmap->n; yr = A->rmap->n; h = yr/10.0; w = xr/10.0; 1079480ef9eaSBarry Smith xr += w; yr += h; xl = -w; yl = -h; 10809566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw,xl,yl,xr,yr)); 10819566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A,"Zoomviewer",(PetscObject)viewer)); 10829566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw,MatView_SeqAIJ_Draw_Zoom,A)); 10839566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A,"Zoomviewer",NULL)); 10849566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10853a40ed3dSBarry Smith PetscFunctionReturn(0); 1086416022c9SBarry Smith } 1087416022c9SBarry Smith 1088dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ(Mat A,PetscViewer viewer) 1089416022c9SBarry Smith { 1090ace3abfcSBarry Smith PetscBool iascii,isbinary,isdraw; 1091416022c9SBarry Smith 10923a40ed3dSBarry Smith PetscFunctionBegin; 10939566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii)); 10949566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary)); 10959566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERDRAW,&isdraw)); 1096c45a1595SBarry Smith if (iascii) { 10979566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII(A,viewer)); 10980f5bd95cSBarry Smith } else if (isbinary) { 10999566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Binary(A,viewer)); 11000f5bd95cSBarry Smith } else if (isdraw) { 11019566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Draw(A,viewer)); 110211aeaf0aSBarry Smith } 11039566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A,viewer)); 11043a40ed3dSBarry Smith PetscFunctionReturn(0); 110517ab2063SBarry Smith } 110619bcc07fSBarry Smith 1107dfbe8321SBarry Smith PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A,MatAssemblyType mode) 110817ab2063SBarry Smith { 1109416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1110580bdb30SBarry Smith PetscInt fshift = 0,i,*ai = a->i,*aj = a->j,*imax = a->imax; 1111d0f46423SBarry Smith PetscInt m = A->rmap->n,*ip,N,*ailen = a->ilen,rmax = 0; 111254f21887SBarry Smith MatScalar *aa = a->a,*ap; 11133447b6efSHong Zhang PetscReal ratio = 0.6; 111417ab2063SBarry Smith 11153a40ed3dSBarry Smith PetscFunctionBegin; 11163a40ed3dSBarry Smith if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0); 11179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1118b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1119b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11209566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A,mode)); 1121b215bc84SStefano Zampini PetscFunctionReturn(0); 1122b215bc84SStefano Zampini } 112317ab2063SBarry Smith 112443ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 112517ab2063SBarry Smith for (i=1; i<m; i++) { 1126416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 112717ab2063SBarry Smith fshift += imax[i-1] - ailen[i-1]; 112894a9d846SBarry Smith rmax = PetscMax(rmax,ailen[i]); 112917ab2063SBarry Smith if (fshift) { 1130bfeeae90SHong Zhang ip = aj + ai[i]; 1131bfeeae90SHong Zhang ap = aa + ai[i]; 113217ab2063SBarry Smith N = ailen[i]; 11339566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip-fshift,ip,N)); 1134580bdb30SBarry Smith if (!A->structure_only) { 11359566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap-fshift,ap,N)); 113617ab2063SBarry Smith } 113717ab2063SBarry Smith } 113817ab2063SBarry Smith ai[i] = ai[i-1] + ailen[i-1]; 113917ab2063SBarry Smith } 114017ab2063SBarry Smith if (m) { 114117ab2063SBarry Smith fshift += imax[m-1] - ailen[m-1]; 114217ab2063SBarry Smith ai[m] = ai[m-1] + ailen[m-1]; 114317ab2063SBarry Smith } 11447b083b7cSBarry Smith 114517ab2063SBarry Smith /* reset ilen and imax for each row */ 11467b083b7cSBarry Smith a->nonzerorowcnt = 0; 1147396832f4SHong Zhang if (A->structure_only) { 11489566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11499566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1150396832f4SHong Zhang } else { /* !A->structure_only */ 115117ab2063SBarry Smith for (i=0; i<m; i++) { 115217ab2063SBarry Smith ailen[i] = imax[i] = ai[i+1] - ai[i]; 11537b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i+1] - ai[i]) > 0); 115417ab2063SBarry Smith } 1155396832f4SHong Zhang } 1156bfeeae90SHong Zhang a->nz = ai[m]; 1157aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1,PETSC_COMM_SELF,PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 115817ab2063SBarry Smith 11599566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 11609566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n",m,A->cmap->n,fshift,a->nz)); 11619566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n",a->reallocs)); 11629566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Maximum nonzeros in any row is %" PetscInt_FMT "\n",rmax)); 11632205254eSKarl Rupp 11648e58a170SBarry Smith A->info.mallocs += a->reallocs; 1165dd5f02e7SSatish Balay a->reallocs = 0; 11666712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 116736db0b34SBarry Smith a->rmax = rmax; 11684e220ebcSLois Curfman McInnes 1169396832f4SHong Zhang if (!A->structure_only) { 11709566063dSJacob Faibussowitsch PetscCall(MatCheckCompressedRow(A,a->nonzerorowcnt,&a->compressedrow,a->i,m,ratio)); 1171396832f4SHong Zhang } 11729566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A,mode)); 11733a40ed3dSBarry Smith PetscFunctionReturn(0); 117417ab2063SBarry Smith } 117517ab2063SBarry Smith 117699cafbc1SBarry Smith PetscErrorCode MatRealPart_SeqAIJ(Mat A) 117799cafbc1SBarry Smith { 117899cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 117999cafbc1SBarry Smith PetscInt i,nz = a->nz; 11802e5835c6SStefano Zampini MatScalar *aa; 118199cafbc1SBarry Smith 118299cafbc1SBarry Smith PetscFunctionBegin; 11839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 118499cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscRealPart(aa[i]); 11859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 11869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 118799cafbc1SBarry Smith PetscFunctionReturn(0); 118899cafbc1SBarry Smith } 118999cafbc1SBarry Smith 119099cafbc1SBarry Smith PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 119199cafbc1SBarry Smith { 119299cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 119399cafbc1SBarry Smith PetscInt i,nz = a->nz; 11942e5835c6SStefano Zampini MatScalar *aa; 119599cafbc1SBarry Smith 119699cafbc1SBarry Smith PetscFunctionBegin; 11979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 119899cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 12009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 120199cafbc1SBarry Smith PetscFunctionReturn(0); 120299cafbc1SBarry Smith } 120399cafbc1SBarry Smith 1204dfbe8321SBarry Smith PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 120517ab2063SBarry Smith { 1206fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1207fff043a9SJunchao Zhang MatScalar *aa; 12083a40ed3dSBarry Smith 12093a40ed3dSBarry Smith PetscFunctionBegin; 12109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A,&aa)); 12119566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa,a->i[A->rmap->n])); 12129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A,&aa)); 12139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 12143a40ed3dSBarry Smith PetscFunctionReturn(0); 121517ab2063SBarry Smith } 1216416022c9SBarry Smith 1217cbc6b225SStefano Zampini PETSC_INTERN PetscErrorCode MatResetPreallocationCOO_SeqAIJ(Mat A) 1218cbc6b225SStefano Zampini { 1219cbc6b225SStefano Zampini Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1220cbc6b225SStefano Zampini 1221cbc6b225SStefano Zampini PetscFunctionBegin; 12229566063dSJacob Faibussowitsch PetscCall(PetscFree(a->perm)); 12239566063dSJacob Faibussowitsch PetscCall(PetscFree(a->jmap)); 1224cbc6b225SStefano Zampini PetscFunctionReturn(0); 1225cbc6b225SStefano Zampini } 1226cbc6b225SStefano Zampini 1227dfbe8321SBarry Smith PetscErrorCode MatDestroy_SeqAIJ(Mat A) 122817ab2063SBarry Smith { 1229416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1230d5d45c9bSBarry Smith 12313a40ed3dSBarry Smith PetscFunctionBegin; 1232aa482453SBarry Smith #if defined(PETSC_USE_LOG) 1233c0aa6a63SJacob Faibussowitsch PetscLogObjectState((PetscObject)A,"Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT,A->rmap->n,A->cmap->n,a->nz); 123417ab2063SBarry Smith #endif 12359566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A,&a->a,&a->j,&a->i)); 12369566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(A)); 12379566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12389566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12399566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12409566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12419566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12429566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12439566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12449566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag,a->mdiag,a->ssor_work)); 12459566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12469566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12479566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12489566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i,a->compressedrow.rindex)); 12499566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 12509566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1251901853e0SKris Buschelman 12526718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12536718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12546718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12556718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12566718818eSStefano Zampini due to different matrix sizes */ 12579566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A,"__PETSc__ab_dense",NULL)); 12586718818eSStefano Zampini 12599566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A,NULL)); 12602e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"PetscMatlabEnginePut_C",NULL)); 12612e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"PetscMatlabEngineGet_C",NULL)); 12629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetColumnIndices_C",NULL)); 12639566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatStoreValues_C",NULL)); 12649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatRetrieveValues_C",NULL)); 12659566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqsbaij_C",NULL)); 12669566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqbaij_C",NULL)); 12679566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijperm_C",NULL)); 12682e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijsell_C",NULL)); 12692e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12702e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijmkl_C",NULL)); 12712e956fe4SStefano Zampini #endif 12724222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12739566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijcusparse_C",NULL)); 12749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaijcusparse_seqaij_C",NULL)); 12759566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaij_seqaijcusparse_C",NULL)); 12764222ddf1SHong Zhang #endif 12773d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijkokkos_C",NULL)); 12793d0639e7SStefano Zampini #endif 12809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijcrl_C",NULL)); 1281af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_elemental_C",NULL)); 1283af8000cdSHong Zhang #endif 1284d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_scalapack_C",NULL)); 1286d24d4204SJose E. Roman #endif 128763c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12889566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_hypre_C",NULL)); 12899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_transpose_seqaij_seqaij_C",NULL)); 129063c07aadSStefano Zampini #endif 12919566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqdense_C",NULL)); 12929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqsell_C",NULL)); 12939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_is_C",NULL)); 12949566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatIsTranspose_C",NULL)); 12952e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatIsHermitianTranspose_C",NULL)); 12969566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetPreallocation_C",NULL)); 12979566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatResetPreallocation_C",NULL)); 12989566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetPreallocationCSR_C",NULL)); 12999566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatReorderForNonzeroDiagonal_C",NULL)); 13009566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_is_seqaij_C",NULL)); 13019566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqdense_seqaij_C",NULL)); 13029566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaij_seqaij_C",NULL)); 13039566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJKron_C",NULL)); 13049566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSetPreallocationCOO_C",NULL)); 13059566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSetValuesCOO_C",NULL)); 13062e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatFactorGetSolverType_C",NULL)); 13072e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 13082e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaijsell_seqaij_C",NULL)); 13092e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaijperm_seqaij_C",NULL)); 13102e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijviennacl_C",NULL)); 13112e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaijviennacl_seqdense_C",NULL)); 13122e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaijviennacl_seqaij_C",NULL)); 13133a40ed3dSBarry Smith PetscFunctionReturn(0); 131417ab2063SBarry Smith } 131517ab2063SBarry Smith 1316ace3abfcSBarry Smith PetscErrorCode MatSetOption_SeqAIJ(Mat A,MatOption op,PetscBool flg) 131717ab2063SBarry Smith { 1318416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 13193a40ed3dSBarry Smith 13203a40ed3dSBarry Smith PetscFunctionBegin; 1321a65d3064SKris Buschelman switch (op) { 1322a65d3064SKris Buschelman case MAT_ROW_ORIENTED: 13234e0d8c25SBarry Smith a->roworiented = flg; 1324a65d3064SKris Buschelman break; 1325a9817697SBarry Smith case MAT_KEEP_NONZERO_PATTERN: 1326a9817697SBarry Smith a->keepnonzeropattern = flg; 1327a65d3064SKris Buschelman break; 1328512a5fc5SBarry Smith case MAT_NEW_NONZERO_LOCATIONS: 1329512a5fc5SBarry Smith a->nonew = (flg ? 0 : 1); 1330a65d3064SKris Buschelman break; 1331a65d3064SKris Buschelman case MAT_NEW_NONZERO_LOCATION_ERR: 13324e0d8c25SBarry Smith a->nonew = (flg ? -1 : 0); 1333a65d3064SKris Buschelman break; 1334a65d3064SKris Buschelman case MAT_NEW_NONZERO_ALLOCATION_ERR: 13354e0d8c25SBarry Smith a->nonew = (flg ? -2 : 0); 1336a65d3064SKris Buschelman break; 133728b2fa4aSMatthew Knepley case MAT_UNUSED_NONZERO_LOCATION_ERR: 133828b2fa4aSMatthew Knepley a->nounused = (flg ? -1 : 0); 133928b2fa4aSMatthew Knepley break; 1340a65d3064SKris Buschelman case MAT_IGNORE_ZERO_ENTRIES: 13414e0d8c25SBarry Smith a->ignorezeroentries = flg; 13420df259c2SBarry Smith break; 13433d472b54SHong Zhang case MAT_SPD: 1344b1646e73SJed Brown case MAT_SYMMETRIC: 1345b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1346b1646e73SJed Brown case MAT_HERMITIAN: 1347b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1348957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 13495021d80fSJed Brown /* These options are handled directly by MatSetOption() */ 13505021d80fSJed Brown break; 13518c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 1352a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1353a65d3064SKris Buschelman case MAT_USE_HASH_TABLE: 13549566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Option %s ignored\n",MatOptions[op])); 1355a65d3064SKris Buschelman break; 1356b87ac2d8SJed Brown case MAT_USE_INODES: 13579566063dSJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A,MAT_USE_INODES,flg)); 1358b87ac2d8SJed Brown break; 1359c10200c1SHong Zhang case MAT_SUBMAT_SINGLEIS: 1360c10200c1SHong Zhang A->submat_singleis = flg; 1361c10200c1SHong Zhang break; 1362071fcb05SBarry Smith case MAT_SORTED_FULL: 1363071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1364071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1365071fcb05SBarry Smith break; 13661a2c6b5cSJunchao Zhang case MAT_FORM_EXPLICIT_TRANSPOSE: 13671a2c6b5cSJunchao Zhang A->form_explicit_transpose = flg; 13681a2c6b5cSJunchao Zhang break; 1369a65d3064SKris Buschelman default: 137098921bdaSJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"unknown option %d",op); 1371a65d3064SKris Buschelman } 13723a40ed3dSBarry Smith PetscFunctionReturn(0); 137317ab2063SBarry Smith } 137417ab2063SBarry Smith 1375dfbe8321SBarry Smith PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A,Vec v) 137617ab2063SBarry Smith { 1377416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1378fdc842d1SBarry Smith PetscInt i,j,n,*ai=a->i,*aj=a->j; 1379c898d852SStefano Zampini PetscScalar *x; 1380c898d852SStefano Zampini const PetscScalar *aa; 138117ab2063SBarry Smith 13823a40ed3dSBarry Smith PetscFunctionBegin; 13839566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v,&n)); 138408401ef6SPierre Jolivet PetscCheck(n == A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 13859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 1386d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1387d3e70bfaSHong Zhang PetscInt *diag=a->diag; 13889566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 13892c990fa1SHong Zhang for (i=0; i<n; i++) x[i] = 1.0/aa[diag[i]]; 13909566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 13919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 139235e7444dSHong Zhang PetscFunctionReturn(0); 139335e7444dSHong Zhang } 139435e7444dSHong Zhang 13959566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 139635e7444dSHong Zhang for (i=0; i<n; i++) { 1397fdc842d1SBarry Smith x[i] = 0.0; 139835e7444dSHong Zhang for (j=ai[i]; j<ai[i+1]; j++) { 139935e7444dSHong Zhang if (aj[j] == i) { 140035e7444dSHong Zhang x[i] = aa[j]; 140117ab2063SBarry Smith break; 140217ab2063SBarry Smith } 140317ab2063SBarry Smith } 140417ab2063SBarry Smith } 14059566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 14069566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 14073a40ed3dSBarry Smith PetscFunctionReturn(0); 140817ab2063SBarry Smith } 140917ab2063SBarry Smith 1410c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1411dfbe8321SBarry Smith PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A,Vec xx,Vec zz,Vec yy) 141217ab2063SBarry Smith { 1413416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 14145f22a7b3SSebastian Grimberg const MatScalar *aa; 1415d9ca1df4SBarry Smith PetscScalar *y; 1416d9ca1df4SBarry Smith const PetscScalar *x; 1417d0f46423SBarry Smith PetscInt m = A->rmap->n; 14185c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 14195f22a7b3SSebastian Grimberg const MatScalar *v; 1420a77337e4SBarry Smith PetscScalar alpha; 1421d9ca1df4SBarry Smith PetscInt n,i,j; 1422d9ca1df4SBarry Smith const PetscInt *idx,*ii,*ridx=NULL; 14233447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1424ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14255c897100SBarry Smith #endif 142617ab2063SBarry Smith 14273a40ed3dSBarry Smith PetscFunctionBegin; 14289566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz,yy)); 14299566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx,&x)); 14309566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy,&y)); 14319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 14325c897100SBarry Smith 14335c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1434fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m,x,a->i,a->j,aa,y); 14355c897100SBarry Smith #else 14363447b6efSHong Zhang if (usecprow) { 14373447b6efSHong Zhang m = cprow.nrows; 14383447b6efSHong Zhang ii = cprow.i; 14397b2bb3b9SHong Zhang ridx = cprow.rindex; 14403447b6efSHong Zhang } else { 14413447b6efSHong Zhang ii = a->i; 14423447b6efSHong Zhang } 144317ab2063SBarry Smith for (i=0; i<m; i++) { 14443447b6efSHong Zhang idx = a->j + ii[i]; 1445fff043a9SJunchao Zhang v = aa + ii[i]; 14463447b6efSHong Zhang n = ii[i+1] - ii[i]; 14473447b6efSHong Zhang if (usecprow) { 14487b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14493447b6efSHong Zhang } else { 145017ab2063SBarry Smith alpha = x[i]; 14513447b6efSHong Zhang } 145204fbf559SBarry Smith for (j=0; j<n; j++) y[idx[j]] += alpha*v[j]; 145317ab2063SBarry Smith } 14545c897100SBarry Smith #endif 14559566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 14569566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx,&x)); 14579566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy,&y)); 14589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 14593a40ed3dSBarry Smith PetscFunctionReturn(0); 146017ab2063SBarry Smith } 146117ab2063SBarry Smith 1462dfbe8321SBarry Smith PetscErrorCode MatMultTranspose_SeqAIJ(Mat A,Vec xx,Vec yy) 14635c897100SBarry Smith { 14645c897100SBarry Smith PetscFunctionBegin; 14659566063dSJacob Faibussowitsch PetscCall(VecSet(yy,0.0)); 14669566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A,xx,yy,yy)); 14675c897100SBarry Smith PetscFunctionReturn(0); 14685c897100SBarry Smith } 14695c897100SBarry Smith 1470c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 147178b84d54SShri Abhyankar 1472dfbe8321SBarry Smith PetscErrorCode MatMult_SeqAIJ(Mat A,Vec xx,Vec yy) 147317ab2063SBarry Smith { 1474416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1475d9fead3dSBarry Smith PetscScalar *y; 147654f21887SBarry Smith const PetscScalar *x; 1477fff043a9SJunchao Zhang const MatScalar *aa,*a_a; 1478003131ecSBarry Smith PetscInt m=A->rmap->n; 14790298fd71SBarry Smith const PetscInt *aj,*ii,*ridx=NULL; 14807b083b7cSBarry Smith PetscInt n,i; 1481362ced78SSatish Balay PetscScalar sum; 1482ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 148317ab2063SBarry Smith 1484b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 148597952fefSHong Zhang #pragma disjoint(*x,*y,*aa) 1486fee21e36SBarry Smith #endif 1487fee21e36SBarry Smith 14883a40ed3dSBarry Smith PetscFunctionBegin; 1489b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14909566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A,xx,yy)); 1491b215bc84SStefano Zampini PetscFunctionReturn(0); 1492b215bc84SStefano Zampini } 14939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&a_a)); 14949566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx,&x)); 14959566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy,&y)); 1496416022c9SBarry Smith ii = a->i; 14974eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14989566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y,m)); 149997952fefSHong Zhang m = a->compressedrow.nrows; 150097952fefSHong Zhang ii = a->compressedrow.i; 150197952fefSHong Zhang ridx = a->compressedrow.rindex; 150297952fefSHong Zhang for (i=0; i<m; i++) { 150397952fefSHong Zhang n = ii[i+1] - ii[i]; 150497952fefSHong Zhang aj = a->j + ii[i]; 1505fff043a9SJunchao Zhang aa = a_a + ii[i]; 150697952fefSHong Zhang sum = 0.0; 1507003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 1508003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 150997952fefSHong Zhang y[*ridx++] = sum; 151097952fefSHong Zhang } 151197952fefSHong Zhang } else { /* do not use compressed row format */ 1512b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 15133d3eaba7SBarry Smith aj = a->j; 1514fff043a9SJunchao Zhang aa = a_a; 1515b05257ddSBarry Smith fortranmultaij_(&m,x,ii,aj,aa,y); 1516b05257ddSBarry Smith #else 151717ab2063SBarry Smith for (i=0; i<m; i++) { 1518003131ecSBarry Smith n = ii[i+1] - ii[i]; 1519003131ecSBarry Smith aj = a->j + ii[i]; 1520fff043a9SJunchao Zhang aa = a_a + ii[i]; 152117ab2063SBarry Smith sum = 0.0; 1522003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 152317ab2063SBarry Smith y[i] = sum; 152417ab2063SBarry Smith } 15258d195f9aSBarry Smith #endif 1526b05257ddSBarry Smith } 15279566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz - a->nonzerorowcnt)); 15289566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx,&x)); 15299566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy,&y)); 15309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&a_a)); 15313a40ed3dSBarry Smith PetscFunctionReturn(0); 153217ab2063SBarry Smith } 153317ab2063SBarry Smith 1534b434eb95SMatthew G. Knepley PetscErrorCode MatMultMax_SeqAIJ(Mat A,Vec xx,Vec yy) 1535b434eb95SMatthew G. Knepley { 1536b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1537b434eb95SMatthew G. Knepley PetscScalar *y; 1538b434eb95SMatthew G. Knepley const PetscScalar *x; 1539fff043a9SJunchao Zhang const MatScalar *aa,*a_a; 1540b434eb95SMatthew G. Knepley PetscInt m=A->rmap->n; 1541b434eb95SMatthew G. Knepley const PetscInt *aj,*ii,*ridx=NULL; 1542b434eb95SMatthew G. Knepley PetscInt n,i,nonzerorow=0; 1543b434eb95SMatthew G. Knepley PetscScalar sum; 1544b434eb95SMatthew G. Knepley PetscBool usecprow=a->compressedrow.use; 1545b434eb95SMatthew G. Knepley 1546b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1547b434eb95SMatthew G. Knepley #pragma disjoint(*x,*y,*aa) 1548b434eb95SMatthew G. Knepley #endif 1549b434eb95SMatthew G. Knepley 1550b434eb95SMatthew G. Knepley PetscFunctionBegin; 15519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&a_a)); 15529566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx,&x)); 15539566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy,&y)); 1554b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1555b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1556b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1557b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1558b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1559b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1560b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1561fff043a9SJunchao Zhang aa = a_a + ii[i]; 1562b434eb95SMatthew G. Knepley sum = 0.0; 1563b434eb95SMatthew G. Knepley nonzerorow += (n>0); 1564b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1565b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1566b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1567b434eb95SMatthew G. Knepley } 1568b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15693d3eaba7SBarry Smith ii = a->i; 1570b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1571b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1572b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1573fff043a9SJunchao Zhang aa = a_a + ii[i]; 1574b434eb95SMatthew G. Knepley sum = 0.0; 1575b434eb95SMatthew G. Knepley nonzerorow += (n>0); 1576b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1577b434eb95SMatthew G. Knepley y[i] = sum; 1578b434eb95SMatthew G. Knepley } 1579b434eb95SMatthew G. Knepley } 15809566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz - nonzerorow)); 15819566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx,&x)); 15829566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy,&y)); 15839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&a_a)); 1584b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1585b434eb95SMatthew G. Knepley } 1586b434eb95SMatthew G. Knepley 1587b434eb95SMatthew G. Knepley PetscErrorCode MatMultAddMax_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz) 1588b434eb95SMatthew G. Knepley { 1589b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1590b434eb95SMatthew G. Knepley PetscScalar *y,*z; 1591b434eb95SMatthew G. Knepley const PetscScalar *x; 1592fff043a9SJunchao Zhang const MatScalar *aa,*a_a; 1593b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n,*aj,*ii; 1594b434eb95SMatthew G. Knepley PetscInt n,i,*ridx=NULL; 1595b434eb95SMatthew G. Knepley PetscScalar sum; 1596b434eb95SMatthew G. Knepley PetscBool usecprow=a->compressedrow.use; 1597b434eb95SMatthew G. Knepley 1598b434eb95SMatthew G. Knepley PetscFunctionBegin; 15999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&a_a)); 16009566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx,&x)); 16019566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy,zz,&y,&z)); 1602b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1603b434eb95SMatthew G. Knepley if (zz != yy) { 16049566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(z,y,m)); 1605b434eb95SMatthew G. Knepley } 1606b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1607b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1608b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1609b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1610b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1611b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1612fff043a9SJunchao Zhang aa = a_a + ii[i]; 1613b434eb95SMatthew G. Knepley sum = y[*ridx]; 1614b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1615b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1616b434eb95SMatthew G. Knepley } 1617b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 16183d3eaba7SBarry Smith ii = a->i; 1619b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1620b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1621b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1622fff043a9SJunchao Zhang aa = a_a + ii[i]; 1623b434eb95SMatthew G. Knepley sum = y[i]; 1624b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1625b434eb95SMatthew G. Knepley z[i] = sum; 1626b434eb95SMatthew G. Knepley } 1627b434eb95SMatthew G. Knepley } 16289566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 16299566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx,&x)); 16309566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy,zz,&y,&z)); 16319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&a_a)); 1632b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1633b434eb95SMatthew G. Knepley } 1634b434eb95SMatthew G. Knepley 1635c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1636dfbe8321SBarry Smith PetscErrorCode MatMultAdd_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz) 163717ab2063SBarry Smith { 1638416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1639f15663dcSBarry Smith PetscScalar *y,*z; 1640f15663dcSBarry Smith const PetscScalar *x; 1641fff043a9SJunchao Zhang const MatScalar *aa,*a_a; 1642d9ca1df4SBarry Smith const PetscInt *aj,*ii,*ridx=NULL; 1643d9ca1df4SBarry Smith PetscInt m = A->rmap->n,n,i; 1644362ced78SSatish Balay PetscScalar sum; 1645ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 16469ea0dfa2SSatish Balay 16473a40ed3dSBarry Smith PetscFunctionBegin; 1648b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16499566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A,xx,yy,zz)); 1650b215bc84SStefano Zampini PetscFunctionReturn(0); 1651b215bc84SStefano Zampini } 16529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&a_a)); 16539566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx,&x)); 16549566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy,zz,&y,&z)); 16554eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 16564eb6d288SHong Zhang if (zz != yy) { 16579566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(z,y,m)); 16584eb6d288SHong Zhang } 165997952fefSHong Zhang m = a->compressedrow.nrows; 166097952fefSHong Zhang ii = a->compressedrow.i; 166197952fefSHong Zhang ridx = a->compressedrow.rindex; 166297952fefSHong Zhang for (i=0; i<m; i++) { 166397952fefSHong Zhang n = ii[i+1] - ii[i]; 166497952fefSHong Zhang aj = a->j + ii[i]; 1665fff043a9SJunchao Zhang aa = a_a + ii[i]; 166697952fefSHong Zhang sum = y[*ridx]; 1667f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 166897952fefSHong Zhang z[*ridx++] = sum; 166997952fefSHong Zhang } 167097952fefSHong Zhang } else { /* do not use compressed row format */ 16713d3eaba7SBarry Smith ii = a->i; 1672f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16733d3eaba7SBarry Smith aj = a->j; 1674fff043a9SJunchao Zhang aa = a_a; 1675f15663dcSBarry Smith fortranmultaddaij_(&m,x,ii,aj,aa,y,z); 1676f15663dcSBarry Smith #else 167717ab2063SBarry Smith for (i=0; i<m; i++) { 1678f15663dcSBarry Smith n = ii[i+1] - ii[i]; 1679f15663dcSBarry Smith aj = a->j + ii[i]; 1680fff043a9SJunchao Zhang aa = a_a + ii[i]; 168117ab2063SBarry Smith sum = y[i]; 1682f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 168317ab2063SBarry Smith z[i] = sum; 168417ab2063SBarry Smith } 168502ab625aSSatish Balay #endif 1686f15663dcSBarry Smith } 16879566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 16889566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx,&x)); 16899566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy,zz,&y,&z)); 16909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&a_a)); 16913a40ed3dSBarry Smith PetscFunctionReturn(0); 169217ab2063SBarry Smith } 169317ab2063SBarry Smith 169417ab2063SBarry Smith /* 169517ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 169617ab2063SBarry Smith */ 1697dfbe8321SBarry Smith PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 169817ab2063SBarry Smith { 1699416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1700d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n; 1701c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 170217ab2063SBarry Smith 17033a40ed3dSBarry Smith PetscFunctionBegin; 170409f38230SBarry Smith if (!a->diag) { 17059566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&a->diag)); 17069566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A, m*sizeof(PetscInt))); 1707c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 170809f38230SBarry Smith } 1709d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 1710c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1711c0c07093SJunchao Zhang if (alreadySet) { 1712c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1713c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i+1] && a->j[pos] == i) continue; 1714c0c07093SJunchao Zhang } 1715c0c07093SJunchao Zhang 171609f38230SBarry Smith a->diag[i] = a->i[i+1]; 1717bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1718bfeeae90SHong Zhang if (a->j[j] == i) { 171909f38230SBarry Smith a->diag[i] = j; 172017ab2063SBarry Smith break; 172117ab2063SBarry Smith } 172217ab2063SBarry Smith } 172317ab2063SBarry Smith } 17243a40ed3dSBarry Smith PetscFunctionReturn(0); 172517ab2063SBarry Smith } 172617ab2063SBarry Smith 172761ecd0c6SBarry Smith PetscErrorCode MatShift_SeqAIJ(Mat A,PetscScalar v) 172861ecd0c6SBarry Smith { 172961ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 173061ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt*)a->diag; 173161ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt*) a->i; 173261ecd0c6SBarry Smith PetscInt i,*mdiag = NULL; 173361ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 173461ecd0c6SBarry Smith 173561ecd0c6SBarry Smith PetscFunctionBegin; 173661ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A,1,NULL)); 17389566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A,v)); 173961ecd0c6SBarry Smith PetscFunctionReturn(0); 174061ecd0c6SBarry Smith } 174161ecd0c6SBarry Smith 174261ecd0c6SBarry Smith if (a->diagonaldense) { 174361ecd0c6SBarry Smith cnt = 0; 174461ecd0c6SBarry Smith } else { 17459566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n,&mdiag)); 174661ecd0c6SBarry Smith for (i=0; i<A->rmap->n; i++) { 1747349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i+1]) { /* 'out of range' rows never have diagonals */ 174861ecd0c6SBarry Smith cnt++; 174961ecd0c6SBarry Smith mdiag[i] = 1; 175061ecd0c6SBarry Smith } 175161ecd0c6SBarry Smith } 175261ecd0c6SBarry Smith } 175361ecd0c6SBarry Smith if (!cnt) { 17549566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A,v)); 175561ecd0c6SBarry Smith } else { 1756b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1757b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 175861ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc,free_a = a->free_a,free_ij = a->free_ij; 175961ecd0c6SBarry Smith 176061ecd0c6SBarry Smith a->a = NULL; 176161ecd0c6SBarry Smith a->j = NULL; 176261ecd0c6SBarry Smith a->i = NULL; 176361ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1764349d3b71SJunchao Zhang for (i=0; i<PetscMin(A->rmap->n,A->cmap->n); i++) { 176561ecd0c6SBarry Smith a->imax[i] += mdiag[i]; 176661ecd0c6SBarry Smith } 17679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A,0,a->imax)); 176861ecd0c6SBarry Smith 176961ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 177061ecd0c6SBarry Smith for (i=0; i<A->rmap->n; i++) { 17719566063dSJacob Faibussowitsch PetscCall(MatSetValues(A,1,&i,a->imax[i] - mdiag[i],&oldj[oldi[i]],&olda[oldi[i]],ADD_VALUES)); 1772447d62f5SStefano Zampini if (i < A->cmap->n) { 17739566063dSJacob Faibussowitsch PetscCall(MatSetValue(A,i,i,v,ADD_VALUES)); 177461ecd0c6SBarry Smith } 1775447d62f5SStefano Zampini } 17769566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A,MAT_FINAL_ASSEMBLY)); 17779566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A,MAT_FINAL_ASSEMBLY)); 177861ecd0c6SBarry Smith if (singlemalloc) { 17799566063dSJacob Faibussowitsch PetscCall(PetscFree3(olda,oldj,oldi)); 178061ecd0c6SBarry Smith } else { 17819566063dSJacob Faibussowitsch if (free_a) PetscCall(PetscFree(olda)); 17829566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldj)); 17839566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldi)); 178461ecd0c6SBarry Smith } 178561ecd0c6SBarry Smith } 17869566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 178761ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 178861ecd0c6SBarry Smith PetscFunctionReturn(0); 178961ecd0c6SBarry Smith } 179061ecd0c6SBarry Smith 1791be5855fcSBarry Smith /* 1792be5855fcSBarry Smith Checks for missing diagonals 1793be5855fcSBarry Smith */ 1794ace3abfcSBarry Smith PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A,PetscBool *missing,PetscInt *d) 1795be5855fcSBarry Smith { 1796be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 17977734d3b5SMatthew G. Knepley PetscInt *diag,*ii = a->i,i; 1798be5855fcSBarry Smith 1799be5855fcSBarry Smith PetscFunctionBegin; 180009f38230SBarry Smith *missing = PETSC_FALSE; 18017734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 180209f38230SBarry Smith *missing = PETSC_TRUE; 180309f38230SBarry Smith if (d) *d = 0; 18049566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Matrix has no entries therefore is missing diagonal\n")); 180509f38230SBarry Smith } else { 180601445905SHong Zhang PetscInt n; 180701445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1808f1e2ffcdSBarry Smith diag = a->diag; 180901445905SHong Zhang for (i=0; i<n; i++) { 18107734d3b5SMatthew G. Knepley if (diag[i] >= ii[i+1]) { 181109f38230SBarry Smith *missing = PETSC_TRUE; 181209f38230SBarry Smith if (d) *d = i; 18139566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Matrix is missing diagonal number %" PetscInt_FMT "\n",i)); 1814358d2f5dSShri Abhyankar break; 181509f38230SBarry Smith } 1816be5855fcSBarry Smith } 1817be5855fcSBarry Smith } 1818be5855fcSBarry Smith PetscFunctionReturn(0); 1819be5855fcSBarry Smith } 1820be5855fcSBarry Smith 18210da83c2eSBarry Smith #include <petscblaslapack.h> 18220da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 18230da83c2eSBarry Smith 18240da83c2eSBarry Smith /* 18250da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 18260da83c2eSBarry Smith */ 18270da83c2eSBarry Smith PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A,PetscInt nblocks,const PetscInt *bsizes,PetscScalar *diag) 18280da83c2eSBarry Smith { 18290da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx,j,bsizemax = 0,*v_pivots; 18300da83c2eSBarry Smith PetscBool allowzeropivot,zeropivotdetected=PETSC_FALSE; 18310da83c2eSBarry Smith const PetscReal shift = 0.0; 18320da83c2eSBarry Smith PetscInt ipvt[5]; 18330da83c2eSBarry Smith PetscScalar work[25],*v_work; 18340da83c2eSBarry Smith 18350da83c2eSBarry Smith PetscFunctionBegin; 18360da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18370da83c2eSBarry Smith for (i=0; i<nblocks; i++) ncnt += bsizes[i]; 183808401ef6SPierre Jolivet PetscCheck(ncnt == n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT,ncnt,n); 18390da83c2eSBarry Smith for (i=0; i<nblocks; i++) { 18400da83c2eSBarry Smith bsizemax = PetscMax(bsizemax,bsizes[i]); 18410da83c2eSBarry Smith } 18429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax,&indx)); 18430da83c2eSBarry Smith if (bsizemax > 7) { 18449566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(bsizemax,&v_work,bsizemax,&v_pivots)); 18450da83c2eSBarry Smith } 18460da83c2eSBarry Smith ncnt = 0; 18470da83c2eSBarry Smith for (i=0; i<nblocks; i++) { 18480da83c2eSBarry Smith for (j=0; j<bsizes[i]; j++) indx[j] = ncnt+j; 18499566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,bsizes[i],indx,bsizes[i],indx,diag)); 18500da83c2eSBarry Smith switch (bsizes[i]) { 18510da83c2eSBarry Smith case 1: 18520da83c2eSBarry Smith *diag = 1.0/(*diag); 18530da83c2eSBarry Smith break; 18540da83c2eSBarry Smith case 2: 18559566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag,shift,allowzeropivot,&zeropivotdetected)); 18560da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18579566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18580da83c2eSBarry Smith break; 18590da83c2eSBarry Smith case 3: 18609566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag,shift,allowzeropivot,&zeropivotdetected)); 18610da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18629566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18630da83c2eSBarry Smith break; 18640da83c2eSBarry Smith case 4: 18659566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag,shift,allowzeropivot,&zeropivotdetected)); 18660da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18679566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18680da83c2eSBarry Smith break; 18690da83c2eSBarry Smith case 5: 18709566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag,ipvt,work,shift,allowzeropivot,&zeropivotdetected)); 18710da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18729566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18730da83c2eSBarry Smith break; 18740da83c2eSBarry Smith case 6: 18759566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag,shift,allowzeropivot,&zeropivotdetected)); 18760da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18779566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18780da83c2eSBarry Smith break; 18790da83c2eSBarry Smith case 7: 18809566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag,shift,allowzeropivot,&zeropivotdetected)); 18810da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18829566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18830da83c2eSBarry Smith break; 18840da83c2eSBarry Smith default: 18859566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i],diag,v_pivots,v_work,allowzeropivot,&zeropivotdetected)); 18860da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18879566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag,bsizes[i])); 18880da83c2eSBarry Smith } 18890da83c2eSBarry Smith ncnt += bsizes[i]; 18900da83c2eSBarry Smith diag += bsizes[i]*bsizes[i]; 18910da83c2eSBarry Smith } 18920da83c2eSBarry Smith if (bsizemax > 7) { 18939566063dSJacob Faibussowitsch PetscCall(PetscFree2(v_work,v_pivots)); 18940da83c2eSBarry Smith } 18959566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18960da83c2eSBarry Smith PetscFunctionReturn(0); 18970da83c2eSBarry Smith } 18980da83c2eSBarry Smith 1899422a814eSBarry Smith /* 1900422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1901422a814eSBarry Smith */ 19027087cfbeSBarry Smith PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A,PetscScalar omega,PetscScalar fshift) 190371f1c65dSBarry Smith { 190471f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 1905d0f46423SBarry Smith PetscInt i,*diag,m = A->rmap->n; 19062e5835c6SStefano Zampini const MatScalar *v; 190754f21887SBarry Smith PetscScalar *idiag,*mdiag; 190871f1c65dSBarry Smith 190971f1c65dSBarry Smith PetscFunctionBegin; 191071f1c65dSBarry Smith if (a->idiagvalid) PetscFunctionReturn(0); 19119566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 191271f1c65dSBarry Smith diag = a->diag; 191371f1c65dSBarry Smith if (!a->idiag) { 19149566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(m,&a->idiag,m,&a->mdiag,m,&a->ssor_work)); 19159566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,3*m*sizeof(PetscScalar))); 191671f1c65dSBarry Smith } 19172e5835c6SStefano Zampini 191871f1c65dSBarry Smith mdiag = a->mdiag; 191971f1c65dSBarry Smith idiag = a->idiag; 19209566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&v)); 1921422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 192271f1c65dSBarry Smith for (i=0; i<m; i++) { 192371f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1924899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1925899639b0SHong Zhang if (PetscRealPart(fshift)) { 19269566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Zero diagonal on row %" PetscInt_FMT "\n",i)); 19277b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 19287b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 19297b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 193098921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Zero diagonal on row %" PetscInt_FMT,i); 1931899639b0SHong Zhang } 193271f1c65dSBarry Smith idiag[i] = 1.0/v[diag[i]]; 193371f1c65dSBarry Smith } 19349566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 193571f1c65dSBarry Smith } else { 193671f1c65dSBarry Smith for (i=0; i<m; i++) { 193771f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 193871f1c65dSBarry Smith idiag[i] = omega/(fshift + v[diag[i]]); 193971f1c65dSBarry Smith } 19409566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*m)); 194171f1c65dSBarry Smith } 194271f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&v)); 194471f1c65dSBarry Smith PetscFunctionReturn(0); 194571f1c65dSBarry Smith } 194671f1c65dSBarry Smith 1947c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 194841f059aeSBarry Smith PetscErrorCode MatSOR_SeqAIJ(Mat A,Vec bb,PetscReal omega,MatSORType flag,PetscReal fshift,PetscInt its,PetscInt lits,Vec xx) 194917ab2063SBarry Smith { 1950416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1951e6d1f457SBarry Smith PetscScalar *x,d,sum,*t,scale; 19522e5835c6SStefano Zampini const MatScalar *v,*idiag=NULL,*mdiag,*aa; 195354f21887SBarry Smith const PetscScalar *b, *bs,*xb, *ts; 19543d3eaba7SBarry Smith PetscInt n,m = A->rmap->n,i; 195597f1f81fSBarry Smith const PetscInt *idx,*diag; 195617ab2063SBarry Smith 19573a40ed3dSBarry Smith PetscFunctionBegin; 1958b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19599566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A,bb,omega,flag,fshift,its,lits,xx)); 1960b215bc84SStefano Zampini PetscFunctionReturn(0); 1961b215bc84SStefano Zampini } 1962b965ef7fSBarry Smith its = its*lits; 196391723122SBarry Smith 196471f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19659566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A,omega,fshift)); 196671f1c65dSBarry Smith a->fshift = fshift; 196771f1c65dSBarry Smith a->omega = omega; 1968ed480e8bSBarry Smith 196971f1c65dSBarry Smith diag = a->diag; 197071f1c65dSBarry Smith t = a->ssor_work; 1971ed480e8bSBarry Smith idiag = a->idiag; 197271f1c65dSBarry Smith mdiag = a->mdiag; 1973ed480e8bSBarry Smith 19749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 19759566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx,&x)); 19769566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb,&b)); 1977ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 197817ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 197917ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1980ed480e8bSBarry Smith bs = b; 198117ab2063SBarry Smith for (i=0; i<m; i++) { 198271f1c65dSBarry Smith d = fshift + mdiag[i]; 1983416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1984ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19852e5835c6SStefano Zampini v = aa + diag[i] + 1; 198617ab2063SBarry Smith sum = b[i]*d/omega; 1987003131ecSBarry Smith PetscSparseDensePlusDot(sum,bs,v,idx,n); 198817ab2063SBarry Smith x[i] = sum; 198917ab2063SBarry Smith } 19909566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx,&x)); 19919566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb,&b)); 19929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 19939566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19943a40ed3dSBarry Smith PetscFunctionReturn(0); 199517ab2063SBarry Smith } 1996c783ea89SBarry Smith 199708401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER,PETSC_COMM_SELF,PETSC_ERR_SUP,"SOR_APPLY_LOWER is not implemented"); 19982205254eSKarl Rupp else if (flag & SOR_EISENSTAT) { 19994c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 2000887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 200117ab2063SBarry Smith 200217ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 200317ab2063SBarry Smith 2004887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 200517ab2063SBarry Smith */ 200617ab2063SBarry Smith scale = (2.0/omega) - 1.0; 200717ab2063SBarry Smith 200817ab2063SBarry Smith /* x = (E + U)^{-1} b */ 200917ab2063SBarry Smith for (i=m-1; i>=0; i--) { 2010416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 2011ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20122e5835c6SStefano Zampini v = aa + diag[i] + 1; 201317ab2063SBarry Smith sum = b[i]; 2014e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 2015ed480e8bSBarry Smith x[i] = sum*idiag[i]; 201617ab2063SBarry Smith } 201717ab2063SBarry Smith 201817ab2063SBarry Smith /* t = b - (2*E - D)x */ 20192e5835c6SStefano Zampini v = aa; 20202205254eSKarl Rupp for (i=0; i<m; i++) t[i] = b[i] - scale*(v[*diag++])*x[i]; 202117ab2063SBarry Smith 202217ab2063SBarry Smith /* t = (E + L)^{-1}t */ 2023ed480e8bSBarry Smith ts = t; 2024416022c9SBarry Smith diag = a->diag; 202517ab2063SBarry Smith for (i=0; i<m; i++) { 2026416022c9SBarry Smith n = diag[i] - a->i[i]; 2027ed480e8bSBarry Smith idx = a->j + a->i[i]; 20282e5835c6SStefano Zampini v = aa + a->i[i]; 202917ab2063SBarry Smith sum = t[i]; 2030003131ecSBarry Smith PetscSparseDenseMinusDot(sum,ts,v,idx,n); 2031ed480e8bSBarry Smith t[i] = sum*idiag[i]; 2032733d66baSBarry Smith /* x = x + t */ 2033733d66baSBarry Smith x[i] += t[i]; 203417ab2063SBarry Smith } 203517ab2063SBarry Smith 20369566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0*m-1 + 2.0*a->nz)); 20379566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx,&x)); 20389566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb,&b)); 20393a40ed3dSBarry Smith PetscFunctionReturn(0); 204017ab2063SBarry Smith } 204117ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 204217ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 204317ab2063SBarry Smith for (i=0; i<m; i++) { 2044416022c9SBarry Smith n = diag[i] - a->i[i]; 2045ed480e8bSBarry Smith idx = a->j + a->i[i]; 20462e5835c6SStefano Zampini v = aa + a->i[i]; 204717ab2063SBarry Smith sum = b[i]; 2048e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 20495c99c7daSBarry Smith t[i] = sum; 2050ed480e8bSBarry Smith x[i] = sum*idiag[i]; 205117ab2063SBarry Smith } 20525c99c7daSBarry Smith xb = t; 20539566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20543a40ed3dSBarry Smith } else xb = b; 205517ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 205617ab2063SBarry Smith for (i=m-1; i>=0; i--) { 2057416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 2058ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20592e5835c6SStefano Zampini v = aa + diag[i] + 1; 206017ab2063SBarry Smith sum = xb[i]; 2061e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 20625c99c7daSBarry Smith if (xb == b) { 2063ed480e8bSBarry Smith x[i] = sum*idiag[i]; 20645c99c7daSBarry Smith } else { 2065b19a5dc2SMark Adams x[i] = (1-omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 206617ab2063SBarry Smith } 20675c99c7daSBarry Smith } 20689566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 206917ab2063SBarry Smith } 207017ab2063SBarry Smith its--; 207117ab2063SBarry Smith } 207217ab2063SBarry Smith while (its--) { 207317ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 207417ab2063SBarry Smith for (i=0; i<m; i++) { 2075b19a5dc2SMark Adams /* lower */ 2076b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2077ed480e8bSBarry Smith idx = a->j + a->i[i]; 20782e5835c6SStefano Zampini v = aa + a->i[i]; 207917ab2063SBarry Smith sum = b[i]; 2080e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 2081b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2082b19a5dc2SMark Adams /* upper */ 2083b19a5dc2SMark Adams n = a->i[i+1] - diag[i] - 1; 2084b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20852e5835c6SStefano Zampini v = aa + diag[i] + 1; 2086b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum,x,v,idx,n); 2087b19a5dc2SMark Adams x[i] = (1. - omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 208817ab2063SBarry Smith } 2089b19a5dc2SMark Adams xb = t; 20909566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 2091b19a5dc2SMark Adams } else xb = b; 209217ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 209317ab2063SBarry Smith for (i=m-1; i>=0; i--) { 2094b19a5dc2SMark Adams sum = xb[i]; 2095b19a5dc2SMark Adams if (xb == b) { 2096b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2097416022c9SBarry Smith n = a->i[i+1] - a->i[i]; 2098ed480e8bSBarry Smith idx = a->j + a->i[i]; 20992e5835c6SStefano Zampini v = aa + a->i[i]; 2100e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 2101ed480e8bSBarry Smith x[i] = (1. - omega)*x[i] + (sum + mdiag[i]*x[i])*idiag[i]; 2102b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2103b19a5dc2SMark Adams n = a->i[i+1] - diag[i] - 1; 2104b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 21052e5835c6SStefano Zampini v = aa + diag[i] + 1; 2106b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum,x,v,idx,n); 2107b19a5dc2SMark Adams x[i] = (1. - omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 210817ab2063SBarry Smith } 2109b19a5dc2SMark Adams } 2110b19a5dc2SMark Adams if (xb == b) { 21119566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 2112b19a5dc2SMark Adams } else { 21139566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2114b19a5dc2SMark Adams } 211517ab2063SBarry Smith } 211617ab2063SBarry Smith } 21179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 21189566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx,&x)); 21199566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb,&b)); 2120365a8a9eSBarry Smith PetscFunctionReturn(0); 212117ab2063SBarry Smith } 212217ab2063SBarry Smith 2123dfbe8321SBarry Smith PetscErrorCode MatGetInfo_SeqAIJ(Mat A,MatInfoType flag,MatInfo *info) 212417ab2063SBarry Smith { 2125416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 21264e220ebcSLois Curfman McInnes 21273a40ed3dSBarry Smith PetscFunctionBegin; 21284e220ebcSLois Curfman McInnes info->block_size = 1.0; 21293966268fSBarry Smith info->nz_allocated = a->maxnz; 21303966268fSBarry Smith info->nz_used = a->nz; 21313966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 21323966268fSBarry Smith info->assemblies = A->num_ass; 21333966268fSBarry Smith info->mallocs = A->info.mallocs; 21347adad957SLisandro Dalcin info->memory = ((PetscObject)A)->mem; 2135d5f3da31SBarry Smith if (A->factortype) { 21364e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 21374e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 21384e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 21394e220ebcSLois Curfman McInnes } else { 21404e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21414e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21424e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21434e220ebcSLois Curfman McInnes } 21443a40ed3dSBarry Smith PetscFunctionReturn(0); 214517ab2063SBarry Smith } 214617ab2063SBarry Smith 21472b40b63fSBarry Smith PetscErrorCode MatZeroRows_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 214817ab2063SBarry Smith { 2149416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2150c7da8527SEric Chamberland PetscInt i,m = A->rmap->n - 1; 215197b48c8fSBarry Smith const PetscScalar *xx; 21522e5835c6SStefano Zampini PetscScalar *bb,*aa; 2153c7da8527SEric Chamberland PetscInt d = 0; 215417ab2063SBarry Smith 21553a40ed3dSBarry Smith PetscFunctionBegin; 215697b48c8fSBarry Smith if (x && b) { 21579566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x,&xx)); 21589566063dSJacob Faibussowitsch PetscCall(VecGetArray(b,&bb)); 215997b48c8fSBarry Smith for (i=0; i<N; i++) { 2160aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %" PetscInt_FMT " out of range", rows[i]); 2161447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 216297b48c8fSBarry Smith bb[rows[i]] = diag*xx[rows[i]]; 216397b48c8fSBarry Smith } 21649566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x,&xx)); 21659566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b,&bb)); 216697b48c8fSBarry Smith } 216797b48c8fSBarry Smith 21689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 2169a9817697SBarry Smith if (a->keepnonzeropattern) { 2170f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 2171aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %" PetscInt_FMT " out of range", rows[i]); 21729566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]],a->ilen[rows[i]])); 2173f1e2ffcdSBarry Smith } 2174f4df32b1SMatthew Knepley if (diag != 0.0) { 2175c7da8527SEric Chamberland for (i=0; i<N; i++) { 2176c7da8527SEric Chamberland d = rows[i]; 2177447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 217808401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d+1],PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT,d); 2179c7da8527SEric Chamberland } 2180f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 2181447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21822e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2183f1e2ffcdSBarry Smith } 2184f1e2ffcdSBarry Smith } 2185f1e2ffcdSBarry Smith } else { 2186f4df32b1SMatthew Knepley if (diag != 0.0) { 218717ab2063SBarry Smith for (i=0; i<N; i++) { 2188aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %" PetscInt_FMT " out of range", rows[i]); 21897ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2190447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2191447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2192447d62f5SStefano Zampini } else { 2193416022c9SBarry Smith a->ilen[rows[i]] = 1; 21942e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2195bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2196447d62f5SStefano Zampini } 2197447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21989566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],&diag,INSERT_VALUES)); 219917ab2063SBarry Smith } 220017ab2063SBarry Smith } 22013a40ed3dSBarry Smith } else { 220217ab2063SBarry Smith for (i=0; i<N; i++) { 2203aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %" PetscInt_FMT " out of range", rows[i]); 2204416022c9SBarry Smith a->ilen[rows[i]] = 0; 220517ab2063SBarry Smith } 220617ab2063SBarry Smith } 2207e56f5c9eSBarry Smith A->nonzerostate++; 2208f1e2ffcdSBarry Smith } 22099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 22109566063dSJacob Faibussowitsch PetscCall((*A->ops->assemblyend)(A,MAT_FINAL_ASSEMBLY)); 22113a40ed3dSBarry Smith PetscFunctionReturn(0); 221217ab2063SBarry Smith } 221317ab2063SBarry Smith 22146e169961SBarry Smith PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 22156e169961SBarry Smith { 22166e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 22176e169961SBarry Smith PetscInt i,j,m = A->rmap->n - 1,d = 0; 22182b40b63fSBarry Smith PetscBool missing,*zeroed,vecs = PETSC_FALSE; 22196e169961SBarry Smith const PetscScalar *xx; 22202e5835c6SStefano Zampini PetscScalar *bb,*aa; 22216e169961SBarry Smith 22226e169961SBarry Smith PetscFunctionBegin; 22232e5835c6SStefano Zampini if (!N) PetscFunctionReturn(0); 22249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 22256e169961SBarry Smith if (x && b) { 22269566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x,&xx)); 22279566063dSJacob Faibussowitsch PetscCall(VecGetArray(b,&bb)); 22282b40b63fSBarry Smith vecs = PETSC_TRUE; 22296e169961SBarry Smith } 22309566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n,&zeroed)); 22316e169961SBarry Smith for (i=0; i<N; i++) { 2232aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %" PetscInt_FMT " out of range", rows[i]); 22339566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]],a->ilen[rows[i]])); 22342205254eSKarl Rupp 22356e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 22366e169961SBarry Smith } 22376e169961SBarry Smith for (i=0; i<A->rmap->n; i++) { 22386e169961SBarry Smith if (!zeroed[i]) { 22396e169961SBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 22404cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22412e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j]*xx[a->j[j]]; 22422e5835c6SStefano Zampini aa[j] = 0.0; 22436e169961SBarry Smith } 22446e169961SBarry Smith } 22454cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag*xx[i]; 22466e169961SBarry Smith } 22476e169961SBarry Smith if (x && b) { 22489566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x,&xx)); 22499566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b,&bb)); 22506e169961SBarry Smith } 22519566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22526e169961SBarry Smith if (diag != 0.0) { 22539566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A,&missing,&d)); 22541d5a398dSstefano_zampini if (missing) { 22551d5a398dSstefano_zampini for (i=0; i<N; i++) { 22564cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2257aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")",d,rows[i]); 22589566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],&diag,INSERT_VALUES)); 22591d5a398dSstefano_zampini } 22601d5a398dSstefano_zampini } else { 22616e169961SBarry Smith for (i=0; i<N; i++) { 22622e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 22636e169961SBarry Smith } 22646e169961SBarry Smith } 22651d5a398dSstefano_zampini } 22669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 22679566063dSJacob Faibussowitsch PetscCall((*A->ops->assemblyend)(A,MAT_FINAL_ASSEMBLY)); 22686e169961SBarry Smith PetscFunctionReturn(0); 22696e169961SBarry Smith } 22706e169961SBarry Smith 2271a77337e4SBarry Smith PetscErrorCode MatGetRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 227217ab2063SBarry Smith { 2273fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2274fff043a9SJunchao Zhang const PetscScalar *aa; 2275fff043a9SJunchao Zhang PetscInt *itmp; 227617ab2063SBarry Smith 22773a40ed3dSBarry Smith PetscFunctionBegin; 22789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 2279416022c9SBarry Smith *nz = a->i[row+1] - a->i[row]; 22802e5835c6SStefano Zampini if (v) *v = (PetscScalar*)(aa + a->i[row]); 228117ab2063SBarry Smith if (idx) { 2282bfeeae90SHong Zhang itmp = a->j + a->i[row]; 228326fbe8dcSKarl Rupp if (*nz) *idx = itmp; 2284f4259b30SLisandro Dalcin else *idx = NULL; 228517ab2063SBarry Smith } 22869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 22873a40ed3dSBarry Smith PetscFunctionReturn(0); 228817ab2063SBarry Smith } 228917ab2063SBarry Smith 2290a77337e4SBarry Smith PetscErrorCode MatRestoreRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 229117ab2063SBarry Smith { 22923a40ed3dSBarry Smith PetscFunctionBegin; 2293cb4a9cd9SHong Zhang if (nz) *nz = 0; 22942e5835c6SStefano Zampini if (idx) *idx = NULL; 22952e5835c6SStefano Zampini if (v) *v = NULL; 22963a40ed3dSBarry Smith PetscFunctionReturn(0); 229717ab2063SBarry Smith } 229817ab2063SBarry Smith 2299dfbe8321SBarry Smith PetscErrorCode MatNorm_SeqAIJ(Mat A,NormType type,PetscReal *nrm) 230017ab2063SBarry Smith { 2301416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 23022e5835c6SStefano Zampini const MatScalar *v; 230336db0b34SBarry Smith PetscReal sum = 0.0; 230497f1f81fSBarry Smith PetscInt i,j; 230517ab2063SBarry Smith 23063a40ed3dSBarry Smith PetscFunctionBegin; 23079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&v)); 230817ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2309570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2310570b7f6dSBarry Smith PetscBLASInt one = 1,nz = a->nz; 231173cf7048SBarry Smith PetscStackCallBLAS("BLASnrm2",*nrm = BLASnrm2_(&nz,v,&one)); 2312570b7f6dSBarry Smith #else 2313416022c9SBarry Smith for (i=0; i<a->nz; i++) { 231436db0b34SBarry Smith sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 231517ab2063SBarry Smith } 23168f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2317570b7f6dSBarry Smith #endif 23189566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 23193a40ed3dSBarry Smith } else if (type == NORM_1) { 232036db0b34SBarry Smith PetscReal *tmp; 232197f1f81fSBarry Smith PetscInt *jj = a->j; 23229566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n+1,&tmp)); 2323064f8208SBarry Smith *nrm = 0.0; 2324416022c9SBarry Smith for (j=0; j<a->nz; j++) { 2325bfeeae90SHong Zhang tmp[*jj++] += PetscAbsScalar(*v); v++; 232617ab2063SBarry Smith } 2327d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 2328064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 232917ab2063SBarry Smith } 23309566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 23319566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz-1,0))); 23323a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2333064f8208SBarry Smith *nrm = 0.0; 2334d0f46423SBarry Smith for (j=0; j<A->rmap->n; j++) { 23352e5835c6SStefano Zampini const PetscScalar *v2 = v + a->i[j]; 233617ab2063SBarry Smith sum = 0.0; 2337416022c9SBarry Smith for (i=0; i<a->i[j+1]-a->i[j]; i++) { 23382e5835c6SStefano Zampini sum += PetscAbsScalar(*v2); v2++; 233917ab2063SBarry Smith } 2340064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 234117ab2063SBarry Smith } 23429566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz-1,0))); 2343f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"No support for two norm"); 23449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&v)); 23453a40ed3dSBarry Smith PetscFunctionReturn(0); 234617ab2063SBarry Smith } 234717ab2063SBarry Smith 23484e938277SHong Zhang /* Merged from MatGetSymbolicTranspose_SeqAIJ() - replace MatGetSymbolicTranspose_SeqAIJ()? */ 23494e938277SHong Zhang PetscErrorCode MatTransposeSymbolic_SeqAIJ(Mat A,Mat *B) 23504e938277SHong Zhang { 23514e938277SHong Zhang PetscInt i,j,anzj; 23524e938277SHong Zhang Mat_SeqAIJ *a=(Mat_SeqAIJ*)A->data,*b; 23534e938277SHong Zhang PetscInt an=A->cmap->N,am=A->rmap->N; 23544e938277SHong Zhang PetscInt *ati,*atj,*atfill,*ai=a->i,*aj=a->j; 23554e938277SHong Zhang 23564e938277SHong Zhang PetscFunctionBegin; 23574e938277SHong Zhang /* Allocate space for symbolic transpose info and work array */ 23589566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(an+1,&ati)); 23599566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ai[am],&atj)); 23609566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(an,&atfill)); 23614e938277SHong Zhang 23624e938277SHong Zhang /* Walk through aj and count ## of non-zeros in each row of A^T. */ 23634e938277SHong Zhang /* Note: offset by 1 for fast conversion into csr format. */ 236426fbe8dcSKarl Rupp for (i=0;i<ai[am];i++) ati[aj[i]+1] += 1; 23654e938277SHong Zhang /* Form ati for csr format of A^T. */ 236626fbe8dcSKarl Rupp for (i=0;i<an;i++) ati[i+1] += ati[i]; 23674e938277SHong Zhang 23684e938277SHong Zhang /* Copy ati into atfill so we have locations of the next free space in atj */ 23699566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(atfill,ati,an)); 23704e938277SHong Zhang 23714e938277SHong Zhang /* Walk through A row-wise and mark nonzero entries of A^T. */ 23724e938277SHong Zhang for (i=0;i<am;i++) { 23734e938277SHong Zhang anzj = ai[i+1] - ai[i]; 23744e938277SHong Zhang for (j=0;j<anzj;j++) { 23754e938277SHong Zhang atj[atfill[*aj]] = i; 23764e938277SHong Zhang atfill[*aj++] += 1; 23774e938277SHong Zhang } 23784e938277SHong Zhang } 23794e938277SHong Zhang 23804e938277SHong Zhang /* Clean up temporary space and complete requests. */ 23819566063dSJacob Faibussowitsch PetscCall(PetscFree(atfill)); 23829566063dSJacob Faibussowitsch PetscCall(MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),an,am,ati,atj,NULL,B)); 23839566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(*B,PetscAbs(A->cmap->bs),PetscAbs(A->rmap->bs))); 23849566063dSJacob Faibussowitsch PetscCall(MatSetType(*B,((PetscObject)A)->type_name)); 2385a2f3521dSMark F. Adams 23864e938277SHong Zhang b = (Mat_SeqAIJ*)((*B)->data); 23874e938277SHong Zhang b->free_a = PETSC_FALSE; 23884e938277SHong Zhang b->free_ij = PETSC_TRUE; 23894e938277SHong Zhang b->nonew = 0; 23904e938277SHong Zhang PetscFunctionReturn(0); 23914e938277SHong Zhang } 23924e938277SHong Zhang 23937087cfbeSBarry Smith PetscErrorCode MatIsTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 2394cd0d46ebSvictorle { 23953d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) A->data,*bij = (Mat_SeqAIJ*) B->data; 239654f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 23972e5835c6SStefano Zampini const MatScalar *va,*vb; 239897f1f81fSBarry Smith PetscInt ma,na,mb,nb, i; 2399cd0d46ebSvictorle 2400cd0d46ebSvictorle PetscFunctionBegin; 24019566063dSJacob Faibussowitsch PetscCall(MatGetSize(A,&ma,&na)); 24029566063dSJacob Faibussowitsch PetscCall(MatGetSize(B,&mb,&nb)); 24035485867bSBarry Smith if (ma!=nb || na!=mb) { 24045485867bSBarry Smith *f = PETSC_FALSE; 24055485867bSBarry Smith PetscFunctionReturn(0); 24065485867bSBarry Smith } 24079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&va)); 24089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B,&vb)); 2409cd0d46ebSvictorle aii = aij->i; bii = bij->i; 2410cd0d46ebSvictorle adx = aij->j; bdx = bij->j; 24119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma,&aptr)); 24129566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb,&bptr)); 2413cd0d46ebSvictorle for (i=0; i<ma; i++) aptr[i] = aii[i]; 2414cd0d46ebSvictorle for (i=0; i<mb; i++) bptr[i] = bii[i]; 2415cd0d46ebSvictorle 2416cd0d46ebSvictorle *f = PETSC_TRUE; 2417cd0d46ebSvictorle for (i=0; i<ma; i++) { 2418cd0d46ebSvictorle while (aptr[i]<aii[i+1]) { 241997f1f81fSBarry Smith PetscInt idc,idr; 24205485867bSBarry Smith PetscScalar vc,vr; 2421cd0d46ebSvictorle /* column/row index/value */ 24225485867bSBarry Smith idc = adx[aptr[i]]; 24235485867bSBarry Smith idr = bdx[bptr[idc]]; 24245485867bSBarry Smith vc = va[aptr[i]]; 24255485867bSBarry Smith vr = vb[bptr[idc]]; 24265485867bSBarry Smith if (i!=idr || PetscAbsScalar(vc-vr) > tol) { 24275485867bSBarry Smith *f = PETSC_FALSE; 24285485867bSBarry Smith goto done; 2429cd0d46ebSvictorle } else { 24305485867bSBarry Smith aptr[i]++; 24315485867bSBarry Smith if (B || i!=idc) bptr[idc]++; 2432cd0d46ebSvictorle } 2433cd0d46ebSvictorle } 2434cd0d46ebSvictorle } 2435cd0d46ebSvictorle done: 24369566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24379566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&va)); 24399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B,&vb)); 2440cd0d46ebSvictorle PetscFunctionReturn(0); 2441cd0d46ebSvictorle } 2442cd0d46ebSvictorle 24437087cfbeSBarry Smith PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 24441cbb95d3SBarry Smith { 24453d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) A->data,*bij = (Mat_SeqAIJ*) B->data; 244654f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 244754f21887SBarry Smith MatScalar *va,*vb; 24481cbb95d3SBarry Smith PetscInt ma,na,mb,nb, i; 24491cbb95d3SBarry Smith 24501cbb95d3SBarry Smith PetscFunctionBegin; 24519566063dSJacob Faibussowitsch PetscCall(MatGetSize(A,&ma,&na)); 24529566063dSJacob Faibussowitsch PetscCall(MatGetSize(B,&mb,&nb)); 24531cbb95d3SBarry Smith if (ma!=nb || na!=mb) { 24541cbb95d3SBarry Smith *f = PETSC_FALSE; 24551cbb95d3SBarry Smith PetscFunctionReturn(0); 24561cbb95d3SBarry Smith } 24571cbb95d3SBarry Smith aii = aij->i; bii = bij->i; 24581cbb95d3SBarry Smith adx = aij->j; bdx = bij->j; 24591cbb95d3SBarry Smith va = aij->a; vb = bij->a; 24609566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma,&aptr)); 24619566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb,&bptr)); 24621cbb95d3SBarry Smith for (i=0; i<ma; i++) aptr[i] = aii[i]; 24631cbb95d3SBarry Smith for (i=0; i<mb; i++) bptr[i] = bii[i]; 24641cbb95d3SBarry Smith 24651cbb95d3SBarry Smith *f = PETSC_TRUE; 24661cbb95d3SBarry Smith for (i=0; i<ma; i++) { 24671cbb95d3SBarry Smith while (aptr[i]<aii[i+1]) { 24681cbb95d3SBarry Smith PetscInt idc,idr; 24691cbb95d3SBarry Smith PetscScalar vc,vr; 24701cbb95d3SBarry Smith /* column/row index/value */ 24711cbb95d3SBarry Smith idc = adx[aptr[i]]; 24721cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 24731cbb95d3SBarry Smith vc = va[aptr[i]]; 24741cbb95d3SBarry Smith vr = vb[bptr[idc]]; 24751cbb95d3SBarry Smith if (i!=idr || PetscAbsScalar(vc-PetscConj(vr)) > tol) { 24761cbb95d3SBarry Smith *f = PETSC_FALSE; 24771cbb95d3SBarry Smith goto done; 24781cbb95d3SBarry Smith } else { 24791cbb95d3SBarry Smith aptr[i]++; 24801cbb95d3SBarry Smith if (B || i!=idc) bptr[idc]++; 24811cbb95d3SBarry Smith } 24821cbb95d3SBarry Smith } 24831cbb95d3SBarry Smith } 24841cbb95d3SBarry Smith done: 24859566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24869566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24871cbb95d3SBarry Smith PetscFunctionReturn(0); 24881cbb95d3SBarry Smith } 24891cbb95d3SBarry Smith 2490ace3abfcSBarry Smith PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 24919e29f15eSvictorle { 24929e29f15eSvictorle PetscFunctionBegin; 24939566063dSJacob Faibussowitsch PetscCall(MatIsTranspose_SeqAIJ(A,A,tol,f)); 24949e29f15eSvictorle PetscFunctionReturn(0); 24959e29f15eSvictorle } 24969e29f15eSvictorle 2497ace3abfcSBarry Smith PetscErrorCode MatIsHermitian_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 24981cbb95d3SBarry Smith { 24991cbb95d3SBarry Smith PetscFunctionBegin; 25009566063dSJacob Faibussowitsch PetscCall(MatIsHermitianTranspose_SeqAIJ(A,A,tol,f)); 25011cbb95d3SBarry Smith PetscFunctionReturn(0); 25021cbb95d3SBarry Smith } 25031cbb95d3SBarry Smith 2504dfbe8321SBarry Smith PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A,Vec ll,Vec rr) 250517ab2063SBarry Smith { 2506416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2507fff8e43fSBarry Smith const PetscScalar *l,*r; 2508fff8e43fSBarry Smith PetscScalar x; 250954f21887SBarry Smith MatScalar *v; 2510fff8e43fSBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,M,nz = a->nz; 2511fff8e43fSBarry Smith const PetscInt *jj; 251217ab2063SBarry Smith 25133a40ed3dSBarry Smith PetscFunctionBegin; 251417ab2063SBarry Smith if (ll) { 25153ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 25163ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 25179566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll,&m)); 251808401ef6SPierre Jolivet PetscCheck(m == A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Left scaling vector wrong length"); 25199566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll,&l)); 25209566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&v)); 252117ab2063SBarry Smith for (i=0; i<m; i++) { 252217ab2063SBarry Smith x = l[i]; 2523416022c9SBarry Smith M = a->i[i+1] - a->i[i]; 25242205254eSKarl Rupp for (j=0; j<M; j++) (*v++) *= x; 252517ab2063SBarry Smith } 25269566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll,&l)); 25279566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 25289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&v)); 252917ab2063SBarry Smith } 253017ab2063SBarry Smith if (rr) { 25319566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr,&n)); 253208401ef6SPierre Jolivet PetscCheck(n == A->cmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Right scaling vector wrong length"); 25339566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr,&r)); 25349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&v)); 25352e5835c6SStefano Zampini jj = a->j; 25362205254eSKarl Rupp for (i=0; i<nz; i++) (*v++) *= r[*jj++]; 25379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&v)); 25389566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr,&r)); 25399566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 254017ab2063SBarry Smith } 25419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 25423a40ed3dSBarry Smith PetscFunctionReturn(0); 254317ab2063SBarry Smith } 254417ab2063SBarry Smith 25457dae84e0SHong Zhang PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A,IS isrow,IS iscol,PetscInt csize,MatReuse scall,Mat *B) 254617ab2063SBarry Smith { 2547db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*c; 2548d0f46423SBarry Smith PetscInt *smap,i,k,kstart,kend,oldcols = A->cmap->n,*lens; 254997f1f81fSBarry Smith PetscInt row,mat_i,*mat_j,tcol,first,step,*mat_ilen,sum,lensi; 25505d0c19d7SBarry Smith const PetscInt *irow,*icol; 25512e5835c6SStefano Zampini const PetscScalar *aa; 25525d0c19d7SBarry Smith PetscInt nrows,ncols; 255397f1f81fSBarry Smith PetscInt *starts,*j_new,*i_new,*aj = a->j,*ai = a->i,ii,*ailen = a->ilen; 255454f21887SBarry Smith MatScalar *a_new,*mat_a; 2555416022c9SBarry Smith Mat C; 2556cdc6f3adSToby Isaac PetscBool stride; 255717ab2063SBarry Smith 25583a40ed3dSBarry Smith PetscFunctionBegin; 25599566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow,&irow)); 25609566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow,&nrows)); 25619566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol,&ncols)); 256217ab2063SBarry Smith 25639566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol,ISSTRIDE,&stride)); 2564ff718158SBarry Smith if (stride) { 25659566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol,&first,&step)); 2566ff718158SBarry Smith } else { 2567ff718158SBarry Smith first = 0; 2568ff718158SBarry Smith step = 0; 2569ff718158SBarry Smith } 2570fee21e36SBarry Smith if (stride && step == 1) { 257102834360SBarry Smith /* special case of contiguous rows */ 25729566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows,&lens,nrows,&starts)); 257302834360SBarry Smith /* loop over new rows determining lens and starting points */ 257402834360SBarry Smith for (i=0; i<nrows; i++) { 2575bfeeae90SHong Zhang kstart = ai[irow[i]]; 2576a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2577a91a9bebSLisandro Dalcin starts[i] = kstart; 257802834360SBarry Smith for (k=kstart; k<kend; k++) { 2579bfeeae90SHong Zhang if (aj[k] >= first) { 258002834360SBarry Smith starts[i] = k; 258102834360SBarry Smith break; 258202834360SBarry Smith } 258302834360SBarry Smith } 2584a2744918SBarry Smith sum = 0; 258502834360SBarry Smith while (k < kend) { 2586bfeeae90SHong Zhang if (aj[k++] >= first+ncols) break; 2587a2744918SBarry Smith sum++; 258802834360SBarry Smith } 2589a2744918SBarry Smith lens[i] = sum; 259002834360SBarry Smith } 259102834360SBarry Smith /* create submatrix */ 2592cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 259397f1f81fSBarry Smith PetscInt n_cols,n_rows; 25949566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B,&n_rows,&n_cols)); 2595aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Reused submatrix wrong size"); 25969566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 259708480c60SBarry Smith C = *B; 25983a40ed3dSBarry Smith } else { 25993bef6203SJed Brown PetscInt rbs,cbs; 26009566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A),&C)); 26019566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE)); 26029566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow,&rbs)); 26039566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol,&cbs)); 26049566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C,rbs,cbs)); 26059566063dSJacob Faibussowitsch PetscCall(MatSetType(C,((PetscObject)A)->type_name)); 26069566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens)); 260708480c60SBarry Smith } 2608db02288aSLois Curfman McInnes c = (Mat_SeqAIJ*)C->data; 2609db02288aSLois Curfman McInnes 261002834360SBarry Smith /* loop over rows inserting into submatrix */ 2611db02288aSLois Curfman McInnes a_new = c->a; 2612db02288aSLois Curfman McInnes j_new = c->j; 2613db02288aSLois Curfman McInnes i_new = c->i; 26149566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 261502834360SBarry Smith for (i=0; i<nrows; i++) { 2616a2744918SBarry Smith ii = starts[i]; 2617a2744918SBarry Smith lensi = lens[i]; 2618a2744918SBarry Smith for (k=0; k<lensi; k++) { 2619a2744918SBarry Smith *j_new++ = aj[ii+k] - first; 262002834360SBarry Smith } 26219566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new,aa + starts[i],lensi)); 2622a2744918SBarry Smith a_new += lensi; 2623a2744918SBarry Smith i_new[i+1] = i_new[i] + lensi; 2624a2744918SBarry Smith c->ilen[i] = lensi; 262502834360SBarry Smith } 26269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 26279566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens,starts)); 26283a40ed3dSBarry Smith } else { 26299566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol,&icol)); 26309566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols,&smap)); 26319566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1+nrows,&lens)); 26324dcab191SBarry Smith for (i=0; i<ncols; i++) { 26336bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT,i,icol[i],oldcols); 26344dcab191SBarry Smith smap[icol[i]] = i+1; 26354dcab191SBarry Smith } 26364dcab191SBarry Smith 263702834360SBarry Smith /* determine lens of each row */ 263802834360SBarry Smith for (i=0; i<nrows; i++) { 2639bfeeae90SHong Zhang kstart = ai[irow[i]]; 264002834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 264102834360SBarry Smith lens[i] = 0; 264202834360SBarry Smith for (k=kstart; k<kend; k++) { 2643bfeeae90SHong Zhang if (smap[aj[k]]) { 264402834360SBarry Smith lens[i]++; 264502834360SBarry Smith } 264602834360SBarry Smith } 264702834360SBarry Smith } 264817ab2063SBarry Smith /* Create and fill new matrix */ 2649a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2650ace3abfcSBarry Smith PetscBool equal; 26510f5bd95cSBarry Smith 265299141d43SSatish Balay c = (Mat_SeqAIJ*)((*B)->data); 2653aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong size"); 26549566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen,lens,(*B)->rmap->n,&equal)); 265528b400f6SJacob Faibussowitsch PetscCheck(equal,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong no of nonzeros"); 26569566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen,(*B)->rmap->n)); 265708480c60SBarry Smith C = *B; 26583a40ed3dSBarry Smith } else { 26593bef6203SJed Brown PetscInt rbs,cbs; 26609566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A),&C)); 26619566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE)); 26629566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow,&rbs)); 26639566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol,&cbs)); 26649566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C,rbs,cbs)); 26659566063dSJacob Faibussowitsch PetscCall(MatSetType(C,((PetscObject)A)->type_name)); 26669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens)); 266708480c60SBarry Smith } 26689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 266999141d43SSatish Balay c = (Mat_SeqAIJ*)(C->data); 267017ab2063SBarry Smith for (i=0; i<nrows; i++) { 267199141d43SSatish Balay row = irow[i]; 2672bfeeae90SHong Zhang kstart = ai[row]; 267399141d43SSatish Balay kend = kstart + a->ilen[row]; 2674bfeeae90SHong Zhang mat_i = c->i[i]; 267599141d43SSatish Balay mat_j = c->j + mat_i; 267699141d43SSatish Balay mat_a = c->a + mat_i; 267799141d43SSatish Balay mat_ilen = c->ilen + i; 267817ab2063SBarry Smith for (k=kstart; k<kend; k++) { 2679bfeeae90SHong Zhang if ((tcol=smap[a->j[k]])) { 2680ed480e8bSBarry Smith *mat_j++ = tcol - 1; 26812e5835c6SStefano Zampini *mat_a++ = aa[k]; 268299141d43SSatish Balay (*mat_ilen)++; 268399141d43SSatish Balay 268417ab2063SBarry Smith } 268517ab2063SBarry Smith } 268617ab2063SBarry Smith } 26879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 268802834360SBarry Smith /* Free work space */ 26899566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol,&icol)); 26909566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26919566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2692cdc6f3adSToby Isaac /* sort */ 2693cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2694cdc6f3adSToby Isaac PetscInt ilen; 2695cdc6f3adSToby Isaac 2696cdc6f3adSToby Isaac mat_i = c->i[i]; 2697cdc6f3adSToby Isaac mat_j = c->j + mat_i; 2698cdc6f3adSToby Isaac mat_a = c->a + mat_i; 2699cdc6f3adSToby Isaac ilen = c->ilen[i]; 27009566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen,mat_j,mat_a)); 2701cdc6f3adSToby Isaac } 270202834360SBarry Smith } 27038c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 27049566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C,A->boundtocpu)); 2705305c6ccfSStefano Zampini #endif 27069566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY)); 27079566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY)); 270817ab2063SBarry Smith 27099566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow,&irow)); 2710416022c9SBarry Smith *B = C; 27113a40ed3dSBarry Smith PetscFunctionReturn(0); 271217ab2063SBarry Smith } 271317ab2063SBarry Smith 2714fc08c53fSHong Zhang PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat,MPI_Comm subComm,MatReuse scall,Mat *subMat) 271582d44351SHong Zhang { 271682d44351SHong Zhang Mat B; 271782d44351SHong Zhang 271882d44351SHong Zhang PetscFunctionBegin; 2719c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 27209566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm,&B)); 27219566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B,mat->rmap->n,mat->cmap->n,mat->rmap->n,mat->cmap->n)); 27229566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B,mat,mat)); 27239566063dSJacob Faibussowitsch PetscCall(MatSetType(B,MATSEQAIJ)); 27249566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B,mat,MAT_COPY_VALUES,PETSC_TRUE)); 272582d44351SHong Zhang *subMat = B; 2726c2d650bdSHong Zhang } else { 27279566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat,*subMat,SAME_NONZERO_PATTERN)); 2728c2d650bdSHong Zhang } 272982d44351SHong Zhang PetscFunctionReturn(0); 273082d44351SHong Zhang } 273182d44351SHong Zhang 27329a625307SHong Zhang PetscErrorCode MatILUFactor_SeqAIJ(Mat inA,IS row,IS col,const MatFactorInfo *info) 2733a871dcd8SBarry Smith { 273463b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 273563b91edcSBarry Smith Mat outA; 2736ace3abfcSBarry Smith PetscBool row_identity,col_identity; 273763b91edcSBarry Smith 27383a40ed3dSBarry Smith PetscFunctionBegin; 273908401ef6SPierre Jolivet PetscCheck(info->levels == 0,PETSC_COMM_SELF,PETSC_ERR_SUP,"Only levels=0 supported for in-place ilu"); 27401df811f5SHong Zhang 27419566063dSJacob Faibussowitsch PetscCall(ISIdentity(row,&row_identity)); 27429566063dSJacob Faibussowitsch PetscCall(ISIdentity(col,&col_identity)); 2743a871dcd8SBarry Smith 274463b91edcSBarry Smith outA = inA; 2745d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 27469566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 27479566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC,&inA->solvertype)); 27482205254eSKarl Rupp 27499566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 27509566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 27512205254eSKarl Rupp 2752c3122656SLisandro Dalcin a->row = row; 27532205254eSKarl Rupp 27549566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 27559566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 27562205254eSKarl Rupp 2757c3122656SLisandro Dalcin a->col = col; 275863b91edcSBarry Smith 275936db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 27609566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 27619566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col,PETSC_DECIDE,&a->icol)); 27629566063dSJacob Faibussowitsch PetscCall(PetscLogObjectParent((PetscObject)inA,(PetscObject)a->icol)); 2763f0ec6fceSSatish Balay 276494a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 27659566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n+1,&a->solve_work)); 27669566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)inA, (inA->rmap->n+1)*sizeof(PetscScalar))); 276794a9d846SBarry Smith } 276863b91edcSBarry Smith 27699566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2770137fb511SHong Zhang if (row_identity && col_identity) { 27719566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA,inA,info)); 2772137fb511SHong Zhang } else { 27739566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA,inA,info)); 2774137fb511SHong Zhang } 27753a40ed3dSBarry Smith PetscFunctionReturn(0); 2776a871dcd8SBarry Smith } 2777a871dcd8SBarry Smith 2778f4df32b1SMatthew Knepley PetscErrorCode MatScale_SeqAIJ(Mat inA,PetscScalar alpha) 2779f0b747eeSBarry Smith { 2780f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 2781dfa0f9e5SStefano Zampini PetscScalar *v; 2782c5df96a5SBarry Smith PetscBLASInt one = 1,bnz; 27833a40ed3dSBarry Smith 27843a40ed3dSBarry Smith PetscFunctionBegin; 27859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA,&v)); 27869566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz,&bnz)); 2787dfa0f9e5SStefano Zampini PetscStackCallBLAS("BLASscal",BLASscal_(&bnz,&alpha,v,&one)); 27889566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA,&v)); 27909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27913a40ed3dSBarry Smith PetscFunctionReturn(0); 2792f0b747eeSBarry Smith } 2793f0b747eeSBarry Smith 2794f68bb481SHong Zhang PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 279516b64355SHong Zhang { 279616b64355SHong Zhang PetscInt i; 279716b64355SHong Zhang 279816b64355SHong Zhang PetscFunctionBegin; 279916b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 28009566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1,submatj->ptr,submatj->tmp,submatj->ctr)); 280116b64355SHong Zhang 280216b64355SHong Zhang for (i=0; i<submatj->nrqr; ++i) { 28039566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->sbuf2[i])); 280416b64355SHong Zhang } 28059566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2,submatj->req_size,submatj->req_source1)); 280616b64355SHong Zhang 280716b64355SHong Zhang if (submatj->rbuf1) { 28089566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 28099566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 281016b64355SHong Zhang } 281116b64355SHong Zhang 281216b64355SHong Zhang for (i=0; i<submatj->nrqs; ++i) { 28139566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf3[i])); 281416b64355SHong Zhang } 28159566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2,submatj->rbuf2,submatj->rbuf3)); 28169566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 281716b64355SHong Zhang } 281816b64355SHong Zhang 281916b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 28209566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy((PetscTable*)&submatj->rmap)); 28219566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 28229566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 282316b64355SHong Zhang #else 28249566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 282516b64355SHong Zhang #endif 282616b64355SHong Zhang 282716b64355SHong Zhang if (!submatj->allcolumns) { 282816b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 28299566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy((PetscTable*)&submatj->cmap)); 283016b64355SHong Zhang #else 28319566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 283216b64355SHong Zhang #endif 283316b64355SHong Zhang } 28349566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 283516b64355SHong Zhang 28369566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 283716b64355SHong Zhang PetscFunctionReturn(0); 283816b64355SHong Zhang } 283916b64355SHong Zhang 28400fb991dcSHong Zhang PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 284116b64355SHong Zhang { 284216b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ*)C->data; 28435c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 284416b64355SHong Zhang 284516b64355SHong Zhang PetscFunctionBegin; 28469566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 28479566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 284816b64355SHong Zhang PetscFunctionReturn(0); 284916b64355SHong Zhang } 285016b64355SHong Zhang 285189a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 28522d033e1fSHong Zhang PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n,Mat *mat[]) 28532d033e1fSHong Zhang { 28542d033e1fSHong Zhang PetscInt i; 28550fb991dcSHong Zhang Mat C; 28560fb991dcSHong Zhang Mat_SeqAIJ *c; 28570fb991dcSHong Zhang Mat_SubSppt *submatj; 28582d033e1fSHong Zhang 28592d033e1fSHong Zhang PetscFunctionBegin; 28602d033e1fSHong Zhang for (i=0; i<n; i++) { 28610fb991dcSHong Zhang C = (*mat)[i]; 28620fb991dcSHong Zhang c = (Mat_SeqAIJ*)C->data; 28630fb991dcSHong Zhang submatj = c->submatis1; 28642d033e1fSHong Zhang if (submatj) { 2865682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 2866*26cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 28679566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 28689566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 28699566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 28709566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 28719566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 28729566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2873682e4c99SStefano Zampini } 28742d033e1fSHong Zhang } else { 28759566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 28762d033e1fSHong Zhang } 28772d033e1fSHong Zhang } 287886e85357SHong Zhang 287963a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 28809566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n,mat)); 288163a75b2aSHong Zhang 28829566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 28832d033e1fSHong Zhang PetscFunctionReturn(0); 28842d033e1fSHong Zhang } 28852d033e1fSHong Zhang 28867dae84e0SHong Zhang PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A,PetscInt n,const IS irow[],const IS icol[],MatReuse scall,Mat *B[]) 2887cddf8d76SBarry Smith { 288897f1f81fSBarry Smith PetscInt i; 2889cddf8d76SBarry Smith 28903a40ed3dSBarry Smith PetscFunctionBegin; 2891cddf8d76SBarry Smith if (scall == MAT_INITIAL_MATRIX) { 28929566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n+1,B)); 2893cddf8d76SBarry Smith } 2894cddf8d76SBarry Smith 2895cddf8d76SBarry Smith for (i=0; i<n; i++) { 28969566063dSJacob Faibussowitsch PetscCall(MatCreateSubMatrix_SeqAIJ(A,irow[i],icol[i],PETSC_DECIDE,scall,&(*B)[i])); 2897cddf8d76SBarry Smith } 28983a40ed3dSBarry Smith PetscFunctionReturn(0); 2899cddf8d76SBarry Smith } 2900cddf8d76SBarry Smith 290197f1f81fSBarry Smith PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A,PetscInt is_max,IS is[],PetscInt ov) 29024dcbc457SBarry Smith { 2903e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 29045d0c19d7SBarry Smith PetscInt row,i,j,k,l,m,n,*nidx,isz,val; 29055d0c19d7SBarry Smith const PetscInt *idx; 290697f1f81fSBarry Smith PetscInt start,end,*ai,*aj; 2907f1af5d2fSBarry Smith PetscBT table; 2908bbd702dbSSatish Balay 29093a40ed3dSBarry Smith PetscFunctionBegin; 2910d0f46423SBarry Smith m = A->rmap->n; 2911e4d965acSSatish Balay ai = a->i; 2912bfeeae90SHong Zhang aj = a->j; 29138a047759SSatish Balay 291408401ef6SPierre Jolivet PetscCheck(ov >= 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"illegal negative overlap value used"); 291506763907SSatish Balay 29169566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1,&nidx)); 29179566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m,&table)); 291806763907SSatish Balay 2919e4d965acSSatish Balay for (i=0; i<is_max; i++) { 2920b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2921e4d965acSSatish Balay isz = 0; 29229566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m,table)); 2923e4d965acSSatish Balay 2924e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 29259566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i],&idx)); 29269566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i],&n)); 2927e4d965acSSatish Balay 2928dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2929e4d965acSSatish Balay for (j=0; j<n; ++j) { 29302205254eSKarl Rupp if (!PetscBTLookupSet(table,idx[j])) nidx[isz++] = idx[j]; 29314dcbc457SBarry Smith } 29329566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i],&idx)); 29339566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2934e4d965acSSatish Balay 293504a348a9SBarry Smith k = 0; 293604a348a9SBarry Smith for (j=0; j<ov; j++) { /* for each overlap */ 293704a348a9SBarry Smith n = isz; 293806763907SSatish Balay for (; k<n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2939e4d965acSSatish Balay row = nidx[k]; 2940e4d965acSSatish Balay start = ai[row]; 2941e4d965acSSatish Balay end = ai[row+1]; 294204a348a9SBarry Smith for (l = start; l<end; l++) { 2943efb16452SHong Zhang val = aj[l]; 29442205254eSKarl Rupp if (!PetscBTLookupSet(table,val)) nidx[isz++] = val; 2945e4d965acSSatish Balay } 2946e4d965acSSatish Balay } 2947e4d965acSSatish Balay } 29489566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF,isz,nidx,PETSC_COPY_VALUES,(is+i))); 2949e4d965acSSatish Balay } 29509566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 29519566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 29523a40ed3dSBarry Smith PetscFunctionReturn(0); 29534dcbc457SBarry Smith } 295417ab2063SBarry Smith 29550513a670SBarry Smith /* -------------------------------------------------------------- */ 2956dfbe8321SBarry Smith PetscErrorCode MatPermute_SeqAIJ(Mat A,IS rowp,IS colp,Mat *B) 29570513a670SBarry Smith { 29580513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 29593b98c0a2SBarry Smith PetscInt i,nz = 0,m = A->rmap->n,n = A->cmap->n; 29605d0c19d7SBarry Smith const PetscInt *row,*col; 29615d0c19d7SBarry Smith PetscInt *cnew,j,*lens; 296256cd22aeSBarry Smith IS icolp,irowp; 29630298fd71SBarry Smith PetscInt *cwork = NULL; 29640298fd71SBarry Smith PetscScalar *vwork = NULL; 29650513a670SBarry Smith 29663a40ed3dSBarry Smith PetscFunctionBegin; 29679566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp,PETSC_DECIDE,&irowp)); 29689566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp,&row)); 29699566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp,PETSC_DECIDE,&icolp)); 29709566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp,&col)); 29710513a670SBarry Smith 29720513a670SBarry Smith /* determine lengths of permuted rows */ 29739566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1,&lens)); 29742205254eSKarl Rupp for (i=0; i<m; i++) lens[row[i]] = a->i[i+1] - a->i[i]; 29759566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A),B)); 29769566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B,m,n,m,n)); 29779566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B,A,A)); 29789566063dSJacob Faibussowitsch PetscCall(MatSetType(*B,((PetscObject)A)->type_name)); 29799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B,0,lens)); 29809566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 29810513a670SBarry Smith 29829566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n,&cnew)); 29830513a670SBarry Smith for (i=0; i<m; i++) { 29849566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A,i,&nz,&cwork,&vwork)); 29852205254eSKarl Rupp for (j=0; j<nz; j++) cnew[j] = col[cwork[j]]; 29869566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B,1,&row[i],nz,cnew,vwork,INSERT_VALUES)); 29879566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A,i,&nz,&cwork,&vwork)); 29880513a670SBarry Smith } 29899566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 29902205254eSKarl Rupp 29913c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 29922205254eSKarl Rupp 29938c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29949566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B,A->boundtocpu)); 29959fe5e383SStefano Zampini #endif 29969566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY)); 29979566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY)); 29989566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp,&row)); 29999566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp,&col)); 30009566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 30019566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 30026768869dSprj- if (rowp == colp) { 30039566063dSJacob Faibussowitsch PetscCall(MatPropagateSymmetryOptions(A,*B)); 30046768869dSprj- } 30053a40ed3dSBarry Smith PetscFunctionReturn(0); 30060513a670SBarry Smith } 30070513a670SBarry Smith 3008dfbe8321SBarry Smith PetscErrorCode MatCopy_SeqAIJ(Mat A,Mat B,MatStructure str) 3009cb5b572fSBarry Smith { 3010cb5b572fSBarry Smith PetscFunctionBegin; 301133f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 301233f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 3013be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3014be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ*)B->data; 30152e5835c6SStefano Zampini const PetscScalar *aa; 3016be6bf707SBarry Smith 30179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 301808401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n],PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT,a->i[A->rmap->n],b->i[B->rmap->n]); 30199566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a,aa,a->i[A->rmap->n])); 30209566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 30219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 3022cb5b572fSBarry Smith } else { 30239566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A,B,str)); 3024cb5b572fSBarry Smith } 3025cb5b572fSBarry Smith PetscFunctionReturn(0); 3026cb5b572fSBarry Smith } 3027cb5b572fSBarry Smith 30284994cf47SJed Brown PetscErrorCode MatSetUp_SeqAIJ(Mat A) 3029273d9f13SBarry Smith { 3030273d9f13SBarry Smith PetscFunctionBegin; 30319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A,PETSC_DEFAULT,NULL)); 3032273d9f13SBarry Smith PetscFunctionReturn(0); 3033273d9f13SBarry Smith } 3034273d9f13SBarry Smith 3035f38c1e66SStefano Zampini PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A,PetscScalar *array[]) 30366c0721eeSBarry Smith { 30376c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 30386e111a19SKarl Rupp 30396c0721eeSBarry Smith PetscFunctionBegin; 30406c0721eeSBarry Smith *array = a->a; 30416c0721eeSBarry Smith PetscFunctionReturn(0); 30426c0721eeSBarry Smith } 30436c0721eeSBarry Smith 3044f38c1e66SStefano Zampini PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A,PetscScalar *array[]) 30456c0721eeSBarry Smith { 30466c0721eeSBarry Smith PetscFunctionBegin; 3047f38c1e66SStefano Zampini *array = NULL; 30486c0721eeSBarry Smith PetscFunctionReturn(0); 30496c0721eeSBarry Smith } 3050273d9f13SBarry Smith 30518229c054SShri Abhyankar /* 30528229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 30538229c054SShri Abhyankar have different nonzero structure. 30548229c054SShri Abhyankar */ 3055b264fe52SHong Zhang PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m,const PetscInt *xi,const PetscInt *xj,const PetscInt *yi,const PetscInt *yj,PetscInt *nnz) 3056ec7775f6SShri Abhyankar { 3057b264fe52SHong Zhang PetscInt i,j,k,nzx,nzy; 3058ec7775f6SShri Abhyankar 3059ec7775f6SShri Abhyankar PetscFunctionBegin; 3060ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 3061ec7775f6SShri Abhyankar for (i=0; i<m; i++) { 3062b264fe52SHong Zhang const PetscInt *xjj = xj+xi[i],*yjj = yj+yi[i]; 3063b264fe52SHong Zhang nzx = xi[i+1] - xi[i]; 3064b264fe52SHong Zhang nzy = yi[i+1] - yi[i]; 30658af7cee1SJed Brown nnz[i] = 0; 30668af7cee1SJed Brown for (j=0,k=0; j<nzx; j++) { /* Point in X */ 3067b264fe52SHong Zhang for (; k<nzy && yjj[k]<xjj[j]; k++) nnz[i]++; /* Catch up to X */ 3068b264fe52SHong Zhang if (k<nzy && yjj[k]==xjj[j]) k++; /* Skip duplicate */ 30698af7cee1SJed Brown nnz[i]++; 30708af7cee1SJed Brown } 30718af7cee1SJed Brown for (; k<nzy; k++) nnz[i]++; 3072ec7775f6SShri Abhyankar } 3073ec7775f6SShri Abhyankar PetscFunctionReturn(0); 3074ec7775f6SShri Abhyankar } 3075ec7775f6SShri Abhyankar 3076b264fe52SHong Zhang PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y,Mat X,PetscInt *nnz) 3077b264fe52SHong Zhang { 3078b264fe52SHong Zhang PetscInt m = Y->rmap->N; 3079b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ*)X->data; 3080b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ*)Y->data; 3081b264fe52SHong Zhang 3082b264fe52SHong Zhang PetscFunctionBegin; 3083b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 30849566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m,x->i,x->j,y->i,y->j,nnz)); 3085b264fe52SHong Zhang PetscFunctionReturn(0); 3086b264fe52SHong Zhang } 3087b264fe52SHong Zhang 3088f4df32b1SMatthew Knepley PetscErrorCode MatAXPY_SeqAIJ(Mat Y,PetscScalar a,Mat X,MatStructure str) 3089ac90fabeSBarry Smith { 3090ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ*)X->data,*y = (Mat_SeqAIJ*)Y->data; 3091ac90fabeSBarry Smith 3092ac90fabeSBarry Smith PetscFunctionBegin; 3093134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 3094134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3095134adf20SPierre Jolivet if (e) { 30969566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i,y->i,Y->rmap->n+1,&e)); 309781fa06acSBarry Smith if (e) { 30989566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j,y->j,y->nz,&e)); 3099134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 310081fa06acSBarry Smith } 310181fa06acSBarry Smith } 310254c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"MatStructure is not SAME_NONZERO_PATTERN"); 310381fa06acSBarry Smith } 3104ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 31052e5835c6SStefano Zampini const PetscScalar *xa; 31062e5835c6SStefano Zampini PetscScalar *ya,alpha = a; 310781fa06acSBarry Smith PetscBLASInt one = 1,bnz; 310881fa06acSBarry Smith 31099566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz,&bnz)); 31109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y,&ya)); 31119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X,&xa)); 31122e5835c6SStefano Zampini PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&bnz,&alpha,xa,&one,ya,&one)); 31139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X,&xa)); 31149566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y,&ya)); 31159566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*bnz)); 31169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 31179566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3118ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 31199566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y,a,X,str)); 3120ac90fabeSBarry Smith } else { 31218229c054SShri Abhyankar Mat B; 31228229c054SShri Abhyankar PetscInt *nnz; 31239566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N,&nnz)); 31249566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y),&B)); 31259566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B,((PetscObject)Y)->name)); 31269566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B,Y->rmap,Y->cmap)); 31279566063dSJacob Faibussowitsch PetscCall(MatSetType(B,((PetscObject)Y)->type_name)); 31289566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y,X,nnz)); 31299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B,0,nnz)); 31309566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B,Y,a,X,str)); 31319566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y,&B)); 31329566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3133ac90fabeSBarry Smith } 3134ac90fabeSBarry Smith PetscFunctionReturn(0); 3135ac90fabeSBarry Smith } 3136ac90fabeSBarry Smith 31372726fb6dSPierre Jolivet PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3138354c94deSBarry Smith { 3139354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3140354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3141354c94deSBarry Smith PetscInt i,nz; 3142354c94deSBarry Smith PetscScalar *a; 3143354c94deSBarry Smith 3144354c94deSBarry Smith PetscFunctionBegin; 3145354c94deSBarry Smith nz = aij->nz; 31469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat,&a)); 31472205254eSKarl Rupp for (i=0; i<nz; i++) a[i] = PetscConj(a[i]); 31489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat,&a)); 3149354c94deSBarry Smith #else 3150354c94deSBarry Smith PetscFunctionBegin; 3151354c94deSBarry Smith #endif 3152354c94deSBarry Smith PetscFunctionReturn(0); 3153354c94deSBarry Smith } 3154354c94deSBarry Smith 3155985db425SBarry Smith PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3156e34fafa9SBarry Smith { 3157e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3158d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3159e34fafa9SBarry Smith PetscReal atmp; 3160985db425SBarry Smith PetscScalar *x; 3161ce496241SStefano Zampini const MatScalar *aa,*av; 3162e34fafa9SBarry Smith 3163e34fafa9SBarry Smith PetscFunctionBegin; 316428b400f6SJacob Faibussowitsch PetscCheck(!A->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 31659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&av)); 3166ce496241SStefano Zampini aa = av; 3167e34fafa9SBarry Smith ai = a->i; 3168e34fafa9SBarry Smith aj = a->j; 3169e34fafa9SBarry Smith 31709566063dSJacob Faibussowitsch PetscCall(VecSet(v,0.0)); 31719566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 31729566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v,&n)); 317308401ef6SPierre Jolivet PetscCheck(n == A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3174e34fafa9SBarry Smith for (i=0; i<m; i++) { 3175e34fafa9SBarry Smith ncols = ai[1] - ai[0]; ai++; 3176e34fafa9SBarry Smith for (j=0; j<ncols; j++) { 3177985db425SBarry Smith atmp = PetscAbsScalar(*aa); 3178985db425SBarry Smith if (PetscAbsScalar(x[i]) < atmp) {x[i] = atmp; if (idx) idx[i] = *aj;} 3179985db425SBarry Smith aa++; aj++; 3180985db425SBarry Smith } 3181985db425SBarry Smith } 31829566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 31839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&av)); 3184985db425SBarry Smith PetscFunctionReturn(0); 3185985db425SBarry Smith } 3186985db425SBarry Smith 3187985db425SBarry Smith PetscErrorCode MatGetRowMax_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3188985db425SBarry Smith { 3189985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3190d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3191985db425SBarry Smith PetscScalar *x; 3192ce496241SStefano Zampini const MatScalar *aa,*av; 3193985db425SBarry Smith 3194985db425SBarry Smith PetscFunctionBegin; 319528b400f6SJacob Faibussowitsch PetscCheck(!A->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 31969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&av)); 3197ce496241SStefano Zampini aa = av; 3198985db425SBarry Smith ai = a->i; 3199985db425SBarry Smith aj = a->j; 3200985db425SBarry Smith 32019566063dSJacob Faibussowitsch PetscCall(VecSet(v,0.0)); 32029566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 32039566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v,&n)); 320408401ef6SPierre Jolivet PetscCheck(n == A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3205985db425SBarry Smith for (i=0; i<m; i++) { 3206985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 3207d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 3208985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 3209985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3210985db425SBarry Smith x[i] = 0.0; 3211985db425SBarry Smith if (idx) { 3212985db425SBarry Smith for (j=0; j<ncols; j++) { /* find first implicit 0.0 in the row */ 3213985db425SBarry Smith if (aj[j] > j) { 3214985db425SBarry Smith idx[i] = j; 3215985db425SBarry Smith break; 3216985db425SBarry Smith } 3217985db425SBarry Smith } 32181a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 32191a254869SHong Zhang if (j==ncols && j < A->cmap->n) idx[i] = j; 3220985db425SBarry Smith } 3221985db425SBarry Smith } 3222985db425SBarry Smith for (j=0; j<ncols; j++) { 3223985db425SBarry Smith if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 3224985db425SBarry Smith aa++; aj++; 3225985db425SBarry Smith } 3226985db425SBarry Smith } 32279566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 32289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&av)); 3229985db425SBarry Smith PetscFunctionReturn(0); 3230985db425SBarry Smith } 3231985db425SBarry Smith 3232c87e5d42SMatthew Knepley PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3233c87e5d42SMatthew Knepley { 3234c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3235c87e5d42SMatthew Knepley PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3236ce496241SStefano Zampini PetscScalar *x; 3237ce496241SStefano Zampini const MatScalar *aa,*av; 3238c87e5d42SMatthew Knepley 3239c87e5d42SMatthew Knepley PetscFunctionBegin; 32409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&av)); 3241ce496241SStefano Zampini aa = av; 3242c87e5d42SMatthew Knepley ai = a->i; 3243c87e5d42SMatthew Knepley aj = a->j; 3244c87e5d42SMatthew Knepley 32459566063dSJacob Faibussowitsch PetscCall(VecSet(v,0.0)); 32469566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 32479566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v,&n)); 324808401ef6SPierre Jolivet PetscCheck(n == m,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3249c87e5d42SMatthew Knepley for (i=0; i<m; i++) { 3250c87e5d42SMatthew Knepley ncols = ai[1] - ai[0]; ai++; 3251f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 3252f07e67edSHong Zhang x[i] = *aa; if (idx) idx[i] = 0; 3253f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3254f07e67edSHong Zhang x[i] = 0.0; 3255f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3256289a08f5SMatthew Knepley for (j=0; j<ncols; j++) { 3257f07e67edSHong Zhang if (aj[j] > j) { 3258f07e67edSHong Zhang idx[i] = j; 32592205254eSKarl Rupp break; 32602205254eSKarl Rupp } 3261289a08f5SMatthew Knepley } 3262f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3263f07e67edSHong Zhang if (j==ncols && j < A->cmap->n) idx[i] = j; 3264f07e67edSHong Zhang } 3265289a08f5SMatthew Knepley } 3266c87e5d42SMatthew Knepley for (j=0; j<ncols; j++) { 3267f07e67edSHong Zhang if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 3268c87e5d42SMatthew Knepley aa++; aj++; 3269c87e5d42SMatthew Knepley } 3270c87e5d42SMatthew Knepley } 32719566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 32729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&av)); 3273c87e5d42SMatthew Knepley PetscFunctionReturn(0); 3274c87e5d42SMatthew Knepley } 3275c87e5d42SMatthew Knepley 3276985db425SBarry Smith PetscErrorCode MatGetRowMin_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3277985db425SBarry Smith { 3278985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3279d9ca1df4SBarry Smith PetscInt i,j,m = A->rmap->n,ncols,n; 3280d9ca1df4SBarry Smith const PetscInt *ai,*aj; 3281985db425SBarry Smith PetscScalar *x; 3282ce496241SStefano Zampini const MatScalar *aa,*av; 3283985db425SBarry Smith 3284985db425SBarry Smith PetscFunctionBegin; 328528b400f6SJacob Faibussowitsch PetscCheck(!A->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 32869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&av)); 3287ce496241SStefano Zampini aa = av; 3288985db425SBarry Smith ai = a->i; 3289985db425SBarry Smith aj = a->j; 3290985db425SBarry Smith 32919566063dSJacob Faibussowitsch PetscCall(VecSet(v,0.0)); 32929566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 32939566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v,&n)); 329408401ef6SPierre Jolivet PetscCheck(n == m,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3295985db425SBarry Smith for (i=0; i<m; i++) { 3296985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 3297d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 3298985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 3299985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3300985db425SBarry Smith x[i] = 0.0; 3301985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3302985db425SBarry Smith for (j=0; j<ncols; j++) { 3303985db425SBarry Smith if (aj[j] > j) { 3304985db425SBarry Smith idx[i] = j; 3305985db425SBarry Smith break; 3306985db425SBarry Smith } 3307985db425SBarry Smith } 3308fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3309fa213d2fSHong Zhang if (j==ncols && j < A->cmap->n) idx[i] = j; 3310985db425SBarry Smith } 3311985db425SBarry Smith } 3312985db425SBarry Smith for (j=0; j<ncols; j++) { 3313985db425SBarry Smith if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 3314985db425SBarry Smith aa++; aj++; 3315e34fafa9SBarry Smith } 3316e34fafa9SBarry Smith } 33179566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 33189566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&av)); 3319e34fafa9SBarry Smith PetscFunctionReturn(0); 3320e34fafa9SBarry Smith } 3321bbead8a2SBarry Smith 3322713ccfa9SJed Brown PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A,const PetscScalar **values) 3323bbead8a2SBarry Smith { 3324bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 332533d57670SJed Brown PetscInt i,bs = PetscAbs(A->rmap->bs),mbs = A->rmap->n/bs,ipvt[5],bs2 = bs*bs,*v_pivots,ij[7],*IJ,j; 3326bbead8a2SBarry Smith MatScalar *diag,work[25],*v_work; 33270da83c2eSBarry Smith const PetscReal shift = 0.0; 33281a9391e3SHong Zhang PetscBool allowzeropivot,zeropivotdetected=PETSC_FALSE; 3329bbead8a2SBarry Smith 3330bbead8a2SBarry Smith PetscFunctionBegin; 3331a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 33324a0d0026SBarry Smith if (a->ibdiagvalid) { 33334a0d0026SBarry Smith if (values) *values = a->ibdiag; 33344a0d0026SBarry Smith PetscFunctionReturn(0); 33354a0d0026SBarry Smith } 33369566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 3337bbead8a2SBarry Smith if (!a->ibdiag) { 33389566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bs2*mbs,&a->ibdiag)); 33399566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,bs2*mbs*sizeof(PetscScalar))); 3340bbead8a2SBarry Smith } 3341bbead8a2SBarry Smith diag = a->ibdiag; 3342bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3343bbead8a2SBarry Smith /* factor and invert each block */ 3344bbead8a2SBarry Smith switch (bs) { 3345bbead8a2SBarry Smith case 1: 3346bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 33479566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,1,&i,1,&i,diag+i)); 3348ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3349ec1892c8SHong Zhang if (allowzeropivot) { 33507b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33517b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 33527b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 33539566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n",i,(double)PetscAbsScalar(diag[i]),(double)PETSC_MACHINE_EPSILON)); 335498921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_MAT_LU_ZRPVT,"Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g",i,(double)PetscAbsScalar(diag[i]),(double)PETSC_MACHINE_EPSILON); 3355ec1892c8SHong Zhang } 3356bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3357bbead8a2SBarry Smith } 3358bbead8a2SBarry Smith break; 3359bbead8a2SBarry Smith case 2: 3360bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3361bbead8a2SBarry Smith ij[0] = 2*i; ij[1] = 2*i + 1; 33629566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,2,ij,2,ij,diag)); 33639566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag,shift,allowzeropivot,&zeropivotdetected)); 33647b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33659566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3366bbead8a2SBarry Smith diag += 4; 3367bbead8a2SBarry Smith } 3368bbead8a2SBarry Smith break; 3369bbead8a2SBarry Smith case 3: 3370bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3371bbead8a2SBarry Smith ij[0] = 3*i; ij[1] = 3*i + 1; ij[2] = 3*i + 2; 33729566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,3,ij,3,ij,diag)); 33739566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag,shift,allowzeropivot,&zeropivotdetected)); 33747b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33759566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3376bbead8a2SBarry Smith diag += 9; 3377bbead8a2SBarry Smith } 3378bbead8a2SBarry Smith break; 3379bbead8a2SBarry Smith case 4: 3380bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3381bbead8a2SBarry Smith ij[0] = 4*i; ij[1] = 4*i + 1; ij[2] = 4*i + 2; ij[3] = 4*i + 3; 33829566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,4,ij,4,ij,diag)); 33839566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag,shift,allowzeropivot,&zeropivotdetected)); 33847b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33859566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3386bbead8a2SBarry Smith diag += 16; 3387bbead8a2SBarry Smith } 3388bbead8a2SBarry Smith break; 3389bbead8a2SBarry Smith case 5: 3390bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3391bbead8a2SBarry Smith ij[0] = 5*i; ij[1] = 5*i + 1; ij[2] = 5*i + 2; ij[3] = 5*i + 3; ij[4] = 5*i + 4; 33929566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,5,ij,5,ij,diag)); 33939566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag,ipvt,work,shift,allowzeropivot,&zeropivotdetected)); 33947b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33959566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3396bbead8a2SBarry Smith diag += 25; 3397bbead8a2SBarry Smith } 3398bbead8a2SBarry Smith break; 3399bbead8a2SBarry Smith case 6: 3400bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3401bbead8a2SBarry Smith ij[0] = 6*i; ij[1] = 6*i + 1; ij[2] = 6*i + 2; ij[3] = 6*i + 3; ij[4] = 6*i + 4; ij[5] = 6*i + 5; 34029566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,6,ij,6,ij,diag)); 34039566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag,shift,allowzeropivot,&zeropivotdetected)); 34047b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34059566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3406bbead8a2SBarry Smith diag += 36; 3407bbead8a2SBarry Smith } 3408bbead8a2SBarry Smith break; 3409bbead8a2SBarry Smith case 7: 3410bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3411bbead8a2SBarry Smith ij[0] = 7*i; ij[1] = 7*i + 1; ij[2] = 7*i + 2; ij[3] = 7*i + 3; ij[4] = 7*i + 4; ij[5] = 7*i + 5; ij[5] = 7*i + 6; 34129566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,7,ij,7,ij,diag)); 34139566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag,shift,allowzeropivot,&zeropivotdetected)); 34147b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34159566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3416bbead8a2SBarry Smith diag += 49; 3417bbead8a2SBarry Smith } 3418bbead8a2SBarry Smith break; 3419bbead8a2SBarry Smith default: 34209566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs,&v_work,bs,&v_pivots,bs,&IJ)); 3421bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3422bbead8a2SBarry Smith for (j=0; j<bs; j++) { 3423bbead8a2SBarry Smith IJ[j] = bs*i + j; 3424bbead8a2SBarry Smith } 34259566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,bs,IJ,bs,IJ,diag)); 34269566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs,diag,v_pivots,v_work,allowzeropivot,&zeropivotdetected)); 34277b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34289566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag,bs)); 3429bbead8a2SBarry Smith diag += bs2; 3430bbead8a2SBarry Smith } 34319566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work,v_pivots,IJ)); 3432bbead8a2SBarry Smith } 3433bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 3434bbead8a2SBarry Smith PetscFunctionReturn(0); 3435bbead8a2SBarry Smith } 3436bbead8a2SBarry Smith 343773a71a0fSBarry Smith static PetscErrorCode MatSetRandom_SeqAIJ(Mat x,PetscRandom rctx) 343873a71a0fSBarry Smith { 343973a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)x->data; 3440fff043a9SJunchao Zhang PetscScalar a,*aa; 344173a71a0fSBarry Smith PetscInt m,n,i,j,col; 344273a71a0fSBarry Smith 344373a71a0fSBarry Smith PetscFunctionBegin; 344473a71a0fSBarry Smith if (!x->assembled) { 34459566063dSJacob Faibussowitsch PetscCall(MatGetSize(x,&m,&n)); 344673a71a0fSBarry Smith for (i=0; i<m; i++) { 344773a71a0fSBarry Smith for (j=0; j<aij->imax[i]; j++) { 34489566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx,&a)); 344973a71a0fSBarry Smith col = (PetscInt)(n*PetscRealPart(a)); 34509566063dSJacob Faibussowitsch PetscCall(MatSetValues(x,1,&i,1,&col,&a,ADD_VALUES)); 345173a71a0fSBarry Smith } 345273a71a0fSBarry Smith } 3453e2ce353bSJunchao Zhang } else { 34549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x,&aa)); 34559566063dSJacob Faibussowitsch for (i=0; i<aij->nz; i++) PetscCall(PetscRandomGetValue(rctx,aa+i)); 34569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x,&aa)); 3457e2ce353bSJunchao Zhang } 34589566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x,MAT_FINAL_ASSEMBLY)); 34599566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x,MAT_FINAL_ASSEMBLY)); 346073a71a0fSBarry Smith PetscFunctionReturn(0); 346173a71a0fSBarry Smith } 346273a71a0fSBarry Smith 3463679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3464679944adSJunchao Zhang PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x,PetscInt low,PetscInt high,PetscRandom rctx) 3465679944adSJunchao Zhang { 3466679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)x->data; 3467679944adSJunchao Zhang PetscScalar a; 3468679944adSJunchao Zhang PetscInt m,n,i,j,col,nskip; 3469679944adSJunchao Zhang 3470679944adSJunchao Zhang PetscFunctionBegin; 3471679944adSJunchao Zhang nskip = high - low; 34729566063dSJacob Faibussowitsch PetscCall(MatGetSize(x,&m,&n)); 3473679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3474679944adSJunchao Zhang for (i=0; i<m; i++) { 3475679944adSJunchao Zhang for (j=0; j<aij->imax[i]; j++) { 34769566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx,&a)); 3477679944adSJunchao Zhang col = (PetscInt)(n*PetscRealPart(a)); 3478679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34799566063dSJacob Faibussowitsch PetscCall(MatSetValues(x,1,&i,1,&col,&a,ADD_VALUES)); 3480679944adSJunchao Zhang } 3481e2ce353bSJunchao Zhang } 34829566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x,MAT_FINAL_ASSEMBLY)); 34839566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x,MAT_FINAL_ASSEMBLY)); 3484679944adSJunchao Zhang PetscFunctionReturn(0); 3485679944adSJunchao Zhang } 3486679944adSJunchao Zhang 3487682d7d0cSBarry Smith /* -------------------------------------------------------------------*/ 34880a6ffc59SBarry Smith static struct _MatOps MatOps_Values = { MatSetValues_SeqAIJ, 3489cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3490cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3491cb5b572fSBarry Smith MatMult_SeqAIJ, 349297304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34937c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34947c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3495f4259b30SLisandro Dalcin NULL, 3496f4259b30SLisandro Dalcin NULL, 3497f4259b30SLisandro Dalcin NULL, 3498f4259b30SLisandro Dalcin /* 10*/ NULL, 3499cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3500f4259b30SLisandro Dalcin NULL, 350141f059aeSBarry Smith MatSOR_SeqAIJ, 350291e9d3e2SHong Zhang MatTranspose_SeqAIJ, 350397304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3504cb5b572fSBarry Smith MatEqual_SeqAIJ, 3505cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3506cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3507cb5b572fSBarry Smith MatNorm_SeqAIJ, 3508f4259b30SLisandro Dalcin /* 20*/ NULL, 3509cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3510cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3511cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3512d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3513f4259b30SLisandro Dalcin NULL, 3514f4259b30SLisandro Dalcin NULL, 3515f4259b30SLisandro Dalcin NULL, 3516f4259b30SLisandro Dalcin NULL, 35174994cf47SJed Brown /* 29*/ MatSetUp_SeqAIJ, 3518f4259b30SLisandro Dalcin NULL, 3519f4259b30SLisandro Dalcin NULL, 3520f4259b30SLisandro Dalcin NULL, 3521f4259b30SLisandro Dalcin NULL, 3522d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3523f4259b30SLisandro Dalcin NULL, 3524f4259b30SLisandro Dalcin NULL, 3525cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3526f4259b30SLisandro Dalcin NULL, 3527d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 35287dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3529cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3530cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3531cb5b572fSBarry Smith MatCopy_SeqAIJ, 3532d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3533cb5b572fSBarry Smith MatScale_SeqAIJ, 35347d68702bSBarry Smith MatShift_SeqAIJ, 353579299369SBarry Smith MatDiagonalSet_SeqAIJ, 35366e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 353773a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 35383b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 35393b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 35403b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3541a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 354293dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3543f4259b30SLisandro Dalcin NULL, 3544f4259b30SLisandro Dalcin NULL, 3545cda55fadSBarry Smith MatPermute_SeqAIJ, 3546f4259b30SLisandro Dalcin NULL, 3547f4259b30SLisandro Dalcin /* 59*/ NULL, 3548b9b97703SBarry Smith MatDestroy_SeqAIJ, 3549b9b97703SBarry Smith MatView_SeqAIJ, 3550f4259b30SLisandro Dalcin NULL, 3551f4259b30SLisandro Dalcin NULL, 3552f4259b30SLisandro Dalcin /* 64*/ NULL, 3553321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3554f4259b30SLisandro Dalcin NULL, 3555f4259b30SLisandro Dalcin NULL, 3556f4259b30SLisandro Dalcin NULL, 3557d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3558c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3559f4259b30SLisandro Dalcin NULL, 3560f4259b30SLisandro Dalcin NULL, 3561f4259b30SLisandro Dalcin NULL, 3562f4259b30SLisandro Dalcin /* 74*/ NULL, 35633acb8795SBarry Smith MatFDColoringApply_AIJ, 3564f4259b30SLisandro Dalcin NULL, 3565f4259b30SLisandro Dalcin NULL, 3566f4259b30SLisandro Dalcin NULL, 35676ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3568f4259b30SLisandro Dalcin NULL, 3569f4259b30SLisandro Dalcin NULL, 3570f4259b30SLisandro Dalcin NULL, 3571bc011b1eSHong Zhang MatLoad_SeqAIJ, 3572d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqAIJ, 35731cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 3574f4259b30SLisandro Dalcin NULL, 3575f4259b30SLisandro Dalcin NULL, 3576f4259b30SLisandro Dalcin NULL, 3577f4259b30SLisandro Dalcin /* 89*/ NULL, 3578f4259b30SLisandro Dalcin NULL, 357926be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3580f4259b30SLisandro Dalcin NULL, 3581f4259b30SLisandro Dalcin NULL, 35828fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3583f4259b30SLisandro Dalcin NULL, 3584f4259b30SLisandro Dalcin NULL, 35856fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3586f4259b30SLisandro Dalcin NULL, 35874222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3588f4259b30SLisandro Dalcin NULL, 3589f4259b30SLisandro Dalcin NULL, 359087d4246cSBarry Smith MatConjugate_SeqAIJ, 3591f4259b30SLisandro Dalcin NULL, 3592d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 359399cafbc1SBarry Smith MatRealPart_SeqAIJ, 3594f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3595f4259b30SLisandro Dalcin NULL, 3596f4259b30SLisandro Dalcin NULL, 3597cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3598f4259b30SLisandro Dalcin NULL, 35992af78befSBarry Smith MatGetRowMin_SeqAIJ, 3600f4259b30SLisandro Dalcin NULL, 3601599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3602f4259b30SLisandro Dalcin /*114*/ NULL, 3603f4259b30SLisandro Dalcin NULL, 3604f4259b30SLisandro Dalcin NULL, 3605f4259b30SLisandro Dalcin NULL, 3606f4259b30SLisandro Dalcin NULL, 3607f4259b30SLisandro Dalcin /*119*/ NULL, 3608f4259b30SLisandro Dalcin NULL, 3609f4259b30SLisandro Dalcin NULL, 3610f4259b30SLisandro Dalcin NULL, 3611b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 36120716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3613a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 361437868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 36150da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3616f4259b30SLisandro Dalcin NULL, 3617f4259b30SLisandro Dalcin /*129*/ NULL, 3618f4259b30SLisandro Dalcin NULL, 3619f4259b30SLisandro Dalcin NULL, 362075648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3621b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3622b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 36232b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3624f4259b30SLisandro Dalcin NULL, 3625f4259b30SLisandro Dalcin NULL, 36263964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3627f4259b30SLisandro Dalcin /*139*/NULL, 3628f4259b30SLisandro Dalcin NULL, 3629f4259b30SLisandro Dalcin NULL, 36303a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 36319c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 36324222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 36334222ddf1SHong Zhang /*145*/MatDestroySubMatrices_SeqAIJ, 3634f4259b30SLisandro Dalcin NULL, 3635f4259b30SLisandro Dalcin NULL 36369e29f15eSvictorle }; 363717ab2063SBarry Smith 36387087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat,PetscInt *indices) 3639bef8e0ddSBarry Smith { 3640bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 364197f1f81fSBarry Smith PetscInt i,nz,n; 3642bef8e0ddSBarry Smith 3643bef8e0ddSBarry Smith PetscFunctionBegin; 3644bef8e0ddSBarry Smith nz = aij->maxnz; 3645d0f46423SBarry Smith n = mat->rmap->n; 3646bef8e0ddSBarry Smith for (i=0; i<nz; i++) { 3647bef8e0ddSBarry Smith aij->j[i] = indices[i]; 3648bef8e0ddSBarry Smith } 3649bef8e0ddSBarry Smith aij->nz = nz; 3650bef8e0ddSBarry Smith for (i=0; i<n; i++) { 3651bef8e0ddSBarry Smith aij->ilen[i] = aij->imax[i]; 3652bef8e0ddSBarry Smith } 3653bef8e0ddSBarry Smith PetscFunctionReturn(0); 3654bef8e0ddSBarry Smith } 3655bef8e0ddSBarry Smith 3656a3bb6f32SFande Kong /* 3657ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3658ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3659ddea5d60SJunchao Zhang */ 3660a3bb6f32SFande Kong PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3661a3bb6f32SFande Kong { 3662a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3663a3bb6f32SFande Kong PetscTable gid1_lid1; 3664a3bb6f32SFande Kong PetscTablePosition tpos; 366525b670f0SStefano Zampini PetscInt gid,lid,i,ec,nz = aij->nz; 366625b670f0SStefano Zampini PetscInt *garray,*jj = aij->j; 3667a3bb6f32SFande Kong 3668a3bb6f32SFande Kong PetscFunctionBegin; 3669a3bb6f32SFande Kong PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3670a3bb6f32SFande Kong PetscValidPointer(mapping,2); 3671a3bb6f32SFande Kong /* use a table */ 36729566063dSJacob Faibussowitsch PetscCall(PetscTableCreate(mat->rmap->n,mat->cmap->N+1,&gid1_lid1)); 3673a3bb6f32SFande Kong ec = 0; 367425b670f0SStefano Zampini for (i=0; i<nz; i++) { 367525b670f0SStefano Zampini PetscInt data,gid1 = jj[i] + 1; 36769566063dSJacob Faibussowitsch PetscCall(PetscTableFind(gid1_lid1,gid1,&data)); 3677a3bb6f32SFande Kong if (!data) { 3678a3bb6f32SFande Kong /* one based table */ 36799566063dSJacob Faibussowitsch PetscCall(PetscTableAdd(gid1_lid1,gid1,++ec,INSERT_VALUES)); 3680a3bb6f32SFande Kong } 3681a3bb6f32SFande Kong } 3682a3bb6f32SFande Kong /* form array of columns we need */ 36839566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec,&garray)); 36849566063dSJacob Faibussowitsch PetscCall(PetscTableGetHeadPosition(gid1_lid1,&tpos)); 3685a3bb6f32SFande Kong while (tpos) { 36869566063dSJacob Faibussowitsch PetscCall(PetscTableGetNext(gid1_lid1,&tpos,&gid,&lid)); 3687a3bb6f32SFande Kong gid--; 3688a3bb6f32SFande Kong lid--; 3689a3bb6f32SFande Kong garray[lid] = gid; 3690a3bb6f32SFande Kong } 36919566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec,garray)); /* sort, and rebuild */ 36929566063dSJacob Faibussowitsch PetscCall(PetscTableRemoveAll(gid1_lid1)); 3693a3bb6f32SFande Kong for (i=0; i<ec; i++) { 36949566063dSJacob Faibussowitsch PetscCall(PetscTableAdd(gid1_lid1,garray[i]+1,i+1,INSERT_VALUES)); 3695a3bb6f32SFande Kong } 3696a3bb6f32SFande Kong /* compact out the extra columns in B */ 369725b670f0SStefano Zampini for (i=0; i<nz; i++) { 369825b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 36999566063dSJacob Faibussowitsch PetscCall(PetscTableFind(gid1_lid1,gid1,&lid)); 3700a3bb6f32SFande Kong lid--; 370125b670f0SStefano Zampini jj[i] = lid; 3702a3bb6f32SFande Kong } 37039566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 37049566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy(&gid1_lid1)); 37059566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat),ec,ec,1,&mat->cmap)); 37069566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF,mat->cmap->bs,mat->cmap->n,garray,PETSC_OWN_POINTER,mapping)); 37079566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping,ISLOCALTOGLOBALMAPPINGHASH)); 3708a3bb6f32SFande Kong PetscFunctionReturn(0); 3709a3bb6f32SFande Kong } 3710a3bb6f32SFande Kong 3711bef8e0ddSBarry Smith /*@ 3712bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3713bef8e0ddSBarry Smith in the matrix. 3714bef8e0ddSBarry Smith 3715bef8e0ddSBarry Smith Input Parameters: 3716bef8e0ddSBarry Smith + mat - the SeqAIJ matrix 3717bef8e0ddSBarry Smith - indices - the column indices 3718bef8e0ddSBarry Smith 371915091d37SBarry Smith Level: advanced 372015091d37SBarry Smith 3721bef8e0ddSBarry Smith Notes: 3722bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3723bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 3724bef8e0ddSBarry Smith of the MatSetValues() operation. 3725bef8e0ddSBarry Smith 3726bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 3727d1be2dadSMatthew Knepley MatCreateSeqAIJ(), and the columns indices MUST be sorted. 3728bef8e0ddSBarry Smith 3729bef8e0ddSBarry Smith MUST be called before any calls to MatSetValues(); 3730bef8e0ddSBarry Smith 3731b9617806SBarry Smith The indices should start with zero, not one. 3732b9617806SBarry Smith 3733bef8e0ddSBarry Smith @*/ 37347087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat,PetscInt *indices) 3735bef8e0ddSBarry Smith { 3736bef8e0ddSBarry Smith PetscFunctionBegin; 37370700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3738dadcf809SJacob Faibussowitsch PetscValidIntPointer(indices,2); 3739cac4c232SBarry Smith PetscUseMethod(mat,"MatSeqAIJSetColumnIndices_C",(Mat,PetscInt*),(mat,indices)); 3740bef8e0ddSBarry Smith PetscFunctionReturn(0); 3741bef8e0ddSBarry Smith } 3742bef8e0ddSBarry Smith 3743be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/ 3744be6bf707SBarry Smith 37457087cfbeSBarry Smith PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3746be6bf707SBarry Smith { 3747be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3748d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3749be6bf707SBarry Smith 3750be6bf707SBarry Smith PetscFunctionBegin; 375128b400f6SJacob Faibussowitsch PetscCheck(aij->nonew,PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3752be6bf707SBarry Smith 3753be6bf707SBarry Smith /* allocate space for values if not already there */ 3754be6bf707SBarry Smith if (!aij->saved_values) { 37559566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz+1,&aij->saved_values)); 37569566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)mat,(nz+1)*sizeof(PetscScalar))); 3757be6bf707SBarry Smith } 3758be6bf707SBarry Smith 3759be6bf707SBarry Smith /* copy values over */ 37609566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values,aij->a,nz)); 3761be6bf707SBarry Smith PetscFunctionReturn(0); 3762be6bf707SBarry Smith } 3763be6bf707SBarry Smith 3764be6bf707SBarry Smith /*@ 3765be6bf707SBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows, for 3766be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3767be6bf707SBarry Smith nonlinear portion. 3768be6bf707SBarry Smith 3769be6bf707SBarry Smith Collect on Mat 3770be6bf707SBarry Smith 3771be6bf707SBarry Smith Input Parameters: 37720e609b76SBarry Smith . mat - the matrix (currently only AIJ matrices support this option) 3773be6bf707SBarry Smith 377415091d37SBarry Smith Level: advanced 377515091d37SBarry Smith 3776be6bf707SBarry Smith Common Usage, with SNESSolve(): 3777be6bf707SBarry Smith $ Create Jacobian matrix 3778be6bf707SBarry Smith $ Set linear terms into matrix 3779be6bf707SBarry Smith $ Apply boundary conditions to matrix, at this time matrix must have 3780be6bf707SBarry Smith $ final nonzero structure (i.e. setting the nonlinear terms and applying 3781be6bf707SBarry Smith $ boundary conditions again will not change the nonzero structure 3782512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3783be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3784be6bf707SBarry Smith $ Call SNESSetJacobian() with matrix 3785be6bf707SBarry Smith $ In your Jacobian routine 3786be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3787be6bf707SBarry Smith $ Set nonlinear terms in matrix 3788be6bf707SBarry Smith 3789be6bf707SBarry Smith Common Usage without SNESSolve(), i.e. when you handle nonlinear solve yourself: 3790be6bf707SBarry Smith $ // build linear portion of Jacobian 3791512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3792be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3793be6bf707SBarry Smith $ loop over nonlinear iterations 3794be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3795be6bf707SBarry Smith $ // call MatSetValues(mat,...) to set nonliner portion of Jacobian 3796be6bf707SBarry Smith $ // call MatAssemblyBegin/End() on matrix 3797be6bf707SBarry Smith $ Solve linear system with Jacobian 3798be6bf707SBarry Smith $ endloop 3799be6bf707SBarry Smith 3800be6bf707SBarry Smith Notes: 3801be6bf707SBarry Smith Matrix must already be assemblied before calling this routine 3802512a5fc5SBarry Smith Must set the matrix option MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); before 3803be6bf707SBarry Smith calling this routine. 3804be6bf707SBarry Smith 38050c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 38060c468ba9SBarry Smith and does not allocated additional space. 38070c468ba9SBarry Smith 3808db781477SPatrick Sanan .seealso: `MatRetrieveValues()` 3809be6bf707SBarry Smith 3810be6bf707SBarry Smith @*/ 38117087cfbeSBarry Smith PetscErrorCode MatStoreValues(Mat mat) 3812be6bf707SBarry Smith { 3813be6bf707SBarry Smith PetscFunctionBegin; 38140700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 381528b400f6SJacob Faibussowitsch PetscCheck(mat->assembled,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 381628b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3817cac4c232SBarry Smith PetscUseMethod(mat,"MatStoreValues_C",(Mat),(mat)); 3818be6bf707SBarry Smith PetscFunctionReturn(0); 3819be6bf707SBarry Smith } 3820be6bf707SBarry Smith 38217087cfbeSBarry Smith PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3822be6bf707SBarry Smith { 3823be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3824d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3825be6bf707SBarry Smith 3826be6bf707SBarry Smith PetscFunctionBegin; 382728b400f6SJacob Faibussowitsch PetscCheck(aij->nonew,PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 382828b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values,PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatStoreValues(A);first"); 3829be6bf707SBarry Smith /* copy values over */ 38309566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a,aij->saved_values,nz)); 3831be6bf707SBarry Smith PetscFunctionReturn(0); 3832be6bf707SBarry Smith } 3833be6bf707SBarry Smith 3834be6bf707SBarry Smith /*@ 3835be6bf707SBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for 3836be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3837be6bf707SBarry Smith nonlinear portion. 3838be6bf707SBarry Smith 3839be6bf707SBarry Smith Collect on Mat 3840be6bf707SBarry Smith 3841be6bf707SBarry Smith Input Parameters: 3842386f7cf9SBarry Smith . mat - the matrix (currently only AIJ matrices support this option) 3843be6bf707SBarry Smith 384415091d37SBarry Smith Level: advanced 384515091d37SBarry Smith 3846db781477SPatrick Sanan .seealso: `MatStoreValues()` 3847be6bf707SBarry Smith 3848be6bf707SBarry Smith @*/ 38497087cfbeSBarry Smith PetscErrorCode MatRetrieveValues(Mat mat) 3850be6bf707SBarry Smith { 3851be6bf707SBarry Smith PetscFunctionBegin; 38520700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 385328b400f6SJacob Faibussowitsch PetscCheck(mat->assembled,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 385428b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3855cac4c232SBarry Smith PetscUseMethod(mat,"MatRetrieveValues_C",(Mat),(mat)); 3856be6bf707SBarry Smith PetscFunctionReturn(0); 3857be6bf707SBarry Smith } 3858be6bf707SBarry Smith 3859be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/ 386017ab2063SBarry Smith /*@C 3861682d7d0cSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in AIJ (compressed row) format 38620d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 38636e62573dSLois Curfman McInnes the user should preallocate the matrix storage by setting the parameter nz 386451c19458SBarry Smith (or the array nnz). By setting these parameters accurately, performance 38652bd5e0b2SLois Curfman McInnes during matrix assembly can be increased by more than a factor of 50. 386617ab2063SBarry Smith 3867d083f849SBarry Smith Collective 3868db81eaa0SLois Curfman McInnes 386917ab2063SBarry Smith Input Parameters: 3870db81eaa0SLois Curfman McInnes + comm - MPI communicator, set to PETSC_COMM_SELF 387117ab2063SBarry Smith . m - number of rows 387217ab2063SBarry Smith . n - number of columns 387317ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 387451c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38750298fd71SBarry Smith (possibly different for each row) or NULL 387617ab2063SBarry Smith 387717ab2063SBarry Smith Output Parameter: 3878416022c9SBarry Smith . A - the matrix 387917ab2063SBarry Smith 3880175b88e8SBarry Smith It is recommended that one use the MatCreate(), MatSetType() and/or MatSetFromOptions(), 3881f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 3882175b88e8SBarry Smith [MatXXXXSetPreallocation() is, for example, MatSeqAIJSetPreallocation] 3883175b88e8SBarry Smith 3884b259b22eSLois Curfman McInnes Notes: 388549a6f317SBarry Smith If nnz is given then nz is ignored 388649a6f317SBarry Smith 388717ab2063SBarry Smith The AIJ format (also called the Yale sparse matrix format or 388817ab2063SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 38890002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 389044cd7ae7SLois Curfman McInnes either one (as in Fortran) or zero. See the users' manual for details. 389117ab2063SBarry Smith 389217ab2063SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 38930298fd71SBarry Smith Set nz=PETSC_DEFAULT and nnz=NULL for PETSc to control dynamic memory 38943d323bbdSBarry Smith allocation. For large problems you MUST preallocate memory or you 38956da5968aSLois Curfman McInnes will get TERRIBLE performance, see the users' manual chapter on matrices. 389617ab2063SBarry Smith 3897682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38984fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3899682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 39006c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 39016c7ebb05SLois Curfman McInnes 39026c7ebb05SLois Curfman McInnes Options Database Keys: 3903698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 39049db58ca8SBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 390517ab2063SBarry Smith 3906027ccd11SLois Curfman McInnes Level: intermediate 3907027ccd11SLois Curfman McInnes 3908db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 390936db0b34SBarry Smith 391017ab2063SBarry Smith @*/ 39117087cfbeSBarry Smith PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt nz,const PetscInt nnz[],Mat *A) 391217ab2063SBarry Smith { 39133a40ed3dSBarry Smith PetscFunctionBegin; 39149566063dSJacob Faibussowitsch PetscCall(MatCreate(comm,A)); 39159566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A,m,n,m,n)); 39169566063dSJacob Faibussowitsch PetscCall(MatSetType(*A,MATSEQAIJ)); 39179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A,nz,nnz)); 3918273d9f13SBarry Smith PetscFunctionReturn(0); 3919273d9f13SBarry Smith } 3920273d9f13SBarry Smith 3921273d9f13SBarry Smith /*@C 3922273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3923273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3924273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3925273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3926273d9f13SBarry Smith 3927d083f849SBarry Smith Collective 3928273d9f13SBarry Smith 3929273d9f13SBarry Smith Input Parameters: 39301c4f3114SJed Brown + B - The matrix 3931273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3932273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 39330298fd71SBarry Smith (possibly different for each row) or NULL 3934273d9f13SBarry Smith 3935273d9f13SBarry Smith Notes: 393649a6f317SBarry Smith If nnz is given then nz is ignored 393749a6f317SBarry Smith 3938273d9f13SBarry Smith The AIJ format (also called the Yale sparse matrix format or 3939273d9f13SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 3940273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3941273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3942273d9f13SBarry Smith 3943273d9f13SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 39440298fd71SBarry Smith Set nz=PETSC_DEFAULT and nnz=NULL for PETSc to control dynamic memory 3945273d9f13SBarry Smith allocation. For large problems you MUST preallocate memory or you 3946273d9f13SBarry Smith will get TERRIBLE performance, see the users' manual chapter on matrices. 3947273d9f13SBarry Smith 3948aa95bbe8SBarry Smith You can call MatGetInfo() to get information on how effective the preallocation was; 3949aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3950aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3951aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3952aa95bbe8SBarry Smith 3953a96a251dSBarry Smith Developers: Use nz of MAT_SKIP_ALLOCATION to not allocate any space for the matrix 3954a96a251dSBarry Smith entries or columns indices 3955a96a251dSBarry Smith 3956273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3957273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3958273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3959273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3960273d9f13SBarry Smith 3961273d9f13SBarry Smith Options Database Keys: 3962698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 396347b2e64bSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 3964273d9f13SBarry Smith 3965273d9f13SBarry Smith Level: intermediate 3966273d9f13SBarry Smith 3967db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3968db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3969273d9f13SBarry Smith 3970273d9f13SBarry Smith @*/ 39717087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation(Mat B,PetscInt nz,const PetscInt nnz[]) 3972273d9f13SBarry Smith { 3973a23d5eceSKris Buschelman PetscFunctionBegin; 39746ba663aaSJed Brown PetscValidHeaderSpecific(B,MAT_CLASSID,1); 39756ba663aaSJed Brown PetscValidType(B,1); 3976cac4c232SBarry Smith PetscTryMethod(B,"MatSeqAIJSetPreallocation_C",(Mat,PetscInt,const PetscInt[]),(B,nz,nnz)); 3977a23d5eceSKris Buschelman PetscFunctionReturn(0); 3978a23d5eceSKris Buschelman } 3979a23d5eceSKris Buschelman 39807087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B,PetscInt nz,const PetscInt *nnz) 3981a23d5eceSKris Buschelman { 3982273d9f13SBarry Smith Mat_SeqAIJ *b; 39832576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE,realalloc = PETSC_FALSE; 398497f1f81fSBarry Smith PetscInt i; 3985273d9f13SBarry Smith 3986273d9f13SBarry Smith PetscFunctionBegin; 39872576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3988a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3989c461c341SBarry Smith skipallocation = PETSC_TRUE; 3990c461c341SBarry Smith nz = 0; 3991c461c341SBarry Smith } 39929566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39939566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3994899cda47SBarry Smith 3995435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 399608401ef6SPierre Jolivet PetscCheck(nz >= 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nz cannot be less than 0: value %" PetscInt_FMT,nz); 3997cf9c20a2SJed Brown if (PetscUnlikelyDebug(nnz)) { 3998d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) { 399908401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT,i,nnz[i]); 400008401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT,i,nnz[i],B->cmap->n); 4001b73539f3SBarry Smith } 4002b73539f3SBarry Smith } 4003b73539f3SBarry Smith 4004273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 40052205254eSKarl Rupp 4006273d9f13SBarry Smith b = (Mat_SeqAIJ*)B->data; 4007273d9f13SBarry Smith 4008ab93d7beSBarry Smith if (!skipallocation) { 40092ee49352SLisandro Dalcin if (!b->imax) { 40109566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n,&b->imax)); 40119566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt))); 4012071fcb05SBarry Smith } 4013071fcb05SBarry Smith if (!b->ilen) { 4014071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 40159566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n,&b->ilen)); 40169566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt))); 4017071fcb05SBarry Smith } else { 40189566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen,B->rmap->n*sizeof(PetscInt))); 40192ee49352SLisandro Dalcin } 4020846b4da1SFande Kong if (!b->ipre) { 40219566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n,&b->ipre)); 40229566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt))); 4023846b4da1SFande Kong } 4024273d9f13SBarry Smith if (!nnz) { 4025435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 4026c62bd62aSJed Brown else if (nz < 0) nz = 1; 40275d2a9ed1SStefano Zampini nz = PetscMin(nz,B->cmap->n); 4028d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) b->imax[i] = nz; 4029d0f46423SBarry Smith nz = nz*B->rmap->n; 4030273d9f13SBarry Smith } else { 4031c73702f5SBarry Smith PetscInt64 nz64 = 0; 4032c73702f5SBarry Smith for (i=0; i<B->rmap->n; i++) {b->imax[i] = nnz[i]; nz64 += nnz[i];} 40339566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64,&nz)); 4034273d9f13SBarry Smith } 4035ab93d7beSBarry Smith 4036273d9f13SBarry Smith /* allocate the matrix space */ 403753dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 40389566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B,&b->a,&b->j,&b->i)); 4039396832f4SHong Zhang if (B->structure_only) { 40409566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz,&b->j)); 40419566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n+1,&b->i)); 40429566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)B,(B->rmap->n+1)*sizeof(PetscInt)+nz*sizeof(PetscInt))); 4043396832f4SHong Zhang } else { 40449566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nz,&b->a,nz,&b->j,B->rmap->n+1,&b->i)); 40459566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)B,(B->rmap->n+1)*sizeof(PetscInt)+nz*(sizeof(PetscScalar)+sizeof(PetscInt)))); 4046396832f4SHong Zhang } 4047bfeeae90SHong Zhang b->i[0] = 0; 4048d0f46423SBarry Smith for (i=1; i<B->rmap->n+1; i++) { 40495da197adSKris Buschelman b->i[i] = b->i[i-1] + b->imax[i-1]; 40505da197adSKris Buschelman } 4051396832f4SHong Zhang if (B->structure_only) { 4052396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 4053396832f4SHong Zhang b->free_a = PETSC_FALSE; 4054396832f4SHong Zhang } else { 4055273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 4056e6b907acSBarry Smith b->free_a = PETSC_TRUE; 4057396832f4SHong Zhang } 4058e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 4059c461c341SBarry Smith } else { 4060e6b907acSBarry Smith b->free_a = PETSC_FALSE; 4061e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 4062c461c341SBarry Smith } 4063273d9f13SBarry Smith 4064846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 4065846b4da1SFande Kong /* reserve user-requested sparsity */ 40669566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre,b->imax,B->rmap->n)); 4067846b4da1SFande Kong } 4068846b4da1SFande Kong 4069273d9f13SBarry Smith b->nz = 0; 4070273d9f13SBarry Smith b->maxnz = nz; 4071273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40722205254eSKarl Rupp if (realalloc) { 40739566063dSJacob Faibussowitsch PetscCall(MatSetOption(B,MAT_NEW_NONZERO_ALLOCATION_ERR,PETSC_TRUE)); 40742205254eSKarl Rupp } 4075cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4076cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40775519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40785519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40795519a089SJose E. Roman */ 40805519a089SJose E. Roman B->nonzerostate++; 4081273d9f13SBarry Smith PetscFunctionReturn(0); 4082273d9f13SBarry Smith } 4083273d9f13SBarry Smith 4084846b4da1SFande Kong PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4085846b4da1SFande Kong { 4086846b4da1SFande Kong Mat_SeqAIJ *a; 4087a5bbaf83SFande Kong PetscInt i; 4088846b4da1SFande Kong 4089846b4da1SFande Kong PetscFunctionBegin; 4090846b4da1SFande Kong PetscValidHeaderSpecific(A,MAT_CLASSID,1); 409114d0e64fSAlex Lindsay 409214d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 409314d0e64fSAlex Lindsay if (!A->rmap->n) PetscFunctionReturn(0); 409414d0e64fSAlex Lindsay 4095846b4da1SFande Kong a = (Mat_SeqAIJ*)A->data; 40962c814fdeSFande Kong /* if no saved info, we error out */ 409728b400f6SJacob Faibussowitsch PetscCheck(a->ipre,PETSC_COMM_SELF,PETSC_ERR_ARG_NULL,"No saved preallocation info "); 40982c814fdeSFande Kong 4099aed4548fSBarry Smith PetscCheck(a->i && a->j && a->a && a->imax && a->ilen,PETSC_COMM_SELF,PETSC_ERR_ARG_NULL,"Memory info is incomplete, and can not reset preallocation "); 41002c814fdeSFande Kong 41019566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax,a->ipre,A->rmap->n)); 41029566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen,A->rmap->n)); 4103846b4da1SFande Kong a->i[0] = 0; 4104846b4da1SFande Kong for (i=1; i<A->rmap->n+1; i++) { 4105846b4da1SFande Kong a->i[i] = a->i[i-1] + a->imax[i-1]; 4106846b4da1SFande Kong } 4107846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4108846b4da1SFande Kong a->nz = 0; 4109846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4110846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4111846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4112846b4da1SFande Kong A->assembled = PETSC_FALSE; 4113846b4da1SFande Kong PetscFunctionReturn(0); 4114846b4da1SFande Kong } 4115846b4da1SFande Kong 411658d36128SBarry Smith /*@ 4117a1661176SMatthew Knepley MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in AIJ format. 4118a1661176SMatthew Knepley 4119a1661176SMatthew Knepley Input Parameters: 4120a1661176SMatthew Knepley + B - the matrix 4121a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 4122a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 4123a1661176SMatthew Knepley - v - optional values in the matrix 4124a1661176SMatthew Knepley 4125a1661176SMatthew Knepley Level: developer 4126a1661176SMatthew Knepley 41276a9b8d82SBarry Smith Notes: 412858d36128SBarry Smith The i,j,v values are COPIED with this routine; to avoid the copy use MatCreateSeqAIJWithArrays() 412958d36128SBarry Smith 41306a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 41316a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 41326a9b8d82SBarry Smith 41336a9b8d82SBarry Smith Developer Notes: 41346a9b8d82SBarry Smith An optimization could be added to the implementation where it checks if the i, and j are identical to the current i and j and 41356a9b8d82SBarry Smith then just copies the v values directly with PetscMemcpy(). 41366a9b8d82SBarry Smith 41376a9b8d82SBarry Smith This routine could also take a PetscCopyMode argument to allow sharing the values instead of always copying them. 41386a9b8d82SBarry Smith 4139db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MatResetPreallocation()` 4140a1661176SMatthew Knepley @*/ 4141a1661176SMatthew Knepley PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B,const PetscInt i[],const PetscInt j[],const PetscScalar v[]) 4142a1661176SMatthew Knepley { 4143a1661176SMatthew Knepley PetscFunctionBegin; 41440700a824SBarry Smith PetscValidHeaderSpecific(B,MAT_CLASSID,1); 41456ba663aaSJed Brown PetscValidType(B,1); 4146cac4c232SBarry Smith PetscTryMethod(B,"MatSeqAIJSetPreallocationCSR_C",(Mat,const PetscInt[],const PetscInt[],const PetscScalar[]),(B,i,j,v)); 4147a1661176SMatthew Knepley PetscFunctionReturn(0); 4148a1661176SMatthew Knepley } 4149a1661176SMatthew Knepley 41507087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B,const PetscInt Ii[],const PetscInt J[],const PetscScalar v[]) 4151a1661176SMatthew Knepley { 4152a1661176SMatthew Knepley PetscInt i; 4153a1661176SMatthew Knepley PetscInt m,n; 4154a1661176SMatthew Knepley PetscInt nz; 41556a9b8d82SBarry Smith PetscInt *nnz; 4156a1661176SMatthew Knepley 4157a1661176SMatthew Knepley PetscFunctionBegin; 4158aed4548fSBarry Smith PetscCheck(Ii[0] == 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4159779a8d59SSatish Balay 41609566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 41619566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4162779a8d59SSatish Balay 41639566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 41649566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1, &nnz)); 4165a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4166b7940d39SSatish Balay nz = Ii[i+1]- Ii[i]; 416708401ef6SPierre Jolivet PetscCheck(nz >= 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4168a1661176SMatthew Knepley nnz[i] = nz; 4169a1661176SMatthew Knepley } 41709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 41719566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4172a1661176SMatthew Knepley 4173a1661176SMatthew Knepley for (i = 0; i < m; i++) { 41749566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i+1] - Ii[i], J+Ii[i], v ? v + Ii[i] : NULL, INSERT_VALUES)); 4175a1661176SMatthew Knepley } 4176a1661176SMatthew Knepley 41779566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY)); 41789566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY)); 4179a1661176SMatthew Knepley 41809566063dSJacob Faibussowitsch PetscCall(MatSetOption(B,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE)); 4181a1661176SMatthew Knepley PetscFunctionReturn(0); 4182a1661176SMatthew Knepley } 4183a1661176SMatthew Knepley 4184ad7e164aSPierre Jolivet /*@ 4185ad7e164aSPierre Jolivet MatSeqAIJKron - Computes C, the Kronecker product of A and B. 4186ad7e164aSPierre Jolivet 4187ad7e164aSPierre Jolivet Input Parameters: 4188ad7e164aSPierre Jolivet + A - left-hand side matrix 4189ad7e164aSPierre Jolivet . B - right-hand side matrix 4190ad7e164aSPierre Jolivet - reuse - either MAT_INITIAL_MATRIX or MAT_REUSE_MATRIX 4191ad7e164aSPierre Jolivet 4192ad7e164aSPierre Jolivet Output Parameter: 4193ad7e164aSPierre Jolivet . C - Kronecker product of A and B 4194ad7e164aSPierre Jolivet 4195ad7e164aSPierre Jolivet Level: intermediate 4196ad7e164aSPierre Jolivet 4197ad7e164aSPierre Jolivet Notes: 4198ad7e164aSPierre Jolivet MAT_REUSE_MATRIX can only be used when the nonzero structure of the product matrix has not changed from that last call to MatSeqAIJKron(). 4199ad7e164aSPierre Jolivet 4200db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4201ad7e164aSPierre Jolivet @*/ 4202ad7e164aSPierre Jolivet PetscErrorCode MatSeqAIJKron(Mat A,Mat B,MatReuse reuse,Mat *C) 4203ad7e164aSPierre Jolivet { 4204ad7e164aSPierre Jolivet PetscFunctionBegin; 4205ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A,MAT_CLASSID,1); 4206ad7e164aSPierre Jolivet PetscValidType(A,1); 4207ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B,MAT_CLASSID,2); 4208ad7e164aSPierre Jolivet PetscValidType(B,2); 4209ad7e164aSPierre Jolivet PetscValidPointer(C,4); 4210ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4211ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C,MAT_CLASSID,4); 4212ad7e164aSPierre Jolivet PetscValidType(*C,4); 4213ad7e164aSPierre Jolivet } 4214cac4c232SBarry Smith PetscTryMethod(A,"MatSeqAIJKron_C",(Mat,Mat,MatReuse,Mat*),(A,B,reuse,C)); 4215ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4216ad7e164aSPierre Jolivet } 4217ad7e164aSPierre Jolivet 4218ad7e164aSPierre Jolivet PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A,Mat B,MatReuse reuse,Mat *C) 4219ad7e164aSPierre Jolivet { 4220ad7e164aSPierre Jolivet Mat newmat; 4221ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 4222ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ*)B->data; 4223ad7e164aSPierre Jolivet PetscScalar *v; 4224fff043a9SJunchao Zhang const PetscScalar *aa,*ba; 4225ad7e164aSPierre Jolivet PetscInt *i,*j,m,n,p,q,nnz = 0,am = A->rmap->n,bm = B->rmap->n,an = A->cmap->n, bn = B->cmap->n; 4226ad7e164aSPierre Jolivet PetscBool flg; 4227ad7e164aSPierre Jolivet 4228ad7e164aSPierre Jolivet PetscFunctionBegin; 422928b400f6SJacob Faibussowitsch PetscCheck(!A->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 423028b400f6SJacob Faibussowitsch PetscCheck(A->assembled,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 423128b400f6SJacob Faibussowitsch PetscCheck(!B->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 423228b400f6SJacob Faibussowitsch PetscCheck(B->assembled,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 42339566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B,MATSEQAIJ,&flg)); 423428b400f6SJacob Faibussowitsch PetscCheck(flg,PETSC_COMM_SELF,PETSC_ERR_SUP,"MatType %s",((PetscObject)B)->type_name); 4235aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX,PETSC_COMM_SELF,PETSC_ERR_SUP,"MatReuse %d",(int)reuse); 4236ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 42379566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am*bm+1,&i,a->i[am]*b->i[bm],&j)); 42389566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF,&newmat)); 42399566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat,am*bm,an*bn,am*bm,an*bn)); 42409566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat,MATAIJ)); 4241ad7e164aSPierre Jolivet i[0] = 0; 4242ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4243ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4244ad7e164aSPierre Jolivet i[m*bm + p + 1] = i[m*bm + p] + (a->i[m+1] - a->i[m]) * (b->i[p+1] - b->i[p]); 4245ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m+1]; ++n) { 4246ad7e164aSPierre Jolivet for (q = b->i[p]; q < b->i[p+1]; ++q) { 4247ad7e164aSPierre Jolivet j[nnz++] = a->j[n]*bn + b->j[q]; 4248ad7e164aSPierre Jolivet } 4249ad7e164aSPierre Jolivet } 4250ad7e164aSPierre Jolivet } 4251ad7e164aSPierre Jolivet } 42529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat,i,j,NULL)); 4253ad7e164aSPierre Jolivet *C = newmat; 42549566063dSJacob Faibussowitsch PetscCall(PetscFree2(i,j)); 4255ad7e164aSPierre Jolivet nnz = 0; 4256ad7e164aSPierre Jolivet } 42579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C,&v)); 42589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 42599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B,&ba)); 4260ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4261ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4262ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m+1]; ++n) { 4263ad7e164aSPierre Jolivet for (q = b->i[p]; q < b->i[p+1]; ++q) { 4264fff043a9SJunchao Zhang v[nnz++] = aa[n] * ba[q]; 4265ad7e164aSPierre Jolivet } 4266ad7e164aSPierre Jolivet } 4267ad7e164aSPierre Jolivet } 4268ad7e164aSPierre Jolivet } 42699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C,&v)); 42709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 42719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B,&ba)); 4272ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4273ad7e164aSPierre Jolivet } 4274ad7e164aSPierre Jolivet 4275c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4276af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4277170fe5c8SBarry Smith 4278170fe5c8SBarry Smith /* 4279170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4280170fe5c8SBarry Smith 4281170fe5c8SBarry Smith n p p 42822da392ccSBarry Smith [ ] [ ] [ ] 42832da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42842da392ccSBarry Smith [ ] [ ] [ ] 4285170fe5c8SBarry Smith 4286170fe5c8SBarry Smith */ 4287170fe5c8SBarry Smith PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A,Mat B,Mat C) 4288170fe5c8SBarry Smith { 4289170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense*)A->data; 4290170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ*)B->data; 4291170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense*)C->data; 429286214ceeSStefano Zampini PetscInt i,j,n,m,q,p; 4293170fe5c8SBarry Smith const PetscInt *ii,*idx; 4294170fe5c8SBarry Smith const PetscScalar *b,*a,*a_q; 4295170fe5c8SBarry Smith PetscScalar *c,*c_q; 429686214ceeSStefano Zampini PetscInt clda = sub_c->lda; 429786214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4298170fe5c8SBarry Smith 4299170fe5c8SBarry Smith PetscFunctionBegin; 4300d0f46423SBarry Smith m = A->rmap->n; 4301d0f46423SBarry Smith n = A->cmap->n; 4302d0f46423SBarry Smith p = B->cmap->n; 4303170fe5c8SBarry Smith a = sub_a->v; 4304170fe5c8SBarry Smith b = sub_b->a; 4305170fe5c8SBarry Smith c = sub_c->v; 430686214ceeSStefano Zampini if (clda == m) { 43079566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c,m*p)); 430886214ceeSStefano Zampini } else { 430986214ceeSStefano Zampini for (j=0;j<p;j++) 431086214ceeSStefano Zampini for (i=0;i<m;i++) 431186214ceeSStefano Zampini c[j*clda + i] = 0.0; 431286214ceeSStefano Zampini } 4313170fe5c8SBarry Smith ii = sub_b->i; 4314170fe5c8SBarry Smith idx = sub_b->j; 4315170fe5c8SBarry Smith for (i=0; i<n; i++) { 4316170fe5c8SBarry Smith q = ii[i+1] - ii[i]; 4317170fe5c8SBarry Smith while (q-->0) { 431886214ceeSStefano Zampini c_q = c + clda*(*idx); 431986214ceeSStefano Zampini a_q = a + alda*i; 4320854c7f52SBarry Smith PetscKernelAXPY(c_q,*b,a_q,m); 4321170fe5c8SBarry Smith idx++; 4322170fe5c8SBarry Smith b++; 4323170fe5c8SBarry Smith } 4324170fe5c8SBarry Smith } 4325170fe5c8SBarry Smith PetscFunctionReturn(0); 4326170fe5c8SBarry Smith } 4327170fe5c8SBarry Smith 43284222ddf1SHong Zhang PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A,Mat B,PetscReal fill,Mat C) 4329170fe5c8SBarry Smith { 4330d0f46423SBarry Smith PetscInt m=A->rmap->n,n=B->cmap->n; 433186214ceeSStefano Zampini PetscBool cisdense; 4332170fe5c8SBarry Smith 4333170fe5c8SBarry Smith PetscFunctionBegin; 433408401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT,A->cmap->n,B->rmap->n); 43359566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C,m,n,m,n)); 43369566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C,A,B)); 43379566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATSEQDENSECUDA,"")); 433886214ceeSStefano Zampini if (!cisdense) { 43399566063dSJacob Faibussowitsch PetscCall(MatSetType(C,MATDENSE)); 434086214ceeSStefano Zampini } 43419566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4342d73949e8SHong Zhang 43434222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 4344170fe5c8SBarry Smith PetscFunctionReturn(0); 4345170fe5c8SBarry Smith } 4346170fe5c8SBarry Smith 4347170fe5c8SBarry Smith /* ----------------------------------------------------------------*/ 43480bad9183SKris Buschelman /*MC 4349fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 43500bad9183SKris Buschelman based on compressed sparse row format. 43510bad9183SKris Buschelman 43520bad9183SKris Buschelman Options Database Keys: 43530bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 43540bad9183SKris Buschelman 43550bad9183SKris Buschelman Level: beginner 43560bad9183SKris Buschelman 43570cd7f59aSBarry Smith Notes: 43580cd7f59aSBarry Smith MatSetValues() may be called for this matrix type with a NULL argument for the numerical values, 43590cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 43600cd7f59aSBarry Smith in the matrix 43610cd7f59aSBarry Smith 43620cd7f59aSBarry Smith MatSetOptions(,MAT_STRUCTURE_ONLY,PETSC_TRUE) may be called for this matrix type. In this no 43630cd7f59aSBarry Smith space is allocated for the nonzero entries and any entries passed with MatSetValues() are ignored 43640cd7f59aSBarry Smith 43650cd7f59aSBarry Smith Developer Notes: 43660cd7f59aSBarry Smith It would be nice if all matrix formats supported passing NULL in for the numerical values 43670cd7f59aSBarry Smith 4368db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 43690bad9183SKris Buschelman M*/ 43700bad9183SKris Buschelman 4371ccd284c7SBarry Smith /*MC 4372ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4373ccd284c7SBarry Smith 4374ccd284c7SBarry Smith This matrix type is identical to MATSEQAIJ when constructed with a single process communicator, 4375ccd284c7SBarry Smith and MATMPIAIJ otherwise. As a result, for single process communicators, 4376ed73aabaSBarry Smith MatSeqAIJSetPreallocation() is supported, and similarly MatMPIAIJSetPreallocation() is supported 4377ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4378ccd284c7SBarry Smith the above preallocation routines for simplicity. 4379ccd284c7SBarry Smith 4380ccd284c7SBarry Smith Options Database Keys: 4381ccd284c7SBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to MatSetFromOptions() 4382ccd284c7SBarry Smith 438395452b02SPatrick Sanan Developer Notes: 4384ca9cdca7SRichard Tran Mills Subclasses include MATAIJCUSPARSE, MATAIJPERM, MATAIJSELL, MATAIJMKL, MATAIJCRL, and also automatically switches over to use inodes when 4385ccd284c7SBarry Smith enough exist. 4386ccd284c7SBarry Smith 4387ccd284c7SBarry Smith Level: beginner 4388ccd284c7SBarry Smith 4389db781477SPatrick Sanan .seealso: `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4390ccd284c7SBarry Smith M*/ 4391ccd284c7SBarry Smith 4392ccd284c7SBarry Smith /*MC 4393ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4394ccd284c7SBarry Smith 4395ccd284c7SBarry Smith This matrix type is identical to MATSEQAIJCRL when constructed with a single process communicator, 4396ccd284c7SBarry Smith and MATMPIAIJCRL otherwise. As a result, for single process communicators, 4397ccd284c7SBarry Smith MatSeqAIJSetPreallocation() is supported, and similarly MatMPIAIJSetPreallocation() is supported 4398ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4399ccd284c7SBarry Smith the above preallocation routines for simplicity. 4400ccd284c7SBarry Smith 4401ccd284c7SBarry Smith Options Database Keys: 4402ccd284c7SBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to MatSetFromOptions() 4403ccd284c7SBarry Smith 4404ccd284c7SBarry Smith Level: beginner 4405ccd284c7SBarry Smith 4406c2e3fba1SPatrick Sanan .seealso: `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4407ccd284c7SBarry Smith M*/ 4408ccd284c7SBarry Smith 44097906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat,MatType,MatReuse,Mat*); 44107906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 44117906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat,MatType,MatReuse,Mat*); 44127906f579SHong Zhang #endif 4413d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4414d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat,MatType,MatReuse,Mat*); 4415d24d4204SJose E. Roman #endif 44167906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 44177906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A,MatType,MatReuse,Mat*); 44187906f579SHong Zhang #endif 44197906f579SHong Zhang 4420d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat,MatType,MatReuse,Mat*); 4421c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat,MatType,MatReuse,Mat*); 44224222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 44237906f579SHong Zhang 44248c778c55SBarry Smith /*@C 44258f1ea47aSStefano Zampini MatSeqAIJGetArray - gives read/write access to the array where the data for a MATSEQAIJ matrix is stored 44268c778c55SBarry Smith 44278c778c55SBarry Smith Not Collective 44288c778c55SBarry Smith 44298c778c55SBarry Smith Input Parameter: 4430579dbff0SBarry Smith . mat - a MATSEQAIJ matrix 44318c778c55SBarry Smith 44328c778c55SBarry Smith Output Parameter: 44338c778c55SBarry Smith . array - pointer to the data 44348c778c55SBarry Smith 44358c778c55SBarry Smith Level: intermediate 44368c778c55SBarry Smith 4437db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 44388c778c55SBarry Smith @*/ 44398c778c55SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A,PetscScalar **array) 44408c778c55SBarry Smith { 4441d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 44428c778c55SBarry Smith 44438c778c55SBarry Smith PetscFunctionBegin; 4444d67d9f35SJunchao Zhang if (aij->ops->getarray) { 44459566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A,array)); 4446d67d9f35SJunchao Zhang } else { 4447d67d9f35SJunchao Zhang *array = aij->a; 4448d67d9f35SJunchao Zhang } 4449d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4450d67d9f35SJunchao Zhang } 4451d67d9f35SJunchao Zhang 4452d67d9f35SJunchao Zhang /*@C 4453d67d9f35SJunchao Zhang MatSeqAIJRestoreArray - returns access to the array where the data for a MATSEQAIJ matrix is stored obtained by MatSeqAIJGetArray() 4454d67d9f35SJunchao Zhang 4455d67d9f35SJunchao Zhang Not Collective 4456d67d9f35SJunchao Zhang 4457d67d9f35SJunchao Zhang Input Parameters: 4458d67d9f35SJunchao Zhang + mat - a MATSEQAIJ matrix 4459d67d9f35SJunchao Zhang - array - pointer to the data 4460d67d9f35SJunchao Zhang 4461d67d9f35SJunchao Zhang Level: intermediate 4462d67d9f35SJunchao Zhang 4463db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()` 4464d67d9f35SJunchao Zhang @*/ 4465d67d9f35SJunchao Zhang PetscErrorCode MatSeqAIJRestoreArray(Mat A,PetscScalar **array) 4466d67d9f35SJunchao Zhang { 4467d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 4468d67d9f35SJunchao Zhang 4469d67d9f35SJunchao Zhang PetscFunctionBegin; 4470d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 44719566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A,array)); 4472d67d9f35SJunchao Zhang } else { 4473d67d9f35SJunchao Zhang *array = NULL; 4474d67d9f35SJunchao Zhang } 44759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44769566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 44778c778c55SBarry Smith PetscFunctionReturn(0); 44788c778c55SBarry Smith } 44798c778c55SBarry Smith 448021e72a00SBarry Smith /*@C 44818f1ea47aSStefano Zampini MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a MATSEQAIJ matrix is stored 44828f1ea47aSStefano Zampini 44838f1ea47aSStefano Zampini Not Collective 44848f1ea47aSStefano Zampini 44858f1ea47aSStefano Zampini Input Parameter: 44868f1ea47aSStefano Zampini . mat - a MATSEQAIJ matrix 44878f1ea47aSStefano Zampini 44888f1ea47aSStefano Zampini Output Parameter: 44898f1ea47aSStefano Zampini . array - pointer to the data 44908f1ea47aSStefano Zampini 44918f1ea47aSStefano Zampini Level: intermediate 44928f1ea47aSStefano Zampini 4493db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44948f1ea47aSStefano Zampini @*/ 44958f1ea47aSStefano Zampini PetscErrorCode MatSeqAIJGetArrayRead(Mat A,const PetscScalar **array) 44968f1ea47aSStefano Zampini { 4497d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 44988f1ea47aSStefano Zampini 44998f1ea47aSStefano Zampini PetscFunctionBegin; 4500d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 45019566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A,array)); 4502d67d9f35SJunchao Zhang } else { 4503d67d9f35SJunchao Zhang *array = aij->a; 4504d67d9f35SJunchao Zhang } 45058f1ea47aSStefano Zampini PetscFunctionReturn(0); 45068f1ea47aSStefano Zampini } 45078f1ea47aSStefano Zampini 45088f1ea47aSStefano Zampini /*@C 45098f1ea47aSStefano Zampini MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from MatSeqAIJGetArrayRead 45108f1ea47aSStefano Zampini 45118f1ea47aSStefano Zampini Not Collective 45128f1ea47aSStefano Zampini 45138f1ea47aSStefano Zampini Input Parameter: 45148f1ea47aSStefano Zampini . mat - a MATSEQAIJ matrix 45158f1ea47aSStefano Zampini 45168f1ea47aSStefano Zampini Output Parameter: 45178f1ea47aSStefano Zampini . array - pointer to the data 45188f1ea47aSStefano Zampini 45198f1ea47aSStefano Zampini Level: intermediate 45208f1ea47aSStefano Zampini 4521db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45228f1ea47aSStefano Zampini @*/ 45238f1ea47aSStefano Zampini PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A,const PetscScalar **array) 45248f1ea47aSStefano Zampini { 4525d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 45268f1ea47aSStefano Zampini 45278f1ea47aSStefano Zampini PetscFunctionBegin; 4528d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 45299566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A,array)); 4530d67d9f35SJunchao Zhang } else { 4531d67d9f35SJunchao Zhang *array = NULL; 4532d67d9f35SJunchao Zhang } 4533d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4534d67d9f35SJunchao Zhang } 4535d67d9f35SJunchao Zhang 4536d67d9f35SJunchao Zhang /*@C 4537d67d9f35SJunchao Zhang MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a MATSEQAIJ matrix is stored 4538d67d9f35SJunchao Zhang 4539d67d9f35SJunchao Zhang Not Collective 4540d67d9f35SJunchao Zhang 4541d67d9f35SJunchao Zhang Input Parameter: 4542d67d9f35SJunchao Zhang . mat - a MATSEQAIJ matrix 4543d67d9f35SJunchao Zhang 4544d67d9f35SJunchao Zhang Output Parameter: 4545d67d9f35SJunchao Zhang . array - pointer to the data 4546d67d9f35SJunchao Zhang 4547d67d9f35SJunchao Zhang Level: intermediate 4548d67d9f35SJunchao Zhang 4549db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4550d67d9f35SJunchao Zhang @*/ 4551d67d9f35SJunchao Zhang PetscErrorCode MatSeqAIJGetArrayWrite(Mat A,PetscScalar **array) 4552d67d9f35SJunchao Zhang { 4553d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 4554d67d9f35SJunchao Zhang 4555d67d9f35SJunchao Zhang PetscFunctionBegin; 4556d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 45579566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A,array)); 4558d67d9f35SJunchao Zhang } else { 4559d67d9f35SJunchao Zhang *array = aij->a; 4560d67d9f35SJunchao Zhang } 45619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 45629566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 4563d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4564d67d9f35SJunchao Zhang } 4565d67d9f35SJunchao Zhang 4566d67d9f35SJunchao Zhang /*@C 4567d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4568d67d9f35SJunchao Zhang 4569d67d9f35SJunchao Zhang Not Collective 4570d67d9f35SJunchao Zhang 4571d67d9f35SJunchao Zhang Input Parameter: 4572d67d9f35SJunchao Zhang . mat - a MATSEQAIJ matrix 4573d67d9f35SJunchao Zhang 4574d67d9f35SJunchao Zhang Output Parameter: 4575d67d9f35SJunchao Zhang . array - pointer to the data 4576d67d9f35SJunchao Zhang 4577d67d9f35SJunchao Zhang Level: intermediate 4578d67d9f35SJunchao Zhang 4579db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4580d67d9f35SJunchao Zhang @*/ 4581d67d9f35SJunchao Zhang PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A,PetscScalar **array) 4582d67d9f35SJunchao Zhang { 4583d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 4584d67d9f35SJunchao Zhang 4585d67d9f35SJunchao Zhang PetscFunctionBegin; 4586d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45879566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A,array)); 4588d67d9f35SJunchao Zhang } else { 4589d67d9f35SJunchao Zhang *array = NULL; 4590d67d9f35SJunchao Zhang } 45918f1ea47aSStefano Zampini PetscFunctionReturn(0); 45928f1ea47aSStefano Zampini } 45938f1ea47aSStefano Zampini 45948f1ea47aSStefano Zampini /*@C 45957ee59b9bSJunchao Zhang MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the SEQAIJ matrix 45967ee59b9bSJunchao Zhang 45977ee59b9bSJunchao Zhang Not Collective 45987ee59b9bSJunchao Zhang 45997ee59b9bSJunchao Zhang Input Parameter: 46007ee59b9bSJunchao Zhang . mat - a matrix of type MATSEQAIJ or its subclasses 46017ee59b9bSJunchao Zhang 46027ee59b9bSJunchao Zhang Output Parameters: 46037ee59b9bSJunchao Zhang + i - row map array of the matrix 46047ee59b9bSJunchao Zhang . j - column index array of the matrix 46057ee59b9bSJunchao Zhang . a - data array of the matrix 46067ee59b9bSJunchao Zhang - memtype - memory type of the arrays 46077ee59b9bSJunchao Zhang 46087ee59b9bSJunchao Zhang Notes: 46097ee59b9bSJunchao Zhang Any of the output parameters can be NULL, in which case the corresponding value is not returned. 46107ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 46117ee59b9bSJunchao Zhang 46127ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 46137ee59b9bSJunchao Zhang If the matrix is assembled, the data array 'a' is guaranteed to have the latest values of the matrix. 46147ee59b9bSJunchao Zhang 46157ee59b9bSJunchao Zhang Level: Developer 46167ee59b9bSJunchao Zhang 4617db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 46187ee59b9bSJunchao Zhang @*/ 46197ee59b9bSJunchao Zhang PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat,const PetscInt **i,const PetscInt **j,PetscScalar **a,PetscMemType *mtype) 46207ee59b9bSJunchao Zhang { 46217ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 46227ee59b9bSJunchao Zhang 46237ee59b9bSJunchao Zhang PetscFunctionBegin; 46247ee59b9bSJunchao Zhang PetscCheck(mat->preallocated,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"matrix is not preallocated"); 46257ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 46267ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat,i,j,a,mtype)); 46277ee59b9bSJunchao Zhang } else { 46287ee59b9bSJunchao Zhang if (i) *i = aij->i; 46297ee59b9bSJunchao Zhang if (j) *j = aij->j; 46307ee59b9bSJunchao Zhang if (a) *a = aij->a; 46317ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 46327ee59b9bSJunchao Zhang } 46337ee59b9bSJunchao Zhang PetscFunctionReturn(0); 46347ee59b9bSJunchao Zhang } 46357ee59b9bSJunchao Zhang 46367ee59b9bSJunchao Zhang /*@C 463721e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 463821e72a00SBarry Smith 463921e72a00SBarry Smith Not Collective 464021e72a00SBarry Smith 464121e72a00SBarry Smith Input Parameter: 4642579dbff0SBarry Smith . mat - a MATSEQAIJ matrix 464321e72a00SBarry Smith 464421e72a00SBarry Smith Output Parameter: 464521e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 464621e72a00SBarry Smith 464721e72a00SBarry Smith Level: intermediate 464821e72a00SBarry Smith 4649db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 465021e72a00SBarry Smith @*/ 465121e72a00SBarry Smith PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A,PetscInt *nz) 465221e72a00SBarry Smith { 465321e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 465421e72a00SBarry Smith 465521e72a00SBarry Smith PetscFunctionBegin; 465621e72a00SBarry Smith *nz = aij->rmax; 465721e72a00SBarry Smith PetscFunctionReturn(0); 465821e72a00SBarry Smith } 465921e72a00SBarry Smith 4660394ed5ebSJunchao Zhang PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, const PetscInt coo_i[], const PetscInt coo_j[]) 4661394ed5ebSJunchao Zhang { 4662394ed5ebSJunchao Zhang MPI_Comm comm; 4663394ed5ebSJunchao Zhang PetscInt *i,*j; 4664394ed5ebSJunchao Zhang PetscInt M,N,row; 4665394ed5ebSJunchao Zhang PetscCount k,p,q,nneg,nnz,start,end; /* Index the coo array, so use PetscCount as their type */ 4666394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4667394ed5ebSJunchao Zhang PetscInt *Aj; 4668394ed5ebSJunchao Zhang PetscScalar *Aa; 4669cbc6b225SStefano Zampini Mat_SeqAIJ *seqaij = (Mat_SeqAIJ*)(mat->data); 4670cbc6b225SStefano Zampini MatType rtype; 4671394ed5ebSJunchao Zhang PetscCount *perm,*jmap; 4672394ed5ebSJunchao Zhang 4673394ed5ebSJunchao Zhang PetscFunctionBegin; 46749566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(mat)); 46759566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat,&comm)); 46769566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat,&M,&N)); 46779566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(coo_n,&i,coo_n,&j)); 46789566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(i,coo_i,coo_n)); /* Make a copy since we'll modify it */ 46799566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(j,coo_j,coo_n)); 46809566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n,&perm)); 4681394ed5ebSJunchao Zhang for (k=0; k<coo_n; k++) { /* Ignore entries with negative row or col indices */ 4682394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 4683394ed5ebSJunchao Zhang perm[k] = k; 4684394ed5ebSJunchao Zhang } 4685394ed5ebSJunchao Zhang 4686394ed5ebSJunchao Zhang /* Sort by row */ 46879566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithIntCountArrayPair(coo_n,i,j,perm)); 4688394ed5ebSJunchao Zhang for (k=0; k<coo_n; k++) {if (i[k] >= 0) break;} /* Advance k to the first row with a non-negative index */ 4689394ed5ebSJunchao Zhang nneg = k; 46909566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n-nneg+1,&jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4691394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 4692394ed5ebSJunchao Zhang jmap++; /* Inc jmap by 1 for convinience */ 4693394ed5ebSJunchao Zhang 46949566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(M+1,&Ai)); /* CSR of A */ 46959566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n-nneg,&Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4696394ed5ebSJunchao Zhang 4697394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 4698394ed5ebSJunchao Zhang Ai++; /* Inc by 1 for convinience */ 4699394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4700394ed5ebSJunchao Zhang while (k<coo_n) { 4701394ed5ebSJunchao Zhang row = i[k]; 4702394ed5ebSJunchao Zhang start = k; /* [start,end) indices for this row */ 4703394ed5ebSJunchao Zhang while (k<coo_n && i[k] == row) k++; 4704394ed5ebSJunchao Zhang end = k; 47059566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithCountArray(end-start,j+start,perm+start)); 4706394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4707394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4708394ed5ebSJunchao Zhang jmap[q] = 1; /* Number of repeats of this nozero entry */ 4709394ed5ebSJunchao Zhang Ai[row] = 1; 4710394ed5ebSJunchao Zhang nnz++; 4711394ed5ebSJunchao Zhang 4712394ed5ebSJunchao Zhang for (p=start+1; p<end; p++) { /* Scan remaining nonzero in this row */ 4713394ed5ebSJunchao Zhang if (j[p] != j[p-1]) { /* Meet a new nonzero */ 4714394ed5ebSJunchao Zhang q++; 4715394ed5ebSJunchao Zhang jmap[q] = 1; 4716394ed5ebSJunchao Zhang Aj[q] = j[p]; 4717394ed5ebSJunchao Zhang Ai[row]++; 4718394ed5ebSJunchao Zhang nnz++; 4719394ed5ebSJunchao Zhang } else { 4720394ed5ebSJunchao Zhang jmap[q]++; 4721394ed5ebSJunchao Zhang } 4722394ed5ebSJunchao Zhang } 4723394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4724394ed5ebSJunchao Zhang } 47259566063dSJacob Faibussowitsch PetscCall(PetscFree2(i,j)); 4726394ed5ebSJunchao Zhang 4727394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4728394ed5ebSJunchao Zhang for (k=0; k<M; k++) Ai[k+1] += Ai[k]; 4729394ed5ebSJunchao Zhang jmap--; /* Back to the beginning of jmap[] */ 4730394ed5ebSJunchao Zhang jmap[0] = 0; 4731394ed5ebSJunchao Zhang for (k=0; k<nnz; k++) jmap[k+1] += jmap[k]; 4732394ed5ebSJunchao Zhang if (nnz < coo_n-nneg) { /* Realloc with actual number of unique nonzeros */ 4733394ed5ebSJunchao Zhang PetscCount *jmap_new; 4734394ed5ebSJunchao Zhang PetscInt *Aj_new; 4735394ed5ebSJunchao Zhang 47369566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz+1,&jmap_new)); 47379566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new,jmap,nnz+1)); 47389566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4739394ed5ebSJunchao Zhang jmap = jmap_new; 4740394ed5ebSJunchao Zhang 47419566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz,&Aj_new)); 47429566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new,Aj,nnz)); 47439566063dSJacob Faibussowitsch PetscCall(PetscFree(Aj)); 4744394ed5ebSJunchao Zhang Aj = Aj_new; 4745394ed5ebSJunchao Zhang } 4746394ed5ebSJunchao Zhang 4747394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4748394ed5ebSJunchao Zhang PetscCount *perm_new; 4749cbc6b225SStefano Zampini 47509566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n-nneg,&perm_new)); 47519566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new,perm+nneg,coo_n-nneg)); 47529566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4753394ed5ebSJunchao Zhang perm = perm_new; 4754394ed5ebSJunchao Zhang } 4755394ed5ebSJunchao Zhang 47569566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat,&rtype)); 47579566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nnz,&Aa)); /* Zero the matrix */ 47589566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF,M,N,Ai,Aj,Aa,rtype,mat)); 4759394ed5ebSJunchao Zhang 4760394ed5ebSJunchao Zhang seqaij->singlemalloc = PETSC_FALSE; /* Ai, Aj and Aa are not allocated in one big malloc */ 4761394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 4762394ed5ebSJunchao Zhang /* Record COO fields */ 4763394ed5ebSJunchao Zhang seqaij->coo_n = coo_n; 4764394ed5ebSJunchao Zhang seqaij->Atot = coo_n-nneg; /* Annz is seqaij->nz, so no need to record that again */ 4765394ed5ebSJunchao Zhang seqaij->jmap = jmap; /* of length nnz+1 */ 4766394ed5ebSJunchao Zhang seqaij->perm = perm; 4767394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4768394ed5ebSJunchao Zhang } 4769394ed5ebSJunchao Zhang 4770394ed5ebSJunchao Zhang static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A,const PetscScalar v[],InsertMode imode) 4771394ed5ebSJunchao Zhang { 4772394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ*)A->data; 4773394ed5ebSJunchao Zhang PetscCount i,j,Annz = aseq->nz; 4774394ed5ebSJunchao Zhang PetscCount *perm = aseq->perm,*jmap = aseq->jmap; 4775394ed5ebSJunchao Zhang PetscScalar *Aa; 4776394ed5ebSJunchao Zhang 4777394ed5ebSJunchao Zhang PetscFunctionBegin; 47789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&Aa)); 4779394ed5ebSJunchao Zhang for (i=0; i<Annz; i++) { 4780b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4781b6c38306SJunchao Zhang for (j=jmap[i]; j<jmap[i+1]; j++) sum += v[perm[j]]; 4782b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES? 0.0 : Aa[i]) + sum; 4783394ed5ebSJunchao Zhang } 47849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&Aa)); 4785394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4786394ed5ebSJunchao Zhang } 4787394ed5ebSJunchao Zhang 478834b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 47895063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat,MatType,MatReuse,Mat*); 479002fe1965SBarry Smith #endif 47913d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 47925063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat,MatType,MatReuse,Mat*); 47933d0639e7SStefano Zampini #endif 479402fe1965SBarry Smith 47958cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4796273d9f13SBarry Smith { 4797273d9f13SBarry Smith Mat_SeqAIJ *b; 479838baddfdSBarry Smith PetscMPIInt size; 4799273d9f13SBarry Smith 4800273d9f13SBarry Smith PetscFunctionBegin; 48019566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B),&size)); 480208401ef6SPierre Jolivet PetscCheck(size <= 1,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Comm must be of size 1"); 4803273d9f13SBarry Smith 48049566063dSJacob Faibussowitsch PetscCall(PetscNewLog(B,&b)); 48052205254eSKarl Rupp 4806b0a32e0cSBarry Smith B->data = (void*)b; 48072205254eSKarl Rupp 48089566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps))); 4809071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 48102205254eSKarl Rupp 4811f4259b30SLisandro Dalcin b->row = NULL; 4812f4259b30SLisandro Dalcin b->col = NULL; 4813f4259b30SLisandro Dalcin b->icol = NULL; 4814b810aeb4SBarry Smith b->reallocs = 0; 481536db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4816f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4817416022c9SBarry Smith b->nonew = 0; 4818f4259b30SLisandro Dalcin b->diag = NULL; 4819f4259b30SLisandro Dalcin b->solve_work = NULL; 4820f4259b30SLisandro Dalcin B->spptr = NULL; 4821f4259b30SLisandro Dalcin b->saved_values = NULL; 4822f4259b30SLisandro Dalcin b->idiag = NULL; 4823f4259b30SLisandro Dalcin b->mdiag = NULL; 4824f4259b30SLisandro Dalcin b->ssor_work = NULL; 482571f1c65dSBarry Smith b->omega = 1.0; 482671f1c65dSBarry Smith b->fshift = 0.0; 482771f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4828bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4829a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 483017ab2063SBarry Smith 48319566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ)); 4832b3866ffcSBarry Smith #if defined(PETSC_HAVE_MATLAB_ENGINE) 48339566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"PetscMatlabEnginePut_C",MatlabEnginePut_SeqAIJ)); 48349566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"PetscMatlabEngineGet_C",MatlabEngineGet_SeqAIJ)); 4835b3866ffcSBarry Smith #endif 48369566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetColumnIndices_C",MatSeqAIJSetColumnIndices_SeqAIJ)); 48379566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatStoreValues_C",MatStoreValues_SeqAIJ)); 48389566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatRetrieveValues_C",MatRetrieveValues_SeqAIJ)); 48399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqsbaij_C",MatConvert_SeqAIJ_SeqSBAIJ)); 48409566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqbaij_C",MatConvert_SeqAIJ_SeqBAIJ)); 48419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijperm_C",MatConvert_SeqAIJ_SeqAIJPERM)); 48429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijsell_C",MatConvert_SeqAIJ_SeqAIJSELL)); 48439779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 48449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijmkl_C",MatConvert_SeqAIJ_SeqAIJMKL)); 4845191b95cbSRichard Tran Mills #endif 484634b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 48479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijcusparse_C",MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 48489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaijcusparse_seqaij_C",MatProductSetFromOptions_SeqAIJ)); 48499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaij_seqaijcusparse_C",MatProductSetFromOptions_SeqAIJ)); 485002fe1965SBarry Smith #endif 48513d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 48529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijkokkos_C",MatConvert_SeqAIJ_SeqAIJKokkos)); 48533d0639e7SStefano Zampini #endif 48549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijcrl_C",MatConvert_SeqAIJ_SeqAIJCRL)); 4855af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 48569566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_elemental_C",MatConvert_SeqAIJ_Elemental)); 4857af8000cdSHong Zhang #endif 4858d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 48599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_scalapack_C",MatConvert_AIJ_ScaLAPACK)); 4860d24d4204SJose E. Roman #endif 486163c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 48629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_hypre_C",MatConvert_AIJ_HYPRE)); 48639566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_transpose_seqaij_seqaij_C",MatProductSetFromOptions_Transpose_AIJ_AIJ)); 486463c07aadSStefano Zampini #endif 48659566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqdense_C",MatConvert_SeqAIJ_SeqDense)); 48669566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqsell_C",MatConvert_SeqAIJ_SeqSELL)); 48679566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_is_C",MatConvert_XAIJ_IS)); 48689566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatIsTranspose_C",MatIsTranspose_SeqAIJ)); 48699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatIsHermitianTranspose_C",MatIsTranspose_SeqAIJ)); 48709566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetPreallocation_C",MatSeqAIJSetPreallocation_SeqAIJ)); 48719566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatResetPreallocation_C",MatResetPreallocation_SeqAIJ)); 48729566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetPreallocationCSR_C",MatSeqAIJSetPreallocationCSR_SeqAIJ)); 48739566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatReorderForNonzeroDiagonal_C",MatReorderForNonzeroDiagonal_SeqAIJ)); 48749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_is_seqaij_C",MatProductSetFromOptions_IS_XAIJ)); 48759566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqdense_seqaij_C",MatProductSetFromOptions_SeqDense_SeqAIJ)); 48769566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaij_seqaij_C",MatProductSetFromOptions_SeqAIJ)); 48779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJKron_C",MatSeqAIJKron_SeqAIJ)); 48789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSetPreallocationCOO_C",MatSetPreallocationCOO_SeqAIJ)); 48799566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSetValuesCOO_C",MatSetValuesCOO_SeqAIJ)); 48809566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 48819566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ)); 48829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 48833a40ed3dSBarry Smith PetscFunctionReturn(0); 488417ab2063SBarry Smith } 488517ab2063SBarry Smith 4886b24902e0SBarry Smith /* 4887b24902e0SBarry Smith Given a matrix generated with MatGetFactor() duplicates all the information in A into B 4888b24902e0SBarry Smith */ 4889ace3abfcSBarry Smith PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C,Mat A,MatDuplicateOption cpvalues,PetscBool mallocmatspace) 489017ab2063SBarry Smith { 48912a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ*)C->data,*a = (Mat_SeqAIJ*)A->data; 4892071fcb05SBarry Smith PetscInt m = A->rmap->n,i; 489317ab2063SBarry Smith 48943a40ed3dSBarry Smith PetscFunctionBegin; 4895aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Cannot duplicate unassembled matrix"); 4896273d9f13SBarry Smith 4897d5f3da31SBarry Smith C->factortype = A->factortype; 4898f4259b30SLisandro Dalcin c->row = NULL; 4899f4259b30SLisandro Dalcin c->col = NULL; 4900f4259b30SLisandro Dalcin c->icol = NULL; 49016ad4291fSHong Zhang c->reallocs = 0; 490217ab2063SBarry Smith 490369272f91SPierre Jolivet C->assembled = A->assembled; 490469272f91SPierre Jolivet C->preallocated = A->preallocated; 490517ab2063SBarry Smith 490669272f91SPierre Jolivet if (A->preallocated) { 49079566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap,&C->rmap)); 49089566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap,&C->cmap)); 4909eec197d1SBarry Smith 49109566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&c->imax)); 49119566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax,a->imax,m*sizeof(PetscInt))); 49129566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&c->ilen)); 49139566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen,a->ilen,m*sizeof(PetscInt))); 49149566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)C, 2*m*sizeof(PetscInt))); 491517ab2063SBarry Smith 491617ab2063SBarry Smith /* allocate the matrix space */ 4917f77e22a1SHong Zhang if (mallocmatspace) { 49189566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(a->i[m],&c->a,a->i[m],&c->j,m+1,&c->i)); 49199566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)C, a->i[m]*(sizeof(PetscScalar)+sizeof(PetscInt))+(m+1)*sizeof(PetscInt))); 49202205254eSKarl Rupp 4921f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 49222205254eSKarl Rupp 49239566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i,a->i,m+1)); 492417ab2063SBarry Smith if (m > 0) { 49259566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j,a->j,a->i[m])); 4926be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 49272e5835c6SStefano Zampini const PetscScalar *aa; 49282e5835c6SStefano Zampini 49299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 49309566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a,aa,a->i[m])); 49319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 4932be6bf707SBarry Smith } else { 49339566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a,a->i[m])); 493417ab2063SBarry Smith } 493508480c60SBarry Smith } 4936f77e22a1SHong Zhang } 493717ab2063SBarry Smith 49386ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 4939416022c9SBarry Smith c->roworiented = a->roworiented; 4940416022c9SBarry Smith c->nonew = a->nonew; 4941416022c9SBarry Smith if (a->diag) { 49429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1,&c->diag)); 49439566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag,a->diag,m*sizeof(PetscInt))); 49449566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)C,(m+1)*sizeof(PetscInt))); 4945071fcb05SBarry Smith } else c->diag = NULL; 49462205254eSKarl Rupp 4947f4259b30SLisandro Dalcin c->solve_work = NULL; 4948f4259b30SLisandro Dalcin c->saved_values = NULL; 4949f4259b30SLisandro Dalcin c->idiag = NULL; 4950f4259b30SLisandro Dalcin c->ssor_work = NULL; 4951a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 4952e6b907acSBarry Smith c->free_a = PETSC_TRUE; 4953e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 49546ad4291fSHong Zhang 4955893ad86cSHong Zhang c->rmax = a->rmax; 4956416022c9SBarry Smith c->nz = a->nz; 49578ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 4958754ec7b1SSatish Balay 49596ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 49606ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 4961cd6b891eSBarry Smith if (a->compressedrow.use) { 49626ad4291fSHong Zhang i = a->compressedrow.nrows; 49639566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i+1,&c->compressedrow.i,i,&c->compressedrow.rindex)); 49649566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i,a->compressedrow.i,i+1)); 49659566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex,a->compressedrow.rindex,i)); 496627ea64f8SHong Zhang } else { 496727ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 49680298fd71SBarry Smith c->compressedrow.i = NULL; 49690298fd71SBarry Smith c->compressedrow.rindex = NULL; 49706ad4291fSHong Zhang } 4971ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 4972e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 49734846f1f5SKris Buschelman 49749566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A,cpvalues,&C)); 497569272f91SPierre Jolivet } 49769566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist,&((PetscObject)C)->qlist)); 49773a40ed3dSBarry Smith PetscFunctionReturn(0); 497817ab2063SBarry Smith } 497917ab2063SBarry Smith 4980b24902e0SBarry Smith PetscErrorCode MatDuplicate_SeqAIJ(Mat A,MatDuplicateOption cpvalues,Mat *B) 4981b24902e0SBarry Smith { 4982b24902e0SBarry Smith PetscFunctionBegin; 49839566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A),B)); 49849566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n)); 4985cfd3f464SBarry Smith if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) { 49869566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B,A,A)); 4987cfd3f464SBarry Smith } 49889566063dSJacob Faibussowitsch PetscCall(MatSetType(*B,((PetscObject)A)->type_name)); 49899566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B,A,cpvalues,PETSC_TRUE)); 4990b24902e0SBarry Smith PetscFunctionReturn(0); 4991b24902e0SBarry Smith } 4992b24902e0SBarry Smith 4993112444f4SShri Abhyankar PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 4994fbdbba38SShri Abhyankar { 499552f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 499652f91c60SVaclav Hapla 499752f91c60SVaclav Hapla PetscFunctionBegin; 499852f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat,MAT_CLASSID,1); 499952f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer,PETSC_VIEWER_CLASSID,2); 5000c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 50019566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 50029566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary)); 50039566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERHDF5, &ishdf5)); 500452f91c60SVaclav Hapla if (isbinary) { 50059566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat,viewer)); 500652f91c60SVaclav Hapla } else if (ishdf5) { 500752f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 50089566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat,viewer)); 500952f91c60SVaclav Hapla #else 501052f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 501152f91c60SVaclav Hapla #endif 501252f91c60SVaclav Hapla } else { 501398921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"Viewer type %s not yet supported for reading %s matrices",((PetscObject)viewer)->type_name,((PetscObject)newMat)->type_name); 501452f91c60SVaclav Hapla } 501552f91c60SVaclav Hapla PetscFunctionReturn(0); 501652f91c60SVaclav Hapla } 501752f91c60SVaclav Hapla 50183ea6fe3dSLisandro Dalcin PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 501952f91c60SVaclav Hapla { 50203ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ*)mat->data; 50213ea6fe3dSLisandro Dalcin PetscInt header[4],*rowlens,M,N,nz,sum,rows,cols,i; 5022fbdbba38SShri Abhyankar 5023fbdbba38SShri Abhyankar PetscFunctionBegin; 50249566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 5025bbead8a2SBarry Smith 50263ea6fe3dSLisandro Dalcin /* read in matrix header */ 50279566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer,header,4,NULL,PETSC_INT)); 502808401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID,PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Not a matrix object in file"); 5029fbdbba38SShri Abhyankar M = header[1]; N = header[2]; nz = header[3]; 503008401ef6SPierre Jolivet PetscCheck(M >= 0,PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Matrix row size (%" PetscInt_FMT ") in file is negative",M); 503108401ef6SPierre Jolivet PetscCheck(N >= 0,PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Matrix column size (%" PetscInt_FMT ") in file is negative",N); 503208401ef6SPierre Jolivet PetscCheck(nz >= 0,PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Matrix stored in special format on disk, cannot load as SeqAIJ"); 5033fbdbba38SShri Abhyankar 50343ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 50359566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat,viewer)); 50363ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 50373ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 50383ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 50393ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 50403ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 50419566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 50429566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 50433ea6fe3dSLisandro Dalcin 50443ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 50459566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat,&rows,&cols)); 5046aed4548fSBarry Smith PetscCheck(M == rows && N == cols,PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")",M,N,rows,cols); 50473ea6fe3dSLisandro Dalcin 5048fbdbba38SShri Abhyankar /* read in row lengths */ 50499566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M,&rowlens)); 50509566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer,rowlens,M,NULL,PETSC_INT)); 50513ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 50523ea6fe3dSLisandro Dalcin sum = 0; for (i=0; i<M; i++) sum += rowlens[i]; 505308401ef6SPierre Jolivet PetscCheck(sum == nz,PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT,nz,sum); 50543ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 50559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat,0,rowlens)); 50569566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat,&rows,&cols)); 5057aed4548fSBarry Smith PetscCheck(M == rows && N == cols,PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")",M,N,rows,cols); 50583ea6fe3dSLisandro Dalcin /* store row lengths */ 50599566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen,rowlens,M)); 50609566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 5061fbdbba38SShri Abhyankar 50623ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 50633ea6fe3dSLisandro Dalcin a->i[0] = 0; for (i=0; i<M; i++) a->i[i+1] = a->i[i] + a->ilen[i]; 50643ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 50659566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer,a->j,nz,NULL,PETSC_INT)); 50663ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 50679566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer,a->a,nz,NULL,PETSC_SCALAR)); 5068fbdbba38SShri Abhyankar 50699566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat,MAT_FINAL_ASSEMBLY)); 50709566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat,MAT_FINAL_ASSEMBLY)); 5071fbdbba38SShri Abhyankar PetscFunctionReturn(0); 5072fbdbba38SShri Abhyankar } 5073fbdbba38SShri Abhyankar 5074ace3abfcSBarry Smith PetscErrorCode MatEqual_SeqAIJ(Mat A,Mat B,PetscBool * flg) 50757264ac53SSatish Balay { 50767264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*b = (Mat_SeqAIJ*)B->data; 5077fff043a9SJunchao Zhang const PetscScalar *aa,*ba; 5078eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5079eeffb40dSHong Zhang PetscInt k; 5080eeffb40dSHong Zhang #endif 50817264ac53SSatish Balay 50823a40ed3dSBarry Smith PetscFunctionBegin; 5083bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5084d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) ||(a->nz != b->nz)) { 5085ca44d042SBarry Smith *flg = PETSC_FALSE; 5086ca44d042SBarry Smith PetscFunctionReturn(0); 5087bcd2baecSBarry Smith } 50887264ac53SSatish Balay 50897264ac53SSatish Balay /* if the a->i are the same */ 50909566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i,b->i,A->rmap->n+1,flg)); 5091abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 50927264ac53SSatish Balay 50937264ac53SSatish Balay /* if a->j are the same */ 50949566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j,b->j,a->nz,flg)); 5095abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 5096bcd2baecSBarry Smith 50979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 50989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B,&ba)); 5099bcd2baecSBarry Smith /* if a->a are the same */ 5100eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5101eeffb40dSHong Zhang for (k=0; k<a->nz; k++) { 5102fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5103eeffb40dSHong Zhang *flg = PETSC_FALSE; 51043a40ed3dSBarry Smith PetscFunctionReturn(0); 5105eeffb40dSHong Zhang } 5106eeffb40dSHong Zhang } 5107eeffb40dSHong Zhang #else 51089566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa,ba,a->nz,flg)); 5109eeffb40dSHong Zhang #endif 51109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 51119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B,&ba)); 5112eeffb40dSHong Zhang PetscFunctionReturn(0); 51137264ac53SSatish Balay } 511436db0b34SBarry Smith 511505869f15SSatish Balay /*@ 511636db0b34SBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential AIJ matrix using matrix elements (in CSR format) 511736db0b34SBarry Smith provided by the user. 511836db0b34SBarry Smith 5119d083f849SBarry Smith Collective 512036db0b34SBarry Smith 512136db0b34SBarry Smith Input Parameters: 512236db0b34SBarry Smith + comm - must be an MPI communicator of size 1 512336db0b34SBarry Smith . m - number of rows 512436db0b34SBarry Smith . n - number of columns 5125483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 512636db0b34SBarry Smith . j - column indices 512736db0b34SBarry Smith - a - matrix values 512836db0b34SBarry Smith 512936db0b34SBarry Smith Output Parameter: 513036db0b34SBarry Smith . mat - the matrix 513136db0b34SBarry Smith 513236db0b34SBarry Smith Level: intermediate 513336db0b34SBarry Smith 513436db0b34SBarry Smith Notes: 51350551d7c0SBarry Smith The i, j, and a arrays are not copied by this routine, the user must free these arrays 5136292fb18eSBarry Smith once the matrix is destroyed and not before 513736db0b34SBarry Smith 513836db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 513936db0b34SBarry Smith 5140bfeeae90SHong Zhang The i and j indices are 0 based 514136db0b34SBarry Smith 5142a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5143a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 51448eef79e4SBarry Smith as shown 5145a4552177SSatish Balay 51468eef79e4SBarry Smith $ 1 0 0 51478eef79e4SBarry Smith $ 2 0 3 51488eef79e4SBarry Smith $ 4 5 6 51498eef79e4SBarry Smith $ 51508eef79e4SBarry Smith $ i = {0,1,3,6} [size = nrow+1 = 3+1] 51518eef79e4SBarry Smith $ j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 51528eef79e4SBarry Smith $ v = {1,2,3,4,5,6} [size = 6] 5153a4552177SSatish Balay 5154db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 515536db0b34SBarry Smith 515636db0b34SBarry Smith @*/ 5157c3c607ccSBarry Smith PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt i[],PetscInt j[],PetscScalar a[],Mat *mat) 515836db0b34SBarry Smith { 5159cbcfb4deSHong Zhang PetscInt ii; 516036db0b34SBarry Smith Mat_SeqAIJ *aij; 5161cbcfb4deSHong Zhang PetscInt jj; 516236db0b34SBarry Smith 516336db0b34SBarry Smith PetscFunctionBegin; 5164aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"i (row indices) must start with 0"); 51659566063dSJacob Faibussowitsch PetscCall(MatCreate(comm,mat)); 51669566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat,m,n,m,n)); 51679566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 51689566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat,MATSEQAIJ)); 51699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat,MAT_SKIP_ALLOCATION,NULL)); 5170ab93d7beSBarry Smith aij = (Mat_SeqAIJ*)(*mat)->data; 51719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&aij->imax)); 51729566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&aij->ilen)); 5173ab93d7beSBarry Smith 517436db0b34SBarry Smith aij->i = i; 517536db0b34SBarry Smith aij->j = j; 517636db0b34SBarry Smith aij->a = a; 517736db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 517836db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5179e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5180e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 518136db0b34SBarry Smith 5182cbc6b225SStefano Zampini for (ii=0,aij->nonzerorowcnt=0,aij->rmax=0; ii<m; ii++) { 518336db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii+1] - i[ii]; 518476bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5185aed4548fSBarry Smith PetscCheck(i[ii+1] - i[ii] >= 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT,ii,i[ii+1] - i[ii]); 51869985e31cSBarry Smith for (jj=i[ii]+1; jj<i[ii+1]; jj++) { 518708401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj-1],PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted",jj-i[ii],j[jj],ii); 518808401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj-1],PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry",jj-i[ii],j[jj],ii); 51899985e31cSBarry Smith } 519036db0b34SBarry Smith } 519176bd3646SJed Brown } 519276bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 519336db0b34SBarry Smith for (ii=0; ii<aij->i[m]; ii++) { 519408401ef6SPierre Jolivet PetscCheck(j[ii] >= 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT,ii,j[ii]); 5195aed4548fSBarry Smith PetscCheck(j[ii] <= n - 1,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT,ii,j[ii]); 519636db0b34SBarry Smith } 519776bd3646SJed Brown } 519836db0b34SBarry Smith 51999566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY)); 52009566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY)); 520136db0b34SBarry Smith PetscFunctionReturn(0); 520236db0b34SBarry Smith } 5203cbc6b225SStefano Zampini 5204f62e3866SBarry Smith /*@ 5205d021a1c5SVictor Minden MatCreateSeqAIJFromTriple - Creates an sequential AIJ matrix using matrix elements (in COO format) 52068a0b0e6bSVictor Minden provided by the user. 52078a0b0e6bSVictor Minden 5208d083f849SBarry Smith Collective 52098a0b0e6bSVictor Minden 52108a0b0e6bSVictor Minden Input Parameters: 52118a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 52128a0b0e6bSVictor Minden . m - number of rows 52138a0b0e6bSVictor Minden . n - number of columns 52148a0b0e6bSVictor Minden . i - row indices 52158a0b0e6bSVictor Minden . j - column indices 52161230e6d1SVictor Minden . a - matrix values 52171230e6d1SVictor Minden . nz - number of nonzeros 5218f62e3866SBarry Smith - idx - if the i and j indices start with 1 use PETSC_TRUE otherwise use PETSC_FALSE 52198a0b0e6bSVictor Minden 52208a0b0e6bSVictor Minden Output Parameter: 52218a0b0e6bSVictor Minden . mat - the matrix 52228a0b0e6bSVictor Minden 52238a0b0e6bSVictor Minden Level: intermediate 52248a0b0e6bSVictor Minden 5225f62e3866SBarry Smith Example: 5226f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 52279e99939fSJunchao Zhang .vb 52288a0b0e6bSVictor Minden 1 0 0 52298a0b0e6bSVictor Minden 2 0 3 52308a0b0e6bSVictor Minden 4 5 6 52318a0b0e6bSVictor Minden 52328a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 52338a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 52348a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 52359e99939fSJunchao Zhang .ve 52368a0b0e6bSVictor Minden 5237db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()` 52388a0b0e6bSVictor Minden 52398a0b0e6bSVictor Minden @*/ 5240c3c607ccSBarry Smith PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt i[],PetscInt j[],PetscScalar a[],Mat *mat,PetscInt nz,PetscBool idx) 52418a0b0e6bSVictor Minden { 5242d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1,row,col; 52438a0b0e6bSVictor Minden 52448a0b0e6bSVictor Minden PetscFunctionBegin; 52459566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m,&nnz)); 52461230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 5247c8d679ebSHong Zhang nnz[i[ii] - !!idx] += 1; 52481230e6d1SVictor Minden } 52499566063dSJacob Faibussowitsch PetscCall(MatCreate(comm,mat)); 52509566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat,m,n,m,n)); 52519566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat,MATSEQAIJ)); 52529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat,0,nnz)); 52531230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 52541230e6d1SVictor Minden if (idx) { 52551230e6d1SVictor Minden row = i[ii] - 1; 52561230e6d1SVictor Minden col = j[ii] - 1; 52571230e6d1SVictor Minden } else { 52581230e6d1SVictor Minden row = i[ii]; 52591230e6d1SVictor Minden col = j[ii]; 52608a0b0e6bSVictor Minden } 52619566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat,one,&row,one,&col,&a[ii],ADD_VALUES)); 52628a0b0e6bSVictor Minden } 52639566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY)); 52649566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY)); 52659566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 52668a0b0e6bSVictor Minden PetscFunctionReturn(0); 52678a0b0e6bSVictor Minden } 526836db0b34SBarry Smith 5269acf2f550SJed Brown PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5270acf2f550SJed Brown { 5271acf2f550SJed Brown Mat_SeqAIJ *a=(Mat_SeqAIJ*)A->data; 5272acf2f550SJed Brown 5273acf2f550SJed Brown PetscFunctionBegin; 5274acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5275acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 52762205254eSKarl Rupp 52779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 5278acf2f550SJed Brown PetscFunctionReturn(0); 5279acf2f550SJed Brown } 5280acf2f550SJed Brown 52819c8f2541SHong Zhang PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm,Mat inmat,PetscInt n,MatReuse scall,Mat *outmat) 52829c8f2541SHong Zhang { 52838761c3d6SHong Zhang PetscMPIInt size; 52849c8f2541SHong Zhang 52859c8f2541SHong Zhang PetscFunctionBegin; 52869566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm,&size)); 52877bbdc51dSHong Zhang if (size == 1) { 52887bbdc51dSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 52899566063dSJacob Faibussowitsch PetscCall(MatDuplicate(inmat,MAT_COPY_VALUES,outmat)); 52907bbdc51dSHong Zhang } else { 52919566063dSJacob Faibussowitsch PetscCall(MatCopy(inmat,*outmat,SAME_NONZERO_PATTERN)); 52927bbdc51dSHong Zhang } 52938761c3d6SHong Zhang } else { 52949566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm,inmat,n,scall,outmat)); 52958761c3d6SHong Zhang } 52969c8f2541SHong Zhang PetscFunctionReturn(0); 52979c8f2541SHong Zhang } 52989c8f2541SHong Zhang 529981824310SBarry Smith /* 530053dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 530153dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 530253dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 530353dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 530453dd7562SDmitry Karpeev */ 530553dd7562SDmitry Karpeev PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C,IS rowemb,IS colemb,MatStructure pattern,Mat B) 530653dd7562SDmitry Karpeev { 530753dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 530853dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 530953dd7562SDmitry Karpeev PetscBool seqaij; 531053dd7562SDmitry Karpeev PetscInt m,n,*nz,i,j,count; 531153dd7562SDmitry Karpeev PetscScalar v; 531253dd7562SDmitry Karpeev const PetscInt *rowindices,*colindices; 531353dd7562SDmitry Karpeev 531453dd7562SDmitry Karpeev PetscFunctionBegin; 531553dd7562SDmitry Karpeev if (!B) PetscFunctionReturn(0); 531653dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 53179566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B,MATSEQAIJ,&seqaij)); 531828b400f6SJacob Faibussowitsch PetscCheck(seqaij,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is of wrong type"); 531953dd7562SDmitry Karpeev if (rowemb) { 53209566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb,&m)); 532108401ef6SPierre Jolivet PetscCheck(m == B->rmap->n,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT,m,B->rmap->n); 532253dd7562SDmitry Karpeev } else { 532308401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is row-incompatible with the target matrix"); 532453dd7562SDmitry Karpeev } 532553dd7562SDmitry Karpeev if (colemb) { 53269566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb,&n)); 532708401ef6SPierre Jolivet PetscCheck(n == B->cmap->n,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT,n,B->cmap->n); 532853dd7562SDmitry Karpeev } else { 532908401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is col-incompatible with the target matrix"); 533053dd7562SDmitry Karpeev } 533153dd7562SDmitry Karpeev 533253dd7562SDmitry Karpeev Baij = (Mat_SeqAIJ*)(B->data); 533353dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 53349566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n,&nz)); 533553dd7562SDmitry Karpeev for (i=0; i<B->rmap->n; i++) { 533653dd7562SDmitry Karpeev nz[i] = Baij->i[i+1] - Baij->i[i]; 533753dd7562SDmitry Karpeev } 53389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C,0,nz)); 53399566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 534053dd7562SDmitry Karpeev } 534153dd7562SDmitry Karpeev if (pattern == SUBSET_NONZERO_PATTERN) { 53429566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(C)); 534353dd7562SDmitry Karpeev } 534453dd7562SDmitry Karpeev count = 0; 534553dd7562SDmitry Karpeev rowindices = NULL; 534653dd7562SDmitry Karpeev colindices = NULL; 534753dd7562SDmitry Karpeev if (rowemb) { 53489566063dSJacob Faibussowitsch PetscCall(ISGetIndices(rowemb,&rowindices)); 534953dd7562SDmitry Karpeev } 535053dd7562SDmitry Karpeev if (colemb) { 53519566063dSJacob Faibussowitsch PetscCall(ISGetIndices(colemb,&colindices)); 535253dd7562SDmitry Karpeev } 535353dd7562SDmitry Karpeev for (i=0; i<B->rmap->n; i++) { 535453dd7562SDmitry Karpeev PetscInt row; 535553dd7562SDmitry Karpeev row = i; 535653dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 535753dd7562SDmitry Karpeev for (j=Baij->i[i]; j<Baij->i[i+1]; j++) { 535853dd7562SDmitry Karpeev PetscInt col; 535953dd7562SDmitry Karpeev col = Baij->j[count]; 536053dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 536153dd7562SDmitry Karpeev v = Baij->a[count]; 53629566063dSJacob Faibussowitsch PetscCall(MatSetValues(C,1,&row,1,&col,&v,INSERT_VALUES)); 536353dd7562SDmitry Karpeev ++count; 536453dd7562SDmitry Karpeev } 536553dd7562SDmitry Karpeev } 536653dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 536753dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 536853dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 536953dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 537053dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 537153dd7562SDmitry Karpeev PetscFunctionReturn(0); 537253dd7562SDmitry Karpeev } 537353dd7562SDmitry Karpeev 53744099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 53754099cc6bSBarry Smith 53764099cc6bSBarry Smith /*@C 53774099cc6bSBarry Smith MatSeqAIJSetType - Converts a MATSEQAIJ matrix to a subtype 53784099cc6bSBarry Smith 53794099cc6bSBarry Smith Collective on Mat 53804099cc6bSBarry Smith 53814099cc6bSBarry Smith Input Parameters: 53824099cc6bSBarry Smith + mat - the matrix object 53834099cc6bSBarry Smith - matype - matrix type 53844099cc6bSBarry Smith 53854099cc6bSBarry Smith Options Database Key: 53864099cc6bSBarry Smith . -mat_seqai_type <method> - for example seqaijcrl 53874099cc6bSBarry Smith 53884099cc6bSBarry Smith Level: intermediate 53894099cc6bSBarry Smith 5390db781477SPatrick Sanan .seealso: `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`, `Mat` 53914099cc6bSBarry Smith @*/ 53924099cc6bSBarry Smith PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 53934099cc6bSBarry Smith { 53944099cc6bSBarry Smith PetscBool sametype; 53955f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat,MatType,MatReuse,Mat*); 53964099cc6bSBarry Smith 53974099cc6bSBarry Smith PetscFunctionBegin; 53984099cc6bSBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 53999566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat,matype,&sametype)); 54004099cc6bSBarry Smith if (sametype) PetscFunctionReturn(0); 54014099cc6bSBarry Smith 54029566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList,matype,&r)); 54035f80ce2aSJacob Faibussowitsch PetscCheck(r,PETSC_COMM_SELF,PETSC_ERR_ARG_UNKNOWN_TYPE,"Unknown Mat type given: %s",matype); 54049566063dSJacob Faibussowitsch PetscCall((*r)(mat,matype,MAT_INPLACE_MATRIX,&mat)); 54054099cc6bSBarry Smith PetscFunctionReturn(0); 54064099cc6bSBarry Smith } 54074099cc6bSBarry Smith 54084099cc6bSBarry Smith /*@C 54094099cc6bSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential AIJ matrices 54104099cc6bSBarry Smith 54114099cc6bSBarry Smith Not Collective 54124099cc6bSBarry Smith 54134099cc6bSBarry Smith Input Parameters: 54144099cc6bSBarry Smith + name - name of a new user-defined matrix type, for example MATSEQAIJCRL 54154099cc6bSBarry Smith - function - routine to convert to subtype 54164099cc6bSBarry Smith 54174099cc6bSBarry Smith Notes: 54184099cc6bSBarry Smith MatSeqAIJRegister() may be called multiple times to add several user-defined solvers. 54194099cc6bSBarry Smith 54204099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 54214099cc6bSBarry Smith $ -mat_seqaij_type my_mat 54224099cc6bSBarry Smith 54234099cc6bSBarry Smith Level: advanced 54244099cc6bSBarry Smith 5425db781477SPatrick Sanan .seealso: `MatSeqAIJRegisterAll()` 54264099cc6bSBarry Smith 54274099cc6bSBarry Smith Level: advanced 54284099cc6bSBarry Smith @*/ 5429388d47a6SSatish Balay PetscErrorCode MatSeqAIJRegister(const char sname[],PetscErrorCode (*function)(Mat,MatType,MatReuse,Mat *)) 54304099cc6bSBarry Smith { 54314099cc6bSBarry Smith PetscFunctionBegin; 54329566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 54339566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList,sname,function)); 54344099cc6bSBarry Smith PetscFunctionReturn(0); 54354099cc6bSBarry Smith } 54364099cc6bSBarry Smith 54374099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 54384099cc6bSBarry Smith 54394099cc6bSBarry Smith /*@C 54404099cc6bSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of SeqAIJ 54414099cc6bSBarry Smith 54424099cc6bSBarry Smith Not Collective 54434099cc6bSBarry Smith 54444099cc6bSBarry Smith Level: advanced 54454099cc6bSBarry Smith 5446db781477SPatrick Sanan .seealso: `MatRegisterAll()`, `MatSeqAIJRegister()` 54474099cc6bSBarry Smith @*/ 54484099cc6bSBarry Smith PetscErrorCode MatSeqAIJRegisterAll(void) 54494099cc6bSBarry Smith { 54504099cc6bSBarry Smith PetscFunctionBegin; 54514099cc6bSBarry Smith if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(0); 54524099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 54534099cc6bSBarry Smith 54549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 54559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 54569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 54579779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 54589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5459485f9817SRichard Tran Mills #endif 54605063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 54619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 54625063d097SStefano Zampini #endif 54635063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 54649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 54655063d097SStefano Zampini #endif 54664099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 54679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 54684099cc6bSBarry Smith #endif 54694099cc6bSBarry Smith PetscFunctionReturn(0); 54704099cc6bSBarry Smith } 547153dd7562SDmitry Karpeev 547253dd7562SDmitry Karpeev /* 547381824310SBarry Smith Special version for direct calls from Fortran 547481824310SBarry Smith */ 5475af0996ceSBarry Smith #include <petsc/private/fortranimpl.h> 547681824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 547781824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 547881824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 547981824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 548081824310SBarry Smith #endif 548181824310SBarry Smith 548281824310SBarry Smith /* Change these macros so can be used in void function */ 548398921bdaSJacob Faibussowitsch 548498921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 54859566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 54869566063dSJacob Faibussowitsch #undef PetscCall 54879566063dSJacob Faibussowitsch #define PetscCall(...) do { \ 54885f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 548998921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 549098921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF,__LINE__,PETSC_FUNCTION_NAME,__FILE__,ierr_msv_mpiaij,PETSC_ERROR_REPEAT," "); \ 549198921bdaSJacob Faibussowitsch return; \ 549298921bdaSJacob Faibussowitsch } \ 549398921bdaSJacob Faibussowitsch } while (0) 549498921bdaSJacob Faibussowitsch 549598921bdaSJacob Faibussowitsch #undef SETERRQ 549698921bdaSJacob Faibussowitsch #define SETERRQ(comm,ierr,...) do { \ 549798921bdaSJacob Faibussowitsch *_ierr = PetscError(comm,__LINE__,PETSC_FUNCTION_NAME,__FILE__,ierr,PETSC_ERROR_INITIAL,__VA_ARGS__); \ 549898921bdaSJacob Faibussowitsch return; \ 549998921bdaSJacob Faibussowitsch } while (0) 550081824310SBarry Smith 550119caf8f3SSatish Balay PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA,PetscInt *mm,const PetscInt im[],PetscInt *nn,const PetscInt in[],const PetscScalar v[],InsertMode *isis, PetscErrorCode *_ierr) 550281824310SBarry Smith { 550381824310SBarry Smith Mat A = *AA; 550481824310SBarry Smith PetscInt m = *mm, n = *nn; 550581824310SBarry Smith InsertMode is = *isis; 550681824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 550781824310SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 550881824310SBarry Smith PetscInt *imax,*ai,*ailen; 550981824310SBarry Smith PetscInt *aj,nonew = a->nonew,lastcol = -1; 551054f21887SBarry Smith MatScalar *ap,value,*aa; 5511ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5512ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 551381824310SBarry Smith 551481824310SBarry Smith PetscFunctionBegin; 55154994cf47SJed Brown MatCheckPreallocated(A,1); 551681824310SBarry Smith imax = a->imax; 551781824310SBarry Smith ai = a->i; 551881824310SBarry Smith ailen = a->ilen; 551981824310SBarry Smith aj = a->j; 552081824310SBarry Smith aa = a->a; 552181824310SBarry Smith 552281824310SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 552381824310SBarry Smith row = im[k]; 552481824310SBarry Smith if (row < 0) continue; 55255f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large"); 552681824310SBarry Smith rp = aj + ai[row]; ap = aa + ai[row]; 552781824310SBarry Smith rmax = imax[row]; nrow = ailen[row]; 552881824310SBarry Smith low = 0; 552981824310SBarry Smith high = nrow; 553081824310SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 553181824310SBarry Smith if (in[l] < 0) continue; 55325f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Column too large"); 553381824310SBarry Smith col = in[l]; 55342205254eSKarl Rupp if (roworiented) value = v[l + k*n]; 55352205254eSKarl Rupp else value = v[k + l*m]; 55362205254eSKarl Rupp 553781824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 553881824310SBarry Smith 55392205254eSKarl Rupp if (col <= lastcol) low = 0; 55402205254eSKarl Rupp else high = nrow; 554181824310SBarry Smith lastcol = col; 554281824310SBarry Smith while (high-low > 5) { 554381824310SBarry Smith t = (low+high)/2; 554481824310SBarry Smith if (rp[t] > col) high = t; 554581824310SBarry Smith else low = t; 554681824310SBarry Smith } 554781824310SBarry Smith for (i=low; i<high; i++) { 554881824310SBarry Smith if (rp[i] > col) break; 554981824310SBarry Smith if (rp[i] == col) { 555081824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 555181824310SBarry Smith else ap[i] = value; 555281824310SBarry Smith goto noinsert; 555381824310SBarry Smith } 555481824310SBarry Smith } 555581824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 555681824310SBarry Smith if (nonew == 1) goto noinsert; 55575f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero in the matrix"); 5558fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 555981824310SBarry Smith N = nrow++ - 1; a->nz++; high++; 556081824310SBarry Smith /* shift up all the later entries in this row */ 556181824310SBarry Smith for (ii=N; ii>=i; ii--) { 556281824310SBarry Smith rp[ii+1] = rp[ii]; 556381824310SBarry Smith ap[ii+1] = ap[ii]; 556481824310SBarry Smith } 556581824310SBarry Smith rp[i] = col; 556681824310SBarry Smith ap[i] = value; 5567e56f5c9eSBarry Smith A->nonzerostate++; 556881824310SBarry Smith noinsert:; 556981824310SBarry Smith low = i + 1; 557081824310SBarry Smith } 557181824310SBarry Smith ailen[row] = nrow; 557281824310SBarry Smith } 557381824310SBarry Smith PetscFunctionReturnVoid(); 557481824310SBarry Smith } 557598921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 557698921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 557798921bdaSJacob Faibussowitsch * original definitions */ 55789566063dSJacob Faibussowitsch #undef PetscCall 557998921bdaSJacob Faibussowitsch #undef SETERRQ 5580