1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 114099cc6bSBarry Smith PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 124099cc6bSBarry Smith { 134099cc6bSBarry Smith PetscBool flg; 144099cc6bSBarry Smith char type[256]; 154099cc6bSBarry Smith 164099cc6bSBarry Smith PetscFunctionBegin; 17d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 189566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type","Matrix SeqAIJ type","MatSeqAIJSetType",MatSeqAIJList,"seqaij",type,256,&flg)); 199566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A,type)); 20d0609cedSBarry Smith PetscOptionsEnd(); 214099cc6bSBarry Smith PetscFunctionReturn(0); 224099cc6bSBarry Smith } 234099cc6bSBarry Smith 24857cbf51SRichard Tran Mills PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A,PetscInt type,PetscReal *reductions) 250716a85fSBarry Smith { 260716a85fSBarry Smith PetscInt i,m,n; 270716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 280716a85fSBarry Smith 290716a85fSBarry Smith PetscFunctionBegin; 309566063dSJacob Faibussowitsch PetscCall(MatGetSize(A,&m,&n)); 319566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions,n)); 320716a85fSBarry Smith if (type == NORM_2) { 330716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 34a873a8cdSSam Reynolds reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]*aij->a[i]); 350716a85fSBarry Smith } 360716a85fSBarry Smith } else if (type == NORM_1) { 370716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 38a873a8cdSSam Reynolds reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 390716a85fSBarry Smith } 400716a85fSBarry Smith } else if (type == NORM_INFINITY) { 410716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 42a873a8cdSSam Reynolds reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]),reductions[aij->j[i]]); 430716a85fSBarry Smith } 44857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 45a873a8cdSSam Reynolds for (i=0; i<aij->i[m]; i++) { 46857cbf51SRichard Tran Mills reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 47a873a8cdSSam Reynolds } 48857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 49857cbf51SRichard Tran Mills for (i=0; i<aij->i[m]; i++) { 50857cbf51SRichard Tran Mills reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 51857cbf51SRichard Tran Mills } 52857cbf51SRichard Tran Mills } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Unknown reduction type"); 530716a85fSBarry Smith 540716a85fSBarry Smith if (type == NORM_2) { 55a873a8cdSSam Reynolds for (i=0; i<n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 56857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 57a873a8cdSSam Reynolds for (i=0; i<n; i++) reductions[i] /= m; 580716a85fSBarry Smith } 590716a85fSBarry Smith PetscFunctionReturn(0); 600716a85fSBarry Smith } 610716a85fSBarry Smith 623a062f41SBarry Smith PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A,IS *is) 633a062f41SBarry Smith { 643a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 653a062f41SBarry Smith PetscInt i,m=A->rmap->n,cnt = 0, bs = A->rmap->bs; 663a062f41SBarry Smith const PetscInt *jj = a->j,*ii = a->i; 673a062f41SBarry Smith PetscInt *rows; 683a062f41SBarry Smith 693a062f41SBarry Smith PetscFunctionBegin; 703a062f41SBarry Smith for (i=0; i<m; i++) { 713a062f41SBarry Smith if ((ii[i] != ii[i+1]) && ((jj[ii[i]] < bs*(i/bs)) || (jj[ii[i+1]-1] > bs*((i+bs)/bs)-1))) { 723a062f41SBarry Smith cnt++; 733a062f41SBarry Smith } 743a062f41SBarry Smith } 759566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt,&rows)); 763a062f41SBarry Smith cnt = 0; 773a062f41SBarry Smith for (i=0; i<m; i++) { 783a062f41SBarry Smith if ((ii[i] != ii[i+1]) && ((jj[ii[i]] < bs*(i/bs)) || (jj[ii[i+1]-1] > bs*((i+bs)/bs)-1))) { 793a062f41SBarry Smith rows[cnt] = i; 803a062f41SBarry Smith cnt++; 813a062f41SBarry Smith } 823a062f41SBarry Smith } 839566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF,cnt,rows,PETSC_OWN_POINTER,is)); 843a062f41SBarry Smith PetscFunctionReturn(0); 853a062f41SBarry Smith } 863a062f41SBarry Smith 87f1f41ecbSJed Brown PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A,PetscInt *nrows,PetscInt **zrows) 886ce1633cSBarry Smith { 896ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 90fff043a9SJunchao Zhang const MatScalar *aa; 916ce1633cSBarry Smith PetscInt i,m=A->rmap->n,cnt = 0; 92b2db7409Sstefano_zampini const PetscInt *ii = a->i,*jj = a->j,*diag; 936ce1633cSBarry Smith PetscInt *rows; 946ce1633cSBarry Smith 956ce1633cSBarry Smith PetscFunctionBegin; 969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 979566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 986ce1633cSBarry Smith diag = a->diag; 996ce1633cSBarry Smith for (i=0; i<m; i++) { 100b2db7409Sstefano_zampini if ((diag[i] >= ii[i+1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 1016ce1633cSBarry Smith cnt++; 1026ce1633cSBarry Smith } 1036ce1633cSBarry Smith } 1049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt,&rows)); 1056ce1633cSBarry Smith cnt = 0; 1066ce1633cSBarry Smith for (i=0; i<m; i++) { 107b2db7409Sstefano_zampini if ((diag[i] >= ii[i+1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 1086ce1633cSBarry Smith rows[cnt++] = i; 1096ce1633cSBarry Smith } 1106ce1633cSBarry Smith } 111f1f41ecbSJed Brown *nrows = cnt; 112f1f41ecbSJed Brown *zrows = rows; 1139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 114f1f41ecbSJed Brown PetscFunctionReturn(0); 115f1f41ecbSJed Brown } 116f1f41ecbSJed Brown 117f1f41ecbSJed Brown PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A,IS *zrows) 118f1f41ecbSJed Brown { 119f1f41ecbSJed Brown PetscInt nrows,*rows; 120f1f41ecbSJed Brown 121f1f41ecbSJed Brown PetscFunctionBegin; 1220298fd71SBarry Smith *zrows = NULL; 1239566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A,&nrows,&rows)); 1249566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A),nrows,rows,PETSC_OWN_POINTER,zrows)); 1256ce1633cSBarry Smith PetscFunctionReturn(0); 1266ce1633cSBarry Smith } 1276ce1633cSBarry Smith 128b3a44c85SBarry Smith PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A,IS *keptrows) 129b3a44c85SBarry Smith { 130b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 131b3a44c85SBarry Smith const MatScalar *aa; 132b3a44c85SBarry Smith PetscInt m=A->rmap->n,cnt = 0; 133b3a44c85SBarry Smith const PetscInt *ii; 134b3a44c85SBarry Smith PetscInt n,i,j,*rows; 135b3a44c85SBarry Smith 136b3a44c85SBarry Smith PetscFunctionBegin; 1379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 138f4259b30SLisandro Dalcin *keptrows = NULL; 139b3a44c85SBarry Smith ii = a->i; 140b3a44c85SBarry Smith for (i=0; i<m; i++) { 141b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 142b3a44c85SBarry Smith if (!n) { 143b3a44c85SBarry Smith cnt++; 144b3a44c85SBarry Smith goto ok1; 145b3a44c85SBarry Smith } 1462e5835c6SStefano Zampini for (j=ii[i]; j<ii[i+1]; j++) { 147b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 148b3a44c85SBarry Smith } 149b3a44c85SBarry Smith cnt++; 150b3a44c85SBarry Smith ok1:; 151b3a44c85SBarry Smith } 1522e5835c6SStefano Zampini if (!cnt) { 1539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 1542e5835c6SStefano Zampini PetscFunctionReturn(0); 1552e5835c6SStefano Zampini } 1569566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n-cnt,&rows)); 157b3a44c85SBarry Smith cnt = 0; 158b3a44c85SBarry Smith for (i=0; i<m; i++) { 159b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 160b3a44c85SBarry Smith if (!n) continue; 1612e5835c6SStefano Zampini for (j=ii[i]; j<ii[i+1]; j++) { 162b3a44c85SBarry Smith if (aa[j] != 0.0) { 163b3a44c85SBarry Smith rows[cnt++] = i; 164b3a44c85SBarry Smith break; 165b3a44c85SBarry Smith } 166b3a44c85SBarry Smith } 167b3a44c85SBarry Smith } 1689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 1699566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF,cnt,rows,PETSC_OWN_POINTER,keptrows)); 170b3a44c85SBarry Smith PetscFunctionReturn(0); 171b3a44c85SBarry Smith } 172b3a44c85SBarry Smith 1737087cfbeSBarry Smith PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y,Vec D,InsertMode is) 17479299369SBarry Smith { 17579299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) Y->data; 17699e65526SBarry Smith PetscInt i,m = Y->rmap->n; 17799e65526SBarry Smith const PetscInt *diag; 1782e5835c6SStefano Zampini MatScalar *aa; 17999e65526SBarry Smith const PetscScalar *v; 180ace3abfcSBarry Smith PetscBool missing; 18179299369SBarry Smith 18279299369SBarry Smith PetscFunctionBegin; 18309f38230SBarry Smith if (Y->assembled) { 1849566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y,&missing,NULL)); 18509f38230SBarry Smith if (!missing) { 18679299369SBarry Smith diag = aij->diag; 1879566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D,&v)); 1889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y,&aa)); 18979299369SBarry Smith if (is == INSERT_VALUES) { 19079299369SBarry Smith for (i=0; i<m; i++) { 19179299369SBarry Smith aa[diag[i]] = v[i]; 19279299369SBarry Smith } 19379299369SBarry Smith } else { 19479299369SBarry Smith for (i=0; i<m; i++) { 19579299369SBarry Smith aa[diag[i]] += v[i]; 19679299369SBarry Smith } 19779299369SBarry Smith } 1989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y,&aa)); 1999566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D,&v)); 20079299369SBarry Smith PetscFunctionReturn(0); 20179299369SBarry Smith } 2029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 20309f38230SBarry Smith } 2049566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y,D,is)); 20509f38230SBarry Smith PetscFunctionReturn(0); 20609f38230SBarry Smith } 20779299369SBarry Smith 2081a83f524SJed Brown PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *m,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 20917ab2063SBarry Smith { 210416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 21197f1f81fSBarry Smith PetscInt i,ishift; 21217ab2063SBarry Smith 2133a40ed3dSBarry Smith PetscFunctionBegin; 214d0f46423SBarry Smith *m = A->rmap->n; 2153a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 216bfeeae90SHong Zhang ishift = 0; 21753e63a63SBarry Smith if (symmetric && !A->structurally_symmetric) { 2189566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,PETSC_TRUE,ishift,oshift,(PetscInt**)ia,(PetscInt**)ja)); 219bfeeae90SHong Zhang } else if (oshift == 1) { 2201a83f524SJed Brown PetscInt *tia; 221d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2223b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2239566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n+1,&tia)); 2241a83f524SJed Brown for (i=0; i<A->rmap->n+1; i++) tia[i] = a->i[i] + 1; 2251a83f524SJed Brown *ia = tia; 226ecc77c7aSBarry Smith if (ja) { 2271a83f524SJed Brown PetscInt *tja; 2289566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz+1,&tja)); 2291a83f524SJed Brown for (i=0; i<nz; i++) tja[i] = a->j[i] + 1; 2301a83f524SJed Brown *ja = tja; 231ecc77c7aSBarry Smith } 2326945ee14SBarry Smith } else { 233ecc77c7aSBarry Smith *ia = a->i; 234ecc77c7aSBarry Smith if (ja) *ja = a->j; 235a2ce50c7SBarry Smith } 2363a40ed3dSBarry Smith PetscFunctionReturn(0); 237a2744918SBarry Smith } 238a2744918SBarry Smith 2391a83f524SJed Brown PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2406945ee14SBarry Smith { 2413a40ed3dSBarry Smith PetscFunctionBegin; 2423a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 243bfeeae90SHong Zhang if ((symmetric && !A->structurally_symmetric) || oshift == 1) { 2449566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2459566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 246bcd2baecSBarry Smith } 2473a40ed3dSBarry Smith PetscFunctionReturn(0); 24817ab2063SBarry Smith } 24917ab2063SBarry Smith 2501a83f524SJed Brown PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *nn,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2513b2fbd54SBarry Smith { 2523b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 253d0f46423SBarry Smith PetscInt i,*collengths,*cia,*cja,n = A->cmap->n,m = A->rmap->n; 25497f1f81fSBarry Smith PetscInt nz = a->i[m],row,*jj,mr,col; 2553b2fbd54SBarry Smith 2563a40ed3dSBarry Smith PetscFunctionBegin; 257899cda47SBarry Smith *nn = n; 2583a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2593b2fbd54SBarry Smith if (symmetric) { 2609566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,PETSC_TRUE,0,oshift,(PetscInt**)ia,(PetscInt**)ja)); 2613b2fbd54SBarry Smith } else { 2629566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n,&collengths)); 2639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n+1,&cia)); 2649566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz,&cja)); 2653b2fbd54SBarry Smith jj = a->j; 2663b2fbd54SBarry Smith for (i=0; i<nz; i++) { 267bfeeae90SHong Zhang collengths[jj[i]]++; 2683b2fbd54SBarry Smith } 2693b2fbd54SBarry Smith cia[0] = oshift; 2703b2fbd54SBarry Smith for (i=0; i<n; i++) { 2713b2fbd54SBarry Smith cia[i+1] = cia[i] + collengths[i]; 2723b2fbd54SBarry Smith } 2739566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths,n)); 2743b2fbd54SBarry Smith jj = a->j; 275a93ec695SBarry Smith for (row=0; row<m; row++) { 276a93ec695SBarry Smith mr = a->i[row+1] - a->i[row]; 277a93ec695SBarry Smith for (i=0; i<mr; i++) { 278bfeeae90SHong Zhang col = *jj++; 2792205254eSKarl Rupp 2803b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2813b2fbd54SBarry Smith } 2823b2fbd54SBarry Smith } 2839566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2843b2fbd54SBarry Smith *ia = cia; *ja = cja; 2853b2fbd54SBarry Smith } 2863a40ed3dSBarry Smith PetscFunctionReturn(0); 2873b2fbd54SBarry Smith } 2883b2fbd54SBarry Smith 2891a83f524SJed Brown PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2903b2fbd54SBarry Smith { 2913a40ed3dSBarry Smith PetscFunctionBegin; 2923a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2933b2fbd54SBarry Smith 2949566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2959566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2963a40ed3dSBarry Smith PetscFunctionReturn(0); 2973b2fbd54SBarry Smith } 2983b2fbd54SBarry Smith 2997cee066cSHong Zhang /* 3007cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 3017cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 302040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 3037cee066cSHong Zhang */ 3047cee066cSHong Zhang PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *nn,const PetscInt *ia[],const PetscInt *ja[],PetscInt *spidx[],PetscBool *done) 3057cee066cSHong Zhang { 3067cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3077cee066cSHong Zhang PetscInt i,*collengths,*cia,*cja,n = A->cmap->n,m = A->rmap->n; 308071fcb05SBarry Smith PetscInt nz = a->i[m],row,mr,col,tmp; 3097cee066cSHong Zhang PetscInt *cspidx; 310071fcb05SBarry Smith const PetscInt *jj; 3117cee066cSHong Zhang 3127cee066cSHong Zhang PetscFunctionBegin; 3137cee066cSHong Zhang *nn = n; 3147cee066cSHong Zhang if (!ia) PetscFunctionReturn(0); 315625f6d37SHong Zhang 3169566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n,&collengths)); 3179566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n+1,&cia)); 3189566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz,&cja)); 3199566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz,&cspidx)); 3207cee066cSHong Zhang jj = a->j; 3217cee066cSHong Zhang for (i=0; i<nz; i++) { 3227cee066cSHong Zhang collengths[jj[i]]++; 3237cee066cSHong Zhang } 3247cee066cSHong Zhang cia[0] = oshift; 3257cee066cSHong Zhang for (i=0; i<n; i++) { 3267cee066cSHong Zhang cia[i+1] = cia[i] + collengths[i]; 3277cee066cSHong Zhang } 3289566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths,n)); 3297cee066cSHong Zhang jj = a->j; 3307cee066cSHong Zhang for (row=0; row<m; row++) { 3317cee066cSHong Zhang mr = a->i[row+1] - a->i[row]; 3327cee066cSHong Zhang for (i=0; i<mr; i++) { 3337cee066cSHong Zhang col = *jj++; 334071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 335071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 336071fcb05SBarry Smith cja[tmp] = row + oshift; 3377cee066cSHong Zhang } 3387cee066cSHong Zhang } 3399566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 340071fcb05SBarry Smith *ia = cia; 341071fcb05SBarry Smith *ja = cja; 3427cee066cSHong Zhang *spidx = cspidx; 3437cee066cSHong Zhang PetscFunctionReturn(0); 3447cee066cSHong Zhang } 3457cee066cSHong Zhang 3467cee066cSHong Zhang PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscInt *spidx[],PetscBool *done) 3477cee066cSHong Zhang { 3487cee066cSHong Zhang PetscFunctionBegin; 3499566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A,oshift,symmetric,inodecompressed,n,ia,ja,done)); 3509566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3517cee066cSHong Zhang PetscFunctionReturn(0); 3527cee066cSHong Zhang } 3537cee066cSHong Zhang 35487d4246cSBarry Smith PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A,PetscInt row,const PetscScalar v[]) 35587d4246cSBarry Smith { 35687d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 35787d4246cSBarry Smith PetscInt *ai = a->i; 358fff043a9SJunchao Zhang PetscScalar *aa; 35987d4246cSBarry Smith 36087d4246cSBarry Smith PetscFunctionBegin; 3619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 3629566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa+ai[row],v,ai[row+1]-ai[row])); 3639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 36487d4246cSBarry Smith PetscFunctionReturn(0); 36587d4246cSBarry Smith } 36687d4246cSBarry Smith 367bd04181cSBarry Smith /* 368bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 369bd04181cSBarry Smith 370bd04181cSBarry Smith - a single row of values is set with each call 371bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 372bd04181cSBarry Smith - the values are always added to the matrix, not set 373bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 374bd04181cSBarry Smith 3751f763a69SBarry Smith This does NOT assume the global column indices are sorted 376bd04181cSBarry Smith 3771f763a69SBarry Smith */ 378bd04181cSBarry Smith 379af0996ceSBarry Smith #include <petsc/private/isimpl.h> 380189e4007SBarry Smith PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 381189e4007SBarry Smith { 382189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3831f763a69SBarry Smith PetscInt low,high,t,row,nrow,i,col,l; 3841f763a69SBarry Smith const PetscInt *rp,*ai = a->i,*ailen = a->ilen,*aj = a->j; 3851f763a69SBarry Smith PetscInt lastcol = -1; 386fff043a9SJunchao Zhang MatScalar *ap,value,*aa; 387189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices,*cidx = A->cmap->mapping->indices; 388189e4007SBarry Smith 389fff043a9SJunchao Zhang PetscFunctionBegin; 3909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 391f38dd0b8SBarry Smith row = ridx[im[0]]; 3921f763a69SBarry Smith rp = aj + ai[row]; 3931f763a69SBarry Smith ap = aa + ai[row]; 3941f763a69SBarry Smith nrow = ailen[row]; 395189e4007SBarry Smith low = 0; 396189e4007SBarry Smith high = nrow; 397189e4007SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 398189e4007SBarry Smith col = cidx[in[l]]; 399f38dd0b8SBarry Smith value = v[l]; 400189e4007SBarry Smith 401189e4007SBarry Smith if (col <= lastcol) low = 0; 402189e4007SBarry Smith else high = nrow; 403189e4007SBarry Smith lastcol = col; 404189e4007SBarry Smith while (high-low > 5) { 405189e4007SBarry Smith t = (low+high)/2; 406189e4007SBarry Smith if (rp[t] > col) high = t; 407189e4007SBarry Smith else low = t; 408189e4007SBarry Smith } 409189e4007SBarry Smith for (i=low; i<high; i++) { 410189e4007SBarry Smith if (rp[i] == col) { 4111f763a69SBarry Smith ap[i] += value; 412189e4007SBarry Smith low = i + 1; 4131f763a69SBarry Smith break; 414189e4007SBarry Smith } 415189e4007SBarry Smith } 416189e4007SBarry Smith } 4179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 418f38dd0b8SBarry Smith return 0; 419189e4007SBarry Smith } 420189e4007SBarry Smith 42197f1f81fSBarry Smith PetscErrorCode MatSetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 42217ab2063SBarry Smith { 423416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 424e2ee6c50SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 42597f1f81fSBarry Smith PetscInt *imax = a->imax,*ai = a->i,*ailen = a->ilen; 426e2ee6c50SBarry Smith PetscInt *aj = a->j,nonew = a->nonew,lastcol = -1; 427ce496241SStefano Zampini MatScalar *ap=NULL,value=0.0,*aa; 428ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 429ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 43017ab2063SBarry Smith 4313a40ed3dSBarry Smith PetscFunctionBegin; 4329566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 43317ab2063SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 434416022c9SBarry Smith row = im[k]; 4355ef9f2a5SBarry Smith if (row < 0) continue; 4366bdcaf15SBarry Smith PetscCheck(row < A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT,row,A->rmap->n-1); 437720833daSHong Zhang rp = aj + ai[row]; 438876c6284SHong Zhang if (!A->structure_only) ap = aa + ai[row]; 43917ab2063SBarry Smith rmax = imax[row]; nrow = ailen[row]; 440416022c9SBarry Smith low = 0; 441c71e6ed7SBarry Smith high = nrow; 44217ab2063SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 4435ef9f2a5SBarry Smith if (in[l] < 0) continue; 4446bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT,in[l],A->cmap->n-1); 445bfeeae90SHong Zhang col = in[l]; 446071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k*n] : v[k + l*m]; 447071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 44836db0b34SBarry Smith 4492205254eSKarl Rupp if (col <= lastcol) low = 0; 4502205254eSKarl Rupp else high = nrow; 451e2ee6c50SBarry Smith lastcol = col; 452416022c9SBarry Smith while (high-low > 5) { 453416022c9SBarry Smith t = (low+high)/2; 454416022c9SBarry Smith if (rp[t] > col) high = t; 455416022c9SBarry Smith else low = t; 45617ab2063SBarry Smith } 457416022c9SBarry Smith for (i=low; i<high; i++) { 45817ab2063SBarry Smith if (rp[i] > col) break; 45917ab2063SBarry Smith if (rp[i] == col) { 460876c6284SHong Zhang if (!A->structure_only) { 4610c0d7e18SFande Kong if (is == ADD_VALUES) { 4620c0d7e18SFande Kong ap[i] += value; 4630c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4640c0d7e18SFande Kong } 46517ab2063SBarry Smith else ap[i] = value; 466720833daSHong Zhang } 467e44c0bd4SBarry Smith low = i + 1; 46817ab2063SBarry Smith goto noinsert; 46917ab2063SBarry Smith } 47017ab2063SBarry Smith } 471dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 472c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 47308401ef6SPierre Jolivet PetscCheck(nonew != -1,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix",row,col); 474720833daSHong Zhang if (A->structure_only) { 475876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A,A->rmap->n,1,nrow,row,col,rmax,ai,aj,rp,imax,nonew,MatScalar); 476720833daSHong Zhang } else { 477fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 478720833daSHong Zhang } 479c03d1d03SSatish Balay N = nrow++ - 1; a->nz++; high++; 480416022c9SBarry Smith /* shift up all the later entries in this row */ 4819566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp+i+1,rp+i,N-i+1)); 48217ab2063SBarry Smith rp[i] = col; 483580bdb30SBarry Smith if (!A->structure_only) { 4849566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap+i+1,ap+i,N-i+1)); 485580bdb30SBarry Smith ap[i] = value; 486580bdb30SBarry Smith } 487416022c9SBarry Smith low = i + 1; 488e56f5c9eSBarry Smith A->nonzerostate++; 489e44c0bd4SBarry Smith noinsert:; 49017ab2063SBarry Smith } 49117ab2063SBarry Smith ailen[row] = nrow; 49217ab2063SBarry Smith } 4939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 4943a40ed3dSBarry Smith PetscFunctionReturn(0); 49517ab2063SBarry Smith } 49617ab2063SBarry Smith 49719b08ed1SBarry Smith PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 49819b08ed1SBarry Smith { 49919b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 50019b08ed1SBarry Smith PetscInt *rp,k,row; 50119b08ed1SBarry Smith PetscInt *ai = a->i; 50219b08ed1SBarry Smith PetscInt *aj = a->j; 503fff043a9SJunchao Zhang MatScalar *aa,*ap; 50419b08ed1SBarry Smith 50519b08ed1SBarry Smith PetscFunctionBegin; 50628b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Cannot call on assembled matrix."); 50708401ef6SPierre Jolivet PetscCheck(m*n+a->nz <= a->maxnz,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()",a->maxnz); 508fff043a9SJunchao Zhang 5099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 51019b08ed1SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 51119b08ed1SBarry Smith row = im[k]; 51219b08ed1SBarry Smith rp = aj + ai[row]; 51319b08ed1SBarry Smith ap = aa + ai[row]; 51419b08ed1SBarry Smith 5159566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp,in,n*sizeof(PetscInt))); 51619b08ed1SBarry Smith if (!A->structure_only) { 51719b08ed1SBarry Smith if (v) { 5189566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap,v,n*sizeof(PetscScalar))); 51919b08ed1SBarry Smith v += n; 52019b08ed1SBarry Smith } else { 5219566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap,n*sizeof(PetscScalar))); 52219b08ed1SBarry Smith } 52319b08ed1SBarry Smith } 52419b08ed1SBarry Smith a->ilen[row] = n; 52519b08ed1SBarry Smith a->imax[row] = n; 52619b08ed1SBarry Smith a->i[row+1] = a->i[row]+n; 52719b08ed1SBarry Smith a->nz += n; 52819b08ed1SBarry Smith } 5299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 53019b08ed1SBarry Smith PetscFunctionReturn(0); 53119b08ed1SBarry Smith } 53219b08ed1SBarry Smith 53319b08ed1SBarry Smith /*@ 53419b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 53519b08ed1SBarry Smith 53619b08ed1SBarry Smith Input Parameters: 53719b08ed1SBarry Smith + A - the SeqAIJ matrix 53819b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 53919b08ed1SBarry Smith 54019b08ed1SBarry Smith Level: advanced 54119b08ed1SBarry Smith 54219b08ed1SBarry Smith Notes: 54319b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 54419b08ed1SBarry Smith Simply call MatSetValues() after this call to provide the matrix entries in the usual manner. This matrix may be used 54519b08ed1SBarry Smith as always with multiple matrix assemblies. 54619b08ed1SBarry Smith 547db781477SPatrick Sanan .seealso: `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 54819b08ed1SBarry Smith @*/ 54919b08ed1SBarry Smith 55019b08ed1SBarry Smith PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A,PetscInt nztotal) 55119b08ed1SBarry Smith { 55219b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 55319b08ed1SBarry Smith 55419b08ed1SBarry Smith PetscFunctionBegin; 5559566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5569566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 55719b08ed1SBarry Smith a->maxnz = nztotal; 55819b08ed1SBarry Smith if (!a->imax) { 5599566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n,&a->imax)); 5609566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,A->rmap->n*sizeof(PetscInt))); 56119b08ed1SBarry Smith } 56219b08ed1SBarry Smith if (!a->ilen) { 5639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n,&a->ilen)); 5649566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,A->rmap->n*sizeof(PetscInt))); 56519b08ed1SBarry Smith } else { 5669566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen,A->rmap->n*sizeof(PetscInt))); 56719b08ed1SBarry Smith } 56819b08ed1SBarry Smith 56919b08ed1SBarry Smith /* allocate the matrix space */ 57019b08ed1SBarry Smith if (A->structure_only) { 5719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nztotal,&a->j)); 5729566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n+1,&a->i)); 5739566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,(A->rmap->n+1)*sizeof(PetscInt)+nztotal*sizeof(PetscInt))); 57419b08ed1SBarry Smith } else { 5759566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nztotal,&a->a,nztotal,&a->j,A->rmap->n+1,&a->i)); 5769566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,(A->rmap->n+1)*sizeof(PetscInt)+nztotal*(sizeof(PetscScalar)+sizeof(PetscInt)))); 57719b08ed1SBarry Smith } 57819b08ed1SBarry Smith a->i[0] = 0; 57919b08ed1SBarry Smith if (A->structure_only) { 58019b08ed1SBarry Smith a->singlemalloc = PETSC_FALSE; 58119b08ed1SBarry Smith a->free_a = PETSC_FALSE; 58219b08ed1SBarry Smith } else { 58319b08ed1SBarry Smith a->singlemalloc = PETSC_TRUE; 58419b08ed1SBarry Smith a->free_a = PETSC_TRUE; 58519b08ed1SBarry Smith } 58619b08ed1SBarry Smith a->free_ij = PETSC_TRUE; 58719b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 58819b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 58919b08ed1SBarry Smith PetscFunctionReturn(0); 59019b08ed1SBarry Smith } 59119b08ed1SBarry Smith 592071fcb05SBarry Smith PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 593071fcb05SBarry Smith { 594071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 595071fcb05SBarry Smith PetscInt *rp,k,row; 596071fcb05SBarry Smith PetscInt *ai = a->i,*ailen = a->ilen; 597071fcb05SBarry Smith PetscInt *aj = a->j; 598fff043a9SJunchao Zhang MatScalar *aa,*ap; 599071fcb05SBarry Smith 600071fcb05SBarry Smith PetscFunctionBegin; 6019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 602071fcb05SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 603071fcb05SBarry Smith row = im[k]; 6046bdcaf15SBarry Smith PetscCheck(n <= a->imax[row],PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Preallocation for row %" PetscInt_FMT " does not match number of columns provided",n); 605071fcb05SBarry Smith rp = aj + ai[row]; 606071fcb05SBarry Smith ap = aa + ai[row]; 607071fcb05SBarry Smith if (!A->was_assembled) { 6089566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp,in,n*sizeof(PetscInt))); 609071fcb05SBarry Smith } 610071fcb05SBarry Smith if (!A->structure_only) { 611071fcb05SBarry Smith if (v) { 6129566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap,v,n*sizeof(PetscScalar))); 613071fcb05SBarry Smith v += n; 614071fcb05SBarry Smith } else { 6159566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap,n*sizeof(PetscScalar))); 616071fcb05SBarry Smith } 617071fcb05SBarry Smith } 618071fcb05SBarry Smith ailen[row] = n; 619071fcb05SBarry Smith a->nz += n; 620071fcb05SBarry Smith } 6219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 622071fcb05SBarry Smith PetscFunctionReturn(0); 623071fcb05SBarry Smith } 624071fcb05SBarry Smith 625a77337e4SBarry Smith PetscErrorCode MatGetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],PetscScalar v[]) 6267eb43aa7SLois Curfman McInnes { 6277eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 62897f1f81fSBarry Smith PetscInt *rp,k,low,high,t,row,nrow,i,col,l,*aj = a->j; 62997f1f81fSBarry Smith PetscInt *ai = a->i,*ailen = a->ilen; 630fff043a9SJunchao Zhang MatScalar *ap,*aa; 6317eb43aa7SLois Curfman McInnes 6323a40ed3dSBarry Smith PetscFunctionBegin; 6339566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 6347eb43aa7SLois Curfman McInnes for (k=0; k<m; k++) { /* loop over rows */ 6357eb43aa7SLois Curfman McInnes row = im[k]; 63654c59aa7SJacob Faibussowitsch if (row < 0) {v += n; continue;} /* negative row */ 63754c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT,row,A->rmap->n-1); 638bfeeae90SHong Zhang rp = aj + ai[row]; ap = aa + ai[row]; 6397eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6407eb43aa7SLois Curfman McInnes for (l=0; l<n; l++) { /* loop over columns */ 64154c59aa7SJacob Faibussowitsch if (in[l] < 0) {v++; continue;} /* negative column */ 64254c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT,in[l],A->cmap->n-1); 643bfeeae90SHong Zhang col = in[l]; 6447eb43aa7SLois Curfman McInnes high = nrow; low = 0; /* assume unsorted */ 6457eb43aa7SLois Curfman McInnes while (high-low > 5) { 6467eb43aa7SLois Curfman McInnes t = (low+high)/2; 6477eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6487eb43aa7SLois Curfman McInnes else low = t; 6497eb43aa7SLois Curfman McInnes } 6507eb43aa7SLois Curfman McInnes for (i=low; i<high; i++) { 6517eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6527eb43aa7SLois Curfman McInnes if (rp[i] == col) { 653b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6547eb43aa7SLois Curfman McInnes goto finished; 6557eb43aa7SLois Curfman McInnes } 6567eb43aa7SLois Curfman McInnes } 65797e567efSBarry Smith *v++ = 0.0; 6587eb43aa7SLois Curfman McInnes finished:; 6597eb43aa7SLois Curfman McInnes } 6607eb43aa7SLois Curfman McInnes } 6619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 6623a40ed3dSBarry Smith PetscFunctionReturn(0); 6637eb43aa7SLois Curfman McInnes } 6647eb43aa7SLois Curfman McInnes 6653ea6fe3dSLisandro Dalcin PetscErrorCode MatView_SeqAIJ_Binary(Mat mat,PetscViewer viewer) 66617ab2063SBarry Smith { 6673ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ*)mat->data; 668c898d852SStefano Zampini const PetscScalar *av; 6693ea6fe3dSLisandro Dalcin PetscInt header[4],M,N,m,nz,i; 6703ea6fe3dSLisandro Dalcin PetscInt *rowlens; 67117ab2063SBarry Smith 6723a40ed3dSBarry Smith PetscFunctionBegin; 6739566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6742205254eSKarl Rupp 6753ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6763ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6773ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6783ea6fe3dSLisandro Dalcin nz = A->nz; 679416022c9SBarry Smith 6803ea6fe3dSLisandro Dalcin /* write matrix header */ 6813ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6823ea6fe3dSLisandro Dalcin header[1] = M; header[2] = N; header[3] = nz; 6839566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer,header,4,PETSC_INT)); 684416022c9SBarry Smith 6853ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6869566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&rowlens)); 6873ea6fe3dSLisandro Dalcin for (i=0; i<m; i++) rowlens[i] = A->i[i+1] - A->i[i]; 6889566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer,rowlens,m,PETSC_INT)); 6899566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6903ea6fe3dSLisandro Dalcin /* store column indices */ 6919566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer,A->j,nz,PETSC_INT)); 692416022c9SBarry Smith /* store nonzero values */ 6939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat,&av)); 6949566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer,av,nz,PETSC_SCALAR)); 6959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat,&av)); 696b37d52dbSMark F. Adams 6973ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6989566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat,viewer)); 6993a40ed3dSBarry Smith PetscFunctionReturn(0); 70017ab2063SBarry Smith } 701416022c9SBarry Smith 7027dc0baabSHong Zhang static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A,PetscViewer viewer) 7037dc0baabSHong Zhang { 7047dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 7057dc0baabSHong Zhang PetscInt i,k,m=A->rmap->N; 7067dc0baabSHong Zhang 7077dc0baabSHong Zhang PetscFunctionBegin; 7089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 7097dc0baabSHong Zhang for (i=0; i<m; i++) { 7109566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"row %" PetscInt_FMT ":",i)); 7117dc0baabSHong Zhang for (k=a->i[i]; k<a->i[i+1]; k++) { 7129566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ") ",a->j[k])); 7137dc0baabSHong Zhang } 7149566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 7157dc0baabSHong Zhang } 7169566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 7177dc0baabSHong Zhang PetscFunctionReturn(0); 7187dc0baabSHong Zhang } 7197dc0baabSHong Zhang 72009573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat,PetscViewer); 721cd155464SBarry Smith 722dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_ASCII(Mat A,PetscViewer viewer) 723416022c9SBarry Smith { 724416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 725c898d852SStefano Zampini const PetscScalar *av; 72660e0710aSBarry Smith PetscInt i,j,m = A->rmap->n; 727e060cb09SBarry Smith const char *name; 728f3ef73ceSBarry Smith PetscViewerFormat format; 72917ab2063SBarry Smith 7303a40ed3dSBarry Smith PetscFunctionBegin; 7317dc0baabSHong Zhang if (A->structure_only) { 7329566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A,viewer)); 7337dc0baabSHong Zhang PetscFunctionReturn(0); 7347dc0baabSHong Zhang } 73543e49210SHong Zhang 7369566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer,&format)); 7372e5835c6SStefano Zampini if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0); 7382e5835c6SStefano Zampini 739c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&av)); 7419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&av)); 74271c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 74397f1f81fSBarry Smith PetscInt nofinalvalue = 0; 74460e0710aSBarry Smith if (m && ((a->i[m] == a->i[m-1]) || (a->j[a->nz-1] != A->cmap->n-1))) { 745c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 746d00d2cf4SBarry Smith nofinalvalue = 1; 747d00d2cf4SBarry Smith } 7489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 7499566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n",m,A->cmap->n)); 7509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%% Nonzeros = %" PetscInt_FMT " \n",a->nz)); 751fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7529566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"zzz = zeros(%" PetscInt_FMT ",4);\n",a->nz+nofinalvalue)); 753fbfe6fa7SJed Brown #else 7549566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"zzz = zeros(%" PetscInt_FMT ",3);\n",a->nz+nofinalvalue)); 755fbfe6fa7SJed Brown #endif 7569566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"zzz = [\n")); 75717ab2063SBarry Smith 75817ab2063SBarry Smith for (i=0; i<m; i++) { 75960e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 760aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n",i+1,a->j[j]+1,(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 76217ab2063SBarry Smith #else 7639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n",i+1,a->j[j]+1,(double)a->a[j])); 76417ab2063SBarry Smith #endif 76517ab2063SBarry Smith } 76617ab2063SBarry Smith } 767d00d2cf4SBarry Smith if (nofinalvalue) { 768c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n",m,A->cmap->n,0.,0.)); 770c337ccceSJed Brown #else 7719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n",m,A->cmap->n,0.0)); 772c337ccceSJed Brown #endif 773d00d2cf4SBarry Smith } 7749566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A,&name)); 7759566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"];\n %s = spconvert(zzz);\n",name)); 7769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 777fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 77944cd7ae7SLois Curfman McInnes for (i=0; i<m; i++) { 7809566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"row %" PetscInt_FMT ":",i)); 78160e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 782aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78336db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7849566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 78536db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7869566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)-PetscImaginaryPart(a->a[j]))); 78736db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7889566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)PetscRealPart(a->a[j]))); 7896831982aSBarry Smith } 79044cd7ae7SLois Curfman McInnes #else 7919566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)a->a[j])); 79244cd7ae7SLois Curfman McInnes #endif 79344cd7ae7SLois Curfman McInnes } 7949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 79544cd7ae7SLois Curfman McInnes } 7969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 797fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 79897f1f81fSBarry Smith PetscInt nzd=0,fshift=1,*sptr; 7999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 8009566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1,&sptr)); 801496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 802496be53dSLois Curfman McInnes sptr[i] = nzd+1; 80360e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 804496be53dSLois Curfman McInnes if (a->j[j] >= i) { 805aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 80636db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 807496be53dSLois Curfman McInnes #else 808496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 809496be53dSLois Curfman McInnes #endif 810496be53dSLois Curfman McInnes } 811496be53dSLois Curfman McInnes } 812496be53dSLois Curfman McInnes } 8132e44a96cSLois Curfman McInnes sptr[m] = nzd+1; 8149566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT "\n\n",m,nzd)); 8152e44a96cSLois Curfman McInnes for (i=0; i<m+1; i+=6) { 8162205254eSKarl Rupp if (i+4<m) { 8179566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4],sptr[i+5])); 8182205254eSKarl Rupp } else if (i+3<m) { 8199566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4])); 8202205254eSKarl Rupp } else if (i+2<m) { 8219566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3])); 8222205254eSKarl Rupp } else if (i+1<m) { 8239566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n",sptr[i],sptr[i+1],sptr[i+2])); 8242205254eSKarl Rupp } else if (i<m) { 8259566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT "\n",sptr[i],sptr[i+1])); 8262205254eSKarl Rupp } else { 8279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT "\n",sptr[i])); 8282205254eSKarl Rupp } 829496be53dSLois Curfman McInnes } 8309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 8319566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 832496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 83360e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 8349566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " ",a->j[j]+fshift)); 835496be53dSLois Curfman McInnes } 8369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 837496be53dSLois Curfman McInnes } 8389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 839496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 84060e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 841496be53dSLois Curfman McInnes if (a->j[j] >= i) { 842aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 84336db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) { 8449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %18.16e %18.16e ",(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 8456831982aSBarry Smith } 846496be53dSLois Curfman McInnes #else 8479566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer," %18.16e ",(double)a->a[j])); 848496be53dSLois Curfman McInnes #endif 849496be53dSLois Curfman McInnes } 850496be53dSLois Curfman McInnes } 8519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 852496be53dSLois Curfman McInnes } 8539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 854fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 85597f1f81fSBarry Smith PetscInt cnt = 0,jcnt; 85687828ca2SBarry Smith PetscScalar value; 85768f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 85868f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 85968f1ed48SBarry Smith 86068f1ed48SBarry Smith for (i=0; i<a->i[m]; i++) { 86168f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 86268f1ed48SBarry Smith realonly = PETSC_FALSE; 86368f1ed48SBarry Smith break; 86468f1ed48SBarry Smith } 86568f1ed48SBarry Smith } 86668f1ed48SBarry Smith #endif 86702594712SBarry Smith 8689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 86902594712SBarry Smith for (i=0; i<m; i++) { 87002594712SBarry Smith jcnt = 0; 871d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 872e24b481bSBarry Smith if (jcnt < a->i[i+1]-a->i[i] && j == a->j[cnt]) { 87302594712SBarry Smith value = a->a[cnt++]; 874e24b481bSBarry Smith jcnt++; 87502594712SBarry Smith } else { 87602594712SBarry Smith value = 0.0; 87702594712SBarry Smith } 878aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 87968f1ed48SBarry Smith if (realonly) { 8809566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %7.5e ",(double)PetscRealPart(value))); 88168f1ed48SBarry Smith } else { 8829566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %7.5e+%7.5e i ",(double)PetscRealPart(value),(double)PetscImaginaryPart(value))); 88368f1ed48SBarry Smith } 88402594712SBarry Smith #else 8859566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %7.5e ",(double)value)); 88602594712SBarry Smith #endif 88702594712SBarry Smith } 8889566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 88902594712SBarry Smith } 8909566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 8913c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 892150b93efSMatthew G. Knepley PetscInt fshift=1; 8939566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 8943c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8959566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%%%%MatrixMarket matrix coordinate complex general\n")); 8963c215bfdSMatthew Knepley #else 8979566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%%%%MatrixMarket matrix coordinate real general\n")); 8983c215bfdSMatthew Knepley #endif 8999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 9003c215bfdSMatthew Knepley for (i=0; i<m; i++) { 90160e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 9023c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 9039566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i+fshift,a->j[j]+fshift,(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 9043c215bfdSMatthew Knepley #else 9059566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i+fshift, a->j[j]+fshift, (double)a->a[j])); 9063c215bfdSMatthew Knepley #endif 9073c215bfdSMatthew Knepley } 9083c215bfdSMatthew Knepley } 9099566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 9103a40ed3dSBarry Smith } else { 9119566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 912d5f3da31SBarry Smith if (A->factortype) { 91316cd7e1dSShri Abhyankar for (i=0; i<m; i++) { 9149566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"row %" PetscInt_FMT ":",i)); 91516cd7e1dSShri Abhyankar /* L part */ 91660e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 91716cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91816cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9199566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 92016cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9219566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)(-PetscImaginaryPart(a->a[j])))); 92216cd7e1dSShri Abhyankar } else { 9239566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)PetscRealPart(a->a[j]))); 92416cd7e1dSShri Abhyankar } 92516cd7e1dSShri Abhyankar #else 9269566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)a->a[j])); 92716cd7e1dSShri Abhyankar #endif 92816cd7e1dSShri Abhyankar } 92916cd7e1dSShri Abhyankar /* diagonal */ 93016cd7e1dSShri Abhyankar j = a->diag[i]; 93116cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 93216cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g + %g i)",a->j[j],(double)PetscRealPart(1.0/a->a[j]),(double)PetscImaginaryPart(1.0/a->a[j]))); 93416cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9359566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g - %g i)",a->j[j],(double)PetscRealPart(1.0/a->a[j]),(double)(-PetscImaginaryPart(1.0/a->a[j])))); 93616cd7e1dSShri Abhyankar } else { 9379566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)PetscRealPart(1.0/a->a[j]))); 93816cd7e1dSShri Abhyankar } 93916cd7e1dSShri Abhyankar #else 9409566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)(1.0/a->a[j]))); 94116cd7e1dSShri Abhyankar #endif 94216cd7e1dSShri Abhyankar 94316cd7e1dSShri Abhyankar /* U part */ 94460e0710aSBarry Smith for (j=a->diag[i+1]+1; j<a->diag[i]; j++) { 94516cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 94616cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9479566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 94816cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9499566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)(-PetscImaginaryPart(a->a[j])))); 95016cd7e1dSShri Abhyankar } else { 9519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)PetscRealPart(a->a[j]))); 95216cd7e1dSShri Abhyankar } 95316cd7e1dSShri Abhyankar #else 9549566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)a->a[j])); 95516cd7e1dSShri Abhyankar #endif 95616cd7e1dSShri Abhyankar } 9579566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 95816cd7e1dSShri Abhyankar } 95916cd7e1dSShri Abhyankar } else { 96017ab2063SBarry Smith for (i=0; i<m; i++) { 9619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"row %" PetscInt_FMT ":",i)); 96260e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 963aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 96436db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9659566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 96636db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9679566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)-PetscImaginaryPart(a->a[j]))); 9683a40ed3dSBarry Smith } else { 9699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)PetscRealPart(a->a[j]))); 97017ab2063SBarry Smith } 97117ab2063SBarry Smith #else 9729566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)a->a[j])); 97317ab2063SBarry Smith #endif 97417ab2063SBarry Smith } 9759566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 97617ab2063SBarry Smith } 97716cd7e1dSShri Abhyankar } 9789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 97917ab2063SBarry Smith } 9809566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9813a40ed3dSBarry Smith PetscFunctionReturn(0); 982416022c9SBarry Smith } 983416022c9SBarry Smith 9849804daf3SBarry Smith #include <petscdraw.h> 985dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw,void *Aa) 986416022c9SBarry Smith { 987480ef9eaSBarry Smith Mat A = (Mat) Aa; 988416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 989383922c3SLisandro Dalcin PetscInt i,j,m = A->rmap->n; 990383922c3SLisandro Dalcin int color; 991b05fc000SLisandro Dalcin PetscReal xl,yl,xr,yr,x_l,x_r,y_l,y_r; 992b0a32e0cSBarry Smith PetscViewer viewer; 993f3ef73ceSBarry Smith PetscViewerFormat format; 994fff043a9SJunchao Zhang const PetscScalar *aa; 995cddf8d76SBarry Smith 9963a40ed3dSBarry Smith PetscFunctionBegin; 9979566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A,"Zoomviewer",(PetscObject*)&viewer)); 9989566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer,&format)); 9999566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw,&xl,&yl,&xr,&yr)); 1000383922c3SLisandro Dalcin 1001416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 10029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 1003fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 1004d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10050513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 1006b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 1007416022c9SBarry Smith for (i=0; i<m; i++) { 1008cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 1009bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1010bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 1011fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 10129566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color)); 1013cddf8d76SBarry Smith } 1014cddf8d76SBarry Smith } 1015b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 1016cddf8d76SBarry Smith for (i=0; i<m; i++) { 1017cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 1018bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1019bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 1020fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 10219566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color)); 1022cddf8d76SBarry Smith } 1023cddf8d76SBarry Smith } 1024b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1025cddf8d76SBarry Smith for (i=0; i<m; i++) { 1026cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 1027bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1028bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 1029fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10309566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color)); 1031416022c9SBarry Smith } 1032416022c9SBarry Smith } 1033d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10340513a670SBarry Smith } else { 10350513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10360513a670SBarry Smith /* first determine max of all nonzero values */ 1037b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1038383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1039b0a32e0cSBarry Smith PetscDraw popup; 10400513a670SBarry Smith 10410513a670SBarry Smith for (i=0; i<nz; i++) { 1042fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10430513a670SBarry Smith } 1044383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10459566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw,&popup)); 10469566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup,minv,maxv)); 1047383922c3SLisandro Dalcin 1048d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10490513a670SBarry Smith for (i=0; i<m; i++) { 1050383922c3SLisandro Dalcin y_l = m - i - 1.0; 1051383922c3SLisandro Dalcin y_r = y_l + 1.0; 1052bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1053383922c3SLisandro Dalcin x_l = a->j[j]; 1054383922c3SLisandro Dalcin x_r = x_l + 1.0; 1055fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]),minv,maxv); 10569566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color)); 10570513a670SBarry Smith count++; 10580513a670SBarry Smith } 10590513a670SBarry Smith } 1060d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10610513a670SBarry Smith } 10629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 1063480ef9eaSBarry Smith PetscFunctionReturn(0); 1064480ef9eaSBarry Smith } 1065cddf8d76SBarry Smith 10669804daf3SBarry Smith #include <petscdraw.h> 1067dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw(Mat A,PetscViewer viewer) 1068480ef9eaSBarry Smith { 1069b0a32e0cSBarry Smith PetscDraw draw; 107036db0b34SBarry Smith PetscReal xr,yr,xl,yl,h,w; 1071ace3abfcSBarry Smith PetscBool isnull; 1072480ef9eaSBarry Smith 1073480ef9eaSBarry Smith PetscFunctionBegin; 10749566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer,0,&draw)); 10759566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw,&isnull)); 1076480ef9eaSBarry Smith if (isnull) PetscFunctionReturn(0); 1077480ef9eaSBarry Smith 1078d0f46423SBarry Smith xr = A->cmap->n; yr = A->rmap->n; h = yr/10.0; w = xr/10.0; 1079480ef9eaSBarry Smith xr += w; yr += h; xl = -w; yl = -h; 10809566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw,xl,yl,xr,yr)); 10819566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A,"Zoomviewer",(PetscObject)viewer)); 10829566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw,MatView_SeqAIJ_Draw_Zoom,A)); 10839566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A,"Zoomviewer",NULL)); 10849566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10853a40ed3dSBarry Smith PetscFunctionReturn(0); 1086416022c9SBarry Smith } 1087416022c9SBarry Smith 1088dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ(Mat A,PetscViewer viewer) 1089416022c9SBarry Smith { 1090ace3abfcSBarry Smith PetscBool iascii,isbinary,isdraw; 1091416022c9SBarry Smith 10923a40ed3dSBarry Smith PetscFunctionBegin; 10939566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii)); 10949566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary)); 10959566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERDRAW,&isdraw)); 1096c45a1595SBarry Smith if (iascii) { 10979566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII(A,viewer)); 10980f5bd95cSBarry Smith } else if (isbinary) { 10999566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Binary(A,viewer)); 11000f5bd95cSBarry Smith } else if (isdraw) { 11019566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Draw(A,viewer)); 110211aeaf0aSBarry Smith } 11039566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A,viewer)); 11043a40ed3dSBarry Smith PetscFunctionReturn(0); 110517ab2063SBarry Smith } 110619bcc07fSBarry Smith 1107dfbe8321SBarry Smith PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A,MatAssemblyType mode) 110817ab2063SBarry Smith { 1109416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1110580bdb30SBarry Smith PetscInt fshift = 0,i,*ai = a->i,*aj = a->j,*imax = a->imax; 1111d0f46423SBarry Smith PetscInt m = A->rmap->n,*ip,N,*ailen = a->ilen,rmax = 0; 111254f21887SBarry Smith MatScalar *aa = a->a,*ap; 11133447b6efSHong Zhang PetscReal ratio = 0.6; 111417ab2063SBarry Smith 11153a40ed3dSBarry Smith PetscFunctionBegin; 11163a40ed3dSBarry Smith if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0); 11179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1118b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1119b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11209566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A,mode)); 1121b215bc84SStefano Zampini PetscFunctionReturn(0); 1122b215bc84SStefano Zampini } 112317ab2063SBarry Smith 112443ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 112517ab2063SBarry Smith for (i=1; i<m; i++) { 1126416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 112717ab2063SBarry Smith fshift += imax[i-1] - ailen[i-1]; 112894a9d846SBarry Smith rmax = PetscMax(rmax,ailen[i]); 112917ab2063SBarry Smith if (fshift) { 1130bfeeae90SHong Zhang ip = aj + ai[i]; 1131bfeeae90SHong Zhang ap = aa + ai[i]; 113217ab2063SBarry Smith N = ailen[i]; 11339566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip-fshift,ip,N)); 1134580bdb30SBarry Smith if (!A->structure_only) { 11359566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap-fshift,ap,N)); 113617ab2063SBarry Smith } 113717ab2063SBarry Smith } 113817ab2063SBarry Smith ai[i] = ai[i-1] + ailen[i-1]; 113917ab2063SBarry Smith } 114017ab2063SBarry Smith if (m) { 114117ab2063SBarry Smith fshift += imax[m-1] - ailen[m-1]; 114217ab2063SBarry Smith ai[m] = ai[m-1] + ailen[m-1]; 114317ab2063SBarry Smith } 11447b083b7cSBarry Smith 114517ab2063SBarry Smith /* reset ilen and imax for each row */ 11467b083b7cSBarry Smith a->nonzerorowcnt = 0; 1147396832f4SHong Zhang if (A->structure_only) { 11489566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11499566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1150396832f4SHong Zhang } else { /* !A->structure_only */ 115117ab2063SBarry Smith for (i=0; i<m; i++) { 115217ab2063SBarry Smith ailen[i] = imax[i] = ai[i+1] - ai[i]; 11537b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i+1] - ai[i]) > 0); 115417ab2063SBarry Smith } 1155396832f4SHong Zhang } 1156bfeeae90SHong Zhang a->nz = ai[m]; 1157aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1,PETSC_COMM_SELF,PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 115817ab2063SBarry Smith 11599566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 11609566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n",m,A->cmap->n,fshift,a->nz)); 11619566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n",a->reallocs)); 11629566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Maximum nonzeros in any row is %" PetscInt_FMT "\n",rmax)); 11632205254eSKarl Rupp 11648e58a170SBarry Smith A->info.mallocs += a->reallocs; 1165dd5f02e7SSatish Balay a->reallocs = 0; 11666712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 116736db0b34SBarry Smith a->rmax = rmax; 11684e220ebcSLois Curfman McInnes 1169396832f4SHong Zhang if (!A->structure_only) { 11709566063dSJacob Faibussowitsch PetscCall(MatCheckCompressedRow(A,a->nonzerorowcnt,&a->compressedrow,a->i,m,ratio)); 1171396832f4SHong Zhang } 11729566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A,mode)); 11733a40ed3dSBarry Smith PetscFunctionReturn(0); 117417ab2063SBarry Smith } 117517ab2063SBarry Smith 117699cafbc1SBarry Smith PetscErrorCode MatRealPart_SeqAIJ(Mat A) 117799cafbc1SBarry Smith { 117899cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 117999cafbc1SBarry Smith PetscInt i,nz = a->nz; 11802e5835c6SStefano Zampini MatScalar *aa; 118199cafbc1SBarry Smith 118299cafbc1SBarry Smith PetscFunctionBegin; 11839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 118499cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscRealPart(aa[i]); 11859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 11869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 118799cafbc1SBarry Smith PetscFunctionReturn(0); 118899cafbc1SBarry Smith } 118999cafbc1SBarry Smith 119099cafbc1SBarry Smith PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 119199cafbc1SBarry Smith { 119299cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 119399cafbc1SBarry Smith PetscInt i,nz = a->nz; 11942e5835c6SStefano Zampini MatScalar *aa; 119599cafbc1SBarry Smith 119699cafbc1SBarry Smith PetscFunctionBegin; 11979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 119899cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 12009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 120199cafbc1SBarry Smith PetscFunctionReturn(0); 120299cafbc1SBarry Smith } 120399cafbc1SBarry Smith 1204dfbe8321SBarry Smith PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 120517ab2063SBarry Smith { 1206fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1207fff043a9SJunchao Zhang MatScalar *aa; 12083a40ed3dSBarry Smith 12093a40ed3dSBarry Smith PetscFunctionBegin; 12109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A,&aa)); 12119566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa,a->i[A->rmap->n])); 12129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A,&aa)); 12139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 12143a40ed3dSBarry Smith PetscFunctionReturn(0); 121517ab2063SBarry Smith } 1216416022c9SBarry Smith 1217cbc6b225SStefano Zampini PETSC_INTERN PetscErrorCode MatResetPreallocationCOO_SeqAIJ(Mat A) 1218cbc6b225SStefano Zampini { 1219cbc6b225SStefano Zampini Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1220cbc6b225SStefano Zampini 1221cbc6b225SStefano Zampini PetscFunctionBegin; 12229566063dSJacob Faibussowitsch PetscCall(PetscFree(a->perm)); 12239566063dSJacob Faibussowitsch PetscCall(PetscFree(a->jmap)); 1224cbc6b225SStefano Zampini PetscFunctionReturn(0); 1225cbc6b225SStefano Zampini } 1226cbc6b225SStefano Zampini 1227dfbe8321SBarry Smith PetscErrorCode MatDestroy_SeqAIJ(Mat A) 122817ab2063SBarry Smith { 1229416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1230d5d45c9bSBarry Smith 12313a40ed3dSBarry Smith PetscFunctionBegin; 1232aa482453SBarry Smith #if defined(PETSC_USE_LOG) 1233c0aa6a63SJacob Faibussowitsch PetscLogObjectState((PetscObject)A,"Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT,A->rmap->n,A->cmap->n,a->nz); 123417ab2063SBarry Smith #endif 12359566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A,&a->a,&a->j,&a->i)); 12369566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(A)); 12379566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12389566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12399566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12409566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12419566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12429566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12439566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12449566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag,a->mdiag,a->ssor_work)); 12459566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12469566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12479566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12489566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i,a->compressedrow.rindex)); 12499566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 12509566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1251901853e0SKris Buschelman 12526718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12536718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12546718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12556718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12566718818eSStefano Zampini due to different matrix sizes */ 12579566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A,"__PETSc__ab_dense",NULL)); 12586718818eSStefano Zampini 12599566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A,NULL)); 1260*2e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"PetscMatlabEnginePut_C",NULL)); 1261*2e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"PetscMatlabEngineGet_C",NULL)); 12629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetColumnIndices_C",NULL)); 12639566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatStoreValues_C",NULL)); 12649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatRetrieveValues_C",NULL)); 12659566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqsbaij_C",NULL)); 12669566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqbaij_C",NULL)); 12679566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijperm_C",NULL)); 1268*2e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijsell_C",NULL)); 1269*2e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 1270*2e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijmkl_C",NULL)); 1271*2e956fe4SStefano Zampini #endif 12724222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12739566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijcusparse_C",NULL)); 12749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaijcusparse_seqaij_C",NULL)); 12759566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaij_seqaijcusparse_C",NULL)); 12764222ddf1SHong Zhang #endif 12773d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijkokkos_C",NULL)); 12793d0639e7SStefano Zampini #endif 12809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijcrl_C",NULL)); 1281af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_elemental_C",NULL)); 1283af8000cdSHong Zhang #endif 1284d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_scalapack_C",NULL)); 1286d24d4204SJose E. Roman #endif 128763c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12889566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_hypre_C",NULL)); 12899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_transpose_seqaij_seqaij_C",NULL)); 129063c07aadSStefano Zampini #endif 12919566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqdense_C",NULL)); 12929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqsell_C",NULL)); 12939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_is_C",NULL)); 12949566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatIsTranspose_C",NULL)); 1295*2e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatIsHermitianTranspose_C",NULL)); 12969566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetPreallocation_C",NULL)); 12979566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatResetPreallocation_C",NULL)); 12989566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetPreallocationCSR_C",NULL)); 12999566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatReorderForNonzeroDiagonal_C",NULL)); 13009566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_is_seqaij_C",NULL)); 13019566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqdense_seqaij_C",NULL)); 13029566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaij_seqaij_C",NULL)); 13039566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJKron_C",NULL)); 13049566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSetPreallocationCOO_C",NULL)); 13059566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSetValuesCOO_C",NULL)); 1306*2e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatFactorGetSolverType_C",NULL)); 1307*2e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 1308*2e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaijsell_seqaij_C",NULL)); 1309*2e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaijperm_seqaij_C",NULL)); 1310*2e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijviennacl_C",NULL)); 1311*2e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaijviennacl_seqdense_C",NULL)); 1312*2e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaijviennacl_seqaij_C",NULL)); 13133a40ed3dSBarry Smith PetscFunctionReturn(0); 131417ab2063SBarry Smith } 131517ab2063SBarry Smith 1316ace3abfcSBarry Smith PetscErrorCode MatSetOption_SeqAIJ(Mat A,MatOption op,PetscBool flg) 131717ab2063SBarry Smith { 1318416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 13193a40ed3dSBarry Smith 13203a40ed3dSBarry Smith PetscFunctionBegin; 1321a65d3064SKris Buschelman switch (op) { 1322a65d3064SKris Buschelman case MAT_ROW_ORIENTED: 13234e0d8c25SBarry Smith a->roworiented = flg; 1324a65d3064SKris Buschelman break; 1325a9817697SBarry Smith case MAT_KEEP_NONZERO_PATTERN: 1326a9817697SBarry Smith a->keepnonzeropattern = flg; 1327a65d3064SKris Buschelman break; 1328512a5fc5SBarry Smith case MAT_NEW_NONZERO_LOCATIONS: 1329512a5fc5SBarry Smith a->nonew = (flg ? 0 : 1); 1330a65d3064SKris Buschelman break; 1331a65d3064SKris Buschelman case MAT_NEW_NONZERO_LOCATION_ERR: 13324e0d8c25SBarry Smith a->nonew = (flg ? -1 : 0); 1333a65d3064SKris Buschelman break; 1334a65d3064SKris Buschelman case MAT_NEW_NONZERO_ALLOCATION_ERR: 13354e0d8c25SBarry Smith a->nonew = (flg ? -2 : 0); 1336a65d3064SKris Buschelman break; 133728b2fa4aSMatthew Knepley case MAT_UNUSED_NONZERO_LOCATION_ERR: 133828b2fa4aSMatthew Knepley a->nounused = (flg ? -1 : 0); 133928b2fa4aSMatthew Knepley break; 1340a65d3064SKris Buschelman case MAT_IGNORE_ZERO_ENTRIES: 13414e0d8c25SBarry Smith a->ignorezeroentries = flg; 13420df259c2SBarry Smith break; 13433d472b54SHong Zhang case MAT_SPD: 1344b1646e73SJed Brown case MAT_SYMMETRIC: 1345b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1346b1646e73SJed Brown case MAT_HERMITIAN: 1347b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1348957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 13495021d80fSJed Brown /* These options are handled directly by MatSetOption() */ 13505021d80fSJed Brown break; 13518c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 1352a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1353a65d3064SKris Buschelman case MAT_USE_HASH_TABLE: 13549566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Option %s ignored\n",MatOptions[op])); 1355a65d3064SKris Buschelman break; 1356b87ac2d8SJed Brown case MAT_USE_INODES: 13579566063dSJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A,MAT_USE_INODES,flg)); 1358b87ac2d8SJed Brown break; 1359c10200c1SHong Zhang case MAT_SUBMAT_SINGLEIS: 1360c10200c1SHong Zhang A->submat_singleis = flg; 1361c10200c1SHong Zhang break; 1362071fcb05SBarry Smith case MAT_SORTED_FULL: 1363071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1364071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1365071fcb05SBarry Smith break; 13661a2c6b5cSJunchao Zhang case MAT_FORM_EXPLICIT_TRANSPOSE: 13671a2c6b5cSJunchao Zhang A->form_explicit_transpose = flg; 13681a2c6b5cSJunchao Zhang break; 1369a65d3064SKris Buschelman default: 137098921bdaSJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"unknown option %d",op); 1371a65d3064SKris Buschelman } 13723a40ed3dSBarry Smith PetscFunctionReturn(0); 137317ab2063SBarry Smith } 137417ab2063SBarry Smith 1375dfbe8321SBarry Smith PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A,Vec v) 137617ab2063SBarry Smith { 1377416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1378fdc842d1SBarry Smith PetscInt i,j,n,*ai=a->i,*aj=a->j; 1379c898d852SStefano Zampini PetscScalar *x; 1380c898d852SStefano Zampini const PetscScalar *aa; 138117ab2063SBarry Smith 13823a40ed3dSBarry Smith PetscFunctionBegin; 13839566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v,&n)); 138408401ef6SPierre Jolivet PetscCheck(n == A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 13859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 1386d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1387d3e70bfaSHong Zhang PetscInt *diag=a->diag; 13889566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 13892c990fa1SHong Zhang for (i=0; i<n; i++) x[i] = 1.0/aa[diag[i]]; 13909566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 13919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 139235e7444dSHong Zhang PetscFunctionReturn(0); 139335e7444dSHong Zhang } 139435e7444dSHong Zhang 13959566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 139635e7444dSHong Zhang for (i=0; i<n; i++) { 1397fdc842d1SBarry Smith x[i] = 0.0; 139835e7444dSHong Zhang for (j=ai[i]; j<ai[i+1]; j++) { 139935e7444dSHong Zhang if (aj[j] == i) { 140035e7444dSHong Zhang x[i] = aa[j]; 140117ab2063SBarry Smith break; 140217ab2063SBarry Smith } 140317ab2063SBarry Smith } 140417ab2063SBarry Smith } 14059566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 14069566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 14073a40ed3dSBarry Smith PetscFunctionReturn(0); 140817ab2063SBarry Smith } 140917ab2063SBarry Smith 1410c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1411dfbe8321SBarry Smith PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A,Vec xx,Vec zz,Vec yy) 141217ab2063SBarry Smith { 1413416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 14145f22a7b3SSebastian Grimberg const MatScalar *aa; 1415d9ca1df4SBarry Smith PetscScalar *y; 1416d9ca1df4SBarry Smith const PetscScalar *x; 1417d0f46423SBarry Smith PetscInt m = A->rmap->n; 14185c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 14195f22a7b3SSebastian Grimberg const MatScalar *v; 1420a77337e4SBarry Smith PetscScalar alpha; 1421d9ca1df4SBarry Smith PetscInt n,i,j; 1422d9ca1df4SBarry Smith const PetscInt *idx,*ii,*ridx=NULL; 14233447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1424ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14255c897100SBarry Smith #endif 142617ab2063SBarry Smith 14273a40ed3dSBarry Smith PetscFunctionBegin; 14289566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz,yy)); 14299566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx,&x)); 14309566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy,&y)); 14319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 14325c897100SBarry Smith 14335c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1434fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m,x,a->i,a->j,aa,y); 14355c897100SBarry Smith #else 14363447b6efSHong Zhang if (usecprow) { 14373447b6efSHong Zhang m = cprow.nrows; 14383447b6efSHong Zhang ii = cprow.i; 14397b2bb3b9SHong Zhang ridx = cprow.rindex; 14403447b6efSHong Zhang } else { 14413447b6efSHong Zhang ii = a->i; 14423447b6efSHong Zhang } 144317ab2063SBarry Smith for (i=0; i<m; i++) { 14443447b6efSHong Zhang idx = a->j + ii[i]; 1445fff043a9SJunchao Zhang v = aa + ii[i]; 14463447b6efSHong Zhang n = ii[i+1] - ii[i]; 14473447b6efSHong Zhang if (usecprow) { 14487b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14493447b6efSHong Zhang } else { 145017ab2063SBarry Smith alpha = x[i]; 14513447b6efSHong Zhang } 145204fbf559SBarry Smith for (j=0; j<n; j++) y[idx[j]] += alpha*v[j]; 145317ab2063SBarry Smith } 14545c897100SBarry Smith #endif 14559566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 14569566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx,&x)); 14579566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy,&y)); 14589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 14593a40ed3dSBarry Smith PetscFunctionReturn(0); 146017ab2063SBarry Smith } 146117ab2063SBarry Smith 1462dfbe8321SBarry Smith PetscErrorCode MatMultTranspose_SeqAIJ(Mat A,Vec xx,Vec yy) 14635c897100SBarry Smith { 14645c897100SBarry Smith PetscFunctionBegin; 14659566063dSJacob Faibussowitsch PetscCall(VecSet(yy,0.0)); 14669566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A,xx,yy,yy)); 14675c897100SBarry Smith PetscFunctionReturn(0); 14685c897100SBarry Smith } 14695c897100SBarry Smith 1470c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 147178b84d54SShri Abhyankar 1472dfbe8321SBarry Smith PetscErrorCode MatMult_SeqAIJ(Mat A,Vec xx,Vec yy) 147317ab2063SBarry Smith { 1474416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1475d9fead3dSBarry Smith PetscScalar *y; 147654f21887SBarry Smith const PetscScalar *x; 1477fff043a9SJunchao Zhang const MatScalar *aa,*a_a; 1478003131ecSBarry Smith PetscInt m=A->rmap->n; 14790298fd71SBarry Smith const PetscInt *aj,*ii,*ridx=NULL; 14807b083b7cSBarry Smith PetscInt n,i; 1481362ced78SSatish Balay PetscScalar sum; 1482ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 148317ab2063SBarry Smith 1484b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 148597952fefSHong Zhang #pragma disjoint(*x,*y,*aa) 1486fee21e36SBarry Smith #endif 1487fee21e36SBarry Smith 14883a40ed3dSBarry Smith PetscFunctionBegin; 1489b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14909566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A,xx,yy)); 1491b215bc84SStefano Zampini PetscFunctionReturn(0); 1492b215bc84SStefano Zampini } 14939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&a_a)); 14949566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx,&x)); 14959566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy,&y)); 1496416022c9SBarry Smith ii = a->i; 14974eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14989566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y,m)); 149997952fefSHong Zhang m = a->compressedrow.nrows; 150097952fefSHong Zhang ii = a->compressedrow.i; 150197952fefSHong Zhang ridx = a->compressedrow.rindex; 150297952fefSHong Zhang for (i=0; i<m; i++) { 150397952fefSHong Zhang n = ii[i+1] - ii[i]; 150497952fefSHong Zhang aj = a->j + ii[i]; 1505fff043a9SJunchao Zhang aa = a_a + ii[i]; 150697952fefSHong Zhang sum = 0.0; 1507003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 1508003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 150997952fefSHong Zhang y[*ridx++] = sum; 151097952fefSHong Zhang } 151197952fefSHong Zhang } else { /* do not use compressed row format */ 1512b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 15133d3eaba7SBarry Smith aj = a->j; 1514fff043a9SJunchao Zhang aa = a_a; 1515b05257ddSBarry Smith fortranmultaij_(&m,x,ii,aj,aa,y); 1516b05257ddSBarry Smith #else 151717ab2063SBarry Smith for (i=0; i<m; i++) { 1518003131ecSBarry Smith n = ii[i+1] - ii[i]; 1519003131ecSBarry Smith aj = a->j + ii[i]; 1520fff043a9SJunchao Zhang aa = a_a + ii[i]; 152117ab2063SBarry Smith sum = 0.0; 1522003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 152317ab2063SBarry Smith y[i] = sum; 152417ab2063SBarry Smith } 15258d195f9aSBarry Smith #endif 1526b05257ddSBarry Smith } 15279566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz - a->nonzerorowcnt)); 15289566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx,&x)); 15299566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy,&y)); 15309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&a_a)); 15313a40ed3dSBarry Smith PetscFunctionReturn(0); 153217ab2063SBarry Smith } 153317ab2063SBarry Smith 1534b434eb95SMatthew G. Knepley PetscErrorCode MatMultMax_SeqAIJ(Mat A,Vec xx,Vec yy) 1535b434eb95SMatthew G. Knepley { 1536b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1537b434eb95SMatthew G. Knepley PetscScalar *y; 1538b434eb95SMatthew G. Knepley const PetscScalar *x; 1539fff043a9SJunchao Zhang const MatScalar *aa,*a_a; 1540b434eb95SMatthew G. Knepley PetscInt m=A->rmap->n; 1541b434eb95SMatthew G. Knepley const PetscInt *aj,*ii,*ridx=NULL; 1542b434eb95SMatthew G. Knepley PetscInt n,i,nonzerorow=0; 1543b434eb95SMatthew G. Knepley PetscScalar sum; 1544b434eb95SMatthew G. Knepley PetscBool usecprow=a->compressedrow.use; 1545b434eb95SMatthew G. Knepley 1546b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1547b434eb95SMatthew G. Knepley #pragma disjoint(*x,*y,*aa) 1548b434eb95SMatthew G. Knepley #endif 1549b434eb95SMatthew G. Knepley 1550b434eb95SMatthew G. Knepley PetscFunctionBegin; 15519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&a_a)); 15529566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx,&x)); 15539566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy,&y)); 1554b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1555b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1556b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1557b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1558b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1559b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1560b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1561fff043a9SJunchao Zhang aa = a_a + ii[i]; 1562b434eb95SMatthew G. Knepley sum = 0.0; 1563b434eb95SMatthew G. Knepley nonzerorow += (n>0); 1564b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1565b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1566b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1567b434eb95SMatthew G. Knepley } 1568b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15693d3eaba7SBarry Smith ii = a->i; 1570b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1571b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1572b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1573fff043a9SJunchao Zhang aa = a_a + ii[i]; 1574b434eb95SMatthew G. Knepley sum = 0.0; 1575b434eb95SMatthew G. Knepley nonzerorow += (n>0); 1576b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1577b434eb95SMatthew G. Knepley y[i] = sum; 1578b434eb95SMatthew G. Knepley } 1579b434eb95SMatthew G. Knepley } 15809566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz - nonzerorow)); 15819566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx,&x)); 15829566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy,&y)); 15839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&a_a)); 1584b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1585b434eb95SMatthew G. Knepley } 1586b434eb95SMatthew G. Knepley 1587b434eb95SMatthew G. Knepley PetscErrorCode MatMultAddMax_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz) 1588b434eb95SMatthew G. Knepley { 1589b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1590b434eb95SMatthew G. Knepley PetscScalar *y,*z; 1591b434eb95SMatthew G. Knepley const PetscScalar *x; 1592fff043a9SJunchao Zhang const MatScalar *aa,*a_a; 1593b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n,*aj,*ii; 1594b434eb95SMatthew G. Knepley PetscInt n,i,*ridx=NULL; 1595b434eb95SMatthew G. Knepley PetscScalar sum; 1596b434eb95SMatthew G. Knepley PetscBool usecprow=a->compressedrow.use; 1597b434eb95SMatthew G. Knepley 1598b434eb95SMatthew G. Knepley PetscFunctionBegin; 15999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&a_a)); 16009566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx,&x)); 16019566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy,zz,&y,&z)); 1602b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1603b434eb95SMatthew G. Knepley if (zz != yy) { 16049566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(z,y,m)); 1605b434eb95SMatthew G. Knepley } 1606b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1607b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1608b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1609b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1610b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1611b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1612fff043a9SJunchao Zhang aa = a_a + ii[i]; 1613b434eb95SMatthew G. Knepley sum = y[*ridx]; 1614b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1615b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1616b434eb95SMatthew G. Knepley } 1617b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 16183d3eaba7SBarry Smith ii = a->i; 1619b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1620b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1621b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1622fff043a9SJunchao Zhang aa = a_a + ii[i]; 1623b434eb95SMatthew G. Knepley sum = y[i]; 1624b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1625b434eb95SMatthew G. Knepley z[i] = sum; 1626b434eb95SMatthew G. Knepley } 1627b434eb95SMatthew G. Knepley } 16289566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 16299566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx,&x)); 16309566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy,zz,&y,&z)); 16319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&a_a)); 1632b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1633b434eb95SMatthew G. Knepley } 1634b434eb95SMatthew G. Knepley 1635c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1636dfbe8321SBarry Smith PetscErrorCode MatMultAdd_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz) 163717ab2063SBarry Smith { 1638416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1639f15663dcSBarry Smith PetscScalar *y,*z; 1640f15663dcSBarry Smith const PetscScalar *x; 1641fff043a9SJunchao Zhang const MatScalar *aa,*a_a; 1642d9ca1df4SBarry Smith const PetscInt *aj,*ii,*ridx=NULL; 1643d9ca1df4SBarry Smith PetscInt m = A->rmap->n,n,i; 1644362ced78SSatish Balay PetscScalar sum; 1645ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 16469ea0dfa2SSatish Balay 16473a40ed3dSBarry Smith PetscFunctionBegin; 1648b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16499566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A,xx,yy,zz)); 1650b215bc84SStefano Zampini PetscFunctionReturn(0); 1651b215bc84SStefano Zampini } 16529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&a_a)); 16539566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx,&x)); 16549566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy,zz,&y,&z)); 16554eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 16564eb6d288SHong Zhang if (zz != yy) { 16579566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(z,y,m)); 16584eb6d288SHong Zhang } 165997952fefSHong Zhang m = a->compressedrow.nrows; 166097952fefSHong Zhang ii = a->compressedrow.i; 166197952fefSHong Zhang ridx = a->compressedrow.rindex; 166297952fefSHong Zhang for (i=0; i<m; i++) { 166397952fefSHong Zhang n = ii[i+1] - ii[i]; 166497952fefSHong Zhang aj = a->j + ii[i]; 1665fff043a9SJunchao Zhang aa = a_a + ii[i]; 166697952fefSHong Zhang sum = y[*ridx]; 1667f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 166897952fefSHong Zhang z[*ridx++] = sum; 166997952fefSHong Zhang } 167097952fefSHong Zhang } else { /* do not use compressed row format */ 16713d3eaba7SBarry Smith ii = a->i; 1672f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16733d3eaba7SBarry Smith aj = a->j; 1674fff043a9SJunchao Zhang aa = a_a; 1675f15663dcSBarry Smith fortranmultaddaij_(&m,x,ii,aj,aa,y,z); 1676f15663dcSBarry Smith #else 167717ab2063SBarry Smith for (i=0; i<m; i++) { 1678f15663dcSBarry Smith n = ii[i+1] - ii[i]; 1679f15663dcSBarry Smith aj = a->j + ii[i]; 1680fff043a9SJunchao Zhang aa = a_a + ii[i]; 168117ab2063SBarry Smith sum = y[i]; 1682f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 168317ab2063SBarry Smith z[i] = sum; 168417ab2063SBarry Smith } 168502ab625aSSatish Balay #endif 1686f15663dcSBarry Smith } 16879566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 16889566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx,&x)); 16899566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy,zz,&y,&z)); 16909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&a_a)); 16913a40ed3dSBarry Smith PetscFunctionReturn(0); 169217ab2063SBarry Smith } 169317ab2063SBarry Smith 169417ab2063SBarry Smith /* 169517ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 169617ab2063SBarry Smith */ 1697dfbe8321SBarry Smith PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 169817ab2063SBarry Smith { 1699416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1700d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n; 1701c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 170217ab2063SBarry Smith 17033a40ed3dSBarry Smith PetscFunctionBegin; 170409f38230SBarry Smith if (!a->diag) { 17059566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&a->diag)); 17069566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A, m*sizeof(PetscInt))); 1707c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 170809f38230SBarry Smith } 1709d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 1710c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1711c0c07093SJunchao Zhang if (alreadySet) { 1712c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1713c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i+1] && a->j[pos] == i) continue; 1714c0c07093SJunchao Zhang } 1715c0c07093SJunchao Zhang 171609f38230SBarry Smith a->diag[i] = a->i[i+1]; 1717bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1718bfeeae90SHong Zhang if (a->j[j] == i) { 171909f38230SBarry Smith a->diag[i] = j; 172017ab2063SBarry Smith break; 172117ab2063SBarry Smith } 172217ab2063SBarry Smith } 172317ab2063SBarry Smith } 17243a40ed3dSBarry Smith PetscFunctionReturn(0); 172517ab2063SBarry Smith } 172617ab2063SBarry Smith 172761ecd0c6SBarry Smith PetscErrorCode MatShift_SeqAIJ(Mat A,PetscScalar v) 172861ecd0c6SBarry Smith { 172961ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 173061ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt*)a->diag; 173161ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt*) a->i; 173261ecd0c6SBarry Smith PetscInt i,*mdiag = NULL; 173361ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 173461ecd0c6SBarry Smith 173561ecd0c6SBarry Smith PetscFunctionBegin; 173661ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A,1,NULL)); 17389566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A,v)); 173961ecd0c6SBarry Smith PetscFunctionReturn(0); 174061ecd0c6SBarry Smith } 174161ecd0c6SBarry Smith 174261ecd0c6SBarry Smith if (a->diagonaldense) { 174361ecd0c6SBarry Smith cnt = 0; 174461ecd0c6SBarry Smith } else { 17459566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n,&mdiag)); 174661ecd0c6SBarry Smith for (i=0; i<A->rmap->n; i++) { 1747349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i+1]) { /* 'out of range' rows never have diagonals */ 174861ecd0c6SBarry Smith cnt++; 174961ecd0c6SBarry Smith mdiag[i] = 1; 175061ecd0c6SBarry Smith } 175161ecd0c6SBarry Smith } 175261ecd0c6SBarry Smith } 175361ecd0c6SBarry Smith if (!cnt) { 17549566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A,v)); 175561ecd0c6SBarry Smith } else { 1756b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1757b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 175861ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc,free_a = a->free_a,free_ij = a->free_ij; 175961ecd0c6SBarry Smith 176061ecd0c6SBarry Smith a->a = NULL; 176161ecd0c6SBarry Smith a->j = NULL; 176261ecd0c6SBarry Smith a->i = NULL; 176361ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1764349d3b71SJunchao Zhang for (i=0; i<PetscMin(A->rmap->n,A->cmap->n); i++) { 176561ecd0c6SBarry Smith a->imax[i] += mdiag[i]; 176661ecd0c6SBarry Smith } 17679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A,0,a->imax)); 176861ecd0c6SBarry Smith 176961ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 177061ecd0c6SBarry Smith for (i=0; i<A->rmap->n; i++) { 17719566063dSJacob Faibussowitsch PetscCall(MatSetValues(A,1,&i,a->imax[i] - mdiag[i],&oldj[oldi[i]],&olda[oldi[i]],ADD_VALUES)); 1772447d62f5SStefano Zampini if (i < A->cmap->n) { 17739566063dSJacob Faibussowitsch PetscCall(MatSetValue(A,i,i,v,ADD_VALUES)); 177461ecd0c6SBarry Smith } 1775447d62f5SStefano Zampini } 17769566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A,MAT_FINAL_ASSEMBLY)); 17779566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A,MAT_FINAL_ASSEMBLY)); 177861ecd0c6SBarry Smith if (singlemalloc) { 17799566063dSJacob Faibussowitsch PetscCall(PetscFree3(olda,oldj,oldi)); 178061ecd0c6SBarry Smith } else { 17819566063dSJacob Faibussowitsch if (free_a) PetscCall(PetscFree(olda)); 17829566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldj)); 17839566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldi)); 178461ecd0c6SBarry Smith } 178561ecd0c6SBarry Smith } 17869566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 178761ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 178861ecd0c6SBarry Smith PetscFunctionReturn(0); 178961ecd0c6SBarry Smith } 179061ecd0c6SBarry Smith 1791be5855fcSBarry Smith /* 1792be5855fcSBarry Smith Checks for missing diagonals 1793be5855fcSBarry Smith */ 1794ace3abfcSBarry Smith PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A,PetscBool *missing,PetscInt *d) 1795be5855fcSBarry Smith { 1796be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 17977734d3b5SMatthew G. Knepley PetscInt *diag,*ii = a->i,i; 1798be5855fcSBarry Smith 1799be5855fcSBarry Smith PetscFunctionBegin; 180009f38230SBarry Smith *missing = PETSC_FALSE; 18017734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 180209f38230SBarry Smith *missing = PETSC_TRUE; 180309f38230SBarry Smith if (d) *d = 0; 18049566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Matrix has no entries therefore is missing diagonal\n")); 180509f38230SBarry Smith } else { 180601445905SHong Zhang PetscInt n; 180701445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1808f1e2ffcdSBarry Smith diag = a->diag; 180901445905SHong Zhang for (i=0; i<n; i++) { 18107734d3b5SMatthew G. Knepley if (diag[i] >= ii[i+1]) { 181109f38230SBarry Smith *missing = PETSC_TRUE; 181209f38230SBarry Smith if (d) *d = i; 18139566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Matrix is missing diagonal number %" PetscInt_FMT "\n",i)); 1814358d2f5dSShri Abhyankar break; 181509f38230SBarry Smith } 1816be5855fcSBarry Smith } 1817be5855fcSBarry Smith } 1818be5855fcSBarry Smith PetscFunctionReturn(0); 1819be5855fcSBarry Smith } 1820be5855fcSBarry Smith 18210da83c2eSBarry Smith #include <petscblaslapack.h> 18220da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 18230da83c2eSBarry Smith 18240da83c2eSBarry Smith /* 18250da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 18260da83c2eSBarry Smith */ 18270da83c2eSBarry Smith PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A,PetscInt nblocks,const PetscInt *bsizes,PetscScalar *diag) 18280da83c2eSBarry Smith { 18290da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx,j,bsizemax = 0,*v_pivots; 18300da83c2eSBarry Smith PetscBool allowzeropivot,zeropivotdetected=PETSC_FALSE; 18310da83c2eSBarry Smith const PetscReal shift = 0.0; 18320da83c2eSBarry Smith PetscInt ipvt[5]; 18330da83c2eSBarry Smith PetscScalar work[25],*v_work; 18340da83c2eSBarry Smith 18350da83c2eSBarry Smith PetscFunctionBegin; 18360da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18370da83c2eSBarry Smith for (i=0; i<nblocks; i++) ncnt += bsizes[i]; 183808401ef6SPierre Jolivet PetscCheck(ncnt == n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT,ncnt,n); 18390da83c2eSBarry Smith for (i=0; i<nblocks; i++) { 18400da83c2eSBarry Smith bsizemax = PetscMax(bsizemax,bsizes[i]); 18410da83c2eSBarry Smith } 18429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax,&indx)); 18430da83c2eSBarry Smith if (bsizemax > 7) { 18449566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(bsizemax,&v_work,bsizemax,&v_pivots)); 18450da83c2eSBarry Smith } 18460da83c2eSBarry Smith ncnt = 0; 18470da83c2eSBarry Smith for (i=0; i<nblocks; i++) { 18480da83c2eSBarry Smith for (j=0; j<bsizes[i]; j++) indx[j] = ncnt+j; 18499566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,bsizes[i],indx,bsizes[i],indx,diag)); 18500da83c2eSBarry Smith switch (bsizes[i]) { 18510da83c2eSBarry Smith case 1: 18520da83c2eSBarry Smith *diag = 1.0/(*diag); 18530da83c2eSBarry Smith break; 18540da83c2eSBarry Smith case 2: 18559566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag,shift,allowzeropivot,&zeropivotdetected)); 18560da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18579566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18580da83c2eSBarry Smith break; 18590da83c2eSBarry Smith case 3: 18609566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag,shift,allowzeropivot,&zeropivotdetected)); 18610da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18629566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18630da83c2eSBarry Smith break; 18640da83c2eSBarry Smith case 4: 18659566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag,shift,allowzeropivot,&zeropivotdetected)); 18660da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18679566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18680da83c2eSBarry Smith break; 18690da83c2eSBarry Smith case 5: 18709566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag,ipvt,work,shift,allowzeropivot,&zeropivotdetected)); 18710da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18729566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18730da83c2eSBarry Smith break; 18740da83c2eSBarry Smith case 6: 18759566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag,shift,allowzeropivot,&zeropivotdetected)); 18760da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18779566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18780da83c2eSBarry Smith break; 18790da83c2eSBarry Smith case 7: 18809566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag,shift,allowzeropivot,&zeropivotdetected)); 18810da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18829566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18830da83c2eSBarry Smith break; 18840da83c2eSBarry Smith default: 18859566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i],diag,v_pivots,v_work,allowzeropivot,&zeropivotdetected)); 18860da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18879566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag,bsizes[i])); 18880da83c2eSBarry Smith } 18890da83c2eSBarry Smith ncnt += bsizes[i]; 18900da83c2eSBarry Smith diag += bsizes[i]*bsizes[i]; 18910da83c2eSBarry Smith } 18920da83c2eSBarry Smith if (bsizemax > 7) { 18939566063dSJacob Faibussowitsch PetscCall(PetscFree2(v_work,v_pivots)); 18940da83c2eSBarry Smith } 18959566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18960da83c2eSBarry Smith PetscFunctionReturn(0); 18970da83c2eSBarry Smith } 18980da83c2eSBarry Smith 1899422a814eSBarry Smith /* 1900422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1901422a814eSBarry Smith */ 19027087cfbeSBarry Smith PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A,PetscScalar omega,PetscScalar fshift) 190371f1c65dSBarry Smith { 190471f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 1905d0f46423SBarry Smith PetscInt i,*diag,m = A->rmap->n; 19062e5835c6SStefano Zampini const MatScalar *v; 190754f21887SBarry Smith PetscScalar *idiag,*mdiag; 190871f1c65dSBarry Smith 190971f1c65dSBarry Smith PetscFunctionBegin; 191071f1c65dSBarry Smith if (a->idiagvalid) PetscFunctionReturn(0); 19119566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 191271f1c65dSBarry Smith diag = a->diag; 191371f1c65dSBarry Smith if (!a->idiag) { 19149566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(m,&a->idiag,m,&a->mdiag,m,&a->ssor_work)); 19159566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,3*m*sizeof(PetscScalar))); 191671f1c65dSBarry Smith } 19172e5835c6SStefano Zampini 191871f1c65dSBarry Smith mdiag = a->mdiag; 191971f1c65dSBarry Smith idiag = a->idiag; 19209566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&v)); 1921422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 192271f1c65dSBarry Smith for (i=0; i<m; i++) { 192371f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1924899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1925899639b0SHong Zhang if (PetscRealPart(fshift)) { 19269566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Zero diagonal on row %" PetscInt_FMT "\n",i)); 19277b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 19287b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 19297b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 193098921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Zero diagonal on row %" PetscInt_FMT,i); 1931899639b0SHong Zhang } 193271f1c65dSBarry Smith idiag[i] = 1.0/v[diag[i]]; 193371f1c65dSBarry Smith } 19349566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 193571f1c65dSBarry Smith } else { 193671f1c65dSBarry Smith for (i=0; i<m; i++) { 193771f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 193871f1c65dSBarry Smith idiag[i] = omega/(fshift + v[diag[i]]); 193971f1c65dSBarry Smith } 19409566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*m)); 194171f1c65dSBarry Smith } 194271f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&v)); 194471f1c65dSBarry Smith PetscFunctionReturn(0); 194571f1c65dSBarry Smith } 194671f1c65dSBarry Smith 1947c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 194841f059aeSBarry Smith PetscErrorCode MatSOR_SeqAIJ(Mat A,Vec bb,PetscReal omega,MatSORType flag,PetscReal fshift,PetscInt its,PetscInt lits,Vec xx) 194917ab2063SBarry Smith { 1950416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1951e6d1f457SBarry Smith PetscScalar *x,d,sum,*t,scale; 19522e5835c6SStefano Zampini const MatScalar *v,*idiag=NULL,*mdiag,*aa; 195354f21887SBarry Smith const PetscScalar *b, *bs,*xb, *ts; 19543d3eaba7SBarry Smith PetscInt n,m = A->rmap->n,i; 195597f1f81fSBarry Smith const PetscInt *idx,*diag; 195617ab2063SBarry Smith 19573a40ed3dSBarry Smith PetscFunctionBegin; 1958b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19599566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A,bb,omega,flag,fshift,its,lits,xx)); 1960b215bc84SStefano Zampini PetscFunctionReturn(0); 1961b215bc84SStefano Zampini } 1962b965ef7fSBarry Smith its = its*lits; 196391723122SBarry Smith 196471f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19659566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A,omega,fshift)); 196671f1c65dSBarry Smith a->fshift = fshift; 196771f1c65dSBarry Smith a->omega = omega; 1968ed480e8bSBarry Smith 196971f1c65dSBarry Smith diag = a->diag; 197071f1c65dSBarry Smith t = a->ssor_work; 1971ed480e8bSBarry Smith idiag = a->idiag; 197271f1c65dSBarry Smith mdiag = a->mdiag; 1973ed480e8bSBarry Smith 19749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 19759566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx,&x)); 19769566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb,&b)); 1977ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 197817ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 197917ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1980ed480e8bSBarry Smith bs = b; 198117ab2063SBarry Smith for (i=0; i<m; i++) { 198271f1c65dSBarry Smith d = fshift + mdiag[i]; 1983416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1984ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19852e5835c6SStefano Zampini v = aa + diag[i] + 1; 198617ab2063SBarry Smith sum = b[i]*d/omega; 1987003131ecSBarry Smith PetscSparseDensePlusDot(sum,bs,v,idx,n); 198817ab2063SBarry Smith x[i] = sum; 198917ab2063SBarry Smith } 19909566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx,&x)); 19919566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb,&b)); 19929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 19939566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19943a40ed3dSBarry Smith PetscFunctionReturn(0); 199517ab2063SBarry Smith } 1996c783ea89SBarry Smith 199708401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER,PETSC_COMM_SELF,PETSC_ERR_SUP,"SOR_APPLY_LOWER is not implemented"); 19982205254eSKarl Rupp else if (flag & SOR_EISENSTAT) { 19994c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 2000887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 200117ab2063SBarry Smith 200217ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 200317ab2063SBarry Smith 2004887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 200517ab2063SBarry Smith */ 200617ab2063SBarry Smith scale = (2.0/omega) - 1.0; 200717ab2063SBarry Smith 200817ab2063SBarry Smith /* x = (E + U)^{-1} b */ 200917ab2063SBarry Smith for (i=m-1; i>=0; i--) { 2010416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 2011ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20122e5835c6SStefano Zampini v = aa + diag[i] + 1; 201317ab2063SBarry Smith sum = b[i]; 2014e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 2015ed480e8bSBarry Smith x[i] = sum*idiag[i]; 201617ab2063SBarry Smith } 201717ab2063SBarry Smith 201817ab2063SBarry Smith /* t = b - (2*E - D)x */ 20192e5835c6SStefano Zampini v = aa; 20202205254eSKarl Rupp for (i=0; i<m; i++) t[i] = b[i] - scale*(v[*diag++])*x[i]; 202117ab2063SBarry Smith 202217ab2063SBarry Smith /* t = (E + L)^{-1}t */ 2023ed480e8bSBarry Smith ts = t; 2024416022c9SBarry Smith diag = a->diag; 202517ab2063SBarry Smith for (i=0; i<m; i++) { 2026416022c9SBarry Smith n = diag[i] - a->i[i]; 2027ed480e8bSBarry Smith idx = a->j + a->i[i]; 20282e5835c6SStefano Zampini v = aa + a->i[i]; 202917ab2063SBarry Smith sum = t[i]; 2030003131ecSBarry Smith PetscSparseDenseMinusDot(sum,ts,v,idx,n); 2031ed480e8bSBarry Smith t[i] = sum*idiag[i]; 2032733d66baSBarry Smith /* x = x + t */ 2033733d66baSBarry Smith x[i] += t[i]; 203417ab2063SBarry Smith } 203517ab2063SBarry Smith 20369566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0*m-1 + 2.0*a->nz)); 20379566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx,&x)); 20389566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb,&b)); 20393a40ed3dSBarry Smith PetscFunctionReturn(0); 204017ab2063SBarry Smith } 204117ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 204217ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 204317ab2063SBarry Smith for (i=0; i<m; i++) { 2044416022c9SBarry Smith n = diag[i] - a->i[i]; 2045ed480e8bSBarry Smith idx = a->j + a->i[i]; 20462e5835c6SStefano Zampini v = aa + a->i[i]; 204717ab2063SBarry Smith sum = b[i]; 2048e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 20495c99c7daSBarry Smith t[i] = sum; 2050ed480e8bSBarry Smith x[i] = sum*idiag[i]; 205117ab2063SBarry Smith } 20525c99c7daSBarry Smith xb = t; 20539566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20543a40ed3dSBarry Smith } else xb = b; 205517ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 205617ab2063SBarry Smith for (i=m-1; i>=0; i--) { 2057416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 2058ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20592e5835c6SStefano Zampini v = aa + diag[i] + 1; 206017ab2063SBarry Smith sum = xb[i]; 2061e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 20625c99c7daSBarry Smith if (xb == b) { 2063ed480e8bSBarry Smith x[i] = sum*idiag[i]; 20645c99c7daSBarry Smith } else { 2065b19a5dc2SMark Adams x[i] = (1-omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 206617ab2063SBarry Smith } 20675c99c7daSBarry Smith } 20689566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 206917ab2063SBarry Smith } 207017ab2063SBarry Smith its--; 207117ab2063SBarry Smith } 207217ab2063SBarry Smith while (its--) { 207317ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 207417ab2063SBarry Smith for (i=0; i<m; i++) { 2075b19a5dc2SMark Adams /* lower */ 2076b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2077ed480e8bSBarry Smith idx = a->j + a->i[i]; 20782e5835c6SStefano Zampini v = aa + a->i[i]; 207917ab2063SBarry Smith sum = b[i]; 2080e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 2081b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2082b19a5dc2SMark Adams /* upper */ 2083b19a5dc2SMark Adams n = a->i[i+1] - diag[i] - 1; 2084b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20852e5835c6SStefano Zampini v = aa + diag[i] + 1; 2086b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum,x,v,idx,n); 2087b19a5dc2SMark Adams x[i] = (1. - omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 208817ab2063SBarry Smith } 2089b19a5dc2SMark Adams xb = t; 20909566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 2091b19a5dc2SMark Adams } else xb = b; 209217ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 209317ab2063SBarry Smith for (i=m-1; i>=0; i--) { 2094b19a5dc2SMark Adams sum = xb[i]; 2095b19a5dc2SMark Adams if (xb == b) { 2096b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2097416022c9SBarry Smith n = a->i[i+1] - a->i[i]; 2098ed480e8bSBarry Smith idx = a->j + a->i[i]; 20992e5835c6SStefano Zampini v = aa + a->i[i]; 2100e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 2101ed480e8bSBarry Smith x[i] = (1. - omega)*x[i] + (sum + mdiag[i]*x[i])*idiag[i]; 2102b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2103b19a5dc2SMark Adams n = a->i[i+1] - diag[i] - 1; 2104b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 21052e5835c6SStefano Zampini v = aa + diag[i] + 1; 2106b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum,x,v,idx,n); 2107b19a5dc2SMark Adams x[i] = (1. - omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 210817ab2063SBarry Smith } 2109b19a5dc2SMark Adams } 2110b19a5dc2SMark Adams if (xb == b) { 21119566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 2112b19a5dc2SMark Adams } else { 21139566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2114b19a5dc2SMark Adams } 211517ab2063SBarry Smith } 211617ab2063SBarry Smith } 21179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 21189566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx,&x)); 21199566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb,&b)); 2120365a8a9eSBarry Smith PetscFunctionReturn(0); 212117ab2063SBarry Smith } 212217ab2063SBarry Smith 2123dfbe8321SBarry Smith PetscErrorCode MatGetInfo_SeqAIJ(Mat A,MatInfoType flag,MatInfo *info) 212417ab2063SBarry Smith { 2125416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 21264e220ebcSLois Curfman McInnes 21273a40ed3dSBarry Smith PetscFunctionBegin; 21284e220ebcSLois Curfman McInnes info->block_size = 1.0; 21293966268fSBarry Smith info->nz_allocated = a->maxnz; 21303966268fSBarry Smith info->nz_used = a->nz; 21313966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 21323966268fSBarry Smith info->assemblies = A->num_ass; 21333966268fSBarry Smith info->mallocs = A->info.mallocs; 21347adad957SLisandro Dalcin info->memory = ((PetscObject)A)->mem; 2135d5f3da31SBarry Smith if (A->factortype) { 21364e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 21374e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 21384e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 21394e220ebcSLois Curfman McInnes } else { 21404e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21414e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21424e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21434e220ebcSLois Curfman McInnes } 21443a40ed3dSBarry Smith PetscFunctionReturn(0); 214517ab2063SBarry Smith } 214617ab2063SBarry Smith 21472b40b63fSBarry Smith PetscErrorCode MatZeroRows_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 214817ab2063SBarry Smith { 2149416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2150c7da8527SEric Chamberland PetscInt i,m = A->rmap->n - 1; 215197b48c8fSBarry Smith const PetscScalar *xx; 21522e5835c6SStefano Zampini PetscScalar *bb,*aa; 2153c7da8527SEric Chamberland PetscInt d = 0; 215417ab2063SBarry Smith 21553a40ed3dSBarry Smith PetscFunctionBegin; 215697b48c8fSBarry Smith if (x && b) { 21579566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x,&xx)); 21589566063dSJacob Faibussowitsch PetscCall(VecGetArray(b,&bb)); 215997b48c8fSBarry Smith for (i=0; i<N; i++) { 2160aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %" PetscInt_FMT " out of range", rows[i]); 2161447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 216297b48c8fSBarry Smith bb[rows[i]] = diag*xx[rows[i]]; 216397b48c8fSBarry Smith } 21649566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x,&xx)); 21659566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b,&bb)); 216697b48c8fSBarry Smith } 216797b48c8fSBarry Smith 21689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 2169a9817697SBarry Smith if (a->keepnonzeropattern) { 2170f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 2171aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %" PetscInt_FMT " out of range", rows[i]); 21729566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]],a->ilen[rows[i]])); 2173f1e2ffcdSBarry Smith } 2174f4df32b1SMatthew Knepley if (diag != 0.0) { 2175c7da8527SEric Chamberland for (i=0; i<N; i++) { 2176c7da8527SEric Chamberland d = rows[i]; 2177447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 217808401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d+1],PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT,d); 2179c7da8527SEric Chamberland } 2180f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 2181447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21822e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2183f1e2ffcdSBarry Smith } 2184f1e2ffcdSBarry Smith } 2185f1e2ffcdSBarry Smith } else { 2186f4df32b1SMatthew Knepley if (diag != 0.0) { 218717ab2063SBarry Smith for (i=0; i<N; i++) { 2188aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %" PetscInt_FMT " out of range", rows[i]); 21897ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2190447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2191447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2192447d62f5SStefano Zampini } else { 2193416022c9SBarry Smith a->ilen[rows[i]] = 1; 21942e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2195bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2196447d62f5SStefano Zampini } 2197447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21989566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],&diag,INSERT_VALUES)); 219917ab2063SBarry Smith } 220017ab2063SBarry Smith } 22013a40ed3dSBarry Smith } else { 220217ab2063SBarry Smith for (i=0; i<N; i++) { 2203aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %" PetscInt_FMT " out of range", rows[i]); 2204416022c9SBarry Smith a->ilen[rows[i]] = 0; 220517ab2063SBarry Smith } 220617ab2063SBarry Smith } 2207e56f5c9eSBarry Smith A->nonzerostate++; 2208f1e2ffcdSBarry Smith } 22099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 22109566063dSJacob Faibussowitsch PetscCall((*A->ops->assemblyend)(A,MAT_FINAL_ASSEMBLY)); 22113a40ed3dSBarry Smith PetscFunctionReturn(0); 221217ab2063SBarry Smith } 221317ab2063SBarry Smith 22146e169961SBarry Smith PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 22156e169961SBarry Smith { 22166e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 22176e169961SBarry Smith PetscInt i,j,m = A->rmap->n - 1,d = 0; 22182b40b63fSBarry Smith PetscBool missing,*zeroed,vecs = PETSC_FALSE; 22196e169961SBarry Smith const PetscScalar *xx; 22202e5835c6SStefano Zampini PetscScalar *bb,*aa; 22216e169961SBarry Smith 22226e169961SBarry Smith PetscFunctionBegin; 22232e5835c6SStefano Zampini if (!N) PetscFunctionReturn(0); 22249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 22256e169961SBarry Smith if (x && b) { 22269566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x,&xx)); 22279566063dSJacob Faibussowitsch PetscCall(VecGetArray(b,&bb)); 22282b40b63fSBarry Smith vecs = PETSC_TRUE; 22296e169961SBarry Smith } 22309566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n,&zeroed)); 22316e169961SBarry Smith for (i=0; i<N; i++) { 2232aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %" PetscInt_FMT " out of range", rows[i]); 22339566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]],a->ilen[rows[i]])); 22342205254eSKarl Rupp 22356e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 22366e169961SBarry Smith } 22376e169961SBarry Smith for (i=0; i<A->rmap->n; i++) { 22386e169961SBarry Smith if (!zeroed[i]) { 22396e169961SBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 22404cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22412e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j]*xx[a->j[j]]; 22422e5835c6SStefano Zampini aa[j] = 0.0; 22436e169961SBarry Smith } 22446e169961SBarry Smith } 22454cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag*xx[i]; 22466e169961SBarry Smith } 22476e169961SBarry Smith if (x && b) { 22489566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x,&xx)); 22499566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b,&bb)); 22506e169961SBarry Smith } 22519566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22526e169961SBarry Smith if (diag != 0.0) { 22539566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A,&missing,&d)); 22541d5a398dSstefano_zampini if (missing) { 22551d5a398dSstefano_zampini for (i=0; i<N; i++) { 22564cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2257aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")",d,rows[i]); 22589566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],&diag,INSERT_VALUES)); 22591d5a398dSstefano_zampini } 22601d5a398dSstefano_zampini } else { 22616e169961SBarry Smith for (i=0; i<N; i++) { 22622e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 22636e169961SBarry Smith } 22646e169961SBarry Smith } 22651d5a398dSstefano_zampini } 22669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 22679566063dSJacob Faibussowitsch PetscCall((*A->ops->assemblyend)(A,MAT_FINAL_ASSEMBLY)); 22686e169961SBarry Smith PetscFunctionReturn(0); 22696e169961SBarry Smith } 22706e169961SBarry Smith 2271a77337e4SBarry Smith PetscErrorCode MatGetRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 227217ab2063SBarry Smith { 2273fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2274fff043a9SJunchao Zhang const PetscScalar *aa; 2275fff043a9SJunchao Zhang PetscInt *itmp; 227617ab2063SBarry Smith 22773a40ed3dSBarry Smith PetscFunctionBegin; 22789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 2279416022c9SBarry Smith *nz = a->i[row+1] - a->i[row]; 22802e5835c6SStefano Zampini if (v) *v = (PetscScalar*)(aa + a->i[row]); 228117ab2063SBarry Smith if (idx) { 2282bfeeae90SHong Zhang itmp = a->j + a->i[row]; 228326fbe8dcSKarl Rupp if (*nz) *idx = itmp; 2284f4259b30SLisandro Dalcin else *idx = NULL; 228517ab2063SBarry Smith } 22869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 22873a40ed3dSBarry Smith PetscFunctionReturn(0); 228817ab2063SBarry Smith } 228917ab2063SBarry Smith 2290a77337e4SBarry Smith PetscErrorCode MatRestoreRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 229117ab2063SBarry Smith { 22923a40ed3dSBarry Smith PetscFunctionBegin; 2293cb4a9cd9SHong Zhang if (nz) *nz = 0; 22942e5835c6SStefano Zampini if (idx) *idx = NULL; 22952e5835c6SStefano Zampini if (v) *v = NULL; 22963a40ed3dSBarry Smith PetscFunctionReturn(0); 229717ab2063SBarry Smith } 229817ab2063SBarry Smith 2299dfbe8321SBarry Smith PetscErrorCode MatNorm_SeqAIJ(Mat A,NormType type,PetscReal *nrm) 230017ab2063SBarry Smith { 2301416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 23022e5835c6SStefano Zampini const MatScalar *v; 230336db0b34SBarry Smith PetscReal sum = 0.0; 230497f1f81fSBarry Smith PetscInt i,j; 230517ab2063SBarry Smith 23063a40ed3dSBarry Smith PetscFunctionBegin; 23079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&v)); 230817ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2309570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2310570b7f6dSBarry Smith PetscBLASInt one = 1,nz = a->nz; 231173cf7048SBarry Smith PetscStackCallBLAS("BLASnrm2",*nrm = BLASnrm2_(&nz,v,&one)); 2312570b7f6dSBarry Smith #else 2313416022c9SBarry Smith for (i=0; i<a->nz; i++) { 231436db0b34SBarry Smith sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 231517ab2063SBarry Smith } 23168f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2317570b7f6dSBarry Smith #endif 23189566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 23193a40ed3dSBarry Smith } else if (type == NORM_1) { 232036db0b34SBarry Smith PetscReal *tmp; 232197f1f81fSBarry Smith PetscInt *jj = a->j; 23229566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n+1,&tmp)); 2323064f8208SBarry Smith *nrm = 0.0; 2324416022c9SBarry Smith for (j=0; j<a->nz; j++) { 2325bfeeae90SHong Zhang tmp[*jj++] += PetscAbsScalar(*v); v++; 232617ab2063SBarry Smith } 2327d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 2328064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 232917ab2063SBarry Smith } 23309566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 23319566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz-1,0))); 23323a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2333064f8208SBarry Smith *nrm = 0.0; 2334d0f46423SBarry Smith for (j=0; j<A->rmap->n; j++) { 23352e5835c6SStefano Zampini const PetscScalar *v2 = v + a->i[j]; 233617ab2063SBarry Smith sum = 0.0; 2337416022c9SBarry Smith for (i=0; i<a->i[j+1]-a->i[j]; i++) { 23382e5835c6SStefano Zampini sum += PetscAbsScalar(*v2); v2++; 233917ab2063SBarry Smith } 2340064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 234117ab2063SBarry Smith } 23429566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz-1,0))); 2343f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"No support for two norm"); 23449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&v)); 23453a40ed3dSBarry Smith PetscFunctionReturn(0); 234617ab2063SBarry Smith } 234717ab2063SBarry Smith 23484e938277SHong Zhang /* Merged from MatGetSymbolicTranspose_SeqAIJ() - replace MatGetSymbolicTranspose_SeqAIJ()? */ 23494e938277SHong Zhang PetscErrorCode MatTransposeSymbolic_SeqAIJ(Mat A,Mat *B) 23504e938277SHong Zhang { 23514e938277SHong Zhang PetscInt i,j,anzj; 23524e938277SHong Zhang Mat_SeqAIJ *a=(Mat_SeqAIJ*)A->data,*b; 23534e938277SHong Zhang PetscInt an=A->cmap->N,am=A->rmap->N; 23544e938277SHong Zhang PetscInt *ati,*atj,*atfill,*ai=a->i,*aj=a->j; 23554e938277SHong Zhang 23564e938277SHong Zhang PetscFunctionBegin; 23574e938277SHong Zhang /* Allocate space for symbolic transpose info and work array */ 23589566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(an+1,&ati)); 23599566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ai[am],&atj)); 23609566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(an,&atfill)); 23614e938277SHong Zhang 23624e938277SHong Zhang /* Walk through aj and count ## of non-zeros in each row of A^T. */ 23634e938277SHong Zhang /* Note: offset by 1 for fast conversion into csr format. */ 236426fbe8dcSKarl Rupp for (i=0;i<ai[am];i++) ati[aj[i]+1] += 1; 23654e938277SHong Zhang /* Form ati for csr format of A^T. */ 236626fbe8dcSKarl Rupp for (i=0;i<an;i++) ati[i+1] += ati[i]; 23674e938277SHong Zhang 23684e938277SHong Zhang /* Copy ati into atfill so we have locations of the next free space in atj */ 23699566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(atfill,ati,an)); 23704e938277SHong Zhang 23714e938277SHong Zhang /* Walk through A row-wise and mark nonzero entries of A^T. */ 23724e938277SHong Zhang for (i=0;i<am;i++) { 23734e938277SHong Zhang anzj = ai[i+1] - ai[i]; 23744e938277SHong Zhang for (j=0;j<anzj;j++) { 23754e938277SHong Zhang atj[atfill[*aj]] = i; 23764e938277SHong Zhang atfill[*aj++] += 1; 23774e938277SHong Zhang } 23784e938277SHong Zhang } 23794e938277SHong Zhang 23804e938277SHong Zhang /* Clean up temporary space and complete requests. */ 23819566063dSJacob Faibussowitsch PetscCall(PetscFree(atfill)); 23829566063dSJacob Faibussowitsch PetscCall(MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),an,am,ati,atj,NULL,B)); 23839566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(*B,PetscAbs(A->cmap->bs),PetscAbs(A->rmap->bs))); 23849566063dSJacob Faibussowitsch PetscCall(MatSetType(*B,((PetscObject)A)->type_name)); 2385a2f3521dSMark F. Adams 23864e938277SHong Zhang b = (Mat_SeqAIJ*)((*B)->data); 23874e938277SHong Zhang b->free_a = PETSC_FALSE; 23884e938277SHong Zhang b->free_ij = PETSC_TRUE; 23894e938277SHong Zhang b->nonew = 0; 23904e938277SHong Zhang PetscFunctionReturn(0); 23914e938277SHong Zhang } 23924e938277SHong Zhang 23937087cfbeSBarry Smith PetscErrorCode MatIsTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 2394cd0d46ebSvictorle { 23953d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) A->data,*bij = (Mat_SeqAIJ*) B->data; 239654f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 23972e5835c6SStefano Zampini const MatScalar *va,*vb; 239897f1f81fSBarry Smith PetscInt ma,na,mb,nb, i; 2399cd0d46ebSvictorle 2400cd0d46ebSvictorle PetscFunctionBegin; 24019566063dSJacob Faibussowitsch PetscCall(MatGetSize(A,&ma,&na)); 24029566063dSJacob Faibussowitsch PetscCall(MatGetSize(B,&mb,&nb)); 24035485867bSBarry Smith if (ma!=nb || na!=mb) { 24045485867bSBarry Smith *f = PETSC_FALSE; 24055485867bSBarry Smith PetscFunctionReturn(0); 24065485867bSBarry Smith } 24079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&va)); 24089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B,&vb)); 2409cd0d46ebSvictorle aii = aij->i; bii = bij->i; 2410cd0d46ebSvictorle adx = aij->j; bdx = bij->j; 24119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma,&aptr)); 24129566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb,&bptr)); 2413cd0d46ebSvictorle for (i=0; i<ma; i++) aptr[i] = aii[i]; 2414cd0d46ebSvictorle for (i=0; i<mb; i++) bptr[i] = bii[i]; 2415cd0d46ebSvictorle 2416cd0d46ebSvictorle *f = PETSC_TRUE; 2417cd0d46ebSvictorle for (i=0; i<ma; i++) { 2418cd0d46ebSvictorle while (aptr[i]<aii[i+1]) { 241997f1f81fSBarry Smith PetscInt idc,idr; 24205485867bSBarry Smith PetscScalar vc,vr; 2421cd0d46ebSvictorle /* column/row index/value */ 24225485867bSBarry Smith idc = adx[aptr[i]]; 24235485867bSBarry Smith idr = bdx[bptr[idc]]; 24245485867bSBarry Smith vc = va[aptr[i]]; 24255485867bSBarry Smith vr = vb[bptr[idc]]; 24265485867bSBarry Smith if (i!=idr || PetscAbsScalar(vc-vr) > tol) { 24275485867bSBarry Smith *f = PETSC_FALSE; 24285485867bSBarry Smith goto done; 2429cd0d46ebSvictorle } else { 24305485867bSBarry Smith aptr[i]++; 24315485867bSBarry Smith if (B || i!=idc) bptr[idc]++; 2432cd0d46ebSvictorle } 2433cd0d46ebSvictorle } 2434cd0d46ebSvictorle } 2435cd0d46ebSvictorle done: 24369566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24379566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&va)); 24399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B,&vb)); 2440cd0d46ebSvictorle PetscFunctionReturn(0); 2441cd0d46ebSvictorle } 2442cd0d46ebSvictorle 24437087cfbeSBarry Smith PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 24441cbb95d3SBarry Smith { 24453d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) A->data,*bij = (Mat_SeqAIJ*) B->data; 244654f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 244754f21887SBarry Smith MatScalar *va,*vb; 24481cbb95d3SBarry Smith PetscInt ma,na,mb,nb, i; 24491cbb95d3SBarry Smith 24501cbb95d3SBarry Smith PetscFunctionBegin; 24519566063dSJacob Faibussowitsch PetscCall(MatGetSize(A,&ma,&na)); 24529566063dSJacob Faibussowitsch PetscCall(MatGetSize(B,&mb,&nb)); 24531cbb95d3SBarry Smith if (ma!=nb || na!=mb) { 24541cbb95d3SBarry Smith *f = PETSC_FALSE; 24551cbb95d3SBarry Smith PetscFunctionReturn(0); 24561cbb95d3SBarry Smith } 24571cbb95d3SBarry Smith aii = aij->i; bii = bij->i; 24581cbb95d3SBarry Smith adx = aij->j; bdx = bij->j; 24591cbb95d3SBarry Smith va = aij->a; vb = bij->a; 24609566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma,&aptr)); 24619566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb,&bptr)); 24621cbb95d3SBarry Smith for (i=0; i<ma; i++) aptr[i] = aii[i]; 24631cbb95d3SBarry Smith for (i=0; i<mb; i++) bptr[i] = bii[i]; 24641cbb95d3SBarry Smith 24651cbb95d3SBarry Smith *f = PETSC_TRUE; 24661cbb95d3SBarry Smith for (i=0; i<ma; i++) { 24671cbb95d3SBarry Smith while (aptr[i]<aii[i+1]) { 24681cbb95d3SBarry Smith PetscInt idc,idr; 24691cbb95d3SBarry Smith PetscScalar vc,vr; 24701cbb95d3SBarry Smith /* column/row index/value */ 24711cbb95d3SBarry Smith idc = adx[aptr[i]]; 24721cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 24731cbb95d3SBarry Smith vc = va[aptr[i]]; 24741cbb95d3SBarry Smith vr = vb[bptr[idc]]; 24751cbb95d3SBarry Smith if (i!=idr || PetscAbsScalar(vc-PetscConj(vr)) > tol) { 24761cbb95d3SBarry Smith *f = PETSC_FALSE; 24771cbb95d3SBarry Smith goto done; 24781cbb95d3SBarry Smith } else { 24791cbb95d3SBarry Smith aptr[i]++; 24801cbb95d3SBarry Smith if (B || i!=idc) bptr[idc]++; 24811cbb95d3SBarry Smith } 24821cbb95d3SBarry Smith } 24831cbb95d3SBarry Smith } 24841cbb95d3SBarry Smith done: 24859566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24869566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24871cbb95d3SBarry Smith PetscFunctionReturn(0); 24881cbb95d3SBarry Smith } 24891cbb95d3SBarry Smith 2490ace3abfcSBarry Smith PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 24919e29f15eSvictorle { 24929e29f15eSvictorle PetscFunctionBegin; 24939566063dSJacob Faibussowitsch PetscCall(MatIsTranspose_SeqAIJ(A,A,tol,f)); 24949e29f15eSvictorle PetscFunctionReturn(0); 24959e29f15eSvictorle } 24969e29f15eSvictorle 2497ace3abfcSBarry Smith PetscErrorCode MatIsHermitian_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 24981cbb95d3SBarry Smith { 24991cbb95d3SBarry Smith PetscFunctionBegin; 25009566063dSJacob Faibussowitsch PetscCall(MatIsHermitianTranspose_SeqAIJ(A,A,tol,f)); 25011cbb95d3SBarry Smith PetscFunctionReturn(0); 25021cbb95d3SBarry Smith } 25031cbb95d3SBarry Smith 2504dfbe8321SBarry Smith PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A,Vec ll,Vec rr) 250517ab2063SBarry Smith { 2506416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2507fff8e43fSBarry Smith const PetscScalar *l,*r; 2508fff8e43fSBarry Smith PetscScalar x; 250954f21887SBarry Smith MatScalar *v; 2510fff8e43fSBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,M,nz = a->nz; 2511fff8e43fSBarry Smith const PetscInt *jj; 251217ab2063SBarry Smith 25133a40ed3dSBarry Smith PetscFunctionBegin; 251417ab2063SBarry Smith if (ll) { 25153ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 25163ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 25179566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll,&m)); 251808401ef6SPierre Jolivet PetscCheck(m == A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Left scaling vector wrong length"); 25199566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll,&l)); 25209566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&v)); 252117ab2063SBarry Smith for (i=0; i<m; i++) { 252217ab2063SBarry Smith x = l[i]; 2523416022c9SBarry Smith M = a->i[i+1] - a->i[i]; 25242205254eSKarl Rupp for (j=0; j<M; j++) (*v++) *= x; 252517ab2063SBarry Smith } 25269566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll,&l)); 25279566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 25289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&v)); 252917ab2063SBarry Smith } 253017ab2063SBarry Smith if (rr) { 25319566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr,&n)); 253208401ef6SPierre Jolivet PetscCheck(n == A->cmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Right scaling vector wrong length"); 25339566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr,&r)); 25349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&v)); 25352e5835c6SStefano Zampini jj = a->j; 25362205254eSKarl Rupp for (i=0; i<nz; i++) (*v++) *= r[*jj++]; 25379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&v)); 25389566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr,&r)); 25399566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 254017ab2063SBarry Smith } 25419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 25423a40ed3dSBarry Smith PetscFunctionReturn(0); 254317ab2063SBarry Smith } 254417ab2063SBarry Smith 25457dae84e0SHong Zhang PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A,IS isrow,IS iscol,PetscInt csize,MatReuse scall,Mat *B) 254617ab2063SBarry Smith { 2547db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*c; 2548d0f46423SBarry Smith PetscInt *smap,i,k,kstart,kend,oldcols = A->cmap->n,*lens; 254997f1f81fSBarry Smith PetscInt row,mat_i,*mat_j,tcol,first,step,*mat_ilen,sum,lensi; 25505d0c19d7SBarry Smith const PetscInt *irow,*icol; 25512e5835c6SStefano Zampini const PetscScalar *aa; 25525d0c19d7SBarry Smith PetscInt nrows,ncols; 255397f1f81fSBarry Smith PetscInt *starts,*j_new,*i_new,*aj = a->j,*ai = a->i,ii,*ailen = a->ilen; 255454f21887SBarry Smith MatScalar *a_new,*mat_a; 2555416022c9SBarry Smith Mat C; 2556cdc6f3adSToby Isaac PetscBool stride; 255717ab2063SBarry Smith 25583a40ed3dSBarry Smith PetscFunctionBegin; 25599566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow,&irow)); 25609566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow,&nrows)); 25619566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol,&ncols)); 256217ab2063SBarry Smith 25639566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol,ISSTRIDE,&stride)); 2564ff718158SBarry Smith if (stride) { 25659566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol,&first,&step)); 2566ff718158SBarry Smith } else { 2567ff718158SBarry Smith first = 0; 2568ff718158SBarry Smith step = 0; 2569ff718158SBarry Smith } 2570fee21e36SBarry Smith if (stride && step == 1) { 257102834360SBarry Smith /* special case of contiguous rows */ 25729566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows,&lens,nrows,&starts)); 257302834360SBarry Smith /* loop over new rows determining lens and starting points */ 257402834360SBarry Smith for (i=0; i<nrows; i++) { 2575bfeeae90SHong Zhang kstart = ai[irow[i]]; 2576a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2577a91a9bebSLisandro Dalcin starts[i] = kstart; 257802834360SBarry Smith for (k=kstart; k<kend; k++) { 2579bfeeae90SHong Zhang if (aj[k] >= first) { 258002834360SBarry Smith starts[i] = k; 258102834360SBarry Smith break; 258202834360SBarry Smith } 258302834360SBarry Smith } 2584a2744918SBarry Smith sum = 0; 258502834360SBarry Smith while (k < kend) { 2586bfeeae90SHong Zhang if (aj[k++] >= first+ncols) break; 2587a2744918SBarry Smith sum++; 258802834360SBarry Smith } 2589a2744918SBarry Smith lens[i] = sum; 259002834360SBarry Smith } 259102834360SBarry Smith /* create submatrix */ 2592cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 259397f1f81fSBarry Smith PetscInt n_cols,n_rows; 25949566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B,&n_rows,&n_cols)); 2595aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Reused submatrix wrong size"); 25969566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 259708480c60SBarry Smith C = *B; 25983a40ed3dSBarry Smith } else { 25993bef6203SJed Brown PetscInt rbs,cbs; 26009566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A),&C)); 26019566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE)); 26029566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow,&rbs)); 26039566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol,&cbs)); 26049566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C,rbs,cbs)); 26059566063dSJacob Faibussowitsch PetscCall(MatSetType(C,((PetscObject)A)->type_name)); 26069566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens)); 260708480c60SBarry Smith } 2608db02288aSLois Curfman McInnes c = (Mat_SeqAIJ*)C->data; 2609db02288aSLois Curfman McInnes 261002834360SBarry Smith /* loop over rows inserting into submatrix */ 2611db02288aSLois Curfman McInnes a_new = c->a; 2612db02288aSLois Curfman McInnes j_new = c->j; 2613db02288aSLois Curfman McInnes i_new = c->i; 26149566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 261502834360SBarry Smith for (i=0; i<nrows; i++) { 2616a2744918SBarry Smith ii = starts[i]; 2617a2744918SBarry Smith lensi = lens[i]; 2618a2744918SBarry Smith for (k=0; k<lensi; k++) { 2619a2744918SBarry Smith *j_new++ = aj[ii+k] - first; 262002834360SBarry Smith } 26219566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new,aa + starts[i],lensi)); 2622a2744918SBarry Smith a_new += lensi; 2623a2744918SBarry Smith i_new[i+1] = i_new[i] + lensi; 2624a2744918SBarry Smith c->ilen[i] = lensi; 262502834360SBarry Smith } 26269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 26279566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens,starts)); 26283a40ed3dSBarry Smith } else { 26299566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol,&icol)); 26309566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols,&smap)); 26319566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1+nrows,&lens)); 26324dcab191SBarry Smith for (i=0; i<ncols; i++) { 26336bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT,i,icol[i],oldcols); 26344dcab191SBarry Smith smap[icol[i]] = i+1; 26354dcab191SBarry Smith } 26364dcab191SBarry Smith 263702834360SBarry Smith /* determine lens of each row */ 263802834360SBarry Smith for (i=0; i<nrows; i++) { 2639bfeeae90SHong Zhang kstart = ai[irow[i]]; 264002834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 264102834360SBarry Smith lens[i] = 0; 264202834360SBarry Smith for (k=kstart; k<kend; k++) { 2643bfeeae90SHong Zhang if (smap[aj[k]]) { 264402834360SBarry Smith lens[i]++; 264502834360SBarry Smith } 264602834360SBarry Smith } 264702834360SBarry Smith } 264817ab2063SBarry Smith /* Create and fill new matrix */ 2649a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2650ace3abfcSBarry Smith PetscBool equal; 26510f5bd95cSBarry Smith 265299141d43SSatish Balay c = (Mat_SeqAIJ*)((*B)->data); 2653aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong size"); 26549566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen,lens,(*B)->rmap->n,&equal)); 265528b400f6SJacob Faibussowitsch PetscCheck(equal,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong no of nonzeros"); 26569566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen,(*B)->rmap->n)); 265708480c60SBarry Smith C = *B; 26583a40ed3dSBarry Smith } else { 26593bef6203SJed Brown PetscInt rbs,cbs; 26609566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A),&C)); 26619566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE)); 26629566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow,&rbs)); 26639566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol,&cbs)); 26649566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C,rbs,cbs)); 26659566063dSJacob Faibussowitsch PetscCall(MatSetType(C,((PetscObject)A)->type_name)); 26669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens)); 266708480c60SBarry Smith } 26689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 266999141d43SSatish Balay c = (Mat_SeqAIJ*)(C->data); 267017ab2063SBarry Smith for (i=0; i<nrows; i++) { 267199141d43SSatish Balay row = irow[i]; 2672bfeeae90SHong Zhang kstart = ai[row]; 267399141d43SSatish Balay kend = kstart + a->ilen[row]; 2674bfeeae90SHong Zhang mat_i = c->i[i]; 267599141d43SSatish Balay mat_j = c->j + mat_i; 267699141d43SSatish Balay mat_a = c->a + mat_i; 267799141d43SSatish Balay mat_ilen = c->ilen + i; 267817ab2063SBarry Smith for (k=kstart; k<kend; k++) { 2679bfeeae90SHong Zhang if ((tcol=smap[a->j[k]])) { 2680ed480e8bSBarry Smith *mat_j++ = tcol - 1; 26812e5835c6SStefano Zampini *mat_a++ = aa[k]; 268299141d43SSatish Balay (*mat_ilen)++; 268399141d43SSatish Balay 268417ab2063SBarry Smith } 268517ab2063SBarry Smith } 268617ab2063SBarry Smith } 26879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 268802834360SBarry Smith /* Free work space */ 26899566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol,&icol)); 26909566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26919566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2692cdc6f3adSToby Isaac /* sort */ 2693cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2694cdc6f3adSToby Isaac PetscInt ilen; 2695cdc6f3adSToby Isaac 2696cdc6f3adSToby Isaac mat_i = c->i[i]; 2697cdc6f3adSToby Isaac mat_j = c->j + mat_i; 2698cdc6f3adSToby Isaac mat_a = c->a + mat_i; 2699cdc6f3adSToby Isaac ilen = c->ilen[i]; 27009566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen,mat_j,mat_a)); 2701cdc6f3adSToby Isaac } 270202834360SBarry Smith } 27038c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 27049566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C,A->boundtocpu)); 2705305c6ccfSStefano Zampini #endif 27069566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY)); 27079566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY)); 270817ab2063SBarry Smith 27099566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow,&irow)); 2710416022c9SBarry Smith *B = C; 27113a40ed3dSBarry Smith PetscFunctionReturn(0); 271217ab2063SBarry Smith } 271317ab2063SBarry Smith 2714fc08c53fSHong Zhang PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat,MPI_Comm subComm,MatReuse scall,Mat *subMat) 271582d44351SHong Zhang { 271682d44351SHong Zhang Mat B; 271782d44351SHong Zhang 271882d44351SHong Zhang PetscFunctionBegin; 2719c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 27209566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm,&B)); 27219566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B,mat->rmap->n,mat->cmap->n,mat->rmap->n,mat->cmap->n)); 27229566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B,mat,mat)); 27239566063dSJacob Faibussowitsch PetscCall(MatSetType(B,MATSEQAIJ)); 27249566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B,mat,MAT_COPY_VALUES,PETSC_TRUE)); 272582d44351SHong Zhang *subMat = B; 2726c2d650bdSHong Zhang } else { 27279566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat,*subMat,SAME_NONZERO_PATTERN)); 2728c2d650bdSHong Zhang } 272982d44351SHong Zhang PetscFunctionReturn(0); 273082d44351SHong Zhang } 273182d44351SHong Zhang 27329a625307SHong Zhang PetscErrorCode MatILUFactor_SeqAIJ(Mat inA,IS row,IS col,const MatFactorInfo *info) 2733a871dcd8SBarry Smith { 273463b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 273563b91edcSBarry Smith Mat outA; 2736ace3abfcSBarry Smith PetscBool row_identity,col_identity; 273763b91edcSBarry Smith 27383a40ed3dSBarry Smith PetscFunctionBegin; 273908401ef6SPierre Jolivet PetscCheck(info->levels == 0,PETSC_COMM_SELF,PETSC_ERR_SUP,"Only levels=0 supported for in-place ilu"); 27401df811f5SHong Zhang 27419566063dSJacob Faibussowitsch PetscCall(ISIdentity(row,&row_identity)); 27429566063dSJacob Faibussowitsch PetscCall(ISIdentity(col,&col_identity)); 2743a871dcd8SBarry Smith 274463b91edcSBarry Smith outA = inA; 2745d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 27469566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 27479566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC,&inA->solvertype)); 27482205254eSKarl Rupp 27499566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 27509566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 27512205254eSKarl Rupp 2752c3122656SLisandro Dalcin a->row = row; 27532205254eSKarl Rupp 27549566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 27559566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 27562205254eSKarl Rupp 2757c3122656SLisandro Dalcin a->col = col; 275863b91edcSBarry Smith 275936db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 27609566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 27619566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col,PETSC_DECIDE,&a->icol)); 27629566063dSJacob Faibussowitsch PetscCall(PetscLogObjectParent((PetscObject)inA,(PetscObject)a->icol)); 2763f0ec6fceSSatish Balay 276494a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 27659566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n+1,&a->solve_work)); 27669566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)inA, (inA->rmap->n+1)*sizeof(PetscScalar))); 276794a9d846SBarry Smith } 276863b91edcSBarry Smith 27699566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2770137fb511SHong Zhang if (row_identity && col_identity) { 27719566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA,inA,info)); 2772137fb511SHong Zhang } else { 27739566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA,inA,info)); 2774137fb511SHong Zhang } 27753a40ed3dSBarry Smith PetscFunctionReturn(0); 2776a871dcd8SBarry Smith } 2777a871dcd8SBarry Smith 2778f4df32b1SMatthew Knepley PetscErrorCode MatScale_SeqAIJ(Mat inA,PetscScalar alpha) 2779f0b747eeSBarry Smith { 2780f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 2781dfa0f9e5SStefano Zampini PetscScalar *v; 2782c5df96a5SBarry Smith PetscBLASInt one = 1,bnz; 27833a40ed3dSBarry Smith 27843a40ed3dSBarry Smith PetscFunctionBegin; 27859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA,&v)); 27869566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz,&bnz)); 2787dfa0f9e5SStefano Zampini PetscStackCallBLAS("BLASscal",BLASscal_(&bnz,&alpha,v,&one)); 27889566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA,&v)); 27909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27913a40ed3dSBarry Smith PetscFunctionReturn(0); 2792f0b747eeSBarry Smith } 2793f0b747eeSBarry Smith 2794f68bb481SHong Zhang PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 279516b64355SHong Zhang { 279616b64355SHong Zhang PetscInt i; 279716b64355SHong Zhang 279816b64355SHong Zhang PetscFunctionBegin; 279916b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 28009566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1,submatj->ptr,submatj->tmp,submatj->ctr)); 280116b64355SHong Zhang 280216b64355SHong Zhang for (i=0; i<submatj->nrqr; ++i) { 28039566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->sbuf2[i])); 280416b64355SHong Zhang } 28059566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2,submatj->req_size,submatj->req_source1)); 280616b64355SHong Zhang 280716b64355SHong Zhang if (submatj->rbuf1) { 28089566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 28099566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 281016b64355SHong Zhang } 281116b64355SHong Zhang 281216b64355SHong Zhang for (i=0; i<submatj->nrqs; ++i) { 28139566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf3[i])); 281416b64355SHong Zhang } 28159566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2,submatj->rbuf2,submatj->rbuf3)); 28169566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 281716b64355SHong Zhang } 281816b64355SHong Zhang 281916b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 28209566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy((PetscTable*)&submatj->rmap)); 28219566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 28229566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 282316b64355SHong Zhang #else 28249566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 282516b64355SHong Zhang #endif 282616b64355SHong Zhang 282716b64355SHong Zhang if (!submatj->allcolumns) { 282816b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 28299566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy((PetscTable*)&submatj->cmap)); 283016b64355SHong Zhang #else 28319566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 283216b64355SHong Zhang #endif 283316b64355SHong Zhang } 28349566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 283516b64355SHong Zhang 28369566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 283716b64355SHong Zhang PetscFunctionReturn(0); 283816b64355SHong Zhang } 283916b64355SHong Zhang 28400fb991dcSHong Zhang PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 284116b64355SHong Zhang { 284216b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ*)C->data; 28435c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 284416b64355SHong Zhang 284516b64355SHong Zhang PetscFunctionBegin; 28469566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 28479566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 284816b64355SHong Zhang PetscFunctionReturn(0); 284916b64355SHong Zhang } 285016b64355SHong Zhang 28512d033e1fSHong Zhang PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n,Mat *mat[]) 28522d033e1fSHong Zhang { 28532d033e1fSHong Zhang PetscInt i; 28540fb991dcSHong Zhang Mat C; 28550fb991dcSHong Zhang Mat_SeqAIJ *c; 28560fb991dcSHong Zhang Mat_SubSppt *submatj; 28572d033e1fSHong Zhang 28582d033e1fSHong Zhang PetscFunctionBegin; 28592d033e1fSHong Zhang for (i=0; i<n; i++) { 28600fb991dcSHong Zhang C = (*mat)[i]; 28610fb991dcSHong Zhang c = (Mat_SeqAIJ*)C->data; 28620fb991dcSHong Zhang submatj = c->submatis1; 28632d033e1fSHong Zhang if (submatj) { 2864682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 28659566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 28669566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 28679566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 28689566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 28699566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 28709566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2871682e4c99SStefano Zampini } 28722d033e1fSHong Zhang } else { 28739566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 28742d033e1fSHong Zhang } 28752d033e1fSHong Zhang } 287686e85357SHong Zhang 287763a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 28789566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n,mat)); 287963a75b2aSHong Zhang 28809566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 28812d033e1fSHong Zhang PetscFunctionReturn(0); 28822d033e1fSHong Zhang } 28832d033e1fSHong Zhang 28847dae84e0SHong Zhang PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A,PetscInt n,const IS irow[],const IS icol[],MatReuse scall,Mat *B[]) 2885cddf8d76SBarry Smith { 288697f1f81fSBarry Smith PetscInt i; 2887cddf8d76SBarry Smith 28883a40ed3dSBarry Smith PetscFunctionBegin; 2889cddf8d76SBarry Smith if (scall == MAT_INITIAL_MATRIX) { 28909566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n+1,B)); 2891cddf8d76SBarry Smith } 2892cddf8d76SBarry Smith 2893cddf8d76SBarry Smith for (i=0; i<n; i++) { 28949566063dSJacob Faibussowitsch PetscCall(MatCreateSubMatrix_SeqAIJ(A,irow[i],icol[i],PETSC_DECIDE,scall,&(*B)[i])); 2895cddf8d76SBarry Smith } 28963a40ed3dSBarry Smith PetscFunctionReturn(0); 2897cddf8d76SBarry Smith } 2898cddf8d76SBarry Smith 289997f1f81fSBarry Smith PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A,PetscInt is_max,IS is[],PetscInt ov) 29004dcbc457SBarry Smith { 2901e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 29025d0c19d7SBarry Smith PetscInt row,i,j,k,l,m,n,*nidx,isz,val; 29035d0c19d7SBarry Smith const PetscInt *idx; 290497f1f81fSBarry Smith PetscInt start,end,*ai,*aj; 2905f1af5d2fSBarry Smith PetscBT table; 2906bbd702dbSSatish Balay 29073a40ed3dSBarry Smith PetscFunctionBegin; 2908d0f46423SBarry Smith m = A->rmap->n; 2909e4d965acSSatish Balay ai = a->i; 2910bfeeae90SHong Zhang aj = a->j; 29118a047759SSatish Balay 291208401ef6SPierre Jolivet PetscCheck(ov >= 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"illegal negative overlap value used"); 291306763907SSatish Balay 29149566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1,&nidx)); 29159566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m,&table)); 291606763907SSatish Balay 2917e4d965acSSatish Balay for (i=0; i<is_max; i++) { 2918b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2919e4d965acSSatish Balay isz = 0; 29209566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m,table)); 2921e4d965acSSatish Balay 2922e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 29239566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i],&idx)); 29249566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i],&n)); 2925e4d965acSSatish Balay 2926dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2927e4d965acSSatish Balay for (j=0; j<n; ++j) { 29282205254eSKarl Rupp if (!PetscBTLookupSet(table,idx[j])) nidx[isz++] = idx[j]; 29294dcbc457SBarry Smith } 29309566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i],&idx)); 29319566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2932e4d965acSSatish Balay 293304a348a9SBarry Smith k = 0; 293404a348a9SBarry Smith for (j=0; j<ov; j++) { /* for each overlap */ 293504a348a9SBarry Smith n = isz; 293606763907SSatish Balay for (; k<n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2937e4d965acSSatish Balay row = nidx[k]; 2938e4d965acSSatish Balay start = ai[row]; 2939e4d965acSSatish Balay end = ai[row+1]; 294004a348a9SBarry Smith for (l = start; l<end; l++) { 2941efb16452SHong Zhang val = aj[l]; 29422205254eSKarl Rupp if (!PetscBTLookupSet(table,val)) nidx[isz++] = val; 2943e4d965acSSatish Balay } 2944e4d965acSSatish Balay } 2945e4d965acSSatish Balay } 29469566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF,isz,nidx,PETSC_COPY_VALUES,(is+i))); 2947e4d965acSSatish Balay } 29489566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 29499566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 29503a40ed3dSBarry Smith PetscFunctionReturn(0); 29514dcbc457SBarry Smith } 295217ab2063SBarry Smith 29530513a670SBarry Smith /* -------------------------------------------------------------- */ 2954dfbe8321SBarry Smith PetscErrorCode MatPermute_SeqAIJ(Mat A,IS rowp,IS colp,Mat *B) 29550513a670SBarry Smith { 29560513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 29573b98c0a2SBarry Smith PetscInt i,nz = 0,m = A->rmap->n,n = A->cmap->n; 29585d0c19d7SBarry Smith const PetscInt *row,*col; 29595d0c19d7SBarry Smith PetscInt *cnew,j,*lens; 296056cd22aeSBarry Smith IS icolp,irowp; 29610298fd71SBarry Smith PetscInt *cwork = NULL; 29620298fd71SBarry Smith PetscScalar *vwork = NULL; 29630513a670SBarry Smith 29643a40ed3dSBarry Smith PetscFunctionBegin; 29659566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp,PETSC_DECIDE,&irowp)); 29669566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp,&row)); 29679566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp,PETSC_DECIDE,&icolp)); 29689566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp,&col)); 29690513a670SBarry Smith 29700513a670SBarry Smith /* determine lengths of permuted rows */ 29719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1,&lens)); 29722205254eSKarl Rupp for (i=0; i<m; i++) lens[row[i]] = a->i[i+1] - a->i[i]; 29739566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A),B)); 29749566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B,m,n,m,n)); 29759566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B,A,A)); 29769566063dSJacob Faibussowitsch PetscCall(MatSetType(*B,((PetscObject)A)->type_name)); 29779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B,0,lens)); 29789566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 29790513a670SBarry Smith 29809566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n,&cnew)); 29810513a670SBarry Smith for (i=0; i<m; i++) { 29829566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A,i,&nz,&cwork,&vwork)); 29832205254eSKarl Rupp for (j=0; j<nz; j++) cnew[j] = col[cwork[j]]; 29849566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B,1,&row[i],nz,cnew,vwork,INSERT_VALUES)); 29859566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A,i,&nz,&cwork,&vwork)); 29860513a670SBarry Smith } 29879566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 29882205254eSKarl Rupp 29893c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 29902205254eSKarl Rupp 29918c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29929566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B,A->boundtocpu)); 29939fe5e383SStefano Zampini #endif 29949566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY)); 29959566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY)); 29969566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp,&row)); 29979566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp,&col)); 29989566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29999566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 30006768869dSprj- if (rowp == colp) { 30019566063dSJacob Faibussowitsch PetscCall(MatPropagateSymmetryOptions(A,*B)); 30026768869dSprj- } 30033a40ed3dSBarry Smith PetscFunctionReturn(0); 30040513a670SBarry Smith } 30050513a670SBarry Smith 3006dfbe8321SBarry Smith PetscErrorCode MatCopy_SeqAIJ(Mat A,Mat B,MatStructure str) 3007cb5b572fSBarry Smith { 3008cb5b572fSBarry Smith PetscFunctionBegin; 300933f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 301033f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 3011be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3012be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ*)B->data; 30132e5835c6SStefano Zampini const PetscScalar *aa; 3014be6bf707SBarry Smith 30159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 301608401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n],PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT,a->i[A->rmap->n],b->i[B->rmap->n]); 30179566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a,aa,a->i[A->rmap->n])); 30189566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 30199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 3020cb5b572fSBarry Smith } else { 30219566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A,B,str)); 3022cb5b572fSBarry Smith } 3023cb5b572fSBarry Smith PetscFunctionReturn(0); 3024cb5b572fSBarry Smith } 3025cb5b572fSBarry Smith 30264994cf47SJed Brown PetscErrorCode MatSetUp_SeqAIJ(Mat A) 3027273d9f13SBarry Smith { 3028273d9f13SBarry Smith PetscFunctionBegin; 30299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A,PETSC_DEFAULT,NULL)); 3030273d9f13SBarry Smith PetscFunctionReturn(0); 3031273d9f13SBarry Smith } 3032273d9f13SBarry Smith 3033f38c1e66SStefano Zampini PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A,PetscScalar *array[]) 30346c0721eeSBarry Smith { 30356c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 30366e111a19SKarl Rupp 30376c0721eeSBarry Smith PetscFunctionBegin; 30386c0721eeSBarry Smith *array = a->a; 30396c0721eeSBarry Smith PetscFunctionReturn(0); 30406c0721eeSBarry Smith } 30416c0721eeSBarry Smith 3042f38c1e66SStefano Zampini PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A,PetscScalar *array[]) 30436c0721eeSBarry Smith { 30446c0721eeSBarry Smith PetscFunctionBegin; 3045f38c1e66SStefano Zampini *array = NULL; 30466c0721eeSBarry Smith PetscFunctionReturn(0); 30476c0721eeSBarry Smith } 3048273d9f13SBarry Smith 30498229c054SShri Abhyankar /* 30508229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 30518229c054SShri Abhyankar have different nonzero structure. 30528229c054SShri Abhyankar */ 3053b264fe52SHong Zhang PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m,const PetscInt *xi,const PetscInt *xj,const PetscInt *yi,const PetscInt *yj,PetscInt *nnz) 3054ec7775f6SShri Abhyankar { 3055b264fe52SHong Zhang PetscInt i,j,k,nzx,nzy; 3056ec7775f6SShri Abhyankar 3057ec7775f6SShri Abhyankar PetscFunctionBegin; 3058ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 3059ec7775f6SShri Abhyankar for (i=0; i<m; i++) { 3060b264fe52SHong Zhang const PetscInt *xjj = xj+xi[i],*yjj = yj+yi[i]; 3061b264fe52SHong Zhang nzx = xi[i+1] - xi[i]; 3062b264fe52SHong Zhang nzy = yi[i+1] - yi[i]; 30638af7cee1SJed Brown nnz[i] = 0; 30648af7cee1SJed Brown for (j=0,k=0; j<nzx; j++) { /* Point in X */ 3065b264fe52SHong Zhang for (; k<nzy && yjj[k]<xjj[j]; k++) nnz[i]++; /* Catch up to X */ 3066b264fe52SHong Zhang if (k<nzy && yjj[k]==xjj[j]) k++; /* Skip duplicate */ 30678af7cee1SJed Brown nnz[i]++; 30688af7cee1SJed Brown } 30698af7cee1SJed Brown for (; k<nzy; k++) nnz[i]++; 3070ec7775f6SShri Abhyankar } 3071ec7775f6SShri Abhyankar PetscFunctionReturn(0); 3072ec7775f6SShri Abhyankar } 3073ec7775f6SShri Abhyankar 3074b264fe52SHong Zhang PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y,Mat X,PetscInt *nnz) 3075b264fe52SHong Zhang { 3076b264fe52SHong Zhang PetscInt m = Y->rmap->N; 3077b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ*)X->data; 3078b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ*)Y->data; 3079b264fe52SHong Zhang 3080b264fe52SHong Zhang PetscFunctionBegin; 3081b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 30829566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m,x->i,x->j,y->i,y->j,nnz)); 3083b264fe52SHong Zhang PetscFunctionReturn(0); 3084b264fe52SHong Zhang } 3085b264fe52SHong Zhang 3086f4df32b1SMatthew Knepley PetscErrorCode MatAXPY_SeqAIJ(Mat Y,PetscScalar a,Mat X,MatStructure str) 3087ac90fabeSBarry Smith { 3088ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ*)X->data,*y = (Mat_SeqAIJ*)Y->data; 3089ac90fabeSBarry Smith 3090ac90fabeSBarry Smith PetscFunctionBegin; 3091134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 3092134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3093134adf20SPierre Jolivet if (e) { 30949566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i,y->i,Y->rmap->n+1,&e)); 309581fa06acSBarry Smith if (e) { 30969566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j,y->j,y->nz,&e)); 3097134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 309881fa06acSBarry Smith } 309981fa06acSBarry Smith } 310054c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"MatStructure is not SAME_NONZERO_PATTERN"); 310181fa06acSBarry Smith } 3102ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 31032e5835c6SStefano Zampini const PetscScalar *xa; 31042e5835c6SStefano Zampini PetscScalar *ya,alpha = a; 310581fa06acSBarry Smith PetscBLASInt one = 1,bnz; 310681fa06acSBarry Smith 31079566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz,&bnz)); 31089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y,&ya)); 31099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X,&xa)); 31102e5835c6SStefano Zampini PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&bnz,&alpha,xa,&one,ya,&one)); 31119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X,&xa)); 31129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y,&ya)); 31139566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*bnz)); 31149566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 31159566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3116ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 31179566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y,a,X,str)); 3118ac90fabeSBarry Smith } else { 31198229c054SShri Abhyankar Mat B; 31208229c054SShri Abhyankar PetscInt *nnz; 31219566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N,&nnz)); 31229566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y),&B)); 31239566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B,((PetscObject)Y)->name)); 31249566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B,Y->rmap,Y->cmap)); 31259566063dSJacob Faibussowitsch PetscCall(MatSetType(B,((PetscObject)Y)->type_name)); 31269566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y,X,nnz)); 31279566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B,0,nnz)); 31289566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B,Y,a,X,str)); 31299566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y,&B)); 31309566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3131ac90fabeSBarry Smith } 3132ac90fabeSBarry Smith PetscFunctionReturn(0); 3133ac90fabeSBarry Smith } 3134ac90fabeSBarry Smith 31352726fb6dSPierre Jolivet PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3136354c94deSBarry Smith { 3137354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3138354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3139354c94deSBarry Smith PetscInt i,nz; 3140354c94deSBarry Smith PetscScalar *a; 3141354c94deSBarry Smith 3142354c94deSBarry Smith PetscFunctionBegin; 3143354c94deSBarry Smith nz = aij->nz; 31449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat,&a)); 31452205254eSKarl Rupp for (i=0; i<nz; i++) a[i] = PetscConj(a[i]); 31469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat,&a)); 3147354c94deSBarry Smith #else 3148354c94deSBarry Smith PetscFunctionBegin; 3149354c94deSBarry Smith #endif 3150354c94deSBarry Smith PetscFunctionReturn(0); 3151354c94deSBarry Smith } 3152354c94deSBarry Smith 3153985db425SBarry Smith PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3154e34fafa9SBarry Smith { 3155e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3156d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3157e34fafa9SBarry Smith PetscReal atmp; 3158985db425SBarry Smith PetscScalar *x; 3159ce496241SStefano Zampini const MatScalar *aa,*av; 3160e34fafa9SBarry Smith 3161e34fafa9SBarry Smith PetscFunctionBegin; 316228b400f6SJacob Faibussowitsch PetscCheck(!A->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 31639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&av)); 3164ce496241SStefano Zampini aa = av; 3165e34fafa9SBarry Smith ai = a->i; 3166e34fafa9SBarry Smith aj = a->j; 3167e34fafa9SBarry Smith 31689566063dSJacob Faibussowitsch PetscCall(VecSet(v,0.0)); 31699566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 31709566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v,&n)); 317108401ef6SPierre Jolivet PetscCheck(n == A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3172e34fafa9SBarry Smith for (i=0; i<m; i++) { 3173e34fafa9SBarry Smith ncols = ai[1] - ai[0]; ai++; 3174e34fafa9SBarry Smith for (j=0; j<ncols; j++) { 3175985db425SBarry Smith atmp = PetscAbsScalar(*aa); 3176985db425SBarry Smith if (PetscAbsScalar(x[i]) < atmp) {x[i] = atmp; if (idx) idx[i] = *aj;} 3177985db425SBarry Smith aa++; aj++; 3178985db425SBarry Smith } 3179985db425SBarry Smith } 31809566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 31819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&av)); 3182985db425SBarry Smith PetscFunctionReturn(0); 3183985db425SBarry Smith } 3184985db425SBarry Smith 3185985db425SBarry Smith PetscErrorCode MatGetRowMax_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3186985db425SBarry Smith { 3187985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3188d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3189985db425SBarry Smith PetscScalar *x; 3190ce496241SStefano Zampini const MatScalar *aa,*av; 3191985db425SBarry Smith 3192985db425SBarry Smith PetscFunctionBegin; 319328b400f6SJacob Faibussowitsch PetscCheck(!A->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 31949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&av)); 3195ce496241SStefano Zampini aa = av; 3196985db425SBarry Smith ai = a->i; 3197985db425SBarry Smith aj = a->j; 3198985db425SBarry Smith 31999566063dSJacob Faibussowitsch PetscCall(VecSet(v,0.0)); 32009566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 32019566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v,&n)); 320208401ef6SPierre Jolivet PetscCheck(n == A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3203985db425SBarry Smith for (i=0; i<m; i++) { 3204985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 3205d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 3206985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 3207985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3208985db425SBarry Smith x[i] = 0.0; 3209985db425SBarry Smith if (idx) { 3210985db425SBarry Smith for (j=0; j<ncols; j++) { /* find first implicit 0.0 in the row */ 3211985db425SBarry Smith if (aj[j] > j) { 3212985db425SBarry Smith idx[i] = j; 3213985db425SBarry Smith break; 3214985db425SBarry Smith } 3215985db425SBarry Smith } 32161a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 32171a254869SHong Zhang if (j==ncols && j < A->cmap->n) idx[i] = j; 3218985db425SBarry Smith } 3219985db425SBarry Smith } 3220985db425SBarry Smith for (j=0; j<ncols; j++) { 3221985db425SBarry Smith if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 3222985db425SBarry Smith aa++; aj++; 3223985db425SBarry Smith } 3224985db425SBarry Smith } 32259566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 32269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&av)); 3227985db425SBarry Smith PetscFunctionReturn(0); 3228985db425SBarry Smith } 3229985db425SBarry Smith 3230c87e5d42SMatthew Knepley PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3231c87e5d42SMatthew Knepley { 3232c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3233c87e5d42SMatthew Knepley PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3234ce496241SStefano Zampini PetscScalar *x; 3235ce496241SStefano Zampini const MatScalar *aa,*av; 3236c87e5d42SMatthew Knepley 3237c87e5d42SMatthew Knepley PetscFunctionBegin; 32389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&av)); 3239ce496241SStefano Zampini aa = av; 3240c87e5d42SMatthew Knepley ai = a->i; 3241c87e5d42SMatthew Knepley aj = a->j; 3242c87e5d42SMatthew Knepley 32439566063dSJacob Faibussowitsch PetscCall(VecSet(v,0.0)); 32449566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 32459566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v,&n)); 324608401ef6SPierre Jolivet PetscCheck(n == m,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3247c87e5d42SMatthew Knepley for (i=0; i<m; i++) { 3248c87e5d42SMatthew Knepley ncols = ai[1] - ai[0]; ai++; 3249f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 3250f07e67edSHong Zhang x[i] = *aa; if (idx) idx[i] = 0; 3251f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3252f07e67edSHong Zhang x[i] = 0.0; 3253f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3254289a08f5SMatthew Knepley for (j=0; j<ncols; j++) { 3255f07e67edSHong Zhang if (aj[j] > j) { 3256f07e67edSHong Zhang idx[i] = j; 32572205254eSKarl Rupp break; 32582205254eSKarl Rupp } 3259289a08f5SMatthew Knepley } 3260f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3261f07e67edSHong Zhang if (j==ncols && j < A->cmap->n) idx[i] = j; 3262f07e67edSHong Zhang } 3263289a08f5SMatthew Knepley } 3264c87e5d42SMatthew Knepley for (j=0; j<ncols; j++) { 3265f07e67edSHong Zhang if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 3266c87e5d42SMatthew Knepley aa++; aj++; 3267c87e5d42SMatthew Knepley } 3268c87e5d42SMatthew Knepley } 32699566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 32709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&av)); 3271c87e5d42SMatthew Knepley PetscFunctionReturn(0); 3272c87e5d42SMatthew Knepley } 3273c87e5d42SMatthew Knepley 3274985db425SBarry Smith PetscErrorCode MatGetRowMin_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3275985db425SBarry Smith { 3276985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3277d9ca1df4SBarry Smith PetscInt i,j,m = A->rmap->n,ncols,n; 3278d9ca1df4SBarry Smith const PetscInt *ai,*aj; 3279985db425SBarry Smith PetscScalar *x; 3280ce496241SStefano Zampini const MatScalar *aa,*av; 3281985db425SBarry Smith 3282985db425SBarry Smith PetscFunctionBegin; 328328b400f6SJacob Faibussowitsch PetscCheck(!A->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 32849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&av)); 3285ce496241SStefano Zampini aa = av; 3286985db425SBarry Smith ai = a->i; 3287985db425SBarry Smith aj = a->j; 3288985db425SBarry Smith 32899566063dSJacob Faibussowitsch PetscCall(VecSet(v,0.0)); 32909566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 32919566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v,&n)); 329208401ef6SPierre Jolivet PetscCheck(n == m,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3293985db425SBarry Smith for (i=0; i<m; i++) { 3294985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 3295d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 3296985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 3297985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3298985db425SBarry Smith x[i] = 0.0; 3299985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3300985db425SBarry Smith for (j=0; j<ncols; j++) { 3301985db425SBarry Smith if (aj[j] > j) { 3302985db425SBarry Smith idx[i] = j; 3303985db425SBarry Smith break; 3304985db425SBarry Smith } 3305985db425SBarry Smith } 3306fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3307fa213d2fSHong Zhang if (j==ncols && j < A->cmap->n) idx[i] = j; 3308985db425SBarry Smith } 3309985db425SBarry Smith } 3310985db425SBarry Smith for (j=0; j<ncols; j++) { 3311985db425SBarry Smith if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 3312985db425SBarry Smith aa++; aj++; 3313e34fafa9SBarry Smith } 3314e34fafa9SBarry Smith } 33159566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 33169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&av)); 3317e34fafa9SBarry Smith PetscFunctionReturn(0); 3318e34fafa9SBarry Smith } 3319bbead8a2SBarry Smith 3320713ccfa9SJed Brown PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A,const PetscScalar **values) 3321bbead8a2SBarry Smith { 3322bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 332333d57670SJed Brown PetscInt i,bs = PetscAbs(A->rmap->bs),mbs = A->rmap->n/bs,ipvt[5],bs2 = bs*bs,*v_pivots,ij[7],*IJ,j; 3324bbead8a2SBarry Smith MatScalar *diag,work[25],*v_work; 33250da83c2eSBarry Smith const PetscReal shift = 0.0; 33261a9391e3SHong Zhang PetscBool allowzeropivot,zeropivotdetected=PETSC_FALSE; 3327bbead8a2SBarry Smith 3328bbead8a2SBarry Smith PetscFunctionBegin; 3329a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 33304a0d0026SBarry Smith if (a->ibdiagvalid) { 33314a0d0026SBarry Smith if (values) *values = a->ibdiag; 33324a0d0026SBarry Smith PetscFunctionReturn(0); 33334a0d0026SBarry Smith } 33349566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 3335bbead8a2SBarry Smith if (!a->ibdiag) { 33369566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bs2*mbs,&a->ibdiag)); 33379566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,bs2*mbs*sizeof(PetscScalar))); 3338bbead8a2SBarry Smith } 3339bbead8a2SBarry Smith diag = a->ibdiag; 3340bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3341bbead8a2SBarry Smith /* factor and invert each block */ 3342bbead8a2SBarry Smith switch (bs) { 3343bbead8a2SBarry Smith case 1: 3344bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 33459566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,1,&i,1,&i,diag+i)); 3346ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3347ec1892c8SHong Zhang if (allowzeropivot) { 33487b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33497b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 33507b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 33519566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n",i,(double)PetscAbsScalar(diag[i]),(double)PETSC_MACHINE_EPSILON)); 335298921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_MAT_LU_ZRPVT,"Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g",i,(double)PetscAbsScalar(diag[i]),(double)PETSC_MACHINE_EPSILON); 3353ec1892c8SHong Zhang } 3354bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3355bbead8a2SBarry Smith } 3356bbead8a2SBarry Smith break; 3357bbead8a2SBarry Smith case 2: 3358bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3359bbead8a2SBarry Smith ij[0] = 2*i; ij[1] = 2*i + 1; 33609566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,2,ij,2,ij,diag)); 33619566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag,shift,allowzeropivot,&zeropivotdetected)); 33627b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33639566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3364bbead8a2SBarry Smith diag += 4; 3365bbead8a2SBarry Smith } 3366bbead8a2SBarry Smith break; 3367bbead8a2SBarry Smith case 3: 3368bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3369bbead8a2SBarry Smith ij[0] = 3*i; ij[1] = 3*i + 1; ij[2] = 3*i + 2; 33709566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,3,ij,3,ij,diag)); 33719566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag,shift,allowzeropivot,&zeropivotdetected)); 33727b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33739566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3374bbead8a2SBarry Smith diag += 9; 3375bbead8a2SBarry Smith } 3376bbead8a2SBarry Smith break; 3377bbead8a2SBarry Smith case 4: 3378bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3379bbead8a2SBarry Smith ij[0] = 4*i; ij[1] = 4*i + 1; ij[2] = 4*i + 2; ij[3] = 4*i + 3; 33809566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,4,ij,4,ij,diag)); 33819566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag,shift,allowzeropivot,&zeropivotdetected)); 33827b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33839566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3384bbead8a2SBarry Smith diag += 16; 3385bbead8a2SBarry Smith } 3386bbead8a2SBarry Smith break; 3387bbead8a2SBarry Smith case 5: 3388bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3389bbead8a2SBarry Smith ij[0] = 5*i; ij[1] = 5*i + 1; ij[2] = 5*i + 2; ij[3] = 5*i + 3; ij[4] = 5*i + 4; 33909566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,5,ij,5,ij,diag)); 33919566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag,ipvt,work,shift,allowzeropivot,&zeropivotdetected)); 33927b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33939566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3394bbead8a2SBarry Smith diag += 25; 3395bbead8a2SBarry Smith } 3396bbead8a2SBarry Smith break; 3397bbead8a2SBarry Smith case 6: 3398bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3399bbead8a2SBarry Smith ij[0] = 6*i; ij[1] = 6*i + 1; ij[2] = 6*i + 2; ij[3] = 6*i + 3; ij[4] = 6*i + 4; ij[5] = 6*i + 5; 34009566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,6,ij,6,ij,diag)); 34019566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag,shift,allowzeropivot,&zeropivotdetected)); 34027b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34039566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3404bbead8a2SBarry Smith diag += 36; 3405bbead8a2SBarry Smith } 3406bbead8a2SBarry Smith break; 3407bbead8a2SBarry Smith case 7: 3408bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3409bbead8a2SBarry Smith ij[0] = 7*i; ij[1] = 7*i + 1; ij[2] = 7*i + 2; ij[3] = 7*i + 3; ij[4] = 7*i + 4; ij[5] = 7*i + 5; ij[5] = 7*i + 6; 34109566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,7,ij,7,ij,diag)); 34119566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag,shift,allowzeropivot,&zeropivotdetected)); 34127b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34139566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3414bbead8a2SBarry Smith diag += 49; 3415bbead8a2SBarry Smith } 3416bbead8a2SBarry Smith break; 3417bbead8a2SBarry Smith default: 34189566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs,&v_work,bs,&v_pivots,bs,&IJ)); 3419bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3420bbead8a2SBarry Smith for (j=0; j<bs; j++) { 3421bbead8a2SBarry Smith IJ[j] = bs*i + j; 3422bbead8a2SBarry Smith } 34239566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,bs,IJ,bs,IJ,diag)); 34249566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs,diag,v_pivots,v_work,allowzeropivot,&zeropivotdetected)); 34257b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34269566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag,bs)); 3427bbead8a2SBarry Smith diag += bs2; 3428bbead8a2SBarry Smith } 34299566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work,v_pivots,IJ)); 3430bbead8a2SBarry Smith } 3431bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 3432bbead8a2SBarry Smith PetscFunctionReturn(0); 3433bbead8a2SBarry Smith } 3434bbead8a2SBarry Smith 343573a71a0fSBarry Smith static PetscErrorCode MatSetRandom_SeqAIJ(Mat x,PetscRandom rctx) 343673a71a0fSBarry Smith { 343773a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)x->data; 3438fff043a9SJunchao Zhang PetscScalar a,*aa; 343973a71a0fSBarry Smith PetscInt m,n,i,j,col; 344073a71a0fSBarry Smith 344173a71a0fSBarry Smith PetscFunctionBegin; 344273a71a0fSBarry Smith if (!x->assembled) { 34439566063dSJacob Faibussowitsch PetscCall(MatGetSize(x,&m,&n)); 344473a71a0fSBarry Smith for (i=0; i<m; i++) { 344573a71a0fSBarry Smith for (j=0; j<aij->imax[i]; j++) { 34469566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx,&a)); 344773a71a0fSBarry Smith col = (PetscInt)(n*PetscRealPart(a)); 34489566063dSJacob Faibussowitsch PetscCall(MatSetValues(x,1,&i,1,&col,&a,ADD_VALUES)); 344973a71a0fSBarry Smith } 345073a71a0fSBarry Smith } 3451e2ce353bSJunchao Zhang } else { 34529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x,&aa)); 34539566063dSJacob Faibussowitsch for (i=0; i<aij->nz; i++) PetscCall(PetscRandomGetValue(rctx,aa+i)); 34549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x,&aa)); 3455e2ce353bSJunchao Zhang } 34569566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x,MAT_FINAL_ASSEMBLY)); 34579566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x,MAT_FINAL_ASSEMBLY)); 345873a71a0fSBarry Smith PetscFunctionReturn(0); 345973a71a0fSBarry Smith } 346073a71a0fSBarry Smith 3461679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3462679944adSJunchao Zhang PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x,PetscInt low,PetscInt high,PetscRandom rctx) 3463679944adSJunchao Zhang { 3464679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)x->data; 3465679944adSJunchao Zhang PetscScalar a; 3466679944adSJunchao Zhang PetscInt m,n,i,j,col,nskip; 3467679944adSJunchao Zhang 3468679944adSJunchao Zhang PetscFunctionBegin; 3469679944adSJunchao Zhang nskip = high - low; 34709566063dSJacob Faibussowitsch PetscCall(MatGetSize(x,&m,&n)); 3471679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3472679944adSJunchao Zhang for (i=0; i<m; i++) { 3473679944adSJunchao Zhang for (j=0; j<aij->imax[i]; j++) { 34749566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx,&a)); 3475679944adSJunchao Zhang col = (PetscInt)(n*PetscRealPart(a)); 3476679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34779566063dSJacob Faibussowitsch PetscCall(MatSetValues(x,1,&i,1,&col,&a,ADD_VALUES)); 3478679944adSJunchao Zhang } 3479e2ce353bSJunchao Zhang } 34809566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x,MAT_FINAL_ASSEMBLY)); 34819566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x,MAT_FINAL_ASSEMBLY)); 3482679944adSJunchao Zhang PetscFunctionReturn(0); 3483679944adSJunchao Zhang } 3484679944adSJunchao Zhang 3485682d7d0cSBarry Smith /* -------------------------------------------------------------------*/ 34860a6ffc59SBarry Smith static struct _MatOps MatOps_Values = { MatSetValues_SeqAIJ, 3487cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3488cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3489cb5b572fSBarry Smith MatMult_SeqAIJ, 349097304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34917c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34927c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3493f4259b30SLisandro Dalcin NULL, 3494f4259b30SLisandro Dalcin NULL, 3495f4259b30SLisandro Dalcin NULL, 3496f4259b30SLisandro Dalcin /* 10*/ NULL, 3497cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3498f4259b30SLisandro Dalcin NULL, 349941f059aeSBarry Smith MatSOR_SeqAIJ, 350091e9d3e2SHong Zhang MatTranspose_SeqAIJ, 350197304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3502cb5b572fSBarry Smith MatEqual_SeqAIJ, 3503cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3504cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3505cb5b572fSBarry Smith MatNorm_SeqAIJ, 3506f4259b30SLisandro Dalcin /* 20*/ NULL, 3507cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3508cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3509cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3510d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3511f4259b30SLisandro Dalcin NULL, 3512f4259b30SLisandro Dalcin NULL, 3513f4259b30SLisandro Dalcin NULL, 3514f4259b30SLisandro Dalcin NULL, 35154994cf47SJed Brown /* 29*/ MatSetUp_SeqAIJ, 3516f4259b30SLisandro Dalcin NULL, 3517f4259b30SLisandro Dalcin NULL, 3518f4259b30SLisandro Dalcin NULL, 3519f4259b30SLisandro Dalcin NULL, 3520d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3521f4259b30SLisandro Dalcin NULL, 3522f4259b30SLisandro Dalcin NULL, 3523cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3524f4259b30SLisandro Dalcin NULL, 3525d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 35267dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3527cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3528cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3529cb5b572fSBarry Smith MatCopy_SeqAIJ, 3530d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3531cb5b572fSBarry Smith MatScale_SeqAIJ, 35327d68702bSBarry Smith MatShift_SeqAIJ, 353379299369SBarry Smith MatDiagonalSet_SeqAIJ, 35346e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 353573a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 35363b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 35373b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 35383b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3539a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 354093dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3541f4259b30SLisandro Dalcin NULL, 3542f4259b30SLisandro Dalcin NULL, 3543cda55fadSBarry Smith MatPermute_SeqAIJ, 3544f4259b30SLisandro Dalcin NULL, 3545f4259b30SLisandro Dalcin /* 59*/ NULL, 3546b9b97703SBarry Smith MatDestroy_SeqAIJ, 3547b9b97703SBarry Smith MatView_SeqAIJ, 3548f4259b30SLisandro Dalcin NULL, 3549f4259b30SLisandro Dalcin NULL, 3550f4259b30SLisandro Dalcin /* 64*/ NULL, 3551321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3552f4259b30SLisandro Dalcin NULL, 3553f4259b30SLisandro Dalcin NULL, 3554f4259b30SLisandro Dalcin NULL, 3555d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3556c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3557f4259b30SLisandro Dalcin NULL, 3558f4259b30SLisandro Dalcin NULL, 3559f4259b30SLisandro Dalcin NULL, 3560f4259b30SLisandro Dalcin /* 74*/ NULL, 35613acb8795SBarry Smith MatFDColoringApply_AIJ, 3562f4259b30SLisandro Dalcin NULL, 3563f4259b30SLisandro Dalcin NULL, 3564f4259b30SLisandro Dalcin NULL, 35656ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3566f4259b30SLisandro Dalcin NULL, 3567f4259b30SLisandro Dalcin NULL, 3568f4259b30SLisandro Dalcin NULL, 3569bc011b1eSHong Zhang MatLoad_SeqAIJ, 3570d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqAIJ, 35711cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 3572f4259b30SLisandro Dalcin NULL, 3573f4259b30SLisandro Dalcin NULL, 3574f4259b30SLisandro Dalcin NULL, 3575f4259b30SLisandro Dalcin /* 89*/ NULL, 3576f4259b30SLisandro Dalcin NULL, 357726be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3578f4259b30SLisandro Dalcin NULL, 3579f4259b30SLisandro Dalcin NULL, 35808fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3581f4259b30SLisandro Dalcin NULL, 3582f4259b30SLisandro Dalcin NULL, 35836fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3584f4259b30SLisandro Dalcin NULL, 35854222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3586f4259b30SLisandro Dalcin NULL, 3587f4259b30SLisandro Dalcin NULL, 358887d4246cSBarry Smith MatConjugate_SeqAIJ, 3589f4259b30SLisandro Dalcin NULL, 3590d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 359199cafbc1SBarry Smith MatRealPart_SeqAIJ, 3592f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3593f4259b30SLisandro Dalcin NULL, 3594f4259b30SLisandro Dalcin NULL, 3595cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3596f4259b30SLisandro Dalcin NULL, 35972af78befSBarry Smith MatGetRowMin_SeqAIJ, 3598f4259b30SLisandro Dalcin NULL, 3599599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3600f4259b30SLisandro Dalcin /*114*/ NULL, 3601f4259b30SLisandro Dalcin NULL, 3602f4259b30SLisandro Dalcin NULL, 3603f4259b30SLisandro Dalcin NULL, 3604f4259b30SLisandro Dalcin NULL, 3605f4259b30SLisandro Dalcin /*119*/ NULL, 3606f4259b30SLisandro Dalcin NULL, 3607f4259b30SLisandro Dalcin NULL, 3608f4259b30SLisandro Dalcin NULL, 3609b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 36100716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3611a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 361237868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 36130da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3614f4259b30SLisandro Dalcin NULL, 3615f4259b30SLisandro Dalcin /*129*/ NULL, 3616f4259b30SLisandro Dalcin NULL, 3617f4259b30SLisandro Dalcin NULL, 361875648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3619b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3620b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 36212b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3622f4259b30SLisandro Dalcin NULL, 3623f4259b30SLisandro Dalcin NULL, 36243964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3625f4259b30SLisandro Dalcin /*139*/NULL, 3626f4259b30SLisandro Dalcin NULL, 3627f4259b30SLisandro Dalcin NULL, 36283a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 36299c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 36304222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 36314222ddf1SHong Zhang /*145*/MatDestroySubMatrices_SeqAIJ, 3632f4259b30SLisandro Dalcin NULL, 3633f4259b30SLisandro Dalcin NULL 36349e29f15eSvictorle }; 363517ab2063SBarry Smith 36367087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat,PetscInt *indices) 3637bef8e0ddSBarry Smith { 3638bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 363997f1f81fSBarry Smith PetscInt i,nz,n; 3640bef8e0ddSBarry Smith 3641bef8e0ddSBarry Smith PetscFunctionBegin; 3642bef8e0ddSBarry Smith nz = aij->maxnz; 3643d0f46423SBarry Smith n = mat->rmap->n; 3644bef8e0ddSBarry Smith for (i=0; i<nz; i++) { 3645bef8e0ddSBarry Smith aij->j[i] = indices[i]; 3646bef8e0ddSBarry Smith } 3647bef8e0ddSBarry Smith aij->nz = nz; 3648bef8e0ddSBarry Smith for (i=0; i<n; i++) { 3649bef8e0ddSBarry Smith aij->ilen[i] = aij->imax[i]; 3650bef8e0ddSBarry Smith } 3651bef8e0ddSBarry Smith PetscFunctionReturn(0); 3652bef8e0ddSBarry Smith } 3653bef8e0ddSBarry Smith 3654a3bb6f32SFande Kong /* 3655ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3656ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3657ddea5d60SJunchao Zhang */ 3658a3bb6f32SFande Kong PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3659a3bb6f32SFande Kong { 3660a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3661a3bb6f32SFande Kong PetscTable gid1_lid1; 3662a3bb6f32SFande Kong PetscTablePosition tpos; 366325b670f0SStefano Zampini PetscInt gid,lid,i,ec,nz = aij->nz; 366425b670f0SStefano Zampini PetscInt *garray,*jj = aij->j; 3665a3bb6f32SFande Kong 3666a3bb6f32SFande Kong PetscFunctionBegin; 3667a3bb6f32SFande Kong PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3668a3bb6f32SFande Kong PetscValidPointer(mapping,2); 3669a3bb6f32SFande Kong /* use a table */ 36709566063dSJacob Faibussowitsch PetscCall(PetscTableCreate(mat->rmap->n,mat->cmap->N+1,&gid1_lid1)); 3671a3bb6f32SFande Kong ec = 0; 367225b670f0SStefano Zampini for (i=0; i<nz; i++) { 367325b670f0SStefano Zampini PetscInt data,gid1 = jj[i] + 1; 36749566063dSJacob Faibussowitsch PetscCall(PetscTableFind(gid1_lid1,gid1,&data)); 3675a3bb6f32SFande Kong if (!data) { 3676a3bb6f32SFande Kong /* one based table */ 36779566063dSJacob Faibussowitsch PetscCall(PetscTableAdd(gid1_lid1,gid1,++ec,INSERT_VALUES)); 3678a3bb6f32SFande Kong } 3679a3bb6f32SFande Kong } 3680a3bb6f32SFande Kong /* form array of columns we need */ 36819566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec,&garray)); 36829566063dSJacob Faibussowitsch PetscCall(PetscTableGetHeadPosition(gid1_lid1,&tpos)); 3683a3bb6f32SFande Kong while (tpos) { 36849566063dSJacob Faibussowitsch PetscCall(PetscTableGetNext(gid1_lid1,&tpos,&gid,&lid)); 3685a3bb6f32SFande Kong gid--; 3686a3bb6f32SFande Kong lid--; 3687a3bb6f32SFande Kong garray[lid] = gid; 3688a3bb6f32SFande Kong } 36899566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec,garray)); /* sort, and rebuild */ 36909566063dSJacob Faibussowitsch PetscCall(PetscTableRemoveAll(gid1_lid1)); 3691a3bb6f32SFande Kong for (i=0; i<ec; i++) { 36929566063dSJacob Faibussowitsch PetscCall(PetscTableAdd(gid1_lid1,garray[i]+1,i+1,INSERT_VALUES)); 3693a3bb6f32SFande Kong } 3694a3bb6f32SFande Kong /* compact out the extra columns in B */ 369525b670f0SStefano Zampini for (i=0; i<nz; i++) { 369625b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 36979566063dSJacob Faibussowitsch PetscCall(PetscTableFind(gid1_lid1,gid1,&lid)); 3698a3bb6f32SFande Kong lid--; 369925b670f0SStefano Zampini jj[i] = lid; 3700a3bb6f32SFande Kong } 37019566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 37029566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy(&gid1_lid1)); 37039566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat),ec,ec,1,&mat->cmap)); 37049566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF,mat->cmap->bs,mat->cmap->n,garray,PETSC_OWN_POINTER,mapping)); 37059566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping,ISLOCALTOGLOBALMAPPINGHASH)); 3706a3bb6f32SFande Kong PetscFunctionReturn(0); 3707a3bb6f32SFande Kong } 3708a3bb6f32SFande Kong 3709bef8e0ddSBarry Smith /*@ 3710bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3711bef8e0ddSBarry Smith in the matrix. 3712bef8e0ddSBarry Smith 3713bef8e0ddSBarry Smith Input Parameters: 3714bef8e0ddSBarry Smith + mat - the SeqAIJ matrix 3715bef8e0ddSBarry Smith - indices - the column indices 3716bef8e0ddSBarry Smith 371715091d37SBarry Smith Level: advanced 371815091d37SBarry Smith 3719bef8e0ddSBarry Smith Notes: 3720bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3721bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 3722bef8e0ddSBarry Smith of the MatSetValues() operation. 3723bef8e0ddSBarry Smith 3724bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 3725d1be2dadSMatthew Knepley MatCreateSeqAIJ(), and the columns indices MUST be sorted. 3726bef8e0ddSBarry Smith 3727bef8e0ddSBarry Smith MUST be called before any calls to MatSetValues(); 3728bef8e0ddSBarry Smith 3729b9617806SBarry Smith The indices should start with zero, not one. 3730b9617806SBarry Smith 3731bef8e0ddSBarry Smith @*/ 37327087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat,PetscInt *indices) 3733bef8e0ddSBarry Smith { 3734bef8e0ddSBarry Smith PetscFunctionBegin; 37350700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3736dadcf809SJacob Faibussowitsch PetscValidIntPointer(indices,2); 3737cac4c232SBarry Smith PetscUseMethod(mat,"MatSeqAIJSetColumnIndices_C",(Mat,PetscInt*),(mat,indices)); 3738bef8e0ddSBarry Smith PetscFunctionReturn(0); 3739bef8e0ddSBarry Smith } 3740bef8e0ddSBarry Smith 3741be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/ 3742be6bf707SBarry Smith 37437087cfbeSBarry Smith PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3744be6bf707SBarry Smith { 3745be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3746d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3747be6bf707SBarry Smith 3748be6bf707SBarry Smith PetscFunctionBegin; 374928b400f6SJacob Faibussowitsch PetscCheck(aij->nonew,PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3750be6bf707SBarry Smith 3751be6bf707SBarry Smith /* allocate space for values if not already there */ 3752be6bf707SBarry Smith if (!aij->saved_values) { 37539566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz+1,&aij->saved_values)); 37549566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)mat,(nz+1)*sizeof(PetscScalar))); 3755be6bf707SBarry Smith } 3756be6bf707SBarry Smith 3757be6bf707SBarry Smith /* copy values over */ 37589566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values,aij->a,nz)); 3759be6bf707SBarry Smith PetscFunctionReturn(0); 3760be6bf707SBarry Smith } 3761be6bf707SBarry Smith 3762be6bf707SBarry Smith /*@ 3763be6bf707SBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows, for 3764be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3765be6bf707SBarry Smith nonlinear portion. 3766be6bf707SBarry Smith 3767be6bf707SBarry Smith Collect on Mat 3768be6bf707SBarry Smith 3769be6bf707SBarry Smith Input Parameters: 37700e609b76SBarry Smith . mat - the matrix (currently only AIJ matrices support this option) 3771be6bf707SBarry Smith 377215091d37SBarry Smith Level: advanced 377315091d37SBarry Smith 3774be6bf707SBarry Smith Common Usage, with SNESSolve(): 3775be6bf707SBarry Smith $ Create Jacobian matrix 3776be6bf707SBarry Smith $ Set linear terms into matrix 3777be6bf707SBarry Smith $ Apply boundary conditions to matrix, at this time matrix must have 3778be6bf707SBarry Smith $ final nonzero structure (i.e. setting the nonlinear terms and applying 3779be6bf707SBarry Smith $ boundary conditions again will not change the nonzero structure 3780512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3781be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3782be6bf707SBarry Smith $ Call SNESSetJacobian() with matrix 3783be6bf707SBarry Smith $ In your Jacobian routine 3784be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3785be6bf707SBarry Smith $ Set nonlinear terms in matrix 3786be6bf707SBarry Smith 3787be6bf707SBarry Smith Common Usage without SNESSolve(), i.e. when you handle nonlinear solve yourself: 3788be6bf707SBarry Smith $ // build linear portion of Jacobian 3789512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3790be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3791be6bf707SBarry Smith $ loop over nonlinear iterations 3792be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3793be6bf707SBarry Smith $ // call MatSetValues(mat,...) to set nonliner portion of Jacobian 3794be6bf707SBarry Smith $ // call MatAssemblyBegin/End() on matrix 3795be6bf707SBarry Smith $ Solve linear system with Jacobian 3796be6bf707SBarry Smith $ endloop 3797be6bf707SBarry Smith 3798be6bf707SBarry Smith Notes: 3799be6bf707SBarry Smith Matrix must already be assemblied before calling this routine 3800512a5fc5SBarry Smith Must set the matrix option MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); before 3801be6bf707SBarry Smith calling this routine. 3802be6bf707SBarry Smith 38030c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 38040c468ba9SBarry Smith and does not allocated additional space. 38050c468ba9SBarry Smith 3806db781477SPatrick Sanan .seealso: `MatRetrieveValues()` 3807be6bf707SBarry Smith 3808be6bf707SBarry Smith @*/ 38097087cfbeSBarry Smith PetscErrorCode MatStoreValues(Mat mat) 3810be6bf707SBarry Smith { 3811be6bf707SBarry Smith PetscFunctionBegin; 38120700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 381328b400f6SJacob Faibussowitsch PetscCheck(mat->assembled,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 381428b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3815cac4c232SBarry Smith PetscUseMethod(mat,"MatStoreValues_C",(Mat),(mat)); 3816be6bf707SBarry Smith PetscFunctionReturn(0); 3817be6bf707SBarry Smith } 3818be6bf707SBarry Smith 38197087cfbeSBarry Smith PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3820be6bf707SBarry Smith { 3821be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3822d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3823be6bf707SBarry Smith 3824be6bf707SBarry Smith PetscFunctionBegin; 382528b400f6SJacob Faibussowitsch PetscCheck(aij->nonew,PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 382628b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values,PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatStoreValues(A);first"); 3827be6bf707SBarry Smith /* copy values over */ 38289566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a,aij->saved_values,nz)); 3829be6bf707SBarry Smith PetscFunctionReturn(0); 3830be6bf707SBarry Smith } 3831be6bf707SBarry Smith 3832be6bf707SBarry Smith /*@ 3833be6bf707SBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for 3834be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3835be6bf707SBarry Smith nonlinear portion. 3836be6bf707SBarry Smith 3837be6bf707SBarry Smith Collect on Mat 3838be6bf707SBarry Smith 3839be6bf707SBarry Smith Input Parameters: 3840386f7cf9SBarry Smith . mat - the matrix (currently only AIJ matrices support this option) 3841be6bf707SBarry Smith 384215091d37SBarry Smith Level: advanced 384315091d37SBarry Smith 3844db781477SPatrick Sanan .seealso: `MatStoreValues()` 3845be6bf707SBarry Smith 3846be6bf707SBarry Smith @*/ 38477087cfbeSBarry Smith PetscErrorCode MatRetrieveValues(Mat mat) 3848be6bf707SBarry Smith { 3849be6bf707SBarry Smith PetscFunctionBegin; 38500700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 385128b400f6SJacob Faibussowitsch PetscCheck(mat->assembled,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 385228b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3853cac4c232SBarry Smith PetscUseMethod(mat,"MatRetrieveValues_C",(Mat),(mat)); 3854be6bf707SBarry Smith PetscFunctionReturn(0); 3855be6bf707SBarry Smith } 3856be6bf707SBarry Smith 3857be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/ 385817ab2063SBarry Smith /*@C 3859682d7d0cSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in AIJ (compressed row) format 38600d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 38616e62573dSLois Curfman McInnes the user should preallocate the matrix storage by setting the parameter nz 386251c19458SBarry Smith (or the array nnz). By setting these parameters accurately, performance 38632bd5e0b2SLois Curfman McInnes during matrix assembly can be increased by more than a factor of 50. 386417ab2063SBarry Smith 3865d083f849SBarry Smith Collective 3866db81eaa0SLois Curfman McInnes 386717ab2063SBarry Smith Input Parameters: 3868db81eaa0SLois Curfman McInnes + comm - MPI communicator, set to PETSC_COMM_SELF 386917ab2063SBarry Smith . m - number of rows 387017ab2063SBarry Smith . n - number of columns 387117ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 387251c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38730298fd71SBarry Smith (possibly different for each row) or NULL 387417ab2063SBarry Smith 387517ab2063SBarry Smith Output Parameter: 3876416022c9SBarry Smith . A - the matrix 387717ab2063SBarry Smith 3878175b88e8SBarry Smith It is recommended that one use the MatCreate(), MatSetType() and/or MatSetFromOptions(), 3879f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 3880175b88e8SBarry Smith [MatXXXXSetPreallocation() is, for example, MatSeqAIJSetPreallocation] 3881175b88e8SBarry Smith 3882b259b22eSLois Curfman McInnes Notes: 388349a6f317SBarry Smith If nnz is given then nz is ignored 388449a6f317SBarry Smith 388517ab2063SBarry Smith The AIJ format (also called the Yale sparse matrix format or 388617ab2063SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 38870002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 388844cd7ae7SLois Curfman McInnes either one (as in Fortran) or zero. See the users' manual for details. 388917ab2063SBarry Smith 389017ab2063SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 38910298fd71SBarry Smith Set nz=PETSC_DEFAULT and nnz=NULL for PETSc to control dynamic memory 38923d323bbdSBarry Smith allocation. For large problems you MUST preallocate memory or you 38936da5968aSLois Curfman McInnes will get TERRIBLE performance, see the users' manual chapter on matrices. 389417ab2063SBarry Smith 3895682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38964fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3897682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38986c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38996c7ebb05SLois Curfman McInnes 39006c7ebb05SLois Curfman McInnes Options Database Keys: 3901698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 39029db58ca8SBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 390317ab2063SBarry Smith 3904027ccd11SLois Curfman McInnes Level: intermediate 3905027ccd11SLois Curfman McInnes 3906db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 390736db0b34SBarry Smith 390817ab2063SBarry Smith @*/ 39097087cfbeSBarry Smith PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt nz,const PetscInt nnz[],Mat *A) 391017ab2063SBarry Smith { 39113a40ed3dSBarry Smith PetscFunctionBegin; 39129566063dSJacob Faibussowitsch PetscCall(MatCreate(comm,A)); 39139566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A,m,n,m,n)); 39149566063dSJacob Faibussowitsch PetscCall(MatSetType(*A,MATSEQAIJ)); 39159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A,nz,nnz)); 3916273d9f13SBarry Smith PetscFunctionReturn(0); 3917273d9f13SBarry Smith } 3918273d9f13SBarry Smith 3919273d9f13SBarry Smith /*@C 3920273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3921273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3922273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3923273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3924273d9f13SBarry Smith 3925d083f849SBarry Smith Collective 3926273d9f13SBarry Smith 3927273d9f13SBarry Smith Input Parameters: 39281c4f3114SJed Brown + B - The matrix 3929273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3930273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 39310298fd71SBarry Smith (possibly different for each row) or NULL 3932273d9f13SBarry Smith 3933273d9f13SBarry Smith Notes: 393449a6f317SBarry Smith If nnz is given then nz is ignored 393549a6f317SBarry Smith 3936273d9f13SBarry Smith The AIJ format (also called the Yale sparse matrix format or 3937273d9f13SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 3938273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3939273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3940273d9f13SBarry Smith 3941273d9f13SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 39420298fd71SBarry Smith Set nz=PETSC_DEFAULT and nnz=NULL for PETSc to control dynamic memory 3943273d9f13SBarry Smith allocation. For large problems you MUST preallocate memory or you 3944273d9f13SBarry Smith will get TERRIBLE performance, see the users' manual chapter on matrices. 3945273d9f13SBarry Smith 3946aa95bbe8SBarry Smith You can call MatGetInfo() to get information on how effective the preallocation was; 3947aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3948aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3949aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3950aa95bbe8SBarry Smith 3951a96a251dSBarry Smith Developers: Use nz of MAT_SKIP_ALLOCATION to not allocate any space for the matrix 3952a96a251dSBarry Smith entries or columns indices 3953a96a251dSBarry Smith 3954273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3955273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3956273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3957273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3958273d9f13SBarry Smith 3959273d9f13SBarry Smith Options Database Keys: 3960698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 396147b2e64bSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 3962273d9f13SBarry Smith 3963273d9f13SBarry Smith Level: intermediate 3964273d9f13SBarry Smith 3965db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3966db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3967273d9f13SBarry Smith 3968273d9f13SBarry Smith @*/ 39697087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation(Mat B,PetscInt nz,const PetscInt nnz[]) 3970273d9f13SBarry Smith { 3971a23d5eceSKris Buschelman PetscFunctionBegin; 39726ba663aaSJed Brown PetscValidHeaderSpecific(B,MAT_CLASSID,1); 39736ba663aaSJed Brown PetscValidType(B,1); 3974cac4c232SBarry Smith PetscTryMethod(B,"MatSeqAIJSetPreallocation_C",(Mat,PetscInt,const PetscInt[]),(B,nz,nnz)); 3975a23d5eceSKris Buschelman PetscFunctionReturn(0); 3976a23d5eceSKris Buschelman } 3977a23d5eceSKris Buschelman 39787087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B,PetscInt nz,const PetscInt *nnz) 3979a23d5eceSKris Buschelman { 3980273d9f13SBarry Smith Mat_SeqAIJ *b; 39812576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE,realalloc = PETSC_FALSE; 398297f1f81fSBarry Smith PetscInt i; 3983273d9f13SBarry Smith 3984273d9f13SBarry Smith PetscFunctionBegin; 39852576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3986a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3987c461c341SBarry Smith skipallocation = PETSC_TRUE; 3988c461c341SBarry Smith nz = 0; 3989c461c341SBarry Smith } 39909566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39919566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3992899cda47SBarry Smith 3993435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 399408401ef6SPierre Jolivet PetscCheck(nz >= 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nz cannot be less than 0: value %" PetscInt_FMT,nz); 3995cf9c20a2SJed Brown if (PetscUnlikelyDebug(nnz)) { 3996d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) { 399708401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT,i,nnz[i]); 399808401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT,i,nnz[i],B->cmap->n); 3999b73539f3SBarry Smith } 4000b73539f3SBarry Smith } 4001b73539f3SBarry Smith 4002273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 40032205254eSKarl Rupp 4004273d9f13SBarry Smith b = (Mat_SeqAIJ*)B->data; 4005273d9f13SBarry Smith 4006ab93d7beSBarry Smith if (!skipallocation) { 40072ee49352SLisandro Dalcin if (!b->imax) { 40089566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n,&b->imax)); 40099566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt))); 4010071fcb05SBarry Smith } 4011071fcb05SBarry Smith if (!b->ilen) { 4012071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 40139566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n,&b->ilen)); 40149566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt))); 4015071fcb05SBarry Smith } else { 40169566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen,B->rmap->n*sizeof(PetscInt))); 40172ee49352SLisandro Dalcin } 4018846b4da1SFande Kong if (!b->ipre) { 40199566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n,&b->ipre)); 40209566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt))); 4021846b4da1SFande Kong } 4022273d9f13SBarry Smith if (!nnz) { 4023435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 4024c62bd62aSJed Brown else if (nz < 0) nz = 1; 40255d2a9ed1SStefano Zampini nz = PetscMin(nz,B->cmap->n); 4026d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) b->imax[i] = nz; 4027d0f46423SBarry Smith nz = nz*B->rmap->n; 4028273d9f13SBarry Smith } else { 4029c73702f5SBarry Smith PetscInt64 nz64 = 0; 4030c73702f5SBarry Smith for (i=0; i<B->rmap->n; i++) {b->imax[i] = nnz[i]; nz64 += nnz[i];} 40319566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64,&nz)); 4032273d9f13SBarry Smith } 4033ab93d7beSBarry Smith 4034273d9f13SBarry Smith /* allocate the matrix space */ 403553dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 40369566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B,&b->a,&b->j,&b->i)); 4037396832f4SHong Zhang if (B->structure_only) { 40389566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz,&b->j)); 40399566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n+1,&b->i)); 40409566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)B,(B->rmap->n+1)*sizeof(PetscInt)+nz*sizeof(PetscInt))); 4041396832f4SHong Zhang } else { 40429566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nz,&b->a,nz,&b->j,B->rmap->n+1,&b->i)); 40439566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)B,(B->rmap->n+1)*sizeof(PetscInt)+nz*(sizeof(PetscScalar)+sizeof(PetscInt)))); 4044396832f4SHong Zhang } 4045bfeeae90SHong Zhang b->i[0] = 0; 4046d0f46423SBarry Smith for (i=1; i<B->rmap->n+1; i++) { 40475da197adSKris Buschelman b->i[i] = b->i[i-1] + b->imax[i-1]; 40485da197adSKris Buschelman } 4049396832f4SHong Zhang if (B->structure_only) { 4050396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 4051396832f4SHong Zhang b->free_a = PETSC_FALSE; 4052396832f4SHong Zhang } else { 4053273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 4054e6b907acSBarry Smith b->free_a = PETSC_TRUE; 4055396832f4SHong Zhang } 4056e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 4057c461c341SBarry Smith } else { 4058e6b907acSBarry Smith b->free_a = PETSC_FALSE; 4059e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 4060c461c341SBarry Smith } 4061273d9f13SBarry Smith 4062846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 4063846b4da1SFande Kong /* reserve user-requested sparsity */ 40649566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre,b->imax,B->rmap->n)); 4065846b4da1SFande Kong } 4066846b4da1SFande Kong 4067273d9f13SBarry Smith b->nz = 0; 4068273d9f13SBarry Smith b->maxnz = nz; 4069273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40702205254eSKarl Rupp if (realalloc) { 40719566063dSJacob Faibussowitsch PetscCall(MatSetOption(B,MAT_NEW_NONZERO_ALLOCATION_ERR,PETSC_TRUE)); 40722205254eSKarl Rupp } 4073cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4074cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40755519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40765519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40775519a089SJose E. Roman */ 40785519a089SJose E. Roman B->nonzerostate++; 4079273d9f13SBarry Smith PetscFunctionReturn(0); 4080273d9f13SBarry Smith } 4081273d9f13SBarry Smith 4082846b4da1SFande Kong PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4083846b4da1SFande Kong { 4084846b4da1SFande Kong Mat_SeqAIJ *a; 4085a5bbaf83SFande Kong PetscInt i; 4086846b4da1SFande Kong 4087846b4da1SFande Kong PetscFunctionBegin; 4088846b4da1SFande Kong PetscValidHeaderSpecific(A,MAT_CLASSID,1); 408914d0e64fSAlex Lindsay 409014d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 409114d0e64fSAlex Lindsay if (!A->rmap->n) PetscFunctionReturn(0); 409214d0e64fSAlex Lindsay 4093846b4da1SFande Kong a = (Mat_SeqAIJ*)A->data; 40942c814fdeSFande Kong /* if no saved info, we error out */ 409528b400f6SJacob Faibussowitsch PetscCheck(a->ipre,PETSC_COMM_SELF,PETSC_ERR_ARG_NULL,"No saved preallocation info "); 40962c814fdeSFande Kong 4097aed4548fSBarry Smith PetscCheck(a->i && a->j && a->a && a->imax && a->ilen,PETSC_COMM_SELF,PETSC_ERR_ARG_NULL,"Memory info is incomplete, and can not reset preallocation "); 40982c814fdeSFande Kong 40999566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax,a->ipre,A->rmap->n)); 41009566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen,A->rmap->n)); 4101846b4da1SFande Kong a->i[0] = 0; 4102846b4da1SFande Kong for (i=1; i<A->rmap->n+1; i++) { 4103846b4da1SFande Kong a->i[i] = a->i[i-1] + a->imax[i-1]; 4104846b4da1SFande Kong } 4105846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4106846b4da1SFande Kong a->nz = 0; 4107846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4108846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4109846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4110846b4da1SFande Kong A->assembled = PETSC_FALSE; 4111846b4da1SFande Kong PetscFunctionReturn(0); 4112846b4da1SFande Kong } 4113846b4da1SFande Kong 411458d36128SBarry Smith /*@ 4115a1661176SMatthew Knepley MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in AIJ format. 4116a1661176SMatthew Knepley 4117a1661176SMatthew Knepley Input Parameters: 4118a1661176SMatthew Knepley + B - the matrix 4119a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 4120a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 4121a1661176SMatthew Knepley - v - optional values in the matrix 4122a1661176SMatthew Knepley 4123a1661176SMatthew Knepley Level: developer 4124a1661176SMatthew Knepley 41256a9b8d82SBarry Smith Notes: 412658d36128SBarry Smith The i,j,v values are COPIED with this routine; to avoid the copy use MatCreateSeqAIJWithArrays() 412758d36128SBarry Smith 41286a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 41296a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 41306a9b8d82SBarry Smith 41316a9b8d82SBarry Smith Developer Notes: 41326a9b8d82SBarry Smith An optimization could be added to the implementation where it checks if the i, and j are identical to the current i and j and 41336a9b8d82SBarry Smith then just copies the v values directly with PetscMemcpy(). 41346a9b8d82SBarry Smith 41356a9b8d82SBarry Smith This routine could also take a PetscCopyMode argument to allow sharing the values instead of always copying them. 41366a9b8d82SBarry Smith 4137db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MatResetPreallocation()` 4138a1661176SMatthew Knepley @*/ 4139a1661176SMatthew Knepley PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B,const PetscInt i[],const PetscInt j[],const PetscScalar v[]) 4140a1661176SMatthew Knepley { 4141a1661176SMatthew Knepley PetscFunctionBegin; 41420700a824SBarry Smith PetscValidHeaderSpecific(B,MAT_CLASSID,1); 41436ba663aaSJed Brown PetscValidType(B,1); 4144cac4c232SBarry Smith PetscTryMethod(B,"MatSeqAIJSetPreallocationCSR_C",(Mat,const PetscInt[],const PetscInt[],const PetscScalar[]),(B,i,j,v)); 4145a1661176SMatthew Knepley PetscFunctionReturn(0); 4146a1661176SMatthew Knepley } 4147a1661176SMatthew Knepley 41487087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B,const PetscInt Ii[],const PetscInt J[],const PetscScalar v[]) 4149a1661176SMatthew Knepley { 4150a1661176SMatthew Knepley PetscInt i; 4151a1661176SMatthew Knepley PetscInt m,n; 4152a1661176SMatthew Knepley PetscInt nz; 41536a9b8d82SBarry Smith PetscInt *nnz; 4154a1661176SMatthew Knepley 4155a1661176SMatthew Knepley PetscFunctionBegin; 4156aed4548fSBarry Smith PetscCheck(Ii[0] == 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4157779a8d59SSatish Balay 41589566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 41599566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4160779a8d59SSatish Balay 41619566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 41629566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1, &nnz)); 4163a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4164b7940d39SSatish Balay nz = Ii[i+1]- Ii[i]; 416508401ef6SPierre Jolivet PetscCheck(nz >= 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4166a1661176SMatthew Knepley nnz[i] = nz; 4167a1661176SMatthew Knepley } 41689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 41699566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4170a1661176SMatthew Knepley 4171a1661176SMatthew Knepley for (i = 0; i < m; i++) { 41729566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i+1] - Ii[i], J+Ii[i], v ? v + Ii[i] : NULL, INSERT_VALUES)); 4173a1661176SMatthew Knepley } 4174a1661176SMatthew Knepley 41759566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY)); 41769566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY)); 4177a1661176SMatthew Knepley 41789566063dSJacob Faibussowitsch PetscCall(MatSetOption(B,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE)); 4179a1661176SMatthew Knepley PetscFunctionReturn(0); 4180a1661176SMatthew Knepley } 4181a1661176SMatthew Knepley 4182ad7e164aSPierre Jolivet /*@ 4183ad7e164aSPierre Jolivet MatSeqAIJKron - Computes C, the Kronecker product of A and B. 4184ad7e164aSPierre Jolivet 4185ad7e164aSPierre Jolivet Input Parameters: 4186ad7e164aSPierre Jolivet + A - left-hand side matrix 4187ad7e164aSPierre Jolivet . B - right-hand side matrix 4188ad7e164aSPierre Jolivet - reuse - either MAT_INITIAL_MATRIX or MAT_REUSE_MATRIX 4189ad7e164aSPierre Jolivet 4190ad7e164aSPierre Jolivet Output Parameter: 4191ad7e164aSPierre Jolivet . C - Kronecker product of A and B 4192ad7e164aSPierre Jolivet 4193ad7e164aSPierre Jolivet Level: intermediate 4194ad7e164aSPierre Jolivet 4195ad7e164aSPierre Jolivet Notes: 4196ad7e164aSPierre Jolivet MAT_REUSE_MATRIX can only be used when the nonzero structure of the product matrix has not changed from that last call to MatSeqAIJKron(). 4197ad7e164aSPierre Jolivet 4198db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4199ad7e164aSPierre Jolivet @*/ 4200ad7e164aSPierre Jolivet PetscErrorCode MatSeqAIJKron(Mat A,Mat B,MatReuse reuse,Mat *C) 4201ad7e164aSPierre Jolivet { 4202ad7e164aSPierre Jolivet PetscFunctionBegin; 4203ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A,MAT_CLASSID,1); 4204ad7e164aSPierre Jolivet PetscValidType(A,1); 4205ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B,MAT_CLASSID,2); 4206ad7e164aSPierre Jolivet PetscValidType(B,2); 4207ad7e164aSPierre Jolivet PetscValidPointer(C,4); 4208ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4209ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C,MAT_CLASSID,4); 4210ad7e164aSPierre Jolivet PetscValidType(*C,4); 4211ad7e164aSPierre Jolivet } 4212cac4c232SBarry Smith PetscTryMethod(A,"MatSeqAIJKron_C",(Mat,Mat,MatReuse,Mat*),(A,B,reuse,C)); 4213ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4214ad7e164aSPierre Jolivet } 4215ad7e164aSPierre Jolivet 4216ad7e164aSPierre Jolivet PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A,Mat B,MatReuse reuse,Mat *C) 4217ad7e164aSPierre Jolivet { 4218ad7e164aSPierre Jolivet Mat newmat; 4219ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 4220ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ*)B->data; 4221ad7e164aSPierre Jolivet PetscScalar *v; 4222fff043a9SJunchao Zhang const PetscScalar *aa,*ba; 4223ad7e164aSPierre Jolivet PetscInt *i,*j,m,n,p,q,nnz = 0,am = A->rmap->n,bm = B->rmap->n,an = A->cmap->n, bn = B->cmap->n; 4224ad7e164aSPierre Jolivet PetscBool flg; 4225ad7e164aSPierre Jolivet 4226ad7e164aSPierre Jolivet PetscFunctionBegin; 422728b400f6SJacob Faibussowitsch PetscCheck(!A->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 422828b400f6SJacob Faibussowitsch PetscCheck(A->assembled,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 422928b400f6SJacob Faibussowitsch PetscCheck(!B->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 423028b400f6SJacob Faibussowitsch PetscCheck(B->assembled,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 42319566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B,MATSEQAIJ,&flg)); 423228b400f6SJacob Faibussowitsch PetscCheck(flg,PETSC_COMM_SELF,PETSC_ERR_SUP,"MatType %s",((PetscObject)B)->type_name); 4233aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX,PETSC_COMM_SELF,PETSC_ERR_SUP,"MatReuse %d",(int)reuse); 4234ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 42359566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am*bm+1,&i,a->i[am]*b->i[bm],&j)); 42369566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF,&newmat)); 42379566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat,am*bm,an*bn,am*bm,an*bn)); 42389566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat,MATAIJ)); 4239ad7e164aSPierre Jolivet i[0] = 0; 4240ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4241ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4242ad7e164aSPierre Jolivet i[m*bm + p + 1] = i[m*bm + p] + (a->i[m+1] - a->i[m]) * (b->i[p+1] - b->i[p]); 4243ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m+1]; ++n) { 4244ad7e164aSPierre Jolivet for (q = b->i[p]; q < b->i[p+1]; ++q) { 4245ad7e164aSPierre Jolivet j[nnz++] = a->j[n]*bn + b->j[q]; 4246ad7e164aSPierre Jolivet } 4247ad7e164aSPierre Jolivet } 4248ad7e164aSPierre Jolivet } 4249ad7e164aSPierre Jolivet } 42509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat,i,j,NULL)); 4251ad7e164aSPierre Jolivet *C = newmat; 42529566063dSJacob Faibussowitsch PetscCall(PetscFree2(i,j)); 4253ad7e164aSPierre Jolivet nnz = 0; 4254ad7e164aSPierre Jolivet } 42559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C,&v)); 42569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 42579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B,&ba)); 4258ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4259ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4260ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m+1]; ++n) { 4261ad7e164aSPierre Jolivet for (q = b->i[p]; q < b->i[p+1]; ++q) { 4262fff043a9SJunchao Zhang v[nnz++] = aa[n] * ba[q]; 4263ad7e164aSPierre Jolivet } 4264ad7e164aSPierre Jolivet } 4265ad7e164aSPierre Jolivet } 4266ad7e164aSPierre Jolivet } 42679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C,&v)); 42689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 42699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B,&ba)); 4270ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4271ad7e164aSPierre Jolivet } 4272ad7e164aSPierre Jolivet 4273c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4274af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4275170fe5c8SBarry Smith 4276170fe5c8SBarry Smith /* 4277170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4278170fe5c8SBarry Smith 4279170fe5c8SBarry Smith n p p 42802da392ccSBarry Smith [ ] [ ] [ ] 42812da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42822da392ccSBarry Smith [ ] [ ] [ ] 4283170fe5c8SBarry Smith 4284170fe5c8SBarry Smith */ 4285170fe5c8SBarry Smith PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A,Mat B,Mat C) 4286170fe5c8SBarry Smith { 4287170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense*)A->data; 4288170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ*)B->data; 4289170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense*)C->data; 429086214ceeSStefano Zampini PetscInt i,j,n,m,q,p; 4291170fe5c8SBarry Smith const PetscInt *ii,*idx; 4292170fe5c8SBarry Smith const PetscScalar *b,*a,*a_q; 4293170fe5c8SBarry Smith PetscScalar *c,*c_q; 429486214ceeSStefano Zampini PetscInt clda = sub_c->lda; 429586214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4296170fe5c8SBarry Smith 4297170fe5c8SBarry Smith PetscFunctionBegin; 4298d0f46423SBarry Smith m = A->rmap->n; 4299d0f46423SBarry Smith n = A->cmap->n; 4300d0f46423SBarry Smith p = B->cmap->n; 4301170fe5c8SBarry Smith a = sub_a->v; 4302170fe5c8SBarry Smith b = sub_b->a; 4303170fe5c8SBarry Smith c = sub_c->v; 430486214ceeSStefano Zampini if (clda == m) { 43059566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c,m*p)); 430686214ceeSStefano Zampini } else { 430786214ceeSStefano Zampini for (j=0;j<p;j++) 430886214ceeSStefano Zampini for (i=0;i<m;i++) 430986214ceeSStefano Zampini c[j*clda + i] = 0.0; 431086214ceeSStefano Zampini } 4311170fe5c8SBarry Smith ii = sub_b->i; 4312170fe5c8SBarry Smith idx = sub_b->j; 4313170fe5c8SBarry Smith for (i=0; i<n; i++) { 4314170fe5c8SBarry Smith q = ii[i+1] - ii[i]; 4315170fe5c8SBarry Smith while (q-->0) { 431686214ceeSStefano Zampini c_q = c + clda*(*idx); 431786214ceeSStefano Zampini a_q = a + alda*i; 4318854c7f52SBarry Smith PetscKernelAXPY(c_q,*b,a_q,m); 4319170fe5c8SBarry Smith idx++; 4320170fe5c8SBarry Smith b++; 4321170fe5c8SBarry Smith } 4322170fe5c8SBarry Smith } 4323170fe5c8SBarry Smith PetscFunctionReturn(0); 4324170fe5c8SBarry Smith } 4325170fe5c8SBarry Smith 43264222ddf1SHong Zhang PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A,Mat B,PetscReal fill,Mat C) 4327170fe5c8SBarry Smith { 4328d0f46423SBarry Smith PetscInt m=A->rmap->n,n=B->cmap->n; 432986214ceeSStefano Zampini PetscBool cisdense; 4330170fe5c8SBarry Smith 4331170fe5c8SBarry Smith PetscFunctionBegin; 433208401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT,A->cmap->n,B->rmap->n); 43339566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C,m,n,m,n)); 43349566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C,A,B)); 43359566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATSEQDENSECUDA,"")); 433686214ceeSStefano Zampini if (!cisdense) { 43379566063dSJacob Faibussowitsch PetscCall(MatSetType(C,MATDENSE)); 433886214ceeSStefano Zampini } 43399566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4340d73949e8SHong Zhang 43414222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 4342170fe5c8SBarry Smith PetscFunctionReturn(0); 4343170fe5c8SBarry Smith } 4344170fe5c8SBarry Smith 4345170fe5c8SBarry Smith /* ----------------------------------------------------------------*/ 43460bad9183SKris Buschelman /*MC 4347fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 43480bad9183SKris Buschelman based on compressed sparse row format. 43490bad9183SKris Buschelman 43500bad9183SKris Buschelman Options Database Keys: 43510bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 43520bad9183SKris Buschelman 43530bad9183SKris Buschelman Level: beginner 43540bad9183SKris Buschelman 43550cd7f59aSBarry Smith Notes: 43560cd7f59aSBarry Smith MatSetValues() may be called for this matrix type with a NULL argument for the numerical values, 43570cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 43580cd7f59aSBarry Smith in the matrix 43590cd7f59aSBarry Smith 43600cd7f59aSBarry Smith MatSetOptions(,MAT_STRUCTURE_ONLY,PETSC_TRUE) may be called for this matrix type. In this no 43610cd7f59aSBarry Smith space is allocated for the nonzero entries and any entries passed with MatSetValues() are ignored 43620cd7f59aSBarry Smith 43630cd7f59aSBarry Smith Developer Notes: 43640cd7f59aSBarry Smith It would be nice if all matrix formats supported passing NULL in for the numerical values 43650cd7f59aSBarry Smith 4366db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 43670bad9183SKris Buschelman M*/ 43680bad9183SKris Buschelman 4369ccd284c7SBarry Smith /*MC 4370ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4371ccd284c7SBarry Smith 4372ccd284c7SBarry Smith This matrix type is identical to MATSEQAIJ when constructed with a single process communicator, 4373ccd284c7SBarry Smith and MATMPIAIJ otherwise. As a result, for single process communicators, 4374ed73aabaSBarry Smith MatSeqAIJSetPreallocation() is supported, and similarly MatMPIAIJSetPreallocation() is supported 4375ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4376ccd284c7SBarry Smith the above preallocation routines for simplicity. 4377ccd284c7SBarry Smith 4378ccd284c7SBarry Smith Options Database Keys: 4379ccd284c7SBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to MatSetFromOptions() 4380ccd284c7SBarry Smith 438195452b02SPatrick Sanan Developer Notes: 4382ca9cdca7SRichard Tran Mills Subclasses include MATAIJCUSPARSE, MATAIJPERM, MATAIJSELL, MATAIJMKL, MATAIJCRL, and also automatically switches over to use inodes when 4383ccd284c7SBarry Smith enough exist. 4384ccd284c7SBarry Smith 4385ccd284c7SBarry Smith Level: beginner 4386ccd284c7SBarry Smith 4387db781477SPatrick Sanan .seealso: `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4388ccd284c7SBarry Smith M*/ 4389ccd284c7SBarry Smith 4390ccd284c7SBarry Smith /*MC 4391ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4392ccd284c7SBarry Smith 4393ccd284c7SBarry Smith This matrix type is identical to MATSEQAIJCRL when constructed with a single process communicator, 4394ccd284c7SBarry Smith and MATMPIAIJCRL otherwise. As a result, for single process communicators, 4395ccd284c7SBarry Smith MatSeqAIJSetPreallocation() is supported, and similarly MatMPIAIJSetPreallocation() is supported 4396ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4397ccd284c7SBarry Smith the above preallocation routines for simplicity. 4398ccd284c7SBarry Smith 4399ccd284c7SBarry Smith Options Database Keys: 4400ccd284c7SBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to MatSetFromOptions() 4401ccd284c7SBarry Smith 4402ccd284c7SBarry Smith Level: beginner 4403ccd284c7SBarry Smith 4404c2e3fba1SPatrick Sanan .seealso: `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4405ccd284c7SBarry Smith M*/ 4406ccd284c7SBarry Smith 44077906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat,MatType,MatReuse,Mat*); 44087906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 44097906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat,MatType,MatReuse,Mat*); 44107906f579SHong Zhang #endif 4411d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4412d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat,MatType,MatReuse,Mat*); 4413d24d4204SJose E. Roman #endif 44147906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 44157906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A,MatType,MatReuse,Mat*); 44167906f579SHong Zhang #endif 44177906f579SHong Zhang 4418d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat,MatType,MatReuse,Mat*); 4419c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat,MatType,MatReuse,Mat*); 44204222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 44217906f579SHong Zhang 44228c778c55SBarry Smith /*@C 44238f1ea47aSStefano Zampini MatSeqAIJGetArray - gives read/write access to the array where the data for a MATSEQAIJ matrix is stored 44248c778c55SBarry Smith 44258c778c55SBarry Smith Not Collective 44268c778c55SBarry Smith 44278c778c55SBarry Smith Input Parameter: 4428579dbff0SBarry Smith . mat - a MATSEQAIJ matrix 44298c778c55SBarry Smith 44308c778c55SBarry Smith Output Parameter: 44318c778c55SBarry Smith . array - pointer to the data 44328c778c55SBarry Smith 44338c778c55SBarry Smith Level: intermediate 44348c778c55SBarry Smith 4435db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 44368c778c55SBarry Smith @*/ 44378c778c55SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A,PetscScalar **array) 44388c778c55SBarry Smith { 4439d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 44408c778c55SBarry Smith 44418c778c55SBarry Smith PetscFunctionBegin; 4442d67d9f35SJunchao Zhang if (aij->ops->getarray) { 44439566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A,array)); 4444d67d9f35SJunchao Zhang } else { 4445d67d9f35SJunchao Zhang *array = aij->a; 4446d67d9f35SJunchao Zhang } 4447d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4448d67d9f35SJunchao Zhang } 4449d67d9f35SJunchao Zhang 4450d67d9f35SJunchao Zhang /*@C 4451d67d9f35SJunchao Zhang MatSeqAIJRestoreArray - returns access to the array where the data for a MATSEQAIJ matrix is stored obtained by MatSeqAIJGetArray() 4452d67d9f35SJunchao Zhang 4453d67d9f35SJunchao Zhang Not Collective 4454d67d9f35SJunchao Zhang 4455d67d9f35SJunchao Zhang Input Parameters: 4456d67d9f35SJunchao Zhang + mat - a MATSEQAIJ matrix 4457d67d9f35SJunchao Zhang - array - pointer to the data 4458d67d9f35SJunchao Zhang 4459d67d9f35SJunchao Zhang Level: intermediate 4460d67d9f35SJunchao Zhang 4461db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()` 4462d67d9f35SJunchao Zhang @*/ 4463d67d9f35SJunchao Zhang PetscErrorCode MatSeqAIJRestoreArray(Mat A,PetscScalar **array) 4464d67d9f35SJunchao Zhang { 4465d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 4466d67d9f35SJunchao Zhang 4467d67d9f35SJunchao Zhang PetscFunctionBegin; 4468d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 44699566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A,array)); 4470d67d9f35SJunchao Zhang } else { 4471d67d9f35SJunchao Zhang *array = NULL; 4472d67d9f35SJunchao Zhang } 44739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44749566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 44758c778c55SBarry Smith PetscFunctionReturn(0); 44768c778c55SBarry Smith } 44778c778c55SBarry Smith 447821e72a00SBarry Smith /*@C 44798f1ea47aSStefano Zampini MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a MATSEQAIJ matrix is stored 44808f1ea47aSStefano Zampini 44818f1ea47aSStefano Zampini Not Collective 44828f1ea47aSStefano Zampini 44838f1ea47aSStefano Zampini Input Parameter: 44848f1ea47aSStefano Zampini . mat - a MATSEQAIJ matrix 44858f1ea47aSStefano Zampini 44868f1ea47aSStefano Zampini Output Parameter: 44878f1ea47aSStefano Zampini . array - pointer to the data 44888f1ea47aSStefano Zampini 44898f1ea47aSStefano Zampini Level: intermediate 44908f1ea47aSStefano Zampini 4491db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44928f1ea47aSStefano Zampini @*/ 44938f1ea47aSStefano Zampini PetscErrorCode MatSeqAIJGetArrayRead(Mat A,const PetscScalar **array) 44948f1ea47aSStefano Zampini { 4495d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 44968f1ea47aSStefano Zampini 44978f1ea47aSStefano Zampini PetscFunctionBegin; 4498d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44999566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A,array)); 4500d67d9f35SJunchao Zhang } else { 4501d67d9f35SJunchao Zhang *array = aij->a; 4502d67d9f35SJunchao Zhang } 45038f1ea47aSStefano Zampini PetscFunctionReturn(0); 45048f1ea47aSStefano Zampini } 45058f1ea47aSStefano Zampini 45068f1ea47aSStefano Zampini /*@C 45078f1ea47aSStefano Zampini MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from MatSeqAIJGetArrayRead 45088f1ea47aSStefano Zampini 45098f1ea47aSStefano Zampini Not Collective 45108f1ea47aSStefano Zampini 45118f1ea47aSStefano Zampini Input Parameter: 45128f1ea47aSStefano Zampini . mat - a MATSEQAIJ matrix 45138f1ea47aSStefano Zampini 45148f1ea47aSStefano Zampini Output Parameter: 45158f1ea47aSStefano Zampini . array - pointer to the data 45168f1ea47aSStefano Zampini 45178f1ea47aSStefano Zampini Level: intermediate 45188f1ea47aSStefano Zampini 4519db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45208f1ea47aSStefano Zampini @*/ 45218f1ea47aSStefano Zampini PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A,const PetscScalar **array) 45228f1ea47aSStefano Zampini { 4523d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 45248f1ea47aSStefano Zampini 45258f1ea47aSStefano Zampini PetscFunctionBegin; 4526d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 45279566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A,array)); 4528d67d9f35SJunchao Zhang } else { 4529d67d9f35SJunchao Zhang *array = NULL; 4530d67d9f35SJunchao Zhang } 4531d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4532d67d9f35SJunchao Zhang } 4533d67d9f35SJunchao Zhang 4534d67d9f35SJunchao Zhang /*@C 4535d67d9f35SJunchao Zhang MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a MATSEQAIJ matrix is stored 4536d67d9f35SJunchao Zhang 4537d67d9f35SJunchao Zhang Not Collective 4538d67d9f35SJunchao Zhang 4539d67d9f35SJunchao Zhang Input Parameter: 4540d67d9f35SJunchao Zhang . mat - a MATSEQAIJ matrix 4541d67d9f35SJunchao Zhang 4542d67d9f35SJunchao Zhang Output Parameter: 4543d67d9f35SJunchao Zhang . array - pointer to the data 4544d67d9f35SJunchao Zhang 4545d67d9f35SJunchao Zhang Level: intermediate 4546d67d9f35SJunchao Zhang 4547db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4548d67d9f35SJunchao Zhang @*/ 4549d67d9f35SJunchao Zhang PetscErrorCode MatSeqAIJGetArrayWrite(Mat A,PetscScalar **array) 4550d67d9f35SJunchao Zhang { 4551d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 4552d67d9f35SJunchao Zhang 4553d67d9f35SJunchao Zhang PetscFunctionBegin; 4554d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 45559566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A,array)); 4556d67d9f35SJunchao Zhang } else { 4557d67d9f35SJunchao Zhang *array = aij->a; 4558d67d9f35SJunchao Zhang } 45599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 45609566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 4561d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4562d67d9f35SJunchao Zhang } 4563d67d9f35SJunchao Zhang 4564d67d9f35SJunchao Zhang /*@C 4565d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4566d67d9f35SJunchao Zhang 4567d67d9f35SJunchao Zhang Not Collective 4568d67d9f35SJunchao Zhang 4569d67d9f35SJunchao Zhang Input Parameter: 4570d67d9f35SJunchao Zhang . mat - a MATSEQAIJ matrix 4571d67d9f35SJunchao Zhang 4572d67d9f35SJunchao Zhang Output Parameter: 4573d67d9f35SJunchao Zhang . array - pointer to the data 4574d67d9f35SJunchao Zhang 4575d67d9f35SJunchao Zhang Level: intermediate 4576d67d9f35SJunchao Zhang 4577db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4578d67d9f35SJunchao Zhang @*/ 4579d67d9f35SJunchao Zhang PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A,PetscScalar **array) 4580d67d9f35SJunchao Zhang { 4581d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 4582d67d9f35SJunchao Zhang 4583d67d9f35SJunchao Zhang PetscFunctionBegin; 4584d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45859566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A,array)); 4586d67d9f35SJunchao Zhang } else { 4587d67d9f35SJunchao Zhang *array = NULL; 4588d67d9f35SJunchao Zhang } 45898f1ea47aSStefano Zampini PetscFunctionReturn(0); 45908f1ea47aSStefano Zampini } 45918f1ea47aSStefano Zampini 45928f1ea47aSStefano Zampini /*@C 45937ee59b9bSJunchao Zhang MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the SEQAIJ matrix 45947ee59b9bSJunchao Zhang 45957ee59b9bSJunchao Zhang Not Collective 45967ee59b9bSJunchao Zhang 45977ee59b9bSJunchao Zhang Input Parameter: 45987ee59b9bSJunchao Zhang . mat - a matrix of type MATSEQAIJ or its subclasses 45997ee59b9bSJunchao Zhang 46007ee59b9bSJunchao Zhang Output Parameters: 46017ee59b9bSJunchao Zhang + i - row map array of the matrix 46027ee59b9bSJunchao Zhang . j - column index array of the matrix 46037ee59b9bSJunchao Zhang . a - data array of the matrix 46047ee59b9bSJunchao Zhang - memtype - memory type of the arrays 46057ee59b9bSJunchao Zhang 46067ee59b9bSJunchao Zhang Notes: 46077ee59b9bSJunchao Zhang Any of the output parameters can be NULL, in which case the corresponding value is not returned. 46087ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 46097ee59b9bSJunchao Zhang 46107ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 46117ee59b9bSJunchao Zhang If the matrix is assembled, the data array 'a' is guaranteed to have the latest values of the matrix. 46127ee59b9bSJunchao Zhang 46137ee59b9bSJunchao Zhang Level: Developer 46147ee59b9bSJunchao Zhang 4615db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 46167ee59b9bSJunchao Zhang @*/ 46177ee59b9bSJunchao Zhang PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat,const PetscInt **i,const PetscInt **j,PetscScalar **a,PetscMemType *mtype) 46187ee59b9bSJunchao Zhang { 46197ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 46207ee59b9bSJunchao Zhang 46217ee59b9bSJunchao Zhang PetscFunctionBegin; 46227ee59b9bSJunchao Zhang PetscCheck(mat->preallocated,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"matrix is not preallocated"); 46237ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 46247ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat,i,j,a,mtype)); 46257ee59b9bSJunchao Zhang } else { 46267ee59b9bSJunchao Zhang if (i) *i = aij->i; 46277ee59b9bSJunchao Zhang if (j) *j = aij->j; 46287ee59b9bSJunchao Zhang if (a) *a = aij->a; 46297ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 46307ee59b9bSJunchao Zhang } 46317ee59b9bSJunchao Zhang PetscFunctionReturn(0); 46327ee59b9bSJunchao Zhang } 46337ee59b9bSJunchao Zhang 46347ee59b9bSJunchao Zhang /*@C 463521e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 463621e72a00SBarry Smith 463721e72a00SBarry Smith Not Collective 463821e72a00SBarry Smith 463921e72a00SBarry Smith Input Parameter: 4640579dbff0SBarry Smith . mat - a MATSEQAIJ matrix 464121e72a00SBarry Smith 464221e72a00SBarry Smith Output Parameter: 464321e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 464421e72a00SBarry Smith 464521e72a00SBarry Smith Level: intermediate 464621e72a00SBarry Smith 4647db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 464821e72a00SBarry Smith @*/ 464921e72a00SBarry Smith PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A,PetscInt *nz) 465021e72a00SBarry Smith { 465121e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 465221e72a00SBarry Smith 465321e72a00SBarry Smith PetscFunctionBegin; 465421e72a00SBarry Smith *nz = aij->rmax; 465521e72a00SBarry Smith PetscFunctionReturn(0); 465621e72a00SBarry Smith } 465721e72a00SBarry Smith 4658394ed5ebSJunchao Zhang PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, const PetscInt coo_i[], const PetscInt coo_j[]) 4659394ed5ebSJunchao Zhang { 4660394ed5ebSJunchao Zhang MPI_Comm comm; 4661394ed5ebSJunchao Zhang PetscInt *i,*j; 4662394ed5ebSJunchao Zhang PetscInt M,N,row; 4663394ed5ebSJunchao Zhang PetscCount k,p,q,nneg,nnz,start,end; /* Index the coo array, so use PetscCount as their type */ 4664394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4665394ed5ebSJunchao Zhang PetscInt *Aj; 4666394ed5ebSJunchao Zhang PetscScalar *Aa; 4667cbc6b225SStefano Zampini Mat_SeqAIJ *seqaij = (Mat_SeqAIJ*)(mat->data); 4668cbc6b225SStefano Zampini MatType rtype; 4669394ed5ebSJunchao Zhang PetscCount *perm,*jmap; 4670394ed5ebSJunchao Zhang 4671394ed5ebSJunchao Zhang PetscFunctionBegin; 46729566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(mat)); 46739566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat,&comm)); 46749566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat,&M,&N)); 46759566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(coo_n,&i,coo_n,&j)); 46769566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(i,coo_i,coo_n)); /* Make a copy since we'll modify it */ 46779566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(j,coo_j,coo_n)); 46789566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n,&perm)); 4679394ed5ebSJunchao Zhang for (k=0; k<coo_n; k++) { /* Ignore entries with negative row or col indices */ 4680394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 4681394ed5ebSJunchao Zhang perm[k] = k; 4682394ed5ebSJunchao Zhang } 4683394ed5ebSJunchao Zhang 4684394ed5ebSJunchao Zhang /* Sort by row */ 46859566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithIntCountArrayPair(coo_n,i,j,perm)); 4686394ed5ebSJunchao Zhang for (k=0; k<coo_n; k++) {if (i[k] >= 0) break;} /* Advance k to the first row with a non-negative index */ 4687394ed5ebSJunchao Zhang nneg = k; 46889566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n-nneg+1,&jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4689394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 4690394ed5ebSJunchao Zhang jmap++; /* Inc jmap by 1 for convinience */ 4691394ed5ebSJunchao Zhang 46929566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(M+1,&Ai)); /* CSR of A */ 46939566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n-nneg,&Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4694394ed5ebSJunchao Zhang 4695394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 4696394ed5ebSJunchao Zhang Ai++; /* Inc by 1 for convinience */ 4697394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4698394ed5ebSJunchao Zhang while (k<coo_n) { 4699394ed5ebSJunchao Zhang row = i[k]; 4700394ed5ebSJunchao Zhang start = k; /* [start,end) indices for this row */ 4701394ed5ebSJunchao Zhang while (k<coo_n && i[k] == row) k++; 4702394ed5ebSJunchao Zhang end = k; 47039566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithCountArray(end-start,j+start,perm+start)); 4704394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4705394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4706394ed5ebSJunchao Zhang jmap[q] = 1; /* Number of repeats of this nozero entry */ 4707394ed5ebSJunchao Zhang Ai[row] = 1; 4708394ed5ebSJunchao Zhang nnz++; 4709394ed5ebSJunchao Zhang 4710394ed5ebSJunchao Zhang for (p=start+1; p<end; p++) { /* Scan remaining nonzero in this row */ 4711394ed5ebSJunchao Zhang if (j[p] != j[p-1]) { /* Meet a new nonzero */ 4712394ed5ebSJunchao Zhang q++; 4713394ed5ebSJunchao Zhang jmap[q] = 1; 4714394ed5ebSJunchao Zhang Aj[q] = j[p]; 4715394ed5ebSJunchao Zhang Ai[row]++; 4716394ed5ebSJunchao Zhang nnz++; 4717394ed5ebSJunchao Zhang } else { 4718394ed5ebSJunchao Zhang jmap[q]++; 4719394ed5ebSJunchao Zhang } 4720394ed5ebSJunchao Zhang } 4721394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4722394ed5ebSJunchao Zhang } 47239566063dSJacob Faibussowitsch PetscCall(PetscFree2(i,j)); 4724394ed5ebSJunchao Zhang 4725394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4726394ed5ebSJunchao Zhang for (k=0; k<M; k++) Ai[k+1] += Ai[k]; 4727394ed5ebSJunchao Zhang jmap--; /* Back to the beginning of jmap[] */ 4728394ed5ebSJunchao Zhang jmap[0] = 0; 4729394ed5ebSJunchao Zhang for (k=0; k<nnz; k++) jmap[k+1] += jmap[k]; 4730394ed5ebSJunchao Zhang if (nnz < coo_n-nneg) { /* Realloc with actual number of unique nonzeros */ 4731394ed5ebSJunchao Zhang PetscCount *jmap_new; 4732394ed5ebSJunchao Zhang PetscInt *Aj_new; 4733394ed5ebSJunchao Zhang 47349566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz+1,&jmap_new)); 47359566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new,jmap,nnz+1)); 47369566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4737394ed5ebSJunchao Zhang jmap = jmap_new; 4738394ed5ebSJunchao Zhang 47399566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz,&Aj_new)); 47409566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new,Aj,nnz)); 47419566063dSJacob Faibussowitsch PetscCall(PetscFree(Aj)); 4742394ed5ebSJunchao Zhang Aj = Aj_new; 4743394ed5ebSJunchao Zhang } 4744394ed5ebSJunchao Zhang 4745394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4746394ed5ebSJunchao Zhang PetscCount *perm_new; 4747cbc6b225SStefano Zampini 47489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n-nneg,&perm_new)); 47499566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new,perm+nneg,coo_n-nneg)); 47509566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4751394ed5ebSJunchao Zhang perm = perm_new; 4752394ed5ebSJunchao Zhang } 4753394ed5ebSJunchao Zhang 47549566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat,&rtype)); 47559566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nnz,&Aa)); /* Zero the matrix */ 47569566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF,M,N,Ai,Aj,Aa,rtype,mat)); 4757394ed5ebSJunchao Zhang 4758394ed5ebSJunchao Zhang seqaij->singlemalloc = PETSC_FALSE; /* Ai, Aj and Aa are not allocated in one big malloc */ 4759394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 4760394ed5ebSJunchao Zhang /* Record COO fields */ 4761394ed5ebSJunchao Zhang seqaij->coo_n = coo_n; 4762394ed5ebSJunchao Zhang seqaij->Atot = coo_n-nneg; /* Annz is seqaij->nz, so no need to record that again */ 4763394ed5ebSJunchao Zhang seqaij->jmap = jmap; /* of length nnz+1 */ 4764394ed5ebSJunchao Zhang seqaij->perm = perm; 4765394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4766394ed5ebSJunchao Zhang } 4767394ed5ebSJunchao Zhang 4768394ed5ebSJunchao Zhang static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A,const PetscScalar v[],InsertMode imode) 4769394ed5ebSJunchao Zhang { 4770394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ*)A->data; 4771394ed5ebSJunchao Zhang PetscCount i,j,Annz = aseq->nz; 4772394ed5ebSJunchao Zhang PetscCount *perm = aseq->perm,*jmap = aseq->jmap; 4773394ed5ebSJunchao Zhang PetscScalar *Aa; 4774394ed5ebSJunchao Zhang 4775394ed5ebSJunchao Zhang PetscFunctionBegin; 47769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&Aa)); 4777394ed5ebSJunchao Zhang for (i=0; i<Annz; i++) { 4778b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4779b6c38306SJunchao Zhang for (j=jmap[i]; j<jmap[i+1]; j++) sum += v[perm[j]]; 4780b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES? 0.0 : Aa[i]) + sum; 4781394ed5ebSJunchao Zhang } 47829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&Aa)); 4783394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4784394ed5ebSJunchao Zhang } 4785394ed5ebSJunchao Zhang 478634b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 47875063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat,MatType,MatReuse,Mat*); 478802fe1965SBarry Smith #endif 47893d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 47905063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat,MatType,MatReuse,Mat*); 47913d0639e7SStefano Zampini #endif 479202fe1965SBarry Smith 47938cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4794273d9f13SBarry Smith { 4795273d9f13SBarry Smith Mat_SeqAIJ *b; 479638baddfdSBarry Smith PetscMPIInt size; 4797273d9f13SBarry Smith 4798273d9f13SBarry Smith PetscFunctionBegin; 47999566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B),&size)); 480008401ef6SPierre Jolivet PetscCheck(size <= 1,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Comm must be of size 1"); 4801273d9f13SBarry Smith 48029566063dSJacob Faibussowitsch PetscCall(PetscNewLog(B,&b)); 48032205254eSKarl Rupp 4804b0a32e0cSBarry Smith B->data = (void*)b; 48052205254eSKarl Rupp 48069566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps))); 4807071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 48082205254eSKarl Rupp 4809f4259b30SLisandro Dalcin b->row = NULL; 4810f4259b30SLisandro Dalcin b->col = NULL; 4811f4259b30SLisandro Dalcin b->icol = NULL; 4812b810aeb4SBarry Smith b->reallocs = 0; 481336db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4814f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4815416022c9SBarry Smith b->nonew = 0; 4816f4259b30SLisandro Dalcin b->diag = NULL; 4817f4259b30SLisandro Dalcin b->solve_work = NULL; 4818f4259b30SLisandro Dalcin B->spptr = NULL; 4819f4259b30SLisandro Dalcin b->saved_values = NULL; 4820f4259b30SLisandro Dalcin b->idiag = NULL; 4821f4259b30SLisandro Dalcin b->mdiag = NULL; 4822f4259b30SLisandro Dalcin b->ssor_work = NULL; 482371f1c65dSBarry Smith b->omega = 1.0; 482471f1c65dSBarry Smith b->fshift = 0.0; 482571f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4826bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4827a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 482817ab2063SBarry Smith 48299566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ)); 4830b3866ffcSBarry Smith #if defined(PETSC_HAVE_MATLAB_ENGINE) 48319566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"PetscMatlabEnginePut_C",MatlabEnginePut_SeqAIJ)); 48329566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"PetscMatlabEngineGet_C",MatlabEngineGet_SeqAIJ)); 4833b3866ffcSBarry Smith #endif 48349566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetColumnIndices_C",MatSeqAIJSetColumnIndices_SeqAIJ)); 48359566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatStoreValues_C",MatStoreValues_SeqAIJ)); 48369566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatRetrieveValues_C",MatRetrieveValues_SeqAIJ)); 48379566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqsbaij_C",MatConvert_SeqAIJ_SeqSBAIJ)); 48389566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqbaij_C",MatConvert_SeqAIJ_SeqBAIJ)); 48399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijperm_C",MatConvert_SeqAIJ_SeqAIJPERM)); 48409566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijsell_C",MatConvert_SeqAIJ_SeqAIJSELL)); 48419779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 48429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijmkl_C",MatConvert_SeqAIJ_SeqAIJMKL)); 4843191b95cbSRichard Tran Mills #endif 484434b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 48459566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijcusparse_C",MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 48469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaijcusparse_seqaij_C",MatProductSetFromOptions_SeqAIJ)); 48479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaij_seqaijcusparse_C",MatProductSetFromOptions_SeqAIJ)); 484802fe1965SBarry Smith #endif 48493d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 48509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijkokkos_C",MatConvert_SeqAIJ_SeqAIJKokkos)); 48513d0639e7SStefano Zampini #endif 48529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijcrl_C",MatConvert_SeqAIJ_SeqAIJCRL)); 4853af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 48549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_elemental_C",MatConvert_SeqAIJ_Elemental)); 4855af8000cdSHong Zhang #endif 4856d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 48579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_scalapack_C",MatConvert_AIJ_ScaLAPACK)); 4858d24d4204SJose E. Roman #endif 485963c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 48609566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_hypre_C",MatConvert_AIJ_HYPRE)); 48619566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_transpose_seqaij_seqaij_C",MatProductSetFromOptions_Transpose_AIJ_AIJ)); 486263c07aadSStefano Zampini #endif 48639566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqdense_C",MatConvert_SeqAIJ_SeqDense)); 48649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqsell_C",MatConvert_SeqAIJ_SeqSELL)); 48659566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_is_C",MatConvert_XAIJ_IS)); 48669566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatIsTranspose_C",MatIsTranspose_SeqAIJ)); 48679566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatIsHermitianTranspose_C",MatIsTranspose_SeqAIJ)); 48689566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetPreallocation_C",MatSeqAIJSetPreallocation_SeqAIJ)); 48699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatResetPreallocation_C",MatResetPreallocation_SeqAIJ)); 48709566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetPreallocationCSR_C",MatSeqAIJSetPreallocationCSR_SeqAIJ)); 48719566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatReorderForNonzeroDiagonal_C",MatReorderForNonzeroDiagonal_SeqAIJ)); 48729566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_is_seqaij_C",MatProductSetFromOptions_IS_XAIJ)); 48739566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqdense_seqaij_C",MatProductSetFromOptions_SeqDense_SeqAIJ)); 48749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaij_seqaij_C",MatProductSetFromOptions_SeqAIJ)); 48759566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJKron_C",MatSeqAIJKron_SeqAIJ)); 48769566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSetPreallocationCOO_C",MatSetPreallocationCOO_SeqAIJ)); 48779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSetValuesCOO_C",MatSetValuesCOO_SeqAIJ)); 48789566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 48799566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ)); 48809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 48813a40ed3dSBarry Smith PetscFunctionReturn(0); 488217ab2063SBarry Smith } 488317ab2063SBarry Smith 4884b24902e0SBarry Smith /* 4885b24902e0SBarry Smith Given a matrix generated with MatGetFactor() duplicates all the information in A into B 4886b24902e0SBarry Smith */ 4887ace3abfcSBarry Smith PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C,Mat A,MatDuplicateOption cpvalues,PetscBool mallocmatspace) 488817ab2063SBarry Smith { 48892a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ*)C->data,*a = (Mat_SeqAIJ*)A->data; 4890071fcb05SBarry Smith PetscInt m = A->rmap->n,i; 489117ab2063SBarry Smith 48923a40ed3dSBarry Smith PetscFunctionBegin; 4893aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Cannot duplicate unassembled matrix"); 4894273d9f13SBarry Smith 4895d5f3da31SBarry Smith C->factortype = A->factortype; 4896f4259b30SLisandro Dalcin c->row = NULL; 4897f4259b30SLisandro Dalcin c->col = NULL; 4898f4259b30SLisandro Dalcin c->icol = NULL; 48996ad4291fSHong Zhang c->reallocs = 0; 490017ab2063SBarry Smith 490169272f91SPierre Jolivet C->assembled = A->assembled; 490269272f91SPierre Jolivet C->preallocated = A->preallocated; 490317ab2063SBarry Smith 490469272f91SPierre Jolivet if (A->preallocated) { 49059566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap,&C->rmap)); 49069566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap,&C->cmap)); 4907eec197d1SBarry Smith 49089566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&c->imax)); 49099566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax,a->imax,m*sizeof(PetscInt))); 49109566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&c->ilen)); 49119566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen,a->ilen,m*sizeof(PetscInt))); 49129566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)C, 2*m*sizeof(PetscInt))); 491317ab2063SBarry Smith 491417ab2063SBarry Smith /* allocate the matrix space */ 4915f77e22a1SHong Zhang if (mallocmatspace) { 49169566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(a->i[m],&c->a,a->i[m],&c->j,m+1,&c->i)); 49179566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)C, a->i[m]*(sizeof(PetscScalar)+sizeof(PetscInt))+(m+1)*sizeof(PetscInt))); 49182205254eSKarl Rupp 4919f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 49202205254eSKarl Rupp 49219566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i,a->i,m+1)); 492217ab2063SBarry Smith if (m > 0) { 49239566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j,a->j,a->i[m])); 4924be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 49252e5835c6SStefano Zampini const PetscScalar *aa; 49262e5835c6SStefano Zampini 49279566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 49289566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a,aa,a->i[m])); 49299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 4930be6bf707SBarry Smith } else { 49319566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a,a->i[m])); 493217ab2063SBarry Smith } 493308480c60SBarry Smith } 4934f77e22a1SHong Zhang } 493517ab2063SBarry Smith 49366ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 4937416022c9SBarry Smith c->roworiented = a->roworiented; 4938416022c9SBarry Smith c->nonew = a->nonew; 4939416022c9SBarry Smith if (a->diag) { 49409566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1,&c->diag)); 49419566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag,a->diag,m*sizeof(PetscInt))); 49429566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)C,(m+1)*sizeof(PetscInt))); 4943071fcb05SBarry Smith } else c->diag = NULL; 49442205254eSKarl Rupp 4945f4259b30SLisandro Dalcin c->solve_work = NULL; 4946f4259b30SLisandro Dalcin c->saved_values = NULL; 4947f4259b30SLisandro Dalcin c->idiag = NULL; 4948f4259b30SLisandro Dalcin c->ssor_work = NULL; 4949a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 4950e6b907acSBarry Smith c->free_a = PETSC_TRUE; 4951e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 49526ad4291fSHong Zhang 4953893ad86cSHong Zhang c->rmax = a->rmax; 4954416022c9SBarry Smith c->nz = a->nz; 49558ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 4956754ec7b1SSatish Balay 49576ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 49586ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 4959cd6b891eSBarry Smith if (a->compressedrow.use) { 49606ad4291fSHong Zhang i = a->compressedrow.nrows; 49619566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i+1,&c->compressedrow.i,i,&c->compressedrow.rindex)); 49629566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i,a->compressedrow.i,i+1)); 49639566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex,a->compressedrow.rindex,i)); 496427ea64f8SHong Zhang } else { 496527ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 49660298fd71SBarry Smith c->compressedrow.i = NULL; 49670298fd71SBarry Smith c->compressedrow.rindex = NULL; 49686ad4291fSHong Zhang } 4969ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 4970e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 49714846f1f5SKris Buschelman 49729566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A,cpvalues,&C)); 497369272f91SPierre Jolivet } 49749566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist,&((PetscObject)C)->qlist)); 49753a40ed3dSBarry Smith PetscFunctionReturn(0); 497617ab2063SBarry Smith } 497717ab2063SBarry Smith 4978b24902e0SBarry Smith PetscErrorCode MatDuplicate_SeqAIJ(Mat A,MatDuplicateOption cpvalues,Mat *B) 4979b24902e0SBarry Smith { 4980b24902e0SBarry Smith PetscFunctionBegin; 49819566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A),B)); 49829566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n)); 4983cfd3f464SBarry Smith if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) { 49849566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B,A,A)); 4985cfd3f464SBarry Smith } 49869566063dSJacob Faibussowitsch PetscCall(MatSetType(*B,((PetscObject)A)->type_name)); 49879566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B,A,cpvalues,PETSC_TRUE)); 4988b24902e0SBarry Smith PetscFunctionReturn(0); 4989b24902e0SBarry Smith } 4990b24902e0SBarry Smith 4991112444f4SShri Abhyankar PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 4992fbdbba38SShri Abhyankar { 499352f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 499452f91c60SVaclav Hapla 499552f91c60SVaclav Hapla PetscFunctionBegin; 499652f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat,MAT_CLASSID,1); 499752f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer,PETSC_VIEWER_CLASSID,2); 4998c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 49999566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 50009566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary)); 50019566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERHDF5, &ishdf5)); 500252f91c60SVaclav Hapla if (isbinary) { 50039566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat,viewer)); 500452f91c60SVaclav Hapla } else if (ishdf5) { 500552f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 50069566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat,viewer)); 500752f91c60SVaclav Hapla #else 500852f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 500952f91c60SVaclav Hapla #endif 501052f91c60SVaclav Hapla } else { 501198921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"Viewer type %s not yet supported for reading %s matrices",((PetscObject)viewer)->type_name,((PetscObject)newMat)->type_name); 501252f91c60SVaclav Hapla } 501352f91c60SVaclav Hapla PetscFunctionReturn(0); 501452f91c60SVaclav Hapla } 501552f91c60SVaclav Hapla 50163ea6fe3dSLisandro Dalcin PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 501752f91c60SVaclav Hapla { 50183ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ*)mat->data; 50193ea6fe3dSLisandro Dalcin PetscInt header[4],*rowlens,M,N,nz,sum,rows,cols,i; 5020fbdbba38SShri Abhyankar 5021fbdbba38SShri Abhyankar PetscFunctionBegin; 50229566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 5023bbead8a2SBarry Smith 50243ea6fe3dSLisandro Dalcin /* read in matrix header */ 50259566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer,header,4,NULL,PETSC_INT)); 502608401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID,PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Not a matrix object in file"); 5027fbdbba38SShri Abhyankar M = header[1]; N = header[2]; nz = header[3]; 502808401ef6SPierre Jolivet PetscCheck(M >= 0,PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Matrix row size (%" PetscInt_FMT ") in file is negative",M); 502908401ef6SPierre Jolivet PetscCheck(N >= 0,PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Matrix column size (%" PetscInt_FMT ") in file is negative",N); 503008401ef6SPierre Jolivet PetscCheck(nz >= 0,PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Matrix stored in special format on disk, cannot load as SeqAIJ"); 5031fbdbba38SShri Abhyankar 50323ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 50339566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat,viewer)); 50343ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 50353ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 50363ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 50373ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 50383ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 50399566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 50409566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 50413ea6fe3dSLisandro Dalcin 50423ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 50439566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat,&rows,&cols)); 5044aed4548fSBarry Smith PetscCheck(M == rows && N == cols,PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")",M,N,rows,cols); 50453ea6fe3dSLisandro Dalcin 5046fbdbba38SShri Abhyankar /* read in row lengths */ 50479566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M,&rowlens)); 50489566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer,rowlens,M,NULL,PETSC_INT)); 50493ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 50503ea6fe3dSLisandro Dalcin sum = 0; for (i=0; i<M; i++) sum += rowlens[i]; 505108401ef6SPierre Jolivet PetscCheck(sum == nz,PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT,nz,sum); 50523ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 50539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat,0,rowlens)); 50549566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat,&rows,&cols)); 5055aed4548fSBarry Smith PetscCheck(M == rows && N == cols,PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")",M,N,rows,cols); 50563ea6fe3dSLisandro Dalcin /* store row lengths */ 50579566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen,rowlens,M)); 50589566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 5059fbdbba38SShri Abhyankar 50603ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 50613ea6fe3dSLisandro Dalcin a->i[0] = 0; for (i=0; i<M; i++) a->i[i+1] = a->i[i] + a->ilen[i]; 50623ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 50639566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer,a->j,nz,NULL,PETSC_INT)); 50643ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 50659566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer,a->a,nz,NULL,PETSC_SCALAR)); 5066fbdbba38SShri Abhyankar 50679566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat,MAT_FINAL_ASSEMBLY)); 50689566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat,MAT_FINAL_ASSEMBLY)); 5069fbdbba38SShri Abhyankar PetscFunctionReturn(0); 5070fbdbba38SShri Abhyankar } 5071fbdbba38SShri Abhyankar 5072ace3abfcSBarry Smith PetscErrorCode MatEqual_SeqAIJ(Mat A,Mat B,PetscBool * flg) 50737264ac53SSatish Balay { 50747264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*b = (Mat_SeqAIJ*)B->data; 5075fff043a9SJunchao Zhang const PetscScalar *aa,*ba; 5076eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5077eeffb40dSHong Zhang PetscInt k; 5078eeffb40dSHong Zhang #endif 50797264ac53SSatish Balay 50803a40ed3dSBarry Smith PetscFunctionBegin; 5081bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5082d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) ||(a->nz != b->nz)) { 5083ca44d042SBarry Smith *flg = PETSC_FALSE; 5084ca44d042SBarry Smith PetscFunctionReturn(0); 5085bcd2baecSBarry Smith } 50867264ac53SSatish Balay 50877264ac53SSatish Balay /* if the a->i are the same */ 50889566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i,b->i,A->rmap->n+1,flg)); 5089abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 50907264ac53SSatish Balay 50917264ac53SSatish Balay /* if a->j are the same */ 50929566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j,b->j,a->nz,flg)); 5093abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 5094bcd2baecSBarry Smith 50959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 50969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B,&ba)); 5097bcd2baecSBarry Smith /* if a->a are the same */ 5098eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5099eeffb40dSHong Zhang for (k=0; k<a->nz; k++) { 5100fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5101eeffb40dSHong Zhang *flg = PETSC_FALSE; 51023a40ed3dSBarry Smith PetscFunctionReturn(0); 5103eeffb40dSHong Zhang } 5104eeffb40dSHong Zhang } 5105eeffb40dSHong Zhang #else 51069566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa,ba,a->nz,flg)); 5107eeffb40dSHong Zhang #endif 51089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 51099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B,&ba)); 5110eeffb40dSHong Zhang PetscFunctionReturn(0); 51117264ac53SSatish Balay } 511236db0b34SBarry Smith 511305869f15SSatish Balay /*@ 511436db0b34SBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential AIJ matrix using matrix elements (in CSR format) 511536db0b34SBarry Smith provided by the user. 511636db0b34SBarry Smith 5117d083f849SBarry Smith Collective 511836db0b34SBarry Smith 511936db0b34SBarry Smith Input Parameters: 512036db0b34SBarry Smith + comm - must be an MPI communicator of size 1 512136db0b34SBarry Smith . m - number of rows 512236db0b34SBarry Smith . n - number of columns 5123483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 512436db0b34SBarry Smith . j - column indices 512536db0b34SBarry Smith - a - matrix values 512636db0b34SBarry Smith 512736db0b34SBarry Smith Output Parameter: 512836db0b34SBarry Smith . mat - the matrix 512936db0b34SBarry Smith 513036db0b34SBarry Smith Level: intermediate 513136db0b34SBarry Smith 513236db0b34SBarry Smith Notes: 51330551d7c0SBarry Smith The i, j, and a arrays are not copied by this routine, the user must free these arrays 5134292fb18eSBarry Smith once the matrix is destroyed and not before 513536db0b34SBarry Smith 513636db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 513736db0b34SBarry Smith 5138bfeeae90SHong Zhang The i and j indices are 0 based 513936db0b34SBarry Smith 5140a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5141a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 51428eef79e4SBarry Smith as shown 5143a4552177SSatish Balay 51448eef79e4SBarry Smith $ 1 0 0 51458eef79e4SBarry Smith $ 2 0 3 51468eef79e4SBarry Smith $ 4 5 6 51478eef79e4SBarry Smith $ 51488eef79e4SBarry Smith $ i = {0,1,3,6} [size = nrow+1 = 3+1] 51498eef79e4SBarry Smith $ j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 51508eef79e4SBarry Smith $ v = {1,2,3,4,5,6} [size = 6] 5151a4552177SSatish Balay 5152db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 515336db0b34SBarry Smith 515436db0b34SBarry Smith @*/ 5155c3c607ccSBarry Smith PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt i[],PetscInt j[],PetscScalar a[],Mat *mat) 515636db0b34SBarry Smith { 5157cbcfb4deSHong Zhang PetscInt ii; 515836db0b34SBarry Smith Mat_SeqAIJ *aij; 5159cbcfb4deSHong Zhang PetscInt jj; 516036db0b34SBarry Smith 516136db0b34SBarry Smith PetscFunctionBegin; 5162aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"i (row indices) must start with 0"); 51639566063dSJacob Faibussowitsch PetscCall(MatCreate(comm,mat)); 51649566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat,m,n,m,n)); 51659566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 51669566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat,MATSEQAIJ)); 51679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat,MAT_SKIP_ALLOCATION,NULL)); 5168ab93d7beSBarry Smith aij = (Mat_SeqAIJ*)(*mat)->data; 51699566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&aij->imax)); 51709566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&aij->ilen)); 5171ab93d7beSBarry Smith 517236db0b34SBarry Smith aij->i = i; 517336db0b34SBarry Smith aij->j = j; 517436db0b34SBarry Smith aij->a = a; 517536db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 517636db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5177e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5178e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 517936db0b34SBarry Smith 5180cbc6b225SStefano Zampini for (ii=0,aij->nonzerorowcnt=0,aij->rmax=0; ii<m; ii++) { 518136db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii+1] - i[ii]; 518276bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5183aed4548fSBarry Smith PetscCheck(i[ii+1] - i[ii] >= 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT,ii,i[ii+1] - i[ii]); 51849985e31cSBarry Smith for (jj=i[ii]+1; jj<i[ii+1]; jj++) { 518508401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj-1],PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted",jj-i[ii],j[jj],ii); 518608401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj-1],PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry",jj-i[ii],j[jj],ii); 51879985e31cSBarry Smith } 518836db0b34SBarry Smith } 518976bd3646SJed Brown } 519076bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 519136db0b34SBarry Smith for (ii=0; ii<aij->i[m]; ii++) { 519208401ef6SPierre Jolivet PetscCheck(j[ii] >= 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT,ii,j[ii]); 5193aed4548fSBarry Smith PetscCheck(j[ii] <= n - 1,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT,ii,j[ii]); 519436db0b34SBarry Smith } 519576bd3646SJed Brown } 519636db0b34SBarry Smith 51979566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY)); 51989566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY)); 519936db0b34SBarry Smith PetscFunctionReturn(0); 520036db0b34SBarry Smith } 5201cbc6b225SStefano Zampini 5202f62e3866SBarry Smith /*@ 5203d021a1c5SVictor Minden MatCreateSeqAIJFromTriple - Creates an sequential AIJ matrix using matrix elements (in COO format) 52048a0b0e6bSVictor Minden provided by the user. 52058a0b0e6bSVictor Minden 5206d083f849SBarry Smith Collective 52078a0b0e6bSVictor Minden 52088a0b0e6bSVictor Minden Input Parameters: 52098a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 52108a0b0e6bSVictor Minden . m - number of rows 52118a0b0e6bSVictor Minden . n - number of columns 52128a0b0e6bSVictor Minden . i - row indices 52138a0b0e6bSVictor Minden . j - column indices 52141230e6d1SVictor Minden . a - matrix values 52151230e6d1SVictor Minden . nz - number of nonzeros 5216f62e3866SBarry Smith - idx - if the i and j indices start with 1 use PETSC_TRUE otherwise use PETSC_FALSE 52178a0b0e6bSVictor Minden 52188a0b0e6bSVictor Minden Output Parameter: 52198a0b0e6bSVictor Minden . mat - the matrix 52208a0b0e6bSVictor Minden 52218a0b0e6bSVictor Minden Level: intermediate 52228a0b0e6bSVictor Minden 5223f62e3866SBarry Smith Example: 5224f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 52259e99939fSJunchao Zhang .vb 52268a0b0e6bSVictor Minden 1 0 0 52278a0b0e6bSVictor Minden 2 0 3 52288a0b0e6bSVictor Minden 4 5 6 52298a0b0e6bSVictor Minden 52308a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 52318a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 52328a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 52339e99939fSJunchao Zhang .ve 52348a0b0e6bSVictor Minden 5235db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()` 52368a0b0e6bSVictor Minden 52378a0b0e6bSVictor Minden @*/ 5238c3c607ccSBarry Smith PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt i[],PetscInt j[],PetscScalar a[],Mat *mat,PetscInt nz,PetscBool idx) 52398a0b0e6bSVictor Minden { 5240d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1,row,col; 52418a0b0e6bSVictor Minden 52428a0b0e6bSVictor Minden PetscFunctionBegin; 52439566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m,&nnz)); 52441230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 5245c8d679ebSHong Zhang nnz[i[ii] - !!idx] += 1; 52461230e6d1SVictor Minden } 52479566063dSJacob Faibussowitsch PetscCall(MatCreate(comm,mat)); 52489566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat,m,n,m,n)); 52499566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat,MATSEQAIJ)); 52509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat,0,nnz)); 52511230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 52521230e6d1SVictor Minden if (idx) { 52531230e6d1SVictor Minden row = i[ii] - 1; 52541230e6d1SVictor Minden col = j[ii] - 1; 52551230e6d1SVictor Minden } else { 52561230e6d1SVictor Minden row = i[ii]; 52571230e6d1SVictor Minden col = j[ii]; 52588a0b0e6bSVictor Minden } 52599566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat,one,&row,one,&col,&a[ii],ADD_VALUES)); 52608a0b0e6bSVictor Minden } 52619566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY)); 52629566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY)); 52639566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 52648a0b0e6bSVictor Minden PetscFunctionReturn(0); 52658a0b0e6bSVictor Minden } 526636db0b34SBarry Smith 5267acf2f550SJed Brown PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5268acf2f550SJed Brown { 5269acf2f550SJed Brown Mat_SeqAIJ *a=(Mat_SeqAIJ*)A->data; 5270acf2f550SJed Brown 5271acf2f550SJed Brown PetscFunctionBegin; 5272acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5273acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 52742205254eSKarl Rupp 52759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 5276acf2f550SJed Brown PetscFunctionReturn(0); 5277acf2f550SJed Brown } 5278acf2f550SJed Brown 52799c8f2541SHong Zhang PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm,Mat inmat,PetscInt n,MatReuse scall,Mat *outmat) 52809c8f2541SHong Zhang { 52818761c3d6SHong Zhang PetscMPIInt size; 52829c8f2541SHong Zhang 52839c8f2541SHong Zhang PetscFunctionBegin; 52849566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm,&size)); 52857bbdc51dSHong Zhang if (size == 1) { 52867bbdc51dSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 52879566063dSJacob Faibussowitsch PetscCall(MatDuplicate(inmat,MAT_COPY_VALUES,outmat)); 52887bbdc51dSHong Zhang } else { 52899566063dSJacob Faibussowitsch PetscCall(MatCopy(inmat,*outmat,SAME_NONZERO_PATTERN)); 52907bbdc51dSHong Zhang } 52918761c3d6SHong Zhang } else { 52929566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm,inmat,n,scall,outmat)); 52938761c3d6SHong Zhang } 52949c8f2541SHong Zhang PetscFunctionReturn(0); 52959c8f2541SHong Zhang } 52969c8f2541SHong Zhang 529781824310SBarry Smith /* 529853dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 529953dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 530053dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 530153dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 530253dd7562SDmitry Karpeev */ 530353dd7562SDmitry Karpeev PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C,IS rowemb,IS colemb,MatStructure pattern,Mat B) 530453dd7562SDmitry Karpeev { 530553dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 530653dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 530753dd7562SDmitry Karpeev PetscBool seqaij; 530853dd7562SDmitry Karpeev PetscInt m,n,*nz,i,j,count; 530953dd7562SDmitry Karpeev PetscScalar v; 531053dd7562SDmitry Karpeev const PetscInt *rowindices,*colindices; 531153dd7562SDmitry Karpeev 531253dd7562SDmitry Karpeev PetscFunctionBegin; 531353dd7562SDmitry Karpeev if (!B) PetscFunctionReturn(0); 531453dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 53159566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B,MATSEQAIJ,&seqaij)); 531628b400f6SJacob Faibussowitsch PetscCheck(seqaij,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is of wrong type"); 531753dd7562SDmitry Karpeev if (rowemb) { 53189566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb,&m)); 531908401ef6SPierre Jolivet PetscCheck(m == B->rmap->n,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT,m,B->rmap->n); 532053dd7562SDmitry Karpeev } else { 532108401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is row-incompatible with the target matrix"); 532253dd7562SDmitry Karpeev } 532353dd7562SDmitry Karpeev if (colemb) { 53249566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb,&n)); 532508401ef6SPierre Jolivet PetscCheck(n == B->cmap->n,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT,n,B->cmap->n); 532653dd7562SDmitry Karpeev } else { 532708401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is col-incompatible with the target matrix"); 532853dd7562SDmitry Karpeev } 532953dd7562SDmitry Karpeev 533053dd7562SDmitry Karpeev Baij = (Mat_SeqAIJ*)(B->data); 533153dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 53329566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n,&nz)); 533353dd7562SDmitry Karpeev for (i=0; i<B->rmap->n; i++) { 533453dd7562SDmitry Karpeev nz[i] = Baij->i[i+1] - Baij->i[i]; 533553dd7562SDmitry Karpeev } 53369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C,0,nz)); 53379566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 533853dd7562SDmitry Karpeev } 533953dd7562SDmitry Karpeev if (pattern == SUBSET_NONZERO_PATTERN) { 53409566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(C)); 534153dd7562SDmitry Karpeev } 534253dd7562SDmitry Karpeev count = 0; 534353dd7562SDmitry Karpeev rowindices = NULL; 534453dd7562SDmitry Karpeev colindices = NULL; 534553dd7562SDmitry Karpeev if (rowemb) { 53469566063dSJacob Faibussowitsch PetscCall(ISGetIndices(rowemb,&rowindices)); 534753dd7562SDmitry Karpeev } 534853dd7562SDmitry Karpeev if (colemb) { 53499566063dSJacob Faibussowitsch PetscCall(ISGetIndices(colemb,&colindices)); 535053dd7562SDmitry Karpeev } 535153dd7562SDmitry Karpeev for (i=0; i<B->rmap->n; i++) { 535253dd7562SDmitry Karpeev PetscInt row; 535353dd7562SDmitry Karpeev row = i; 535453dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 535553dd7562SDmitry Karpeev for (j=Baij->i[i]; j<Baij->i[i+1]; j++) { 535653dd7562SDmitry Karpeev PetscInt col; 535753dd7562SDmitry Karpeev col = Baij->j[count]; 535853dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 535953dd7562SDmitry Karpeev v = Baij->a[count]; 53609566063dSJacob Faibussowitsch PetscCall(MatSetValues(C,1,&row,1,&col,&v,INSERT_VALUES)); 536153dd7562SDmitry Karpeev ++count; 536253dd7562SDmitry Karpeev } 536353dd7562SDmitry Karpeev } 536453dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 536553dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 536653dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 536753dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 536853dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 536953dd7562SDmitry Karpeev PetscFunctionReturn(0); 537053dd7562SDmitry Karpeev } 537153dd7562SDmitry Karpeev 53724099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 53734099cc6bSBarry Smith 53744099cc6bSBarry Smith /*@C 53754099cc6bSBarry Smith MatSeqAIJSetType - Converts a MATSEQAIJ matrix to a subtype 53764099cc6bSBarry Smith 53774099cc6bSBarry Smith Collective on Mat 53784099cc6bSBarry Smith 53794099cc6bSBarry Smith Input Parameters: 53804099cc6bSBarry Smith + mat - the matrix object 53814099cc6bSBarry Smith - matype - matrix type 53824099cc6bSBarry Smith 53834099cc6bSBarry Smith Options Database Key: 53844099cc6bSBarry Smith . -mat_seqai_type <method> - for example seqaijcrl 53854099cc6bSBarry Smith 53864099cc6bSBarry Smith Level: intermediate 53874099cc6bSBarry Smith 5388db781477SPatrick Sanan .seealso: `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`, `Mat` 53894099cc6bSBarry Smith @*/ 53904099cc6bSBarry Smith PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 53914099cc6bSBarry Smith { 53924099cc6bSBarry Smith PetscBool sametype; 53935f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat,MatType,MatReuse,Mat*); 53944099cc6bSBarry Smith 53954099cc6bSBarry Smith PetscFunctionBegin; 53964099cc6bSBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 53979566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat,matype,&sametype)); 53984099cc6bSBarry Smith if (sametype) PetscFunctionReturn(0); 53994099cc6bSBarry Smith 54009566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList,matype,&r)); 54015f80ce2aSJacob Faibussowitsch PetscCheck(r,PETSC_COMM_SELF,PETSC_ERR_ARG_UNKNOWN_TYPE,"Unknown Mat type given: %s",matype); 54029566063dSJacob Faibussowitsch PetscCall((*r)(mat,matype,MAT_INPLACE_MATRIX,&mat)); 54034099cc6bSBarry Smith PetscFunctionReturn(0); 54044099cc6bSBarry Smith } 54054099cc6bSBarry Smith 54064099cc6bSBarry Smith /*@C 54074099cc6bSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential AIJ matrices 54084099cc6bSBarry Smith 54094099cc6bSBarry Smith Not Collective 54104099cc6bSBarry Smith 54114099cc6bSBarry Smith Input Parameters: 54124099cc6bSBarry Smith + name - name of a new user-defined matrix type, for example MATSEQAIJCRL 54134099cc6bSBarry Smith - function - routine to convert to subtype 54144099cc6bSBarry Smith 54154099cc6bSBarry Smith Notes: 54164099cc6bSBarry Smith MatSeqAIJRegister() may be called multiple times to add several user-defined solvers. 54174099cc6bSBarry Smith 54184099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 54194099cc6bSBarry Smith $ -mat_seqaij_type my_mat 54204099cc6bSBarry Smith 54214099cc6bSBarry Smith Level: advanced 54224099cc6bSBarry Smith 5423db781477SPatrick Sanan .seealso: `MatSeqAIJRegisterAll()` 54244099cc6bSBarry Smith 54254099cc6bSBarry Smith Level: advanced 54264099cc6bSBarry Smith @*/ 5427388d47a6SSatish Balay PetscErrorCode MatSeqAIJRegister(const char sname[],PetscErrorCode (*function)(Mat,MatType,MatReuse,Mat *)) 54284099cc6bSBarry Smith { 54294099cc6bSBarry Smith PetscFunctionBegin; 54309566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 54319566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList,sname,function)); 54324099cc6bSBarry Smith PetscFunctionReturn(0); 54334099cc6bSBarry Smith } 54344099cc6bSBarry Smith 54354099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 54364099cc6bSBarry Smith 54374099cc6bSBarry Smith /*@C 54384099cc6bSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of SeqAIJ 54394099cc6bSBarry Smith 54404099cc6bSBarry Smith Not Collective 54414099cc6bSBarry Smith 54424099cc6bSBarry Smith Level: advanced 54434099cc6bSBarry Smith 5444db781477SPatrick Sanan .seealso: `MatRegisterAll()`, `MatSeqAIJRegister()` 54454099cc6bSBarry Smith @*/ 54464099cc6bSBarry Smith PetscErrorCode MatSeqAIJRegisterAll(void) 54474099cc6bSBarry Smith { 54484099cc6bSBarry Smith PetscFunctionBegin; 54494099cc6bSBarry Smith if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(0); 54504099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 54514099cc6bSBarry Smith 54529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 54539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 54549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 54559779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 54569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5457485f9817SRichard Tran Mills #endif 54585063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 54599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 54605063d097SStefano Zampini #endif 54615063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 54629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 54635063d097SStefano Zampini #endif 54644099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 54659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 54664099cc6bSBarry Smith #endif 54674099cc6bSBarry Smith PetscFunctionReturn(0); 54684099cc6bSBarry Smith } 546953dd7562SDmitry Karpeev 547053dd7562SDmitry Karpeev /* 547181824310SBarry Smith Special version for direct calls from Fortran 547281824310SBarry Smith */ 5473af0996ceSBarry Smith #include <petsc/private/fortranimpl.h> 547481824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 547581824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 547681824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 547781824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 547881824310SBarry Smith #endif 547981824310SBarry Smith 548081824310SBarry Smith /* Change these macros so can be used in void function */ 548198921bdaSJacob Faibussowitsch 548298921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 54839566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 54849566063dSJacob Faibussowitsch #undef PetscCall 54859566063dSJacob Faibussowitsch #define PetscCall(...) do { \ 54865f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 548798921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 548898921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF,__LINE__,PETSC_FUNCTION_NAME,__FILE__,ierr_msv_mpiaij,PETSC_ERROR_REPEAT," "); \ 548998921bdaSJacob Faibussowitsch return; \ 549098921bdaSJacob Faibussowitsch } \ 549198921bdaSJacob Faibussowitsch } while (0) 549298921bdaSJacob Faibussowitsch 549398921bdaSJacob Faibussowitsch #undef SETERRQ 549498921bdaSJacob Faibussowitsch #define SETERRQ(comm,ierr,...) do { \ 549598921bdaSJacob Faibussowitsch *_ierr = PetscError(comm,__LINE__,PETSC_FUNCTION_NAME,__FILE__,ierr,PETSC_ERROR_INITIAL,__VA_ARGS__); \ 549698921bdaSJacob Faibussowitsch return; \ 549798921bdaSJacob Faibussowitsch } while (0) 549881824310SBarry Smith 549919caf8f3SSatish Balay PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA,PetscInt *mm,const PetscInt im[],PetscInt *nn,const PetscInt in[],const PetscScalar v[],InsertMode *isis, PetscErrorCode *_ierr) 550081824310SBarry Smith { 550181824310SBarry Smith Mat A = *AA; 550281824310SBarry Smith PetscInt m = *mm, n = *nn; 550381824310SBarry Smith InsertMode is = *isis; 550481824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 550581824310SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 550681824310SBarry Smith PetscInt *imax,*ai,*ailen; 550781824310SBarry Smith PetscInt *aj,nonew = a->nonew,lastcol = -1; 550854f21887SBarry Smith MatScalar *ap,value,*aa; 5509ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5510ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 551181824310SBarry Smith 551281824310SBarry Smith PetscFunctionBegin; 55134994cf47SJed Brown MatCheckPreallocated(A,1); 551481824310SBarry Smith imax = a->imax; 551581824310SBarry Smith ai = a->i; 551681824310SBarry Smith ailen = a->ilen; 551781824310SBarry Smith aj = a->j; 551881824310SBarry Smith aa = a->a; 551981824310SBarry Smith 552081824310SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 552181824310SBarry Smith row = im[k]; 552281824310SBarry Smith if (row < 0) continue; 55235f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large"); 552481824310SBarry Smith rp = aj + ai[row]; ap = aa + ai[row]; 552581824310SBarry Smith rmax = imax[row]; nrow = ailen[row]; 552681824310SBarry Smith low = 0; 552781824310SBarry Smith high = nrow; 552881824310SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 552981824310SBarry Smith if (in[l] < 0) continue; 55305f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Column too large"); 553181824310SBarry Smith col = in[l]; 55322205254eSKarl Rupp if (roworiented) value = v[l + k*n]; 55332205254eSKarl Rupp else value = v[k + l*m]; 55342205254eSKarl Rupp 553581824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 553681824310SBarry Smith 55372205254eSKarl Rupp if (col <= lastcol) low = 0; 55382205254eSKarl Rupp else high = nrow; 553981824310SBarry Smith lastcol = col; 554081824310SBarry Smith while (high-low > 5) { 554181824310SBarry Smith t = (low+high)/2; 554281824310SBarry Smith if (rp[t] > col) high = t; 554381824310SBarry Smith else low = t; 554481824310SBarry Smith } 554581824310SBarry Smith for (i=low; i<high; i++) { 554681824310SBarry Smith if (rp[i] > col) break; 554781824310SBarry Smith if (rp[i] == col) { 554881824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 554981824310SBarry Smith else ap[i] = value; 555081824310SBarry Smith goto noinsert; 555181824310SBarry Smith } 555281824310SBarry Smith } 555381824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 555481824310SBarry Smith if (nonew == 1) goto noinsert; 55555f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero in the matrix"); 5556fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 555781824310SBarry Smith N = nrow++ - 1; a->nz++; high++; 555881824310SBarry Smith /* shift up all the later entries in this row */ 555981824310SBarry Smith for (ii=N; ii>=i; ii--) { 556081824310SBarry Smith rp[ii+1] = rp[ii]; 556181824310SBarry Smith ap[ii+1] = ap[ii]; 556281824310SBarry Smith } 556381824310SBarry Smith rp[i] = col; 556481824310SBarry Smith ap[i] = value; 5565e56f5c9eSBarry Smith A->nonzerostate++; 556681824310SBarry Smith noinsert:; 556781824310SBarry Smith low = i + 1; 556881824310SBarry Smith } 556981824310SBarry Smith ailen[row] = nrow; 557081824310SBarry Smith } 557181824310SBarry Smith PetscFunctionReturnVoid(); 557281824310SBarry Smith } 557398921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 557498921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 557598921bdaSJacob Faibussowitsch * original definitions */ 55769566063dSJacob Faibussowitsch #undef PetscCall 557798921bdaSJacob Faibussowitsch #undef SETERRQ 5578