1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 114099cc6bSBarry Smith PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 124099cc6bSBarry Smith { 134099cc6bSBarry Smith PetscBool flg; 144099cc6bSBarry Smith char type[256]; 154099cc6bSBarry Smith 164099cc6bSBarry Smith PetscFunctionBegin; 17d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 189566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type","Matrix SeqAIJ type","MatSeqAIJSetType",MatSeqAIJList,"seqaij",type,256,&flg)); 199566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A,type)); 20d0609cedSBarry Smith PetscOptionsEnd(); 214099cc6bSBarry Smith PetscFunctionReturn(0); 224099cc6bSBarry Smith } 234099cc6bSBarry Smith 24857cbf51SRichard Tran Mills PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A,PetscInt type,PetscReal *reductions) 250716a85fSBarry Smith { 260716a85fSBarry Smith PetscInt i,m,n; 270716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 280716a85fSBarry Smith 290716a85fSBarry Smith PetscFunctionBegin; 309566063dSJacob Faibussowitsch PetscCall(MatGetSize(A,&m,&n)); 319566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions,n)); 320716a85fSBarry Smith if (type == NORM_2) { 330716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 34a873a8cdSSam Reynolds reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]*aij->a[i]); 350716a85fSBarry Smith } 360716a85fSBarry Smith } else if (type == NORM_1) { 370716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 38a873a8cdSSam Reynolds reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 390716a85fSBarry Smith } 400716a85fSBarry Smith } else if (type == NORM_INFINITY) { 410716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 42a873a8cdSSam Reynolds reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]),reductions[aij->j[i]]); 430716a85fSBarry Smith } 44857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 45a873a8cdSSam Reynolds for (i=0; i<aij->i[m]; i++) { 46857cbf51SRichard Tran Mills reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 47a873a8cdSSam Reynolds } 48857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 49857cbf51SRichard Tran Mills for (i=0; i<aij->i[m]; i++) { 50857cbf51SRichard Tran Mills reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 51857cbf51SRichard Tran Mills } 52857cbf51SRichard Tran Mills } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Unknown reduction type"); 530716a85fSBarry Smith 540716a85fSBarry Smith if (type == NORM_2) { 55a873a8cdSSam Reynolds for (i=0; i<n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 56857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 57a873a8cdSSam Reynolds for (i=0; i<n; i++) reductions[i] /= m; 580716a85fSBarry Smith } 590716a85fSBarry Smith PetscFunctionReturn(0); 600716a85fSBarry Smith } 610716a85fSBarry Smith 623a062f41SBarry Smith PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A,IS *is) 633a062f41SBarry Smith { 643a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 653a062f41SBarry Smith PetscInt i,m=A->rmap->n,cnt = 0, bs = A->rmap->bs; 663a062f41SBarry Smith const PetscInt *jj = a->j,*ii = a->i; 673a062f41SBarry Smith PetscInt *rows; 683a062f41SBarry Smith 693a062f41SBarry Smith PetscFunctionBegin; 703a062f41SBarry Smith for (i=0; i<m; i++) { 713a062f41SBarry Smith if ((ii[i] != ii[i+1]) && ((jj[ii[i]] < bs*(i/bs)) || (jj[ii[i+1]-1] > bs*((i+bs)/bs)-1))) { 723a062f41SBarry Smith cnt++; 733a062f41SBarry Smith } 743a062f41SBarry Smith } 759566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt,&rows)); 763a062f41SBarry Smith cnt = 0; 773a062f41SBarry Smith for (i=0; i<m; i++) { 783a062f41SBarry Smith if ((ii[i] != ii[i+1]) && ((jj[ii[i]] < bs*(i/bs)) || (jj[ii[i+1]-1] > bs*((i+bs)/bs)-1))) { 793a062f41SBarry Smith rows[cnt] = i; 803a062f41SBarry Smith cnt++; 813a062f41SBarry Smith } 823a062f41SBarry Smith } 839566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF,cnt,rows,PETSC_OWN_POINTER,is)); 843a062f41SBarry Smith PetscFunctionReturn(0); 853a062f41SBarry Smith } 863a062f41SBarry Smith 87f1f41ecbSJed Brown PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A,PetscInt *nrows,PetscInt **zrows) 886ce1633cSBarry Smith { 896ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 90fff043a9SJunchao Zhang const MatScalar *aa; 916ce1633cSBarry Smith PetscInt i,m=A->rmap->n,cnt = 0; 92b2db7409Sstefano_zampini const PetscInt *ii = a->i,*jj = a->j,*diag; 936ce1633cSBarry Smith PetscInt *rows; 946ce1633cSBarry Smith 956ce1633cSBarry Smith PetscFunctionBegin; 969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 979566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 986ce1633cSBarry Smith diag = a->diag; 996ce1633cSBarry Smith for (i=0; i<m; i++) { 100b2db7409Sstefano_zampini if ((diag[i] >= ii[i+1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 1016ce1633cSBarry Smith cnt++; 1026ce1633cSBarry Smith } 1036ce1633cSBarry Smith } 1049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt,&rows)); 1056ce1633cSBarry Smith cnt = 0; 1066ce1633cSBarry Smith for (i=0; i<m; i++) { 107b2db7409Sstefano_zampini if ((diag[i] >= ii[i+1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 1086ce1633cSBarry Smith rows[cnt++] = i; 1096ce1633cSBarry Smith } 1106ce1633cSBarry Smith } 111f1f41ecbSJed Brown *nrows = cnt; 112f1f41ecbSJed Brown *zrows = rows; 1139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 114f1f41ecbSJed Brown PetscFunctionReturn(0); 115f1f41ecbSJed Brown } 116f1f41ecbSJed Brown 117f1f41ecbSJed Brown PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A,IS *zrows) 118f1f41ecbSJed Brown { 119f1f41ecbSJed Brown PetscInt nrows,*rows; 120f1f41ecbSJed Brown 121f1f41ecbSJed Brown PetscFunctionBegin; 1220298fd71SBarry Smith *zrows = NULL; 1239566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A,&nrows,&rows)); 1249566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A),nrows,rows,PETSC_OWN_POINTER,zrows)); 1256ce1633cSBarry Smith PetscFunctionReturn(0); 1266ce1633cSBarry Smith } 1276ce1633cSBarry Smith 128b3a44c85SBarry Smith PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A,IS *keptrows) 129b3a44c85SBarry Smith { 130b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 131b3a44c85SBarry Smith const MatScalar *aa; 132b3a44c85SBarry Smith PetscInt m=A->rmap->n,cnt = 0; 133b3a44c85SBarry Smith const PetscInt *ii; 134b3a44c85SBarry Smith PetscInt n,i,j,*rows; 135b3a44c85SBarry Smith 136b3a44c85SBarry Smith PetscFunctionBegin; 1379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 138f4259b30SLisandro Dalcin *keptrows = NULL; 139b3a44c85SBarry Smith ii = a->i; 140b3a44c85SBarry Smith for (i=0; i<m; i++) { 141b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 142b3a44c85SBarry Smith if (!n) { 143b3a44c85SBarry Smith cnt++; 144b3a44c85SBarry Smith goto ok1; 145b3a44c85SBarry Smith } 1462e5835c6SStefano Zampini for (j=ii[i]; j<ii[i+1]; j++) { 147b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 148b3a44c85SBarry Smith } 149b3a44c85SBarry Smith cnt++; 150b3a44c85SBarry Smith ok1:; 151b3a44c85SBarry Smith } 1522e5835c6SStefano Zampini if (!cnt) { 1539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 1542e5835c6SStefano Zampini PetscFunctionReturn(0); 1552e5835c6SStefano Zampini } 1569566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n-cnt,&rows)); 157b3a44c85SBarry Smith cnt = 0; 158b3a44c85SBarry Smith for (i=0; i<m; i++) { 159b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 160b3a44c85SBarry Smith if (!n) continue; 1612e5835c6SStefano Zampini for (j=ii[i]; j<ii[i+1]; j++) { 162b3a44c85SBarry Smith if (aa[j] != 0.0) { 163b3a44c85SBarry Smith rows[cnt++] = i; 164b3a44c85SBarry Smith break; 165b3a44c85SBarry Smith } 166b3a44c85SBarry Smith } 167b3a44c85SBarry Smith } 1689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 1699566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF,cnt,rows,PETSC_OWN_POINTER,keptrows)); 170b3a44c85SBarry Smith PetscFunctionReturn(0); 171b3a44c85SBarry Smith } 172b3a44c85SBarry Smith 1737087cfbeSBarry Smith PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y,Vec D,InsertMode is) 17479299369SBarry Smith { 17579299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) Y->data; 17699e65526SBarry Smith PetscInt i,m = Y->rmap->n; 17799e65526SBarry Smith const PetscInt *diag; 1782e5835c6SStefano Zampini MatScalar *aa; 17999e65526SBarry Smith const PetscScalar *v; 180ace3abfcSBarry Smith PetscBool missing; 18179299369SBarry Smith 18279299369SBarry Smith PetscFunctionBegin; 18309f38230SBarry Smith if (Y->assembled) { 1849566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y,&missing,NULL)); 18509f38230SBarry Smith if (!missing) { 18679299369SBarry Smith diag = aij->diag; 1879566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D,&v)); 1889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y,&aa)); 18979299369SBarry Smith if (is == INSERT_VALUES) { 19079299369SBarry Smith for (i=0; i<m; i++) { 19179299369SBarry Smith aa[diag[i]] = v[i]; 19279299369SBarry Smith } 19379299369SBarry Smith } else { 19479299369SBarry Smith for (i=0; i<m; i++) { 19579299369SBarry Smith aa[diag[i]] += v[i]; 19679299369SBarry Smith } 19779299369SBarry Smith } 1989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y,&aa)); 1999566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D,&v)); 20079299369SBarry Smith PetscFunctionReturn(0); 20179299369SBarry Smith } 2029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 20309f38230SBarry Smith } 2049566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y,D,is)); 20509f38230SBarry Smith PetscFunctionReturn(0); 20609f38230SBarry Smith } 20779299369SBarry Smith 2081a83f524SJed Brown PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *m,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 20917ab2063SBarry Smith { 210416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 21197f1f81fSBarry Smith PetscInt i,ishift; 21217ab2063SBarry Smith 2133a40ed3dSBarry Smith PetscFunctionBegin; 214f1f2ae84SBarry Smith if (m) *m = A->rmap->n; 2153a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 216bfeeae90SHong Zhang ishift = 0; 217b94d7dedSBarry Smith if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) { 2189566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,PETSC_TRUE,ishift,oshift,(PetscInt**)ia,(PetscInt**)ja)); 219bfeeae90SHong Zhang } else if (oshift == 1) { 2201a83f524SJed Brown PetscInt *tia; 221d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2223b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2239566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n+1,&tia)); 2241a83f524SJed Brown for (i=0; i<A->rmap->n+1; i++) tia[i] = a->i[i] + 1; 2251a83f524SJed Brown *ia = tia; 226ecc77c7aSBarry Smith if (ja) { 2271a83f524SJed Brown PetscInt *tja; 2289566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz+1,&tja)); 2291a83f524SJed Brown for (i=0; i<nz; i++) tja[i] = a->j[i] + 1; 2301a83f524SJed Brown *ja = tja; 231ecc77c7aSBarry Smith } 2326945ee14SBarry Smith } else { 233ecc77c7aSBarry Smith *ia = a->i; 234ecc77c7aSBarry Smith if (ja) *ja = a->j; 235a2ce50c7SBarry Smith } 2363a40ed3dSBarry Smith PetscFunctionReturn(0); 237a2744918SBarry Smith } 238a2744918SBarry Smith 2391a83f524SJed Brown PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2406945ee14SBarry Smith { 2413a40ed3dSBarry Smith PetscFunctionBegin; 2423a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 243b94d7dedSBarry Smith if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) { 2449566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2459566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 246bcd2baecSBarry Smith } 2473a40ed3dSBarry Smith PetscFunctionReturn(0); 24817ab2063SBarry Smith } 24917ab2063SBarry Smith 2501a83f524SJed Brown PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *nn,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2513b2fbd54SBarry Smith { 2523b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 253d0f46423SBarry Smith PetscInt i,*collengths,*cia,*cja,n = A->cmap->n,m = A->rmap->n; 25497f1f81fSBarry Smith PetscInt nz = a->i[m],row,*jj,mr,col; 2553b2fbd54SBarry Smith 2563a40ed3dSBarry Smith PetscFunctionBegin; 257899cda47SBarry Smith *nn = n; 2583a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2593b2fbd54SBarry Smith if (symmetric) { 2609566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,PETSC_TRUE,0,oshift,(PetscInt**)ia,(PetscInt**)ja)); 2613b2fbd54SBarry Smith } else { 2629566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n,&collengths)); 2639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n+1,&cia)); 2649566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz,&cja)); 2653b2fbd54SBarry Smith jj = a->j; 2663b2fbd54SBarry Smith for (i=0; i<nz; i++) { 267bfeeae90SHong Zhang collengths[jj[i]]++; 2683b2fbd54SBarry Smith } 2693b2fbd54SBarry Smith cia[0] = oshift; 2703b2fbd54SBarry Smith for (i=0; i<n; i++) { 2713b2fbd54SBarry Smith cia[i+1] = cia[i] + collengths[i]; 2723b2fbd54SBarry Smith } 2739566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths,n)); 2743b2fbd54SBarry Smith jj = a->j; 275a93ec695SBarry Smith for (row=0; row<m; row++) { 276a93ec695SBarry Smith mr = a->i[row+1] - a->i[row]; 277a93ec695SBarry Smith for (i=0; i<mr; i++) { 278bfeeae90SHong Zhang col = *jj++; 2792205254eSKarl Rupp 2803b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2813b2fbd54SBarry Smith } 2823b2fbd54SBarry Smith } 2839566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2843b2fbd54SBarry Smith *ia = cia; *ja = cja; 2853b2fbd54SBarry Smith } 2863a40ed3dSBarry Smith PetscFunctionReturn(0); 2873b2fbd54SBarry Smith } 2883b2fbd54SBarry Smith 2891a83f524SJed Brown PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2903b2fbd54SBarry Smith { 2913a40ed3dSBarry Smith PetscFunctionBegin; 2923a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2933b2fbd54SBarry Smith 2949566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2959566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2963a40ed3dSBarry Smith PetscFunctionReturn(0); 2973b2fbd54SBarry Smith } 2983b2fbd54SBarry Smith 2997cee066cSHong Zhang /* 3007cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 3017cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 302040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 3037cee066cSHong Zhang */ 3047cee066cSHong Zhang PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *nn,const PetscInt *ia[],const PetscInt *ja[],PetscInt *spidx[],PetscBool *done) 3057cee066cSHong Zhang { 3067cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3077cee066cSHong Zhang PetscInt i,*collengths,*cia,*cja,n = A->cmap->n,m = A->rmap->n; 308071fcb05SBarry Smith PetscInt nz = a->i[m],row,mr,col,tmp; 3097cee066cSHong Zhang PetscInt *cspidx; 310071fcb05SBarry Smith const PetscInt *jj; 3117cee066cSHong Zhang 3127cee066cSHong Zhang PetscFunctionBegin; 3137cee066cSHong Zhang *nn = n; 3147cee066cSHong Zhang if (!ia) PetscFunctionReturn(0); 315625f6d37SHong Zhang 3169566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n,&collengths)); 3179566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n+1,&cia)); 3189566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz,&cja)); 3199566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz,&cspidx)); 3207cee066cSHong Zhang jj = a->j; 3217cee066cSHong Zhang for (i=0; i<nz; i++) { 3227cee066cSHong Zhang collengths[jj[i]]++; 3237cee066cSHong Zhang } 3247cee066cSHong Zhang cia[0] = oshift; 3257cee066cSHong Zhang for (i=0; i<n; i++) { 3267cee066cSHong Zhang cia[i+1] = cia[i] + collengths[i]; 3277cee066cSHong Zhang } 3289566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths,n)); 3297cee066cSHong Zhang jj = a->j; 3307cee066cSHong Zhang for (row=0; row<m; row++) { 3317cee066cSHong Zhang mr = a->i[row+1] - a->i[row]; 3327cee066cSHong Zhang for (i=0; i<mr; i++) { 3337cee066cSHong Zhang col = *jj++; 334071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 335071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 336071fcb05SBarry Smith cja[tmp] = row + oshift; 3377cee066cSHong Zhang } 3387cee066cSHong Zhang } 3399566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 340071fcb05SBarry Smith *ia = cia; 341071fcb05SBarry Smith *ja = cja; 3427cee066cSHong Zhang *spidx = cspidx; 3437cee066cSHong Zhang PetscFunctionReturn(0); 3447cee066cSHong Zhang } 3457cee066cSHong Zhang 3467cee066cSHong Zhang PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscInt *spidx[],PetscBool *done) 3477cee066cSHong Zhang { 3487cee066cSHong Zhang PetscFunctionBegin; 3499566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A,oshift,symmetric,inodecompressed,n,ia,ja,done)); 3509566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3517cee066cSHong Zhang PetscFunctionReturn(0); 3527cee066cSHong Zhang } 3537cee066cSHong Zhang 35487d4246cSBarry Smith PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A,PetscInt row,const PetscScalar v[]) 35587d4246cSBarry Smith { 35687d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 35787d4246cSBarry Smith PetscInt *ai = a->i; 358fff043a9SJunchao Zhang PetscScalar *aa; 35987d4246cSBarry Smith 36087d4246cSBarry Smith PetscFunctionBegin; 3619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 3629566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa+ai[row],v,ai[row+1]-ai[row])); 3639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 36487d4246cSBarry Smith PetscFunctionReturn(0); 36587d4246cSBarry Smith } 36687d4246cSBarry Smith 367bd04181cSBarry Smith /* 368bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 369bd04181cSBarry Smith 370bd04181cSBarry Smith - a single row of values is set with each call 371bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 372bd04181cSBarry Smith - the values are always added to the matrix, not set 373bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 374bd04181cSBarry Smith 3751f763a69SBarry Smith This does NOT assume the global column indices are sorted 376bd04181cSBarry Smith 3771f763a69SBarry Smith */ 378bd04181cSBarry Smith 379af0996ceSBarry Smith #include <petsc/private/isimpl.h> 380189e4007SBarry Smith PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 381189e4007SBarry Smith { 382189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3831f763a69SBarry Smith PetscInt low,high,t,row,nrow,i,col,l; 3841f763a69SBarry Smith const PetscInt *rp,*ai = a->i,*ailen = a->ilen,*aj = a->j; 3851f763a69SBarry Smith PetscInt lastcol = -1; 386fff043a9SJunchao Zhang MatScalar *ap,value,*aa; 387189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices,*cidx = A->cmap->mapping->indices; 388189e4007SBarry Smith 389fff043a9SJunchao Zhang PetscFunctionBegin; 3909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 391f38dd0b8SBarry Smith row = ridx[im[0]]; 3921f763a69SBarry Smith rp = aj + ai[row]; 3931f763a69SBarry Smith ap = aa + ai[row]; 3941f763a69SBarry Smith nrow = ailen[row]; 395189e4007SBarry Smith low = 0; 396189e4007SBarry Smith high = nrow; 397189e4007SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 398189e4007SBarry Smith col = cidx[in[l]]; 399f38dd0b8SBarry Smith value = v[l]; 400189e4007SBarry Smith 401189e4007SBarry Smith if (col <= lastcol) low = 0; 402189e4007SBarry Smith else high = nrow; 403189e4007SBarry Smith lastcol = col; 404189e4007SBarry Smith while (high-low > 5) { 405189e4007SBarry Smith t = (low+high)/2; 406189e4007SBarry Smith if (rp[t] > col) high = t; 407189e4007SBarry Smith else low = t; 408189e4007SBarry Smith } 409189e4007SBarry Smith for (i=low; i<high; i++) { 410189e4007SBarry Smith if (rp[i] == col) { 4111f763a69SBarry Smith ap[i] += value; 412189e4007SBarry Smith low = i + 1; 4131f763a69SBarry Smith break; 414189e4007SBarry Smith } 415189e4007SBarry Smith } 416189e4007SBarry Smith } 4179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 418f38dd0b8SBarry Smith return 0; 419189e4007SBarry Smith } 420189e4007SBarry Smith 42197f1f81fSBarry Smith PetscErrorCode MatSetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 42217ab2063SBarry Smith { 423416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 424e2ee6c50SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 42597f1f81fSBarry Smith PetscInt *imax = a->imax,*ai = a->i,*ailen = a->ilen; 426e2ee6c50SBarry Smith PetscInt *aj = a->j,nonew = a->nonew,lastcol = -1; 427ce496241SStefano Zampini MatScalar *ap=NULL,value=0.0,*aa; 428ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 429ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 43017ab2063SBarry Smith 4313a40ed3dSBarry Smith PetscFunctionBegin; 4329566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 43317ab2063SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 434416022c9SBarry Smith row = im[k]; 4355ef9f2a5SBarry Smith if (row < 0) continue; 4366bdcaf15SBarry Smith PetscCheck(row < A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT,row,A->rmap->n-1); 437720833daSHong Zhang rp = aj + ai[row]; 438876c6284SHong Zhang if (!A->structure_only) ap = aa + ai[row]; 43917ab2063SBarry Smith rmax = imax[row]; nrow = ailen[row]; 440416022c9SBarry Smith low = 0; 441c71e6ed7SBarry Smith high = nrow; 44217ab2063SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 4435ef9f2a5SBarry Smith if (in[l] < 0) continue; 4446bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT,in[l],A->cmap->n-1); 445bfeeae90SHong Zhang col = in[l]; 446071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k*n] : v[k + l*m]; 447071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 44836db0b34SBarry Smith 4492205254eSKarl Rupp if (col <= lastcol) low = 0; 4502205254eSKarl Rupp else high = nrow; 451e2ee6c50SBarry Smith lastcol = col; 452416022c9SBarry Smith while (high-low > 5) { 453416022c9SBarry Smith t = (low+high)/2; 454416022c9SBarry Smith if (rp[t] > col) high = t; 455416022c9SBarry Smith else low = t; 45617ab2063SBarry Smith } 457416022c9SBarry Smith for (i=low; i<high; i++) { 45817ab2063SBarry Smith if (rp[i] > col) break; 45917ab2063SBarry Smith if (rp[i] == col) { 460876c6284SHong Zhang if (!A->structure_only) { 4610c0d7e18SFande Kong if (is == ADD_VALUES) { 4620c0d7e18SFande Kong ap[i] += value; 4630c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4640c0d7e18SFande Kong } 46517ab2063SBarry Smith else ap[i] = value; 466720833daSHong Zhang } 467e44c0bd4SBarry Smith low = i + 1; 46817ab2063SBarry Smith goto noinsert; 46917ab2063SBarry Smith } 47017ab2063SBarry Smith } 471dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 472c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 47308401ef6SPierre Jolivet PetscCheck(nonew != -1,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix",row,col); 474720833daSHong Zhang if (A->structure_only) { 475876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A,A->rmap->n,1,nrow,row,col,rmax,ai,aj,rp,imax,nonew,MatScalar); 476720833daSHong Zhang } else { 477fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 478720833daSHong Zhang } 479c03d1d03SSatish Balay N = nrow++ - 1; a->nz++; high++; 480416022c9SBarry Smith /* shift up all the later entries in this row */ 4819566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp+i+1,rp+i,N-i+1)); 48217ab2063SBarry Smith rp[i] = col; 483580bdb30SBarry Smith if (!A->structure_only) { 4849566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap+i+1,ap+i,N-i+1)); 485580bdb30SBarry Smith ap[i] = value; 486580bdb30SBarry Smith } 487416022c9SBarry Smith low = i + 1; 488e56f5c9eSBarry Smith A->nonzerostate++; 489e44c0bd4SBarry Smith noinsert:; 49017ab2063SBarry Smith } 49117ab2063SBarry Smith ailen[row] = nrow; 49217ab2063SBarry Smith } 4939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 4943a40ed3dSBarry Smith PetscFunctionReturn(0); 49517ab2063SBarry Smith } 49617ab2063SBarry Smith 49719b08ed1SBarry Smith PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 49819b08ed1SBarry Smith { 49919b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 50019b08ed1SBarry Smith PetscInt *rp,k,row; 50119b08ed1SBarry Smith PetscInt *ai = a->i; 50219b08ed1SBarry Smith PetscInt *aj = a->j; 503fff043a9SJunchao Zhang MatScalar *aa,*ap; 50419b08ed1SBarry Smith 50519b08ed1SBarry Smith PetscFunctionBegin; 50628b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Cannot call on assembled matrix."); 50708401ef6SPierre Jolivet PetscCheck(m*n+a->nz <= a->maxnz,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()",a->maxnz); 508fff043a9SJunchao Zhang 5099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 51019b08ed1SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 51119b08ed1SBarry Smith row = im[k]; 51219b08ed1SBarry Smith rp = aj + ai[row]; 51319b08ed1SBarry Smith ap = aa + ai[row]; 51419b08ed1SBarry Smith 5159566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp,in,n*sizeof(PetscInt))); 51619b08ed1SBarry Smith if (!A->structure_only) { 51719b08ed1SBarry Smith if (v) { 5189566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap,v,n*sizeof(PetscScalar))); 51919b08ed1SBarry Smith v += n; 52019b08ed1SBarry Smith } else { 5219566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap,n*sizeof(PetscScalar))); 52219b08ed1SBarry Smith } 52319b08ed1SBarry Smith } 52419b08ed1SBarry Smith a->ilen[row] = n; 52519b08ed1SBarry Smith a->imax[row] = n; 52619b08ed1SBarry Smith a->i[row+1] = a->i[row]+n; 52719b08ed1SBarry Smith a->nz += n; 52819b08ed1SBarry Smith } 5299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 53019b08ed1SBarry Smith PetscFunctionReturn(0); 53119b08ed1SBarry Smith } 53219b08ed1SBarry Smith 53319b08ed1SBarry Smith /*@ 53419b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 53519b08ed1SBarry Smith 53619b08ed1SBarry Smith Input Parameters: 53719b08ed1SBarry Smith + A - the SeqAIJ matrix 53819b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 53919b08ed1SBarry Smith 54019b08ed1SBarry Smith Level: advanced 54119b08ed1SBarry Smith 54219b08ed1SBarry Smith Notes: 54319b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 54419b08ed1SBarry Smith Simply call MatSetValues() after this call to provide the matrix entries in the usual manner. This matrix may be used 54519b08ed1SBarry Smith as always with multiple matrix assemblies. 54619b08ed1SBarry Smith 547db781477SPatrick Sanan .seealso: `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 54819b08ed1SBarry Smith @*/ 54919b08ed1SBarry Smith 55019b08ed1SBarry Smith PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A,PetscInt nztotal) 55119b08ed1SBarry Smith { 55219b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 55319b08ed1SBarry Smith 55419b08ed1SBarry Smith PetscFunctionBegin; 5559566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5569566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 55719b08ed1SBarry Smith a->maxnz = nztotal; 55819b08ed1SBarry Smith if (!a->imax) { 5599566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n,&a->imax)); 5609566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,A->rmap->n*sizeof(PetscInt))); 56119b08ed1SBarry Smith } 56219b08ed1SBarry Smith if (!a->ilen) { 5639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n,&a->ilen)); 5649566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,A->rmap->n*sizeof(PetscInt))); 56519b08ed1SBarry Smith } else { 5669566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen,A->rmap->n*sizeof(PetscInt))); 56719b08ed1SBarry Smith } 56819b08ed1SBarry Smith 56919b08ed1SBarry Smith /* allocate the matrix space */ 57019b08ed1SBarry Smith if (A->structure_only) { 5719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nztotal,&a->j)); 5729566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n+1,&a->i)); 5739566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,(A->rmap->n+1)*sizeof(PetscInt)+nztotal*sizeof(PetscInt))); 57419b08ed1SBarry Smith } else { 5759566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nztotal,&a->a,nztotal,&a->j,A->rmap->n+1,&a->i)); 5769566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,(A->rmap->n+1)*sizeof(PetscInt)+nztotal*(sizeof(PetscScalar)+sizeof(PetscInt)))); 57719b08ed1SBarry Smith } 57819b08ed1SBarry Smith a->i[0] = 0; 57919b08ed1SBarry Smith if (A->structure_only) { 58019b08ed1SBarry Smith a->singlemalloc = PETSC_FALSE; 58119b08ed1SBarry Smith a->free_a = PETSC_FALSE; 58219b08ed1SBarry Smith } else { 58319b08ed1SBarry Smith a->singlemalloc = PETSC_TRUE; 58419b08ed1SBarry Smith a->free_a = PETSC_TRUE; 58519b08ed1SBarry Smith } 58619b08ed1SBarry Smith a->free_ij = PETSC_TRUE; 58719b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 58819b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 58919b08ed1SBarry Smith PetscFunctionReturn(0); 59019b08ed1SBarry Smith } 59119b08ed1SBarry Smith 592071fcb05SBarry Smith PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 593071fcb05SBarry Smith { 594071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 595071fcb05SBarry Smith PetscInt *rp,k,row; 596071fcb05SBarry Smith PetscInt *ai = a->i,*ailen = a->ilen; 597071fcb05SBarry Smith PetscInt *aj = a->j; 598fff043a9SJunchao Zhang MatScalar *aa,*ap; 599071fcb05SBarry Smith 600071fcb05SBarry Smith PetscFunctionBegin; 6019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 602071fcb05SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 603071fcb05SBarry Smith row = im[k]; 6046bdcaf15SBarry Smith PetscCheck(n <= a->imax[row],PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Preallocation for row %" PetscInt_FMT " does not match number of columns provided",n); 605071fcb05SBarry Smith rp = aj + ai[row]; 606071fcb05SBarry Smith ap = aa + ai[row]; 607071fcb05SBarry Smith if (!A->was_assembled) { 6089566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp,in,n*sizeof(PetscInt))); 609071fcb05SBarry Smith } 610071fcb05SBarry Smith if (!A->structure_only) { 611071fcb05SBarry Smith if (v) { 6129566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap,v,n*sizeof(PetscScalar))); 613071fcb05SBarry Smith v += n; 614071fcb05SBarry Smith } else { 6159566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap,n*sizeof(PetscScalar))); 616071fcb05SBarry Smith } 617071fcb05SBarry Smith } 618071fcb05SBarry Smith ailen[row] = n; 619071fcb05SBarry Smith a->nz += n; 620071fcb05SBarry Smith } 6219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 622071fcb05SBarry Smith PetscFunctionReturn(0); 623071fcb05SBarry Smith } 624071fcb05SBarry Smith 625a77337e4SBarry Smith PetscErrorCode MatGetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],PetscScalar v[]) 6267eb43aa7SLois Curfman McInnes { 6277eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 62897f1f81fSBarry Smith PetscInt *rp,k,low,high,t,row,nrow,i,col,l,*aj = a->j; 62997f1f81fSBarry Smith PetscInt *ai = a->i,*ailen = a->ilen; 630fff043a9SJunchao Zhang MatScalar *ap,*aa; 6317eb43aa7SLois Curfman McInnes 6323a40ed3dSBarry Smith PetscFunctionBegin; 6339566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 6347eb43aa7SLois Curfman McInnes for (k=0; k<m; k++) { /* loop over rows */ 6357eb43aa7SLois Curfman McInnes row = im[k]; 63654c59aa7SJacob Faibussowitsch if (row < 0) {v += n; continue;} /* negative row */ 63754c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT,row,A->rmap->n-1); 638bfeeae90SHong Zhang rp = aj + ai[row]; ap = aa + ai[row]; 6397eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6407eb43aa7SLois Curfman McInnes for (l=0; l<n; l++) { /* loop over columns */ 64154c59aa7SJacob Faibussowitsch if (in[l] < 0) {v++; continue;} /* negative column */ 64254c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT,in[l],A->cmap->n-1); 643bfeeae90SHong Zhang col = in[l]; 6447eb43aa7SLois Curfman McInnes high = nrow; low = 0; /* assume unsorted */ 6457eb43aa7SLois Curfman McInnes while (high-low > 5) { 6467eb43aa7SLois Curfman McInnes t = (low+high)/2; 6477eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6487eb43aa7SLois Curfman McInnes else low = t; 6497eb43aa7SLois Curfman McInnes } 6507eb43aa7SLois Curfman McInnes for (i=low; i<high; i++) { 6517eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6527eb43aa7SLois Curfman McInnes if (rp[i] == col) { 653b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6547eb43aa7SLois Curfman McInnes goto finished; 6557eb43aa7SLois Curfman McInnes } 6567eb43aa7SLois Curfman McInnes } 65797e567efSBarry Smith *v++ = 0.0; 6587eb43aa7SLois Curfman McInnes finished:; 6597eb43aa7SLois Curfman McInnes } 6607eb43aa7SLois Curfman McInnes } 6619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 6623a40ed3dSBarry Smith PetscFunctionReturn(0); 6637eb43aa7SLois Curfman McInnes } 6647eb43aa7SLois Curfman McInnes 6653ea6fe3dSLisandro Dalcin PetscErrorCode MatView_SeqAIJ_Binary(Mat mat,PetscViewer viewer) 66617ab2063SBarry Smith { 6673ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ*)mat->data; 668c898d852SStefano Zampini const PetscScalar *av; 6693ea6fe3dSLisandro Dalcin PetscInt header[4],M,N,m,nz,i; 6703ea6fe3dSLisandro Dalcin PetscInt *rowlens; 67117ab2063SBarry Smith 6723a40ed3dSBarry Smith PetscFunctionBegin; 6739566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6742205254eSKarl Rupp 6753ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6763ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6773ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6783ea6fe3dSLisandro Dalcin nz = A->nz; 679416022c9SBarry Smith 6803ea6fe3dSLisandro Dalcin /* write matrix header */ 6813ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6823ea6fe3dSLisandro Dalcin header[1] = M; header[2] = N; header[3] = nz; 6839566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer,header,4,PETSC_INT)); 684416022c9SBarry Smith 6853ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6869566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&rowlens)); 6873ea6fe3dSLisandro Dalcin for (i=0; i<m; i++) rowlens[i] = A->i[i+1] - A->i[i]; 6889566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer,rowlens,m,PETSC_INT)); 6899566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6903ea6fe3dSLisandro Dalcin /* store column indices */ 6919566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer,A->j,nz,PETSC_INT)); 692416022c9SBarry Smith /* store nonzero values */ 6939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat,&av)); 6949566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer,av,nz,PETSC_SCALAR)); 6959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat,&av)); 696b37d52dbSMark F. Adams 6973ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6989566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat,viewer)); 6993a40ed3dSBarry Smith PetscFunctionReturn(0); 70017ab2063SBarry Smith } 701416022c9SBarry Smith 7027dc0baabSHong Zhang static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A,PetscViewer viewer) 7037dc0baabSHong Zhang { 7047dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 7057dc0baabSHong Zhang PetscInt i,k,m=A->rmap->N; 7067dc0baabSHong Zhang 7077dc0baabSHong Zhang PetscFunctionBegin; 7089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 7097dc0baabSHong Zhang for (i=0; i<m; i++) { 7109566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"row %" PetscInt_FMT ":",i)); 7117dc0baabSHong Zhang for (k=a->i[i]; k<a->i[i+1]; k++) { 7129566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ") ",a->j[k])); 7137dc0baabSHong Zhang } 7149566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 7157dc0baabSHong Zhang } 7169566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 7177dc0baabSHong Zhang PetscFunctionReturn(0); 7187dc0baabSHong Zhang } 7197dc0baabSHong Zhang 72009573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat,PetscViewer); 721cd155464SBarry Smith 722dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_ASCII(Mat A,PetscViewer viewer) 723416022c9SBarry Smith { 724416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 725c898d852SStefano Zampini const PetscScalar *av; 72660e0710aSBarry Smith PetscInt i,j,m = A->rmap->n; 727e060cb09SBarry Smith const char *name; 728f3ef73ceSBarry Smith PetscViewerFormat format; 72917ab2063SBarry Smith 7303a40ed3dSBarry Smith PetscFunctionBegin; 7317dc0baabSHong Zhang if (A->structure_only) { 7329566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A,viewer)); 7337dc0baabSHong Zhang PetscFunctionReturn(0); 7347dc0baabSHong Zhang } 73543e49210SHong Zhang 7369566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer,&format)); 7372e5835c6SStefano Zampini if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0); 7382e5835c6SStefano Zampini 739c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&av)); 7419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&av)); 74271c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 74397f1f81fSBarry Smith PetscInt nofinalvalue = 0; 74460e0710aSBarry Smith if (m && ((a->i[m] == a->i[m-1]) || (a->j[a->nz-1] != A->cmap->n-1))) { 745c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 746d00d2cf4SBarry Smith nofinalvalue = 1; 747d00d2cf4SBarry Smith } 7489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 7499566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n",m,A->cmap->n)); 7509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%% Nonzeros = %" PetscInt_FMT " \n",a->nz)); 751fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7529566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"zzz = zeros(%" PetscInt_FMT ",4);\n",a->nz+nofinalvalue)); 753fbfe6fa7SJed Brown #else 7549566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"zzz = zeros(%" PetscInt_FMT ",3);\n",a->nz+nofinalvalue)); 755fbfe6fa7SJed Brown #endif 7569566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"zzz = [\n")); 75717ab2063SBarry Smith 75817ab2063SBarry Smith for (i=0; i<m; i++) { 75960e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 760aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n",i+1,a->j[j]+1,(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 76217ab2063SBarry Smith #else 7639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n",i+1,a->j[j]+1,(double)a->a[j])); 76417ab2063SBarry Smith #endif 76517ab2063SBarry Smith } 76617ab2063SBarry Smith } 767d00d2cf4SBarry Smith if (nofinalvalue) { 768c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n",m,A->cmap->n,0.,0.)); 770c337ccceSJed Brown #else 7719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n",m,A->cmap->n,0.0)); 772c337ccceSJed Brown #endif 773d00d2cf4SBarry Smith } 7749566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A,&name)); 7759566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"];\n %s = spconvert(zzz);\n",name)); 7769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 777fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 77944cd7ae7SLois Curfman McInnes for (i=0; i<m; i++) { 7809566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"row %" PetscInt_FMT ":",i)); 78160e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 782aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78336db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7849566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 78536db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7869566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)-PetscImaginaryPart(a->a[j]))); 78736db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7889566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)PetscRealPart(a->a[j]))); 7896831982aSBarry Smith } 79044cd7ae7SLois Curfman McInnes #else 7919566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)a->a[j])); 79244cd7ae7SLois Curfman McInnes #endif 79344cd7ae7SLois Curfman McInnes } 7949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 79544cd7ae7SLois Curfman McInnes } 7969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 797fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 79897f1f81fSBarry Smith PetscInt nzd=0,fshift=1,*sptr; 7999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 8009566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1,&sptr)); 801496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 802496be53dSLois Curfman McInnes sptr[i] = nzd+1; 80360e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 804496be53dSLois Curfman McInnes if (a->j[j] >= i) { 805aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 80636db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 807496be53dSLois Curfman McInnes #else 808496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 809496be53dSLois Curfman McInnes #endif 810496be53dSLois Curfman McInnes } 811496be53dSLois Curfman McInnes } 812496be53dSLois Curfman McInnes } 8132e44a96cSLois Curfman McInnes sptr[m] = nzd+1; 8149566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT "\n\n",m,nzd)); 8152e44a96cSLois Curfman McInnes for (i=0; i<m+1; i+=6) { 8162205254eSKarl Rupp if (i+4<m) { 8179566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4],sptr[i+5])); 8182205254eSKarl Rupp } else if (i+3<m) { 8199566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4])); 8202205254eSKarl Rupp } else if (i+2<m) { 8219566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3])); 8222205254eSKarl Rupp } else if (i+1<m) { 8239566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n",sptr[i],sptr[i+1],sptr[i+2])); 8242205254eSKarl Rupp } else if (i<m) { 8259566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT "\n",sptr[i],sptr[i+1])); 8262205254eSKarl Rupp } else { 8279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT "\n",sptr[i])); 8282205254eSKarl Rupp } 829496be53dSLois Curfman McInnes } 8309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 8319566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 832496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 83360e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 8349566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " ",a->j[j]+fshift)); 835496be53dSLois Curfman McInnes } 8369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 837496be53dSLois Curfman McInnes } 8389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 839496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 84060e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 841496be53dSLois Curfman McInnes if (a->j[j] >= i) { 842aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 84336db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) { 8449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %18.16e %18.16e ",(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 8456831982aSBarry Smith } 846496be53dSLois Curfman McInnes #else 8479566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer," %18.16e ",(double)a->a[j])); 848496be53dSLois Curfman McInnes #endif 849496be53dSLois Curfman McInnes } 850496be53dSLois Curfman McInnes } 8519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 852496be53dSLois Curfman McInnes } 8539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 854fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 85597f1f81fSBarry Smith PetscInt cnt = 0,jcnt; 85687828ca2SBarry Smith PetscScalar value; 85768f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 85868f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 85968f1ed48SBarry Smith 86068f1ed48SBarry Smith for (i=0; i<a->i[m]; i++) { 86168f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 86268f1ed48SBarry Smith realonly = PETSC_FALSE; 86368f1ed48SBarry Smith break; 86468f1ed48SBarry Smith } 86568f1ed48SBarry Smith } 86668f1ed48SBarry Smith #endif 86702594712SBarry Smith 8689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 86902594712SBarry Smith for (i=0; i<m; i++) { 87002594712SBarry Smith jcnt = 0; 871d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 872e24b481bSBarry Smith if (jcnt < a->i[i+1]-a->i[i] && j == a->j[cnt]) { 87302594712SBarry Smith value = a->a[cnt++]; 874e24b481bSBarry Smith jcnt++; 87502594712SBarry Smith } else { 87602594712SBarry Smith value = 0.0; 87702594712SBarry Smith } 878aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 87968f1ed48SBarry Smith if (realonly) { 8809566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %7.5e ",(double)PetscRealPart(value))); 88168f1ed48SBarry Smith } else { 8829566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %7.5e+%7.5e i ",(double)PetscRealPart(value),(double)PetscImaginaryPart(value))); 88368f1ed48SBarry Smith } 88402594712SBarry Smith #else 8859566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %7.5e ",(double)value)); 88602594712SBarry Smith #endif 88702594712SBarry Smith } 8889566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 88902594712SBarry Smith } 8909566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 8913c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 892150b93efSMatthew G. Knepley PetscInt fshift=1; 8939566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 8943c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8959566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%%%%MatrixMarket matrix coordinate complex general\n")); 8963c215bfdSMatthew Knepley #else 8979566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%%%%MatrixMarket matrix coordinate real general\n")); 8983c215bfdSMatthew Knepley #endif 8999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 9003c215bfdSMatthew Knepley for (i=0; i<m; i++) { 90160e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 9023c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 9039566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i+fshift,a->j[j]+fshift,(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 9043c215bfdSMatthew Knepley #else 9059566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i+fshift, a->j[j]+fshift, (double)a->a[j])); 9063c215bfdSMatthew Knepley #endif 9073c215bfdSMatthew Knepley } 9083c215bfdSMatthew Knepley } 9099566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 9103a40ed3dSBarry Smith } else { 9119566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 912d5f3da31SBarry Smith if (A->factortype) { 91316cd7e1dSShri Abhyankar for (i=0; i<m; i++) { 9149566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"row %" PetscInt_FMT ":",i)); 91516cd7e1dSShri Abhyankar /* L part */ 91660e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 91716cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91816cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9199566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 92016cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9219566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)(-PetscImaginaryPart(a->a[j])))); 92216cd7e1dSShri Abhyankar } else { 9239566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)PetscRealPart(a->a[j]))); 92416cd7e1dSShri Abhyankar } 92516cd7e1dSShri Abhyankar #else 9269566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)a->a[j])); 92716cd7e1dSShri Abhyankar #endif 92816cd7e1dSShri Abhyankar } 92916cd7e1dSShri Abhyankar /* diagonal */ 93016cd7e1dSShri Abhyankar j = a->diag[i]; 93116cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 93216cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g + %g i)",a->j[j],(double)PetscRealPart(1.0/a->a[j]),(double)PetscImaginaryPart(1.0/a->a[j]))); 93416cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9359566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g - %g i)",a->j[j],(double)PetscRealPart(1.0/a->a[j]),(double)(-PetscImaginaryPart(1.0/a->a[j])))); 93616cd7e1dSShri Abhyankar } else { 9379566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)PetscRealPart(1.0/a->a[j]))); 93816cd7e1dSShri Abhyankar } 93916cd7e1dSShri Abhyankar #else 9409566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)(1.0/a->a[j]))); 94116cd7e1dSShri Abhyankar #endif 94216cd7e1dSShri Abhyankar 94316cd7e1dSShri Abhyankar /* U part */ 94460e0710aSBarry Smith for (j=a->diag[i+1]+1; j<a->diag[i]; j++) { 94516cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 94616cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9479566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 94816cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9499566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)(-PetscImaginaryPart(a->a[j])))); 95016cd7e1dSShri Abhyankar } else { 9519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)PetscRealPart(a->a[j]))); 95216cd7e1dSShri Abhyankar } 95316cd7e1dSShri Abhyankar #else 9549566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)a->a[j])); 95516cd7e1dSShri Abhyankar #endif 95616cd7e1dSShri Abhyankar } 9579566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 95816cd7e1dSShri Abhyankar } 95916cd7e1dSShri Abhyankar } else { 96017ab2063SBarry Smith for (i=0; i<m; i++) { 9619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"row %" PetscInt_FMT ":",i)); 96260e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 963aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 96436db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9659566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 96636db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9679566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)-PetscImaginaryPart(a->a[j]))); 9683a40ed3dSBarry Smith } else { 9699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)PetscRealPart(a->a[j]))); 97017ab2063SBarry Smith } 97117ab2063SBarry Smith #else 9729566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)a->a[j])); 97317ab2063SBarry Smith #endif 97417ab2063SBarry Smith } 9759566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 97617ab2063SBarry Smith } 97716cd7e1dSShri Abhyankar } 9789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 97917ab2063SBarry Smith } 9809566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9813a40ed3dSBarry Smith PetscFunctionReturn(0); 982416022c9SBarry Smith } 983416022c9SBarry Smith 9849804daf3SBarry Smith #include <petscdraw.h> 985dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw,void *Aa) 986416022c9SBarry Smith { 987480ef9eaSBarry Smith Mat A = (Mat) Aa; 988416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 989383922c3SLisandro Dalcin PetscInt i,j,m = A->rmap->n; 990383922c3SLisandro Dalcin int color; 991b05fc000SLisandro Dalcin PetscReal xl,yl,xr,yr,x_l,x_r,y_l,y_r; 992b0a32e0cSBarry Smith PetscViewer viewer; 993f3ef73ceSBarry Smith PetscViewerFormat format; 994fff043a9SJunchao Zhang const PetscScalar *aa; 995cddf8d76SBarry Smith 9963a40ed3dSBarry Smith PetscFunctionBegin; 9979566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A,"Zoomviewer",(PetscObject*)&viewer)); 9989566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer,&format)); 9999566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw,&xl,&yl,&xr,&yr)); 1000383922c3SLisandro Dalcin 1001416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 10029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 1003fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 1004d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10050513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 1006b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 1007416022c9SBarry Smith for (i=0; i<m; i++) { 1008cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 1009bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1010bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 1011fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 10129566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color)); 1013cddf8d76SBarry Smith } 1014cddf8d76SBarry Smith } 1015b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 1016cddf8d76SBarry Smith for (i=0; i<m; i++) { 1017cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 1018bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1019bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 1020fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 10219566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color)); 1022cddf8d76SBarry Smith } 1023cddf8d76SBarry Smith } 1024b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1025cddf8d76SBarry Smith for (i=0; i<m; i++) { 1026cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 1027bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1028bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 1029fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10309566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color)); 1031416022c9SBarry Smith } 1032416022c9SBarry Smith } 1033d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10340513a670SBarry Smith } else { 10350513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10360513a670SBarry Smith /* first determine max of all nonzero values */ 1037b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1038383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1039b0a32e0cSBarry Smith PetscDraw popup; 10400513a670SBarry Smith 10410513a670SBarry Smith for (i=0; i<nz; i++) { 1042fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10430513a670SBarry Smith } 1044383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10459566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw,&popup)); 10469566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup,minv,maxv)); 1047383922c3SLisandro Dalcin 1048d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10490513a670SBarry Smith for (i=0; i<m; i++) { 1050383922c3SLisandro Dalcin y_l = m - i - 1.0; 1051383922c3SLisandro Dalcin y_r = y_l + 1.0; 1052bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1053383922c3SLisandro Dalcin x_l = a->j[j]; 1054383922c3SLisandro Dalcin x_r = x_l + 1.0; 1055fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]),minv,maxv); 10569566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color)); 10570513a670SBarry Smith count++; 10580513a670SBarry Smith } 10590513a670SBarry Smith } 1060d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10610513a670SBarry Smith } 10629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 1063480ef9eaSBarry Smith PetscFunctionReturn(0); 1064480ef9eaSBarry Smith } 1065cddf8d76SBarry Smith 10669804daf3SBarry Smith #include <petscdraw.h> 1067dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw(Mat A,PetscViewer viewer) 1068480ef9eaSBarry Smith { 1069b0a32e0cSBarry Smith PetscDraw draw; 107036db0b34SBarry Smith PetscReal xr,yr,xl,yl,h,w; 1071ace3abfcSBarry Smith PetscBool isnull; 1072480ef9eaSBarry Smith 1073480ef9eaSBarry Smith PetscFunctionBegin; 10749566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer,0,&draw)); 10759566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw,&isnull)); 1076480ef9eaSBarry Smith if (isnull) PetscFunctionReturn(0); 1077480ef9eaSBarry Smith 1078d0f46423SBarry Smith xr = A->cmap->n; yr = A->rmap->n; h = yr/10.0; w = xr/10.0; 1079480ef9eaSBarry Smith xr += w; yr += h; xl = -w; yl = -h; 10809566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw,xl,yl,xr,yr)); 10819566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A,"Zoomviewer",(PetscObject)viewer)); 10829566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw,MatView_SeqAIJ_Draw_Zoom,A)); 10839566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A,"Zoomviewer",NULL)); 10849566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10853a40ed3dSBarry Smith PetscFunctionReturn(0); 1086416022c9SBarry Smith } 1087416022c9SBarry Smith 1088dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ(Mat A,PetscViewer viewer) 1089416022c9SBarry Smith { 1090ace3abfcSBarry Smith PetscBool iascii,isbinary,isdraw; 1091416022c9SBarry Smith 10923a40ed3dSBarry Smith PetscFunctionBegin; 10939566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii)); 10949566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary)); 10959566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERDRAW,&isdraw)); 10961baa6e33SBarry Smith if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A,viewer)); 10971baa6e33SBarry Smith else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A,viewer)); 10981baa6e33SBarry Smith else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A,viewer)); 10999566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A,viewer)); 11003a40ed3dSBarry Smith PetscFunctionReturn(0); 110117ab2063SBarry Smith } 110219bcc07fSBarry Smith 1103dfbe8321SBarry Smith PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A,MatAssemblyType mode) 110417ab2063SBarry Smith { 1105416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1106580bdb30SBarry Smith PetscInt fshift = 0,i,*ai = a->i,*aj = a->j,*imax = a->imax; 1107d0f46423SBarry Smith PetscInt m = A->rmap->n,*ip,N,*ailen = a->ilen,rmax = 0; 110854f21887SBarry Smith MatScalar *aa = a->a,*ap; 11093447b6efSHong Zhang PetscReal ratio = 0.6; 111017ab2063SBarry Smith 11113a40ed3dSBarry Smith PetscFunctionBegin; 11123a40ed3dSBarry Smith if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0); 11139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1114b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1115b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11169566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A,mode)); 1117b215bc84SStefano Zampini PetscFunctionReturn(0); 1118b215bc84SStefano Zampini } 111917ab2063SBarry Smith 112043ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 112117ab2063SBarry Smith for (i=1; i<m; i++) { 1122416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 112317ab2063SBarry Smith fshift += imax[i-1] - ailen[i-1]; 112494a9d846SBarry Smith rmax = PetscMax(rmax,ailen[i]); 112517ab2063SBarry Smith if (fshift) { 1126bfeeae90SHong Zhang ip = aj + ai[i]; 1127bfeeae90SHong Zhang ap = aa + ai[i]; 112817ab2063SBarry Smith N = ailen[i]; 11299566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip-fshift,ip,N)); 1130580bdb30SBarry Smith if (!A->structure_only) { 11319566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap-fshift,ap,N)); 113217ab2063SBarry Smith } 113317ab2063SBarry Smith } 113417ab2063SBarry Smith ai[i] = ai[i-1] + ailen[i-1]; 113517ab2063SBarry Smith } 113617ab2063SBarry Smith if (m) { 113717ab2063SBarry Smith fshift += imax[m-1] - ailen[m-1]; 113817ab2063SBarry Smith ai[m] = ai[m-1] + ailen[m-1]; 113917ab2063SBarry Smith } 11407b083b7cSBarry Smith 114117ab2063SBarry Smith /* reset ilen and imax for each row */ 11427b083b7cSBarry Smith a->nonzerorowcnt = 0; 1143396832f4SHong Zhang if (A->structure_only) { 11449566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11459566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1146396832f4SHong Zhang } else { /* !A->structure_only */ 114717ab2063SBarry Smith for (i=0; i<m; i++) { 114817ab2063SBarry Smith ailen[i] = imax[i] = ai[i+1] - ai[i]; 11497b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i+1] - ai[i]) > 0); 115017ab2063SBarry Smith } 1151396832f4SHong Zhang } 1152bfeeae90SHong Zhang a->nz = ai[m]; 1153aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1,PETSC_COMM_SELF,PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 115417ab2063SBarry Smith 11559566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 11569566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n",m,A->cmap->n,fshift,a->nz)); 11579566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n",a->reallocs)); 11589566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Maximum nonzeros in any row is %" PetscInt_FMT "\n",rmax)); 11592205254eSKarl Rupp 11608e58a170SBarry Smith A->info.mallocs += a->reallocs; 1161dd5f02e7SSatish Balay a->reallocs = 0; 11626712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 116336db0b34SBarry Smith a->rmax = rmax; 11644e220ebcSLois Curfman McInnes 1165396832f4SHong Zhang if (!A->structure_only) { 11669566063dSJacob Faibussowitsch PetscCall(MatCheckCompressedRow(A,a->nonzerorowcnt,&a->compressedrow,a->i,m,ratio)); 1167396832f4SHong Zhang } 11689566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A,mode)); 11693a40ed3dSBarry Smith PetscFunctionReturn(0); 117017ab2063SBarry Smith } 117117ab2063SBarry Smith 117299cafbc1SBarry Smith PetscErrorCode MatRealPart_SeqAIJ(Mat A) 117399cafbc1SBarry Smith { 117499cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 117599cafbc1SBarry Smith PetscInt i,nz = a->nz; 11762e5835c6SStefano Zampini MatScalar *aa; 117799cafbc1SBarry Smith 117899cafbc1SBarry Smith PetscFunctionBegin; 11799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 118099cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscRealPart(aa[i]); 11819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 11829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 118399cafbc1SBarry Smith PetscFunctionReturn(0); 118499cafbc1SBarry Smith } 118599cafbc1SBarry Smith 118699cafbc1SBarry Smith PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 118799cafbc1SBarry Smith { 118899cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 118999cafbc1SBarry Smith PetscInt i,nz = a->nz; 11902e5835c6SStefano Zampini MatScalar *aa; 119199cafbc1SBarry Smith 119299cafbc1SBarry Smith PetscFunctionBegin; 11939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 119499cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 11969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 119799cafbc1SBarry Smith PetscFunctionReturn(0); 119899cafbc1SBarry Smith } 119999cafbc1SBarry Smith 1200dfbe8321SBarry Smith PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 120117ab2063SBarry Smith { 1202fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1203fff043a9SJunchao Zhang MatScalar *aa; 12043a40ed3dSBarry Smith 12053a40ed3dSBarry Smith PetscFunctionBegin; 12069566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A,&aa)); 12079566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa,a->i[A->rmap->n])); 12089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A,&aa)); 12099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 12103a40ed3dSBarry Smith PetscFunctionReturn(0); 121117ab2063SBarry Smith } 1212416022c9SBarry Smith 1213cbc6b225SStefano Zampini PETSC_INTERN PetscErrorCode MatResetPreallocationCOO_SeqAIJ(Mat A) 1214cbc6b225SStefano Zampini { 1215cbc6b225SStefano Zampini Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1216cbc6b225SStefano Zampini 1217cbc6b225SStefano Zampini PetscFunctionBegin; 12189566063dSJacob Faibussowitsch PetscCall(PetscFree(a->perm)); 12199566063dSJacob Faibussowitsch PetscCall(PetscFree(a->jmap)); 1220cbc6b225SStefano Zampini PetscFunctionReturn(0); 1221cbc6b225SStefano Zampini } 1222cbc6b225SStefano Zampini 1223dfbe8321SBarry Smith PetscErrorCode MatDestroy_SeqAIJ(Mat A) 122417ab2063SBarry Smith { 1225416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1226d5d45c9bSBarry Smith 12273a40ed3dSBarry Smith PetscFunctionBegin; 1228aa482453SBarry Smith #if defined(PETSC_USE_LOG) 1229c0aa6a63SJacob Faibussowitsch PetscLogObjectState((PetscObject)A,"Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT,A->rmap->n,A->cmap->n,a->nz); 123017ab2063SBarry Smith #endif 12319566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A,&a->a,&a->j,&a->i)); 12329566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(A)); 12339566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12349566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12359566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12369566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12379566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12389566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12399566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12409566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag,a->mdiag,a->ssor_work)); 12419566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12429566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12439566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12449566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i,a->compressedrow.rindex)); 12459566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 12469566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1247901853e0SKris Buschelman 12486718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12496718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12506718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12516718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12526718818eSStefano Zampini due to different matrix sizes */ 12539566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A,"__PETSc__ab_dense",NULL)); 12546718818eSStefano Zampini 12559566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A,NULL)); 12562e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"PetscMatlabEnginePut_C",NULL)); 12572e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"PetscMatlabEngineGet_C",NULL)); 12589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetColumnIndices_C",NULL)); 12599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatStoreValues_C",NULL)); 12609566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatRetrieveValues_C",NULL)); 12619566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqsbaij_C",NULL)); 12629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqbaij_C",NULL)); 12639566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijperm_C",NULL)); 12642e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijsell_C",NULL)); 12652e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12662e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijmkl_C",NULL)); 12672e956fe4SStefano Zampini #endif 12684222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijcusparse_C",NULL)); 12709566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaijcusparse_seqaij_C",NULL)); 12719566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaij_seqaijcusparse_C",NULL)); 12724222ddf1SHong Zhang #endif 12733d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijkokkos_C",NULL)); 12753d0639e7SStefano Zampini #endif 12769566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijcrl_C",NULL)); 1277af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_elemental_C",NULL)); 1279af8000cdSHong Zhang #endif 1280d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_scalapack_C",NULL)); 1282d24d4204SJose E. Roman #endif 128363c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12849566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_hypre_C",NULL)); 12859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_transpose_seqaij_seqaij_C",NULL)); 128663c07aadSStefano Zampini #endif 12879566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqdense_C",NULL)); 12889566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqsell_C",NULL)); 12899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_is_C",NULL)); 12909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatIsTranspose_C",NULL)); 12912e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatIsHermitianTranspose_C",NULL)); 12929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetPreallocation_C",NULL)); 12939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatResetPreallocation_C",NULL)); 12949566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetPreallocationCSR_C",NULL)); 12959566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatReorderForNonzeroDiagonal_C",NULL)); 12969566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_is_seqaij_C",NULL)); 12979566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqdense_seqaij_C",NULL)); 12989566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaij_seqaij_C",NULL)); 12999566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJKron_C",NULL)); 13009566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSetPreallocationCOO_C",NULL)); 13019566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSetValuesCOO_C",NULL)); 13022e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatFactorGetSolverType_C",NULL)); 13032e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 13042e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaijsell_seqaij_C",NULL)); 13052e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaijperm_seqaij_C",NULL)); 13062e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijviennacl_C",NULL)); 13072e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaijviennacl_seqdense_C",NULL)); 13082e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaijviennacl_seqaij_C",NULL)); 13093a40ed3dSBarry Smith PetscFunctionReturn(0); 131017ab2063SBarry Smith } 131117ab2063SBarry Smith 1312ace3abfcSBarry Smith PetscErrorCode MatSetOption_SeqAIJ(Mat A,MatOption op,PetscBool flg) 131317ab2063SBarry Smith { 1314416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 13153a40ed3dSBarry Smith 13163a40ed3dSBarry Smith PetscFunctionBegin; 1317a65d3064SKris Buschelman switch (op) { 1318a65d3064SKris Buschelman case MAT_ROW_ORIENTED: 13194e0d8c25SBarry Smith a->roworiented = flg; 1320a65d3064SKris Buschelman break; 1321a9817697SBarry Smith case MAT_KEEP_NONZERO_PATTERN: 1322a9817697SBarry Smith a->keepnonzeropattern = flg; 1323a65d3064SKris Buschelman break; 1324512a5fc5SBarry Smith case MAT_NEW_NONZERO_LOCATIONS: 1325512a5fc5SBarry Smith a->nonew = (flg ? 0 : 1); 1326a65d3064SKris Buschelman break; 1327a65d3064SKris Buschelman case MAT_NEW_NONZERO_LOCATION_ERR: 13284e0d8c25SBarry Smith a->nonew = (flg ? -1 : 0); 1329a65d3064SKris Buschelman break; 1330a65d3064SKris Buschelman case MAT_NEW_NONZERO_ALLOCATION_ERR: 13314e0d8c25SBarry Smith a->nonew = (flg ? -2 : 0); 1332a65d3064SKris Buschelman break; 133328b2fa4aSMatthew Knepley case MAT_UNUSED_NONZERO_LOCATION_ERR: 133428b2fa4aSMatthew Knepley a->nounused = (flg ? -1 : 0); 133528b2fa4aSMatthew Knepley break; 1336a65d3064SKris Buschelman case MAT_IGNORE_ZERO_ENTRIES: 13374e0d8c25SBarry Smith a->ignorezeroentries = flg; 13380df259c2SBarry Smith break; 13393d472b54SHong Zhang case MAT_SPD: 1340b1646e73SJed Brown case MAT_SYMMETRIC: 1341b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1342b1646e73SJed Brown case MAT_HERMITIAN: 1343b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1344957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 1345b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 1346b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 1347b94d7dedSBarry Smith /* if the diagonal matrix is square it inherits some of the properties above */ 13485021d80fSJed Brown break; 13498c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 1350a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1351a65d3064SKris Buschelman case MAT_USE_HASH_TABLE: 13529566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Option %s ignored\n",MatOptions[op])); 1353a65d3064SKris Buschelman break; 1354b87ac2d8SJed Brown case MAT_USE_INODES: 13559566063dSJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A,MAT_USE_INODES,flg)); 1356b87ac2d8SJed Brown break; 1357c10200c1SHong Zhang case MAT_SUBMAT_SINGLEIS: 1358c10200c1SHong Zhang A->submat_singleis = flg; 1359c10200c1SHong Zhang break; 1360071fcb05SBarry Smith case MAT_SORTED_FULL: 1361071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1362071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1363071fcb05SBarry Smith break; 13641a2c6b5cSJunchao Zhang case MAT_FORM_EXPLICIT_TRANSPOSE: 13651a2c6b5cSJunchao Zhang A->form_explicit_transpose = flg; 13661a2c6b5cSJunchao Zhang break; 1367a65d3064SKris Buschelman default: 136898921bdaSJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"unknown option %d",op); 1369a65d3064SKris Buschelman } 13703a40ed3dSBarry Smith PetscFunctionReturn(0); 137117ab2063SBarry Smith } 137217ab2063SBarry Smith 1373dfbe8321SBarry Smith PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A,Vec v) 137417ab2063SBarry Smith { 1375416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1376fdc842d1SBarry Smith PetscInt i,j,n,*ai=a->i,*aj=a->j; 1377c898d852SStefano Zampini PetscScalar *x; 1378c898d852SStefano Zampini const PetscScalar *aa; 137917ab2063SBarry Smith 13803a40ed3dSBarry Smith PetscFunctionBegin; 13819566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v,&n)); 138208401ef6SPierre Jolivet PetscCheck(n == A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 13839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 1384d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1385d3e70bfaSHong Zhang PetscInt *diag=a->diag; 13869566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 13872c990fa1SHong Zhang for (i=0; i<n; i++) x[i] = 1.0/aa[diag[i]]; 13889566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 13899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 139035e7444dSHong Zhang PetscFunctionReturn(0); 139135e7444dSHong Zhang } 139235e7444dSHong Zhang 13939566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 139435e7444dSHong Zhang for (i=0; i<n; i++) { 1395fdc842d1SBarry Smith x[i] = 0.0; 139635e7444dSHong Zhang for (j=ai[i]; j<ai[i+1]; j++) { 139735e7444dSHong Zhang if (aj[j] == i) { 139835e7444dSHong Zhang x[i] = aa[j]; 139917ab2063SBarry Smith break; 140017ab2063SBarry Smith } 140117ab2063SBarry Smith } 140217ab2063SBarry Smith } 14039566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 14049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 14053a40ed3dSBarry Smith PetscFunctionReturn(0); 140617ab2063SBarry Smith } 140717ab2063SBarry Smith 1408c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1409dfbe8321SBarry Smith PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A,Vec xx,Vec zz,Vec yy) 141017ab2063SBarry Smith { 1411416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 14125f22a7b3SSebastian Grimberg const MatScalar *aa; 1413d9ca1df4SBarry Smith PetscScalar *y; 1414d9ca1df4SBarry Smith const PetscScalar *x; 1415d0f46423SBarry Smith PetscInt m = A->rmap->n; 14165c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 14175f22a7b3SSebastian Grimberg const MatScalar *v; 1418a77337e4SBarry Smith PetscScalar alpha; 1419d9ca1df4SBarry Smith PetscInt n,i,j; 1420d9ca1df4SBarry Smith const PetscInt *idx,*ii,*ridx=NULL; 14213447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1422ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14235c897100SBarry Smith #endif 142417ab2063SBarry Smith 14253a40ed3dSBarry Smith PetscFunctionBegin; 14269566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz,yy)); 14279566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx,&x)); 14289566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy,&y)); 14299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 14305c897100SBarry Smith 14315c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1432fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m,x,a->i,a->j,aa,y); 14335c897100SBarry Smith #else 14343447b6efSHong Zhang if (usecprow) { 14353447b6efSHong Zhang m = cprow.nrows; 14363447b6efSHong Zhang ii = cprow.i; 14377b2bb3b9SHong Zhang ridx = cprow.rindex; 14383447b6efSHong Zhang } else { 14393447b6efSHong Zhang ii = a->i; 14403447b6efSHong Zhang } 144117ab2063SBarry Smith for (i=0; i<m; i++) { 14423447b6efSHong Zhang idx = a->j + ii[i]; 1443fff043a9SJunchao Zhang v = aa + ii[i]; 14443447b6efSHong Zhang n = ii[i+1] - ii[i]; 14453447b6efSHong Zhang if (usecprow) { 14467b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14473447b6efSHong Zhang } else { 144817ab2063SBarry Smith alpha = x[i]; 14493447b6efSHong Zhang } 145004fbf559SBarry Smith for (j=0; j<n; j++) y[idx[j]] += alpha*v[j]; 145117ab2063SBarry Smith } 14525c897100SBarry Smith #endif 14539566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 14549566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx,&x)); 14559566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy,&y)); 14569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 14573a40ed3dSBarry Smith PetscFunctionReturn(0); 145817ab2063SBarry Smith } 145917ab2063SBarry Smith 1460dfbe8321SBarry Smith PetscErrorCode MatMultTranspose_SeqAIJ(Mat A,Vec xx,Vec yy) 14615c897100SBarry Smith { 14625c897100SBarry Smith PetscFunctionBegin; 14639566063dSJacob Faibussowitsch PetscCall(VecSet(yy,0.0)); 14649566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A,xx,yy,yy)); 14655c897100SBarry Smith PetscFunctionReturn(0); 14665c897100SBarry Smith } 14675c897100SBarry Smith 1468c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 146978b84d54SShri Abhyankar 1470dfbe8321SBarry Smith PetscErrorCode MatMult_SeqAIJ(Mat A,Vec xx,Vec yy) 147117ab2063SBarry Smith { 1472416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1473d9fead3dSBarry Smith PetscScalar *y; 147454f21887SBarry Smith const PetscScalar *x; 1475fff043a9SJunchao Zhang const MatScalar *aa,*a_a; 1476003131ecSBarry Smith PetscInt m=A->rmap->n; 14770298fd71SBarry Smith const PetscInt *aj,*ii,*ridx=NULL; 14787b083b7cSBarry Smith PetscInt n,i; 1479362ced78SSatish Balay PetscScalar sum; 1480ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 148117ab2063SBarry Smith 1482b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 148397952fefSHong Zhang #pragma disjoint(*x,*y,*aa) 1484fee21e36SBarry Smith #endif 1485fee21e36SBarry Smith 14863a40ed3dSBarry Smith PetscFunctionBegin; 1487b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14889566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A,xx,yy)); 1489b215bc84SStefano Zampini PetscFunctionReturn(0); 1490b215bc84SStefano Zampini } 14919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&a_a)); 14929566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx,&x)); 14939566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy,&y)); 1494416022c9SBarry Smith ii = a->i; 14954eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14969566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y,m)); 149797952fefSHong Zhang m = a->compressedrow.nrows; 149897952fefSHong Zhang ii = a->compressedrow.i; 149997952fefSHong Zhang ridx = a->compressedrow.rindex; 150097952fefSHong Zhang for (i=0; i<m; i++) { 150197952fefSHong Zhang n = ii[i+1] - ii[i]; 150297952fefSHong Zhang aj = a->j + ii[i]; 1503fff043a9SJunchao Zhang aa = a_a + ii[i]; 150497952fefSHong Zhang sum = 0.0; 1505003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 1506003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 150797952fefSHong Zhang y[*ridx++] = sum; 150897952fefSHong Zhang } 150997952fefSHong Zhang } else { /* do not use compressed row format */ 1510b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 15113d3eaba7SBarry Smith aj = a->j; 1512fff043a9SJunchao Zhang aa = a_a; 1513b05257ddSBarry Smith fortranmultaij_(&m,x,ii,aj,aa,y); 1514b05257ddSBarry Smith #else 151517ab2063SBarry Smith for (i=0; i<m; i++) { 1516003131ecSBarry Smith n = ii[i+1] - ii[i]; 1517003131ecSBarry Smith aj = a->j + ii[i]; 1518fff043a9SJunchao Zhang aa = a_a + ii[i]; 151917ab2063SBarry Smith sum = 0.0; 1520003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 152117ab2063SBarry Smith y[i] = sum; 152217ab2063SBarry Smith } 15238d195f9aSBarry Smith #endif 1524b05257ddSBarry Smith } 15259566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz - a->nonzerorowcnt)); 15269566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx,&x)); 15279566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy,&y)); 15289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&a_a)); 15293a40ed3dSBarry Smith PetscFunctionReturn(0); 153017ab2063SBarry Smith } 153117ab2063SBarry Smith 1532b434eb95SMatthew G. Knepley PetscErrorCode MatMultMax_SeqAIJ(Mat A,Vec xx,Vec yy) 1533b434eb95SMatthew G. Knepley { 1534b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1535b434eb95SMatthew G. Knepley PetscScalar *y; 1536b434eb95SMatthew G. Knepley const PetscScalar *x; 1537fff043a9SJunchao Zhang const MatScalar *aa,*a_a; 1538b434eb95SMatthew G. Knepley PetscInt m=A->rmap->n; 1539b434eb95SMatthew G. Knepley const PetscInt *aj,*ii,*ridx=NULL; 1540b434eb95SMatthew G. Knepley PetscInt n,i,nonzerorow=0; 1541b434eb95SMatthew G. Knepley PetscScalar sum; 1542b434eb95SMatthew G. Knepley PetscBool usecprow=a->compressedrow.use; 1543b434eb95SMatthew G. Knepley 1544b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1545b434eb95SMatthew G. Knepley #pragma disjoint(*x,*y,*aa) 1546b434eb95SMatthew G. Knepley #endif 1547b434eb95SMatthew G. Knepley 1548b434eb95SMatthew G. Knepley PetscFunctionBegin; 15499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&a_a)); 15509566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx,&x)); 15519566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy,&y)); 1552b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1553b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1554b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1555b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1556b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1557b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1558b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1559fff043a9SJunchao Zhang aa = a_a + ii[i]; 1560b434eb95SMatthew G. Knepley sum = 0.0; 1561b434eb95SMatthew G. Knepley nonzerorow += (n>0); 1562b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1563b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1564b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1565b434eb95SMatthew G. Knepley } 1566b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15673d3eaba7SBarry Smith ii = a->i; 1568b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1569b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1570b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1571fff043a9SJunchao Zhang aa = a_a + ii[i]; 1572b434eb95SMatthew G. Knepley sum = 0.0; 1573b434eb95SMatthew G. Knepley nonzerorow += (n>0); 1574b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1575b434eb95SMatthew G. Knepley y[i] = sum; 1576b434eb95SMatthew G. Knepley } 1577b434eb95SMatthew G. Knepley } 15789566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz - nonzerorow)); 15799566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx,&x)); 15809566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy,&y)); 15819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&a_a)); 1582b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1583b434eb95SMatthew G. Knepley } 1584b434eb95SMatthew G. Knepley 1585b434eb95SMatthew G. Knepley PetscErrorCode MatMultAddMax_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz) 1586b434eb95SMatthew G. Knepley { 1587b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1588b434eb95SMatthew G. Knepley PetscScalar *y,*z; 1589b434eb95SMatthew G. Knepley const PetscScalar *x; 1590fff043a9SJunchao Zhang const MatScalar *aa,*a_a; 1591b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n,*aj,*ii; 1592b434eb95SMatthew G. Knepley PetscInt n,i,*ridx=NULL; 1593b434eb95SMatthew G. Knepley PetscScalar sum; 1594b434eb95SMatthew G. Knepley PetscBool usecprow=a->compressedrow.use; 1595b434eb95SMatthew G. Knepley 1596b434eb95SMatthew G. Knepley PetscFunctionBegin; 15979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&a_a)); 15989566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx,&x)); 15999566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy,zz,&y,&z)); 1600b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1601b434eb95SMatthew G. Knepley if (zz != yy) { 16029566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(z,y,m)); 1603b434eb95SMatthew G. Knepley } 1604b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1605b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1606b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1607b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1608b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1609b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1610fff043a9SJunchao Zhang aa = a_a + ii[i]; 1611b434eb95SMatthew G. Knepley sum = y[*ridx]; 1612b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1613b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1614b434eb95SMatthew G. Knepley } 1615b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 16163d3eaba7SBarry Smith ii = a->i; 1617b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1618b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1619b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1620fff043a9SJunchao Zhang aa = a_a + ii[i]; 1621b434eb95SMatthew G. Knepley sum = y[i]; 1622b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1623b434eb95SMatthew G. Knepley z[i] = sum; 1624b434eb95SMatthew G. Knepley } 1625b434eb95SMatthew G. Knepley } 16269566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 16279566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx,&x)); 16289566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy,zz,&y,&z)); 16299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&a_a)); 1630b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1631b434eb95SMatthew G. Knepley } 1632b434eb95SMatthew G. Knepley 1633c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1634dfbe8321SBarry Smith PetscErrorCode MatMultAdd_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz) 163517ab2063SBarry Smith { 1636416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1637f15663dcSBarry Smith PetscScalar *y,*z; 1638f15663dcSBarry Smith const PetscScalar *x; 1639fff043a9SJunchao Zhang const MatScalar *aa,*a_a; 1640d9ca1df4SBarry Smith const PetscInt *aj,*ii,*ridx=NULL; 1641d9ca1df4SBarry Smith PetscInt m = A->rmap->n,n,i; 1642362ced78SSatish Balay PetscScalar sum; 1643ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 16449ea0dfa2SSatish Balay 16453a40ed3dSBarry Smith PetscFunctionBegin; 1646b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16479566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A,xx,yy,zz)); 1648b215bc84SStefano Zampini PetscFunctionReturn(0); 1649b215bc84SStefano Zampini } 16509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&a_a)); 16519566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx,&x)); 16529566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy,zz,&y,&z)); 16534eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 16544eb6d288SHong Zhang if (zz != yy) { 16559566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(z,y,m)); 16564eb6d288SHong Zhang } 165797952fefSHong Zhang m = a->compressedrow.nrows; 165897952fefSHong Zhang ii = a->compressedrow.i; 165997952fefSHong Zhang ridx = a->compressedrow.rindex; 166097952fefSHong Zhang for (i=0; i<m; i++) { 166197952fefSHong Zhang n = ii[i+1] - ii[i]; 166297952fefSHong Zhang aj = a->j + ii[i]; 1663fff043a9SJunchao Zhang aa = a_a + ii[i]; 166497952fefSHong Zhang sum = y[*ridx]; 1665f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 166697952fefSHong Zhang z[*ridx++] = sum; 166797952fefSHong Zhang } 166897952fefSHong Zhang } else { /* do not use compressed row format */ 16693d3eaba7SBarry Smith ii = a->i; 1670f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16713d3eaba7SBarry Smith aj = a->j; 1672fff043a9SJunchao Zhang aa = a_a; 1673f15663dcSBarry Smith fortranmultaddaij_(&m,x,ii,aj,aa,y,z); 1674f15663dcSBarry Smith #else 167517ab2063SBarry Smith for (i=0; i<m; i++) { 1676f15663dcSBarry Smith n = ii[i+1] - ii[i]; 1677f15663dcSBarry Smith aj = a->j + ii[i]; 1678fff043a9SJunchao Zhang aa = a_a + ii[i]; 167917ab2063SBarry Smith sum = y[i]; 1680f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 168117ab2063SBarry Smith z[i] = sum; 168217ab2063SBarry Smith } 168302ab625aSSatish Balay #endif 1684f15663dcSBarry Smith } 16859566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 16869566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx,&x)); 16879566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy,zz,&y,&z)); 16889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&a_a)); 16893a40ed3dSBarry Smith PetscFunctionReturn(0); 169017ab2063SBarry Smith } 169117ab2063SBarry Smith 169217ab2063SBarry Smith /* 169317ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 169417ab2063SBarry Smith */ 1695dfbe8321SBarry Smith PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 169617ab2063SBarry Smith { 1697416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1698d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n; 1699c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 170017ab2063SBarry Smith 17013a40ed3dSBarry Smith PetscFunctionBegin; 170209f38230SBarry Smith if (!a->diag) { 17039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&a->diag)); 17049566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A, m*sizeof(PetscInt))); 1705c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 170609f38230SBarry Smith } 1707d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 1708c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1709c0c07093SJunchao Zhang if (alreadySet) { 1710c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1711c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i+1] && a->j[pos] == i) continue; 1712c0c07093SJunchao Zhang } 1713c0c07093SJunchao Zhang 171409f38230SBarry Smith a->diag[i] = a->i[i+1]; 1715bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1716bfeeae90SHong Zhang if (a->j[j] == i) { 171709f38230SBarry Smith a->diag[i] = j; 171817ab2063SBarry Smith break; 171917ab2063SBarry Smith } 172017ab2063SBarry Smith } 172117ab2063SBarry Smith } 17223a40ed3dSBarry Smith PetscFunctionReturn(0); 172317ab2063SBarry Smith } 172417ab2063SBarry Smith 172561ecd0c6SBarry Smith PetscErrorCode MatShift_SeqAIJ(Mat A,PetscScalar v) 172661ecd0c6SBarry Smith { 172761ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 172861ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt*)a->diag; 172961ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt*) a->i; 173061ecd0c6SBarry Smith PetscInt i,*mdiag = NULL; 173161ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 173261ecd0c6SBarry Smith 173361ecd0c6SBarry Smith PetscFunctionBegin; 173461ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A,1,NULL)); 17369566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A,v)); 173761ecd0c6SBarry Smith PetscFunctionReturn(0); 173861ecd0c6SBarry Smith } 173961ecd0c6SBarry Smith 174061ecd0c6SBarry Smith if (a->diagonaldense) { 174161ecd0c6SBarry Smith cnt = 0; 174261ecd0c6SBarry Smith } else { 17439566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n,&mdiag)); 174461ecd0c6SBarry Smith for (i=0; i<A->rmap->n; i++) { 1745349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i+1]) { /* 'out of range' rows never have diagonals */ 174661ecd0c6SBarry Smith cnt++; 174761ecd0c6SBarry Smith mdiag[i] = 1; 174861ecd0c6SBarry Smith } 174961ecd0c6SBarry Smith } 175061ecd0c6SBarry Smith } 175161ecd0c6SBarry Smith if (!cnt) { 17529566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A,v)); 175361ecd0c6SBarry Smith } else { 1754b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1755b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 175661ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc,free_a = a->free_a,free_ij = a->free_ij; 175761ecd0c6SBarry Smith 175861ecd0c6SBarry Smith a->a = NULL; 175961ecd0c6SBarry Smith a->j = NULL; 176061ecd0c6SBarry Smith a->i = NULL; 176161ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1762349d3b71SJunchao Zhang for (i=0; i<PetscMin(A->rmap->n,A->cmap->n); i++) { 176361ecd0c6SBarry Smith a->imax[i] += mdiag[i]; 176461ecd0c6SBarry Smith } 17659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A,0,a->imax)); 176661ecd0c6SBarry Smith 176761ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 176861ecd0c6SBarry Smith for (i=0; i<A->rmap->n; i++) { 17699566063dSJacob Faibussowitsch PetscCall(MatSetValues(A,1,&i,a->imax[i] - mdiag[i],&oldj[oldi[i]],&olda[oldi[i]],ADD_VALUES)); 1770447d62f5SStefano Zampini if (i < A->cmap->n) { 17719566063dSJacob Faibussowitsch PetscCall(MatSetValue(A,i,i,v,ADD_VALUES)); 177261ecd0c6SBarry Smith } 1773447d62f5SStefano Zampini } 17749566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A,MAT_FINAL_ASSEMBLY)); 17759566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A,MAT_FINAL_ASSEMBLY)); 177661ecd0c6SBarry Smith if (singlemalloc) { 17779566063dSJacob Faibussowitsch PetscCall(PetscFree3(olda,oldj,oldi)); 177861ecd0c6SBarry Smith } else { 17799566063dSJacob Faibussowitsch if (free_a) PetscCall(PetscFree(olda)); 17809566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldj)); 17819566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldi)); 178261ecd0c6SBarry Smith } 178361ecd0c6SBarry Smith } 17849566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 178561ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 178661ecd0c6SBarry Smith PetscFunctionReturn(0); 178761ecd0c6SBarry Smith } 178861ecd0c6SBarry Smith 1789be5855fcSBarry Smith /* 1790be5855fcSBarry Smith Checks for missing diagonals 1791be5855fcSBarry Smith */ 1792ace3abfcSBarry Smith PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A,PetscBool *missing,PetscInt *d) 1793be5855fcSBarry Smith { 1794be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 17957734d3b5SMatthew G. Knepley PetscInt *diag,*ii = a->i,i; 1796be5855fcSBarry Smith 1797be5855fcSBarry Smith PetscFunctionBegin; 179809f38230SBarry Smith *missing = PETSC_FALSE; 17997734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 180009f38230SBarry Smith *missing = PETSC_TRUE; 180109f38230SBarry Smith if (d) *d = 0; 18029566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Matrix has no entries therefore is missing diagonal\n")); 180309f38230SBarry Smith } else { 180401445905SHong Zhang PetscInt n; 180501445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1806f1e2ffcdSBarry Smith diag = a->diag; 180701445905SHong Zhang for (i=0; i<n; i++) { 18087734d3b5SMatthew G. Knepley if (diag[i] >= ii[i+1]) { 180909f38230SBarry Smith *missing = PETSC_TRUE; 181009f38230SBarry Smith if (d) *d = i; 18119566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Matrix is missing diagonal number %" PetscInt_FMT "\n",i)); 1812358d2f5dSShri Abhyankar break; 181309f38230SBarry Smith } 1814be5855fcSBarry Smith } 1815be5855fcSBarry Smith } 1816be5855fcSBarry Smith PetscFunctionReturn(0); 1817be5855fcSBarry Smith } 1818be5855fcSBarry Smith 18190da83c2eSBarry Smith #include <petscblaslapack.h> 18200da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 18210da83c2eSBarry Smith 18220da83c2eSBarry Smith /* 18230da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 18240da83c2eSBarry Smith */ 18250da83c2eSBarry Smith PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A,PetscInt nblocks,const PetscInt *bsizes,PetscScalar *diag) 18260da83c2eSBarry Smith { 18270da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx,j,bsizemax = 0,*v_pivots; 18280da83c2eSBarry Smith PetscBool allowzeropivot,zeropivotdetected=PETSC_FALSE; 18290da83c2eSBarry Smith const PetscReal shift = 0.0; 18300da83c2eSBarry Smith PetscInt ipvt[5]; 18310da83c2eSBarry Smith PetscScalar work[25],*v_work; 18320da83c2eSBarry Smith 18330da83c2eSBarry Smith PetscFunctionBegin; 18340da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18350da83c2eSBarry Smith for (i=0; i<nblocks; i++) ncnt += bsizes[i]; 183608401ef6SPierre Jolivet PetscCheck(ncnt == n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT,ncnt,n); 18370da83c2eSBarry Smith for (i=0; i<nblocks; i++) { 18380da83c2eSBarry Smith bsizemax = PetscMax(bsizemax,bsizes[i]); 18390da83c2eSBarry Smith } 18409566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax,&indx)); 18410da83c2eSBarry Smith if (bsizemax > 7) { 18429566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(bsizemax,&v_work,bsizemax,&v_pivots)); 18430da83c2eSBarry Smith } 18440da83c2eSBarry Smith ncnt = 0; 18450da83c2eSBarry Smith for (i=0; i<nblocks; i++) { 18460da83c2eSBarry Smith for (j=0; j<bsizes[i]; j++) indx[j] = ncnt+j; 18479566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,bsizes[i],indx,bsizes[i],indx,diag)); 18480da83c2eSBarry Smith switch (bsizes[i]) { 18490da83c2eSBarry Smith case 1: 18500da83c2eSBarry Smith *diag = 1.0/(*diag); 18510da83c2eSBarry Smith break; 18520da83c2eSBarry Smith case 2: 18539566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag,shift,allowzeropivot,&zeropivotdetected)); 18540da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18559566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18560da83c2eSBarry Smith break; 18570da83c2eSBarry Smith case 3: 18589566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag,shift,allowzeropivot,&zeropivotdetected)); 18590da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18609566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18610da83c2eSBarry Smith break; 18620da83c2eSBarry Smith case 4: 18639566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag,shift,allowzeropivot,&zeropivotdetected)); 18640da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18659566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18660da83c2eSBarry Smith break; 18670da83c2eSBarry Smith case 5: 18689566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag,ipvt,work,shift,allowzeropivot,&zeropivotdetected)); 18690da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18709566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18710da83c2eSBarry Smith break; 18720da83c2eSBarry Smith case 6: 18739566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag,shift,allowzeropivot,&zeropivotdetected)); 18740da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18759566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18760da83c2eSBarry Smith break; 18770da83c2eSBarry Smith case 7: 18789566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag,shift,allowzeropivot,&zeropivotdetected)); 18790da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18809566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18810da83c2eSBarry Smith break; 18820da83c2eSBarry Smith default: 18839566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i],diag,v_pivots,v_work,allowzeropivot,&zeropivotdetected)); 18840da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18859566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag,bsizes[i])); 18860da83c2eSBarry Smith } 18870da83c2eSBarry Smith ncnt += bsizes[i]; 18880da83c2eSBarry Smith diag += bsizes[i]*bsizes[i]; 18890da83c2eSBarry Smith } 18900da83c2eSBarry Smith if (bsizemax > 7) { 18919566063dSJacob Faibussowitsch PetscCall(PetscFree2(v_work,v_pivots)); 18920da83c2eSBarry Smith } 18939566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18940da83c2eSBarry Smith PetscFunctionReturn(0); 18950da83c2eSBarry Smith } 18960da83c2eSBarry Smith 1897422a814eSBarry Smith /* 1898422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1899422a814eSBarry Smith */ 19007087cfbeSBarry Smith PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A,PetscScalar omega,PetscScalar fshift) 190171f1c65dSBarry Smith { 190271f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 1903d0f46423SBarry Smith PetscInt i,*diag,m = A->rmap->n; 19042e5835c6SStefano Zampini const MatScalar *v; 190554f21887SBarry Smith PetscScalar *idiag,*mdiag; 190671f1c65dSBarry Smith 190771f1c65dSBarry Smith PetscFunctionBegin; 190871f1c65dSBarry Smith if (a->idiagvalid) PetscFunctionReturn(0); 19099566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 191071f1c65dSBarry Smith diag = a->diag; 191171f1c65dSBarry Smith if (!a->idiag) { 19129566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(m,&a->idiag,m,&a->mdiag,m,&a->ssor_work)); 19139566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,3*m*sizeof(PetscScalar))); 191471f1c65dSBarry Smith } 19152e5835c6SStefano Zampini 191671f1c65dSBarry Smith mdiag = a->mdiag; 191771f1c65dSBarry Smith idiag = a->idiag; 19189566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&v)); 1919422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 192071f1c65dSBarry Smith for (i=0; i<m; i++) { 192171f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1922899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1923899639b0SHong Zhang if (PetscRealPart(fshift)) { 19249566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Zero diagonal on row %" PetscInt_FMT "\n",i)); 19257b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 19267b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 19277b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 192898921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Zero diagonal on row %" PetscInt_FMT,i); 1929899639b0SHong Zhang } 193071f1c65dSBarry Smith idiag[i] = 1.0/v[diag[i]]; 193171f1c65dSBarry Smith } 19329566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 193371f1c65dSBarry Smith } else { 193471f1c65dSBarry Smith for (i=0; i<m; i++) { 193571f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 193671f1c65dSBarry Smith idiag[i] = omega/(fshift + v[diag[i]]); 193771f1c65dSBarry Smith } 19389566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*m)); 193971f1c65dSBarry Smith } 194071f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&v)); 194271f1c65dSBarry Smith PetscFunctionReturn(0); 194371f1c65dSBarry Smith } 194471f1c65dSBarry Smith 1945c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 194641f059aeSBarry Smith PetscErrorCode MatSOR_SeqAIJ(Mat A,Vec bb,PetscReal omega,MatSORType flag,PetscReal fshift,PetscInt its,PetscInt lits,Vec xx) 194717ab2063SBarry Smith { 1948416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1949e6d1f457SBarry Smith PetscScalar *x,d,sum,*t,scale; 19502e5835c6SStefano Zampini const MatScalar *v,*idiag=NULL,*mdiag,*aa; 195154f21887SBarry Smith const PetscScalar *b, *bs,*xb, *ts; 19523d3eaba7SBarry Smith PetscInt n,m = A->rmap->n,i; 195397f1f81fSBarry Smith const PetscInt *idx,*diag; 195417ab2063SBarry Smith 19553a40ed3dSBarry Smith PetscFunctionBegin; 1956b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19579566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A,bb,omega,flag,fshift,its,lits,xx)); 1958b215bc84SStefano Zampini PetscFunctionReturn(0); 1959b215bc84SStefano Zampini } 1960b965ef7fSBarry Smith its = its*lits; 196191723122SBarry Smith 196271f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19639566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A,omega,fshift)); 196471f1c65dSBarry Smith a->fshift = fshift; 196571f1c65dSBarry Smith a->omega = omega; 1966ed480e8bSBarry Smith 196771f1c65dSBarry Smith diag = a->diag; 196871f1c65dSBarry Smith t = a->ssor_work; 1969ed480e8bSBarry Smith idiag = a->idiag; 197071f1c65dSBarry Smith mdiag = a->mdiag; 1971ed480e8bSBarry Smith 19729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 19739566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx,&x)); 19749566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb,&b)); 1975ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 197617ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 197717ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1978ed480e8bSBarry Smith bs = b; 197917ab2063SBarry Smith for (i=0; i<m; i++) { 198071f1c65dSBarry Smith d = fshift + mdiag[i]; 1981416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1982ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19832e5835c6SStefano Zampini v = aa + diag[i] + 1; 198417ab2063SBarry Smith sum = b[i]*d/omega; 1985003131ecSBarry Smith PetscSparseDensePlusDot(sum,bs,v,idx,n); 198617ab2063SBarry Smith x[i] = sum; 198717ab2063SBarry Smith } 19889566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx,&x)); 19899566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb,&b)); 19909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 19919566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19923a40ed3dSBarry Smith PetscFunctionReturn(0); 199317ab2063SBarry Smith } 1994c783ea89SBarry Smith 199508401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER,PETSC_COMM_SELF,PETSC_ERR_SUP,"SOR_APPLY_LOWER is not implemented"); 1996f7d195e4SLawrence Mitchell if (flag & SOR_EISENSTAT) { 19974c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1998887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 199917ab2063SBarry Smith 200017ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 200117ab2063SBarry Smith 2002887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 200317ab2063SBarry Smith */ 200417ab2063SBarry Smith scale = (2.0/omega) - 1.0; 200517ab2063SBarry Smith 200617ab2063SBarry Smith /* x = (E + U)^{-1} b */ 200717ab2063SBarry Smith for (i=m-1; i>=0; i--) { 2008416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 2009ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20102e5835c6SStefano Zampini v = aa + diag[i] + 1; 201117ab2063SBarry Smith sum = b[i]; 2012e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 2013ed480e8bSBarry Smith x[i] = sum*idiag[i]; 201417ab2063SBarry Smith } 201517ab2063SBarry Smith 201617ab2063SBarry Smith /* t = b - (2*E - D)x */ 20172e5835c6SStefano Zampini v = aa; 20182205254eSKarl Rupp for (i=0; i<m; i++) t[i] = b[i] - scale*(v[*diag++])*x[i]; 201917ab2063SBarry Smith 202017ab2063SBarry Smith /* t = (E + L)^{-1}t */ 2021ed480e8bSBarry Smith ts = t; 2022416022c9SBarry Smith diag = a->diag; 202317ab2063SBarry Smith for (i=0; i<m; i++) { 2024416022c9SBarry Smith n = diag[i] - a->i[i]; 2025ed480e8bSBarry Smith idx = a->j + a->i[i]; 20262e5835c6SStefano Zampini v = aa + a->i[i]; 202717ab2063SBarry Smith sum = t[i]; 2028003131ecSBarry Smith PetscSparseDenseMinusDot(sum,ts,v,idx,n); 2029ed480e8bSBarry Smith t[i] = sum*idiag[i]; 2030733d66baSBarry Smith /* x = x + t */ 2031733d66baSBarry Smith x[i] += t[i]; 203217ab2063SBarry Smith } 203317ab2063SBarry Smith 20349566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0*m-1 + 2.0*a->nz)); 20359566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx,&x)); 20369566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb,&b)); 20373a40ed3dSBarry Smith PetscFunctionReturn(0); 203817ab2063SBarry Smith } 203917ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 204017ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 204117ab2063SBarry Smith for (i=0; i<m; i++) { 2042416022c9SBarry Smith n = diag[i] - a->i[i]; 2043ed480e8bSBarry Smith idx = a->j + a->i[i]; 20442e5835c6SStefano Zampini v = aa + a->i[i]; 204517ab2063SBarry Smith sum = b[i]; 2046e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 20475c99c7daSBarry Smith t[i] = sum; 2048ed480e8bSBarry Smith x[i] = sum*idiag[i]; 204917ab2063SBarry Smith } 20505c99c7daSBarry Smith xb = t; 20519566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20523a40ed3dSBarry Smith } else xb = b; 205317ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 205417ab2063SBarry Smith for (i=m-1; i>=0; i--) { 2055416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 2056ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20572e5835c6SStefano Zampini v = aa + diag[i] + 1; 205817ab2063SBarry Smith sum = xb[i]; 2059e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 20605c99c7daSBarry Smith if (xb == b) { 2061ed480e8bSBarry Smith x[i] = sum*idiag[i]; 20625c99c7daSBarry Smith } else { 2063b19a5dc2SMark Adams x[i] = (1-omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 206417ab2063SBarry Smith } 20655c99c7daSBarry Smith } 20669566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 206717ab2063SBarry Smith } 206817ab2063SBarry Smith its--; 206917ab2063SBarry Smith } 207017ab2063SBarry Smith while (its--) { 207117ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 207217ab2063SBarry Smith for (i=0; i<m; i++) { 2073b19a5dc2SMark Adams /* lower */ 2074b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2075ed480e8bSBarry Smith idx = a->j + a->i[i]; 20762e5835c6SStefano Zampini v = aa + a->i[i]; 207717ab2063SBarry Smith sum = b[i]; 2078e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 2079b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2080b19a5dc2SMark Adams /* upper */ 2081b19a5dc2SMark Adams n = a->i[i+1] - diag[i] - 1; 2082b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20832e5835c6SStefano Zampini v = aa + diag[i] + 1; 2084b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum,x,v,idx,n); 2085b19a5dc2SMark Adams x[i] = (1. - omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 208617ab2063SBarry Smith } 2087b19a5dc2SMark Adams xb = t; 20889566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 2089b19a5dc2SMark Adams } else xb = b; 209017ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 209117ab2063SBarry Smith for (i=m-1; i>=0; i--) { 2092b19a5dc2SMark Adams sum = xb[i]; 2093b19a5dc2SMark Adams if (xb == b) { 2094b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2095416022c9SBarry Smith n = a->i[i+1] - a->i[i]; 2096ed480e8bSBarry Smith idx = a->j + a->i[i]; 20972e5835c6SStefano Zampini v = aa + a->i[i]; 2098e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 2099ed480e8bSBarry Smith x[i] = (1. - omega)*x[i] + (sum + mdiag[i]*x[i])*idiag[i]; 2100b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2101b19a5dc2SMark Adams n = a->i[i+1] - diag[i] - 1; 2102b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 21032e5835c6SStefano Zampini v = aa + diag[i] + 1; 2104b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum,x,v,idx,n); 2105b19a5dc2SMark Adams x[i] = (1. - omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 210617ab2063SBarry Smith } 2107b19a5dc2SMark Adams } 2108b19a5dc2SMark Adams if (xb == b) { 21099566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 2110b19a5dc2SMark Adams } else { 21119566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2112b19a5dc2SMark Adams } 211317ab2063SBarry Smith } 211417ab2063SBarry Smith } 21159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 21169566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx,&x)); 21179566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb,&b)); 2118365a8a9eSBarry Smith PetscFunctionReturn(0); 211917ab2063SBarry Smith } 212017ab2063SBarry Smith 2121dfbe8321SBarry Smith PetscErrorCode MatGetInfo_SeqAIJ(Mat A,MatInfoType flag,MatInfo *info) 212217ab2063SBarry Smith { 2123416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 21244e220ebcSLois Curfman McInnes 21253a40ed3dSBarry Smith PetscFunctionBegin; 21264e220ebcSLois Curfman McInnes info->block_size = 1.0; 21273966268fSBarry Smith info->nz_allocated = a->maxnz; 21283966268fSBarry Smith info->nz_used = a->nz; 21293966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 21303966268fSBarry Smith info->assemblies = A->num_ass; 21313966268fSBarry Smith info->mallocs = A->info.mallocs; 21327adad957SLisandro Dalcin info->memory = ((PetscObject)A)->mem; 2133d5f3da31SBarry Smith if (A->factortype) { 21344e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 21354e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 21364e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 21374e220ebcSLois Curfman McInnes } else { 21384e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21394e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21404e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21414e220ebcSLois Curfman McInnes } 21423a40ed3dSBarry Smith PetscFunctionReturn(0); 214317ab2063SBarry Smith } 214417ab2063SBarry Smith 21452b40b63fSBarry Smith PetscErrorCode MatZeroRows_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 214617ab2063SBarry Smith { 2147416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2148c7da8527SEric Chamberland PetscInt i,m = A->rmap->n - 1; 214997b48c8fSBarry Smith const PetscScalar *xx; 21502e5835c6SStefano Zampini PetscScalar *bb,*aa; 2151c7da8527SEric Chamberland PetscInt d = 0; 215217ab2063SBarry Smith 21533a40ed3dSBarry Smith PetscFunctionBegin; 215497b48c8fSBarry Smith if (x && b) { 21559566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x,&xx)); 21569566063dSJacob Faibussowitsch PetscCall(VecGetArray(b,&bb)); 215797b48c8fSBarry Smith for (i=0; i<N; i++) { 2158aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %" PetscInt_FMT " out of range", rows[i]); 2159447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 216097b48c8fSBarry Smith bb[rows[i]] = diag*xx[rows[i]]; 216197b48c8fSBarry Smith } 21629566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x,&xx)); 21639566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b,&bb)); 216497b48c8fSBarry Smith } 216597b48c8fSBarry Smith 21669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 2167a9817697SBarry Smith if (a->keepnonzeropattern) { 2168f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 2169aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %" PetscInt_FMT " out of range", rows[i]); 21709566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]],a->ilen[rows[i]])); 2171f1e2ffcdSBarry Smith } 2172f4df32b1SMatthew Knepley if (diag != 0.0) { 2173c7da8527SEric Chamberland for (i=0; i<N; i++) { 2174c7da8527SEric Chamberland d = rows[i]; 2175447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 217608401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d+1],PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT,d); 2177c7da8527SEric Chamberland } 2178f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 2179447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21802e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2181f1e2ffcdSBarry Smith } 2182f1e2ffcdSBarry Smith } 2183f1e2ffcdSBarry Smith } else { 2184f4df32b1SMatthew Knepley if (diag != 0.0) { 218517ab2063SBarry Smith for (i=0; i<N; i++) { 2186aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %" PetscInt_FMT " out of range", rows[i]); 21877ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2188447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2189447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2190447d62f5SStefano Zampini } else { 2191416022c9SBarry Smith a->ilen[rows[i]] = 1; 21922e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2193bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2194447d62f5SStefano Zampini } 2195447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21969566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],&diag,INSERT_VALUES)); 219717ab2063SBarry Smith } 219817ab2063SBarry Smith } 21993a40ed3dSBarry Smith } else { 220017ab2063SBarry Smith for (i=0; i<N; i++) { 2201aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %" PetscInt_FMT " out of range", rows[i]); 2202416022c9SBarry Smith a->ilen[rows[i]] = 0; 220317ab2063SBarry Smith } 220417ab2063SBarry Smith } 2205e56f5c9eSBarry Smith A->nonzerostate++; 2206f1e2ffcdSBarry Smith } 22079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 2208*dbbe0bcdSBarry Smith PetscUseTypeMethod(A,assemblyend ,MAT_FINAL_ASSEMBLY); 22093a40ed3dSBarry Smith PetscFunctionReturn(0); 221017ab2063SBarry Smith } 221117ab2063SBarry Smith 22126e169961SBarry Smith PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 22136e169961SBarry Smith { 22146e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 22156e169961SBarry Smith PetscInt i,j,m = A->rmap->n - 1,d = 0; 22162b40b63fSBarry Smith PetscBool missing,*zeroed,vecs = PETSC_FALSE; 22176e169961SBarry Smith const PetscScalar *xx; 22182e5835c6SStefano Zampini PetscScalar *bb,*aa; 22196e169961SBarry Smith 22206e169961SBarry Smith PetscFunctionBegin; 22212e5835c6SStefano Zampini if (!N) PetscFunctionReturn(0); 22229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 22236e169961SBarry Smith if (x && b) { 22249566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x,&xx)); 22259566063dSJacob Faibussowitsch PetscCall(VecGetArray(b,&bb)); 22262b40b63fSBarry Smith vecs = PETSC_TRUE; 22276e169961SBarry Smith } 22289566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n,&zeroed)); 22296e169961SBarry Smith for (i=0; i<N; i++) { 2230aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %" PetscInt_FMT " out of range", rows[i]); 22319566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]],a->ilen[rows[i]])); 22322205254eSKarl Rupp 22336e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 22346e169961SBarry Smith } 22356e169961SBarry Smith for (i=0; i<A->rmap->n; i++) { 22366e169961SBarry Smith if (!zeroed[i]) { 22376e169961SBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 22384cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22392e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j]*xx[a->j[j]]; 22402e5835c6SStefano Zampini aa[j] = 0.0; 22416e169961SBarry Smith } 22426e169961SBarry Smith } 22434cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag*xx[i]; 22446e169961SBarry Smith } 22456e169961SBarry Smith if (x && b) { 22469566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x,&xx)); 22479566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b,&bb)); 22486e169961SBarry Smith } 22499566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22506e169961SBarry Smith if (diag != 0.0) { 22519566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A,&missing,&d)); 22521d5a398dSstefano_zampini if (missing) { 22531d5a398dSstefano_zampini for (i=0; i<N; i++) { 22544cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2255aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")",d,rows[i]); 22569566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],&diag,INSERT_VALUES)); 22571d5a398dSstefano_zampini } 22581d5a398dSstefano_zampini } else { 22596e169961SBarry Smith for (i=0; i<N; i++) { 22602e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 22616e169961SBarry Smith } 22626e169961SBarry Smith } 22631d5a398dSstefano_zampini } 22649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 2265*dbbe0bcdSBarry Smith PetscUseTypeMethod(A,assemblyend ,MAT_FINAL_ASSEMBLY); 22666e169961SBarry Smith PetscFunctionReturn(0); 22676e169961SBarry Smith } 22686e169961SBarry Smith 2269a77337e4SBarry Smith PetscErrorCode MatGetRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 227017ab2063SBarry Smith { 2271fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2272fff043a9SJunchao Zhang const PetscScalar *aa; 2273fff043a9SJunchao Zhang PetscInt *itmp; 227417ab2063SBarry Smith 22753a40ed3dSBarry Smith PetscFunctionBegin; 22769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 2277416022c9SBarry Smith *nz = a->i[row+1] - a->i[row]; 22782e5835c6SStefano Zampini if (v) *v = (PetscScalar*)(aa + a->i[row]); 227917ab2063SBarry Smith if (idx) { 2280bfeeae90SHong Zhang itmp = a->j + a->i[row]; 228126fbe8dcSKarl Rupp if (*nz) *idx = itmp; 2282f4259b30SLisandro Dalcin else *idx = NULL; 228317ab2063SBarry Smith } 22849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 22853a40ed3dSBarry Smith PetscFunctionReturn(0); 228617ab2063SBarry Smith } 228717ab2063SBarry Smith 2288a77337e4SBarry Smith PetscErrorCode MatRestoreRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 228917ab2063SBarry Smith { 22903a40ed3dSBarry Smith PetscFunctionBegin; 2291cb4a9cd9SHong Zhang if (nz) *nz = 0; 22922e5835c6SStefano Zampini if (idx) *idx = NULL; 22932e5835c6SStefano Zampini if (v) *v = NULL; 22943a40ed3dSBarry Smith PetscFunctionReturn(0); 229517ab2063SBarry Smith } 229617ab2063SBarry Smith 2297dfbe8321SBarry Smith PetscErrorCode MatNorm_SeqAIJ(Mat A,NormType type,PetscReal *nrm) 229817ab2063SBarry Smith { 2299416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 23002e5835c6SStefano Zampini const MatScalar *v; 230136db0b34SBarry Smith PetscReal sum = 0.0; 230297f1f81fSBarry Smith PetscInt i,j; 230317ab2063SBarry Smith 23043a40ed3dSBarry Smith PetscFunctionBegin; 23059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&v)); 230617ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2307570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2308570b7f6dSBarry Smith PetscBLASInt one = 1,nz = a->nz; 2309792fecdfSBarry Smith PetscCallBLAS("BLASnrm2",*nrm = BLASnrm2_(&nz,v,&one)); 2310570b7f6dSBarry Smith #else 2311416022c9SBarry Smith for (i=0; i<a->nz; i++) { 231236db0b34SBarry Smith sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 231317ab2063SBarry Smith } 23148f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2315570b7f6dSBarry Smith #endif 23169566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 23173a40ed3dSBarry Smith } else if (type == NORM_1) { 231836db0b34SBarry Smith PetscReal *tmp; 231997f1f81fSBarry Smith PetscInt *jj = a->j; 23209566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n+1,&tmp)); 2321064f8208SBarry Smith *nrm = 0.0; 2322416022c9SBarry Smith for (j=0; j<a->nz; j++) { 2323bfeeae90SHong Zhang tmp[*jj++] += PetscAbsScalar(*v); v++; 232417ab2063SBarry Smith } 2325d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 2326064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 232717ab2063SBarry Smith } 23289566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 23299566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz-1,0))); 23303a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2331064f8208SBarry Smith *nrm = 0.0; 2332d0f46423SBarry Smith for (j=0; j<A->rmap->n; j++) { 23332e5835c6SStefano Zampini const PetscScalar *v2 = v + a->i[j]; 233417ab2063SBarry Smith sum = 0.0; 2335416022c9SBarry Smith for (i=0; i<a->i[j+1]-a->i[j]; i++) { 23362e5835c6SStefano Zampini sum += PetscAbsScalar(*v2); v2++; 233717ab2063SBarry Smith } 2338064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 233917ab2063SBarry Smith } 23409566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz-1,0))); 2341f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"No support for two norm"); 23429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&v)); 23433a40ed3dSBarry Smith PetscFunctionReturn(0); 234417ab2063SBarry Smith } 234517ab2063SBarry Smith 23467087cfbeSBarry Smith PetscErrorCode MatIsTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 2347cd0d46ebSvictorle { 23483d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) A->data,*bij = (Mat_SeqAIJ*) B->data; 234954f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 23502e5835c6SStefano Zampini const MatScalar *va,*vb; 235197f1f81fSBarry Smith PetscInt ma,na,mb,nb, i; 2352cd0d46ebSvictorle 2353cd0d46ebSvictorle PetscFunctionBegin; 23549566063dSJacob Faibussowitsch PetscCall(MatGetSize(A,&ma,&na)); 23559566063dSJacob Faibussowitsch PetscCall(MatGetSize(B,&mb,&nb)); 23565485867bSBarry Smith if (ma!=nb || na!=mb) { 23575485867bSBarry Smith *f = PETSC_FALSE; 23585485867bSBarry Smith PetscFunctionReturn(0); 23595485867bSBarry Smith } 23609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&va)); 23619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B,&vb)); 2362cd0d46ebSvictorle aii = aij->i; bii = bij->i; 2363cd0d46ebSvictorle adx = aij->j; bdx = bij->j; 23649566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma,&aptr)); 23659566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb,&bptr)); 2366cd0d46ebSvictorle for (i=0; i<ma; i++) aptr[i] = aii[i]; 2367cd0d46ebSvictorle for (i=0; i<mb; i++) bptr[i] = bii[i]; 2368cd0d46ebSvictorle 2369cd0d46ebSvictorle *f = PETSC_TRUE; 2370cd0d46ebSvictorle for (i=0; i<ma; i++) { 2371cd0d46ebSvictorle while (aptr[i]<aii[i+1]) { 237297f1f81fSBarry Smith PetscInt idc,idr; 23735485867bSBarry Smith PetscScalar vc,vr; 2374cd0d46ebSvictorle /* column/row index/value */ 23755485867bSBarry Smith idc = adx[aptr[i]]; 23765485867bSBarry Smith idr = bdx[bptr[idc]]; 23775485867bSBarry Smith vc = va[aptr[i]]; 23785485867bSBarry Smith vr = vb[bptr[idc]]; 23795485867bSBarry Smith if (i!=idr || PetscAbsScalar(vc-vr) > tol) { 23805485867bSBarry Smith *f = PETSC_FALSE; 23815485867bSBarry Smith goto done; 2382cd0d46ebSvictorle } else { 23835485867bSBarry Smith aptr[i]++; 23845485867bSBarry Smith if (B || i!=idc) bptr[idc]++; 2385cd0d46ebSvictorle } 2386cd0d46ebSvictorle } 2387cd0d46ebSvictorle } 2388cd0d46ebSvictorle done: 23899566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 23909566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 23919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&va)); 23929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B,&vb)); 2393cd0d46ebSvictorle PetscFunctionReturn(0); 2394cd0d46ebSvictorle } 2395cd0d46ebSvictorle 23967087cfbeSBarry Smith PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 23971cbb95d3SBarry Smith { 23983d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) A->data,*bij = (Mat_SeqAIJ*) B->data; 239954f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 240054f21887SBarry Smith MatScalar *va,*vb; 24011cbb95d3SBarry Smith PetscInt ma,na,mb,nb, i; 24021cbb95d3SBarry Smith 24031cbb95d3SBarry Smith PetscFunctionBegin; 24049566063dSJacob Faibussowitsch PetscCall(MatGetSize(A,&ma,&na)); 24059566063dSJacob Faibussowitsch PetscCall(MatGetSize(B,&mb,&nb)); 24061cbb95d3SBarry Smith if (ma!=nb || na!=mb) { 24071cbb95d3SBarry Smith *f = PETSC_FALSE; 24081cbb95d3SBarry Smith PetscFunctionReturn(0); 24091cbb95d3SBarry Smith } 24101cbb95d3SBarry Smith aii = aij->i; bii = bij->i; 24111cbb95d3SBarry Smith adx = aij->j; bdx = bij->j; 24121cbb95d3SBarry Smith va = aij->a; vb = bij->a; 24139566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma,&aptr)); 24149566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb,&bptr)); 24151cbb95d3SBarry Smith for (i=0; i<ma; i++) aptr[i] = aii[i]; 24161cbb95d3SBarry Smith for (i=0; i<mb; i++) bptr[i] = bii[i]; 24171cbb95d3SBarry Smith 24181cbb95d3SBarry Smith *f = PETSC_TRUE; 24191cbb95d3SBarry Smith for (i=0; i<ma; i++) { 24201cbb95d3SBarry Smith while (aptr[i]<aii[i+1]) { 24211cbb95d3SBarry Smith PetscInt idc,idr; 24221cbb95d3SBarry Smith PetscScalar vc,vr; 24231cbb95d3SBarry Smith /* column/row index/value */ 24241cbb95d3SBarry Smith idc = adx[aptr[i]]; 24251cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 24261cbb95d3SBarry Smith vc = va[aptr[i]]; 24271cbb95d3SBarry Smith vr = vb[bptr[idc]]; 24281cbb95d3SBarry Smith if (i!=idr || PetscAbsScalar(vc-PetscConj(vr)) > tol) { 24291cbb95d3SBarry Smith *f = PETSC_FALSE; 24301cbb95d3SBarry Smith goto done; 24311cbb95d3SBarry Smith } else { 24321cbb95d3SBarry Smith aptr[i]++; 24331cbb95d3SBarry Smith if (B || i!=idc) bptr[idc]++; 24341cbb95d3SBarry Smith } 24351cbb95d3SBarry Smith } 24361cbb95d3SBarry Smith } 24371cbb95d3SBarry Smith done: 24389566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24399566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24401cbb95d3SBarry Smith PetscFunctionReturn(0); 24411cbb95d3SBarry Smith } 24421cbb95d3SBarry Smith 2443ace3abfcSBarry Smith PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 24449e29f15eSvictorle { 24459e29f15eSvictorle PetscFunctionBegin; 24469566063dSJacob Faibussowitsch PetscCall(MatIsTranspose_SeqAIJ(A,A,tol,f)); 24479e29f15eSvictorle PetscFunctionReturn(0); 24489e29f15eSvictorle } 24499e29f15eSvictorle 2450ace3abfcSBarry Smith PetscErrorCode MatIsHermitian_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 24511cbb95d3SBarry Smith { 24521cbb95d3SBarry Smith PetscFunctionBegin; 24539566063dSJacob Faibussowitsch PetscCall(MatIsHermitianTranspose_SeqAIJ(A,A,tol,f)); 24541cbb95d3SBarry Smith PetscFunctionReturn(0); 24551cbb95d3SBarry Smith } 24561cbb95d3SBarry Smith 2457dfbe8321SBarry Smith PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A,Vec ll,Vec rr) 245817ab2063SBarry Smith { 2459416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2460fff8e43fSBarry Smith const PetscScalar *l,*r; 2461fff8e43fSBarry Smith PetscScalar x; 246254f21887SBarry Smith MatScalar *v; 2463fff8e43fSBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,M,nz = a->nz; 2464fff8e43fSBarry Smith const PetscInt *jj; 246517ab2063SBarry Smith 24663a40ed3dSBarry Smith PetscFunctionBegin; 246717ab2063SBarry Smith if (ll) { 24683ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 24693ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 24709566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll,&m)); 247108401ef6SPierre Jolivet PetscCheck(m == A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Left scaling vector wrong length"); 24729566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll,&l)); 24739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&v)); 247417ab2063SBarry Smith for (i=0; i<m; i++) { 247517ab2063SBarry Smith x = l[i]; 2476416022c9SBarry Smith M = a->i[i+1] - a->i[i]; 24772205254eSKarl Rupp for (j=0; j<M; j++) (*v++) *= x; 247817ab2063SBarry Smith } 24799566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll,&l)); 24809566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 24819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&v)); 248217ab2063SBarry Smith } 248317ab2063SBarry Smith if (rr) { 24849566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr,&n)); 248508401ef6SPierre Jolivet PetscCheck(n == A->cmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Right scaling vector wrong length"); 24869566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr,&r)); 24879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&v)); 24882e5835c6SStefano Zampini jj = a->j; 24892205254eSKarl Rupp for (i=0; i<nz; i++) (*v++) *= r[*jj++]; 24909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&v)); 24919566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr,&r)); 24929566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 249317ab2063SBarry Smith } 24949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 24953a40ed3dSBarry Smith PetscFunctionReturn(0); 249617ab2063SBarry Smith } 249717ab2063SBarry Smith 24987dae84e0SHong Zhang PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A,IS isrow,IS iscol,PetscInt csize,MatReuse scall,Mat *B) 249917ab2063SBarry Smith { 2500db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*c; 2501d0f46423SBarry Smith PetscInt *smap,i,k,kstart,kend,oldcols = A->cmap->n,*lens; 250297f1f81fSBarry Smith PetscInt row,mat_i,*mat_j,tcol,first,step,*mat_ilen,sum,lensi; 25035d0c19d7SBarry Smith const PetscInt *irow,*icol; 25042e5835c6SStefano Zampini const PetscScalar *aa; 25055d0c19d7SBarry Smith PetscInt nrows,ncols; 250697f1f81fSBarry Smith PetscInt *starts,*j_new,*i_new,*aj = a->j,*ai = a->i,ii,*ailen = a->ilen; 250754f21887SBarry Smith MatScalar *a_new,*mat_a; 2508416022c9SBarry Smith Mat C; 2509cdc6f3adSToby Isaac PetscBool stride; 251017ab2063SBarry Smith 25113a40ed3dSBarry Smith PetscFunctionBegin; 25129566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow,&irow)); 25139566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow,&nrows)); 25149566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol,&ncols)); 251517ab2063SBarry Smith 25169566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol,ISSTRIDE,&stride)); 2517ff718158SBarry Smith if (stride) { 25189566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol,&first,&step)); 2519ff718158SBarry Smith } else { 2520ff718158SBarry Smith first = 0; 2521ff718158SBarry Smith step = 0; 2522ff718158SBarry Smith } 2523fee21e36SBarry Smith if (stride && step == 1) { 252402834360SBarry Smith /* special case of contiguous rows */ 25259566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows,&lens,nrows,&starts)); 252602834360SBarry Smith /* loop over new rows determining lens and starting points */ 252702834360SBarry Smith for (i=0; i<nrows; i++) { 2528bfeeae90SHong Zhang kstart = ai[irow[i]]; 2529a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2530a91a9bebSLisandro Dalcin starts[i] = kstart; 253102834360SBarry Smith for (k=kstart; k<kend; k++) { 2532bfeeae90SHong Zhang if (aj[k] >= first) { 253302834360SBarry Smith starts[i] = k; 253402834360SBarry Smith break; 253502834360SBarry Smith } 253602834360SBarry Smith } 2537a2744918SBarry Smith sum = 0; 253802834360SBarry Smith while (k < kend) { 2539bfeeae90SHong Zhang if (aj[k++] >= first+ncols) break; 2540a2744918SBarry Smith sum++; 254102834360SBarry Smith } 2542a2744918SBarry Smith lens[i] = sum; 254302834360SBarry Smith } 254402834360SBarry Smith /* create submatrix */ 2545cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 254697f1f81fSBarry Smith PetscInt n_cols,n_rows; 25479566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B,&n_rows,&n_cols)); 2548aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Reused submatrix wrong size"); 25499566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 255008480c60SBarry Smith C = *B; 25513a40ed3dSBarry Smith } else { 25523bef6203SJed Brown PetscInt rbs,cbs; 25539566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A),&C)); 25549566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE)); 25559566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow,&rbs)); 25569566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol,&cbs)); 25579566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C,rbs,cbs)); 25589566063dSJacob Faibussowitsch PetscCall(MatSetType(C,((PetscObject)A)->type_name)); 25599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens)); 256008480c60SBarry Smith } 2561db02288aSLois Curfman McInnes c = (Mat_SeqAIJ*)C->data; 2562db02288aSLois Curfman McInnes 256302834360SBarry Smith /* loop over rows inserting into submatrix */ 2564db02288aSLois Curfman McInnes a_new = c->a; 2565db02288aSLois Curfman McInnes j_new = c->j; 2566db02288aSLois Curfman McInnes i_new = c->i; 25679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 256802834360SBarry Smith for (i=0; i<nrows; i++) { 2569a2744918SBarry Smith ii = starts[i]; 2570a2744918SBarry Smith lensi = lens[i]; 2571a2744918SBarry Smith for (k=0; k<lensi; k++) { 2572a2744918SBarry Smith *j_new++ = aj[ii+k] - first; 257302834360SBarry Smith } 25749566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new,aa + starts[i],lensi)); 2575a2744918SBarry Smith a_new += lensi; 2576a2744918SBarry Smith i_new[i+1] = i_new[i] + lensi; 2577a2744918SBarry Smith c->ilen[i] = lensi; 257802834360SBarry Smith } 25799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 25809566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens,starts)); 25813a40ed3dSBarry Smith } else { 25829566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol,&icol)); 25839566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols,&smap)); 25849566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1+nrows,&lens)); 25854dcab191SBarry Smith for (i=0; i<ncols; i++) { 25866bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT,i,icol[i],oldcols); 25874dcab191SBarry Smith smap[icol[i]] = i+1; 25884dcab191SBarry Smith } 25894dcab191SBarry Smith 259002834360SBarry Smith /* determine lens of each row */ 259102834360SBarry Smith for (i=0; i<nrows; i++) { 2592bfeeae90SHong Zhang kstart = ai[irow[i]]; 259302834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 259402834360SBarry Smith lens[i] = 0; 259502834360SBarry Smith for (k=kstart; k<kend; k++) { 2596bfeeae90SHong Zhang if (smap[aj[k]]) { 259702834360SBarry Smith lens[i]++; 259802834360SBarry Smith } 259902834360SBarry Smith } 260002834360SBarry Smith } 260117ab2063SBarry Smith /* Create and fill new matrix */ 2602a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2603ace3abfcSBarry Smith PetscBool equal; 26040f5bd95cSBarry Smith 260599141d43SSatish Balay c = (Mat_SeqAIJ*)((*B)->data); 2606aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong size"); 26079566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen,lens,(*B)->rmap->n,&equal)); 260828b400f6SJacob Faibussowitsch PetscCheck(equal,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong no of nonzeros"); 26099566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen,(*B)->rmap->n)); 261008480c60SBarry Smith C = *B; 26113a40ed3dSBarry Smith } else { 26123bef6203SJed Brown PetscInt rbs,cbs; 26139566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A),&C)); 26149566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE)); 26159566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow,&rbs)); 26169566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol,&cbs)); 26179566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C,rbs,cbs)); 26189566063dSJacob Faibussowitsch PetscCall(MatSetType(C,((PetscObject)A)->type_name)); 26199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens)); 262008480c60SBarry Smith } 26219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 262299141d43SSatish Balay c = (Mat_SeqAIJ*)(C->data); 262317ab2063SBarry Smith for (i=0; i<nrows; i++) { 262499141d43SSatish Balay row = irow[i]; 2625bfeeae90SHong Zhang kstart = ai[row]; 262699141d43SSatish Balay kend = kstart + a->ilen[row]; 2627bfeeae90SHong Zhang mat_i = c->i[i]; 262899141d43SSatish Balay mat_j = c->j + mat_i; 262999141d43SSatish Balay mat_a = c->a + mat_i; 263099141d43SSatish Balay mat_ilen = c->ilen + i; 263117ab2063SBarry Smith for (k=kstart; k<kend; k++) { 2632bfeeae90SHong Zhang if ((tcol=smap[a->j[k]])) { 2633ed480e8bSBarry Smith *mat_j++ = tcol - 1; 26342e5835c6SStefano Zampini *mat_a++ = aa[k]; 263599141d43SSatish Balay (*mat_ilen)++; 263699141d43SSatish Balay 263717ab2063SBarry Smith } 263817ab2063SBarry Smith } 263917ab2063SBarry Smith } 26409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 264102834360SBarry Smith /* Free work space */ 26429566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol,&icol)); 26439566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26449566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2645cdc6f3adSToby Isaac /* sort */ 2646cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2647cdc6f3adSToby Isaac PetscInt ilen; 2648cdc6f3adSToby Isaac 2649cdc6f3adSToby Isaac mat_i = c->i[i]; 2650cdc6f3adSToby Isaac mat_j = c->j + mat_i; 2651cdc6f3adSToby Isaac mat_a = c->a + mat_i; 2652cdc6f3adSToby Isaac ilen = c->ilen[i]; 26539566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen,mat_j,mat_a)); 2654cdc6f3adSToby Isaac } 265502834360SBarry Smith } 26568c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 26579566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C,A->boundtocpu)); 2658305c6ccfSStefano Zampini #endif 26599566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY)); 26609566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY)); 266117ab2063SBarry Smith 26629566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow,&irow)); 2663416022c9SBarry Smith *B = C; 26643a40ed3dSBarry Smith PetscFunctionReturn(0); 266517ab2063SBarry Smith } 266617ab2063SBarry Smith 2667fc08c53fSHong Zhang PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat,MPI_Comm subComm,MatReuse scall,Mat *subMat) 266882d44351SHong Zhang { 266982d44351SHong Zhang Mat B; 267082d44351SHong Zhang 267182d44351SHong Zhang PetscFunctionBegin; 2672c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 26739566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm,&B)); 26749566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B,mat->rmap->n,mat->cmap->n,mat->rmap->n,mat->cmap->n)); 26759566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B,mat,mat)); 26769566063dSJacob Faibussowitsch PetscCall(MatSetType(B,MATSEQAIJ)); 26779566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B,mat,MAT_COPY_VALUES,PETSC_TRUE)); 267882d44351SHong Zhang *subMat = B; 2679c2d650bdSHong Zhang } else { 26809566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat,*subMat,SAME_NONZERO_PATTERN)); 2681c2d650bdSHong Zhang } 268282d44351SHong Zhang PetscFunctionReturn(0); 268382d44351SHong Zhang } 268482d44351SHong Zhang 26859a625307SHong Zhang PetscErrorCode MatILUFactor_SeqAIJ(Mat inA,IS row,IS col,const MatFactorInfo *info) 2686a871dcd8SBarry Smith { 268763b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 268863b91edcSBarry Smith Mat outA; 2689ace3abfcSBarry Smith PetscBool row_identity,col_identity; 269063b91edcSBarry Smith 26913a40ed3dSBarry Smith PetscFunctionBegin; 269208401ef6SPierre Jolivet PetscCheck(info->levels == 0,PETSC_COMM_SELF,PETSC_ERR_SUP,"Only levels=0 supported for in-place ilu"); 26931df811f5SHong Zhang 26949566063dSJacob Faibussowitsch PetscCall(ISIdentity(row,&row_identity)); 26959566063dSJacob Faibussowitsch PetscCall(ISIdentity(col,&col_identity)); 2696a871dcd8SBarry Smith 269763b91edcSBarry Smith outA = inA; 2698d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 26999566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 27009566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC,&inA->solvertype)); 27012205254eSKarl Rupp 27029566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 27039566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 27042205254eSKarl Rupp 2705c3122656SLisandro Dalcin a->row = row; 27062205254eSKarl Rupp 27079566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 27089566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 27092205254eSKarl Rupp 2710c3122656SLisandro Dalcin a->col = col; 271163b91edcSBarry Smith 271236db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 27139566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 27149566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col,PETSC_DECIDE,&a->icol)); 27159566063dSJacob Faibussowitsch PetscCall(PetscLogObjectParent((PetscObject)inA,(PetscObject)a->icol)); 2716f0ec6fceSSatish Balay 271794a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 27189566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n+1,&a->solve_work)); 27199566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)inA, (inA->rmap->n+1)*sizeof(PetscScalar))); 272094a9d846SBarry Smith } 272163b91edcSBarry Smith 27229566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2723137fb511SHong Zhang if (row_identity && col_identity) { 27249566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA,inA,info)); 2725137fb511SHong Zhang } else { 27269566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA,inA,info)); 2727137fb511SHong Zhang } 27283a40ed3dSBarry Smith PetscFunctionReturn(0); 2729a871dcd8SBarry Smith } 2730a871dcd8SBarry Smith 2731f4df32b1SMatthew Knepley PetscErrorCode MatScale_SeqAIJ(Mat inA,PetscScalar alpha) 2732f0b747eeSBarry Smith { 2733f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 2734dfa0f9e5SStefano Zampini PetscScalar *v; 2735c5df96a5SBarry Smith PetscBLASInt one = 1,bnz; 27363a40ed3dSBarry Smith 27373a40ed3dSBarry Smith PetscFunctionBegin; 27389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA,&v)); 27399566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz,&bnz)); 2740792fecdfSBarry Smith PetscCallBLAS("BLASscal",BLASscal_(&bnz,&alpha,v,&one)); 27419566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA,&v)); 27439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27443a40ed3dSBarry Smith PetscFunctionReturn(0); 2745f0b747eeSBarry Smith } 2746f0b747eeSBarry Smith 2747f68bb481SHong Zhang PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 274816b64355SHong Zhang { 274916b64355SHong Zhang PetscInt i; 275016b64355SHong Zhang 275116b64355SHong Zhang PetscFunctionBegin; 275216b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 27539566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1,submatj->ptr,submatj->tmp,submatj->ctr)); 275416b64355SHong Zhang 275516b64355SHong Zhang for (i=0; i<submatj->nrqr; ++i) { 27569566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->sbuf2[i])); 275716b64355SHong Zhang } 27589566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2,submatj->req_size,submatj->req_source1)); 275916b64355SHong Zhang 276016b64355SHong Zhang if (submatj->rbuf1) { 27619566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 27629566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 276316b64355SHong Zhang } 276416b64355SHong Zhang 276516b64355SHong Zhang for (i=0; i<submatj->nrqs; ++i) { 27669566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf3[i])); 276716b64355SHong Zhang } 27689566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2,submatj->rbuf2,submatj->rbuf3)); 27699566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 277016b64355SHong Zhang } 277116b64355SHong Zhang 277216b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 27739566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy((PetscTable*)&submatj->rmap)); 27749566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 27759566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 277616b64355SHong Zhang #else 27779566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 277816b64355SHong Zhang #endif 277916b64355SHong Zhang 278016b64355SHong Zhang if (!submatj->allcolumns) { 278116b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 27829566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy((PetscTable*)&submatj->cmap)); 278316b64355SHong Zhang #else 27849566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 278516b64355SHong Zhang #endif 278616b64355SHong Zhang } 27879566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 278816b64355SHong Zhang 27899566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 279016b64355SHong Zhang PetscFunctionReturn(0); 279116b64355SHong Zhang } 279216b64355SHong Zhang 27930fb991dcSHong Zhang PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 279416b64355SHong Zhang { 279516b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ*)C->data; 27965c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 279716b64355SHong Zhang 279816b64355SHong Zhang PetscFunctionBegin; 27999566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 28009566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 280116b64355SHong Zhang PetscFunctionReturn(0); 280216b64355SHong Zhang } 280316b64355SHong Zhang 280489a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 28052d033e1fSHong Zhang PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n,Mat *mat[]) 28062d033e1fSHong Zhang { 28072d033e1fSHong Zhang PetscInt i; 28080fb991dcSHong Zhang Mat C; 28090fb991dcSHong Zhang Mat_SeqAIJ *c; 28100fb991dcSHong Zhang Mat_SubSppt *submatj; 28112d033e1fSHong Zhang 28122d033e1fSHong Zhang PetscFunctionBegin; 28132d033e1fSHong Zhang for (i=0; i<n; i++) { 28140fb991dcSHong Zhang C = (*mat)[i]; 28150fb991dcSHong Zhang c = (Mat_SeqAIJ*)C->data; 28160fb991dcSHong Zhang submatj = c->submatis1; 28172d033e1fSHong Zhang if (submatj) { 2818682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 281926cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 28209566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 28219566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 28229566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 28239566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 28249566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 28259566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2826682e4c99SStefano Zampini } 28272d033e1fSHong Zhang } else { 28289566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 28292d033e1fSHong Zhang } 28302d033e1fSHong Zhang } 283186e85357SHong Zhang 283263a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 28339566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n,mat)); 283463a75b2aSHong Zhang 28359566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 28362d033e1fSHong Zhang PetscFunctionReturn(0); 28372d033e1fSHong Zhang } 28382d033e1fSHong Zhang 28397dae84e0SHong Zhang PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A,PetscInt n,const IS irow[],const IS icol[],MatReuse scall,Mat *B[]) 2840cddf8d76SBarry Smith { 284197f1f81fSBarry Smith PetscInt i; 2842cddf8d76SBarry Smith 28433a40ed3dSBarry Smith PetscFunctionBegin; 2844cddf8d76SBarry Smith if (scall == MAT_INITIAL_MATRIX) { 28459566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n+1,B)); 2846cddf8d76SBarry Smith } 2847cddf8d76SBarry Smith 2848cddf8d76SBarry Smith for (i=0; i<n; i++) { 28499566063dSJacob Faibussowitsch PetscCall(MatCreateSubMatrix_SeqAIJ(A,irow[i],icol[i],PETSC_DECIDE,scall,&(*B)[i])); 2850cddf8d76SBarry Smith } 28513a40ed3dSBarry Smith PetscFunctionReturn(0); 2852cddf8d76SBarry Smith } 2853cddf8d76SBarry Smith 285497f1f81fSBarry Smith PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A,PetscInt is_max,IS is[],PetscInt ov) 28554dcbc457SBarry Smith { 2856e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 28575d0c19d7SBarry Smith PetscInt row,i,j,k,l,m,n,*nidx,isz,val; 28585d0c19d7SBarry Smith const PetscInt *idx; 285997f1f81fSBarry Smith PetscInt start,end,*ai,*aj; 2860f1af5d2fSBarry Smith PetscBT table; 2861bbd702dbSSatish Balay 28623a40ed3dSBarry Smith PetscFunctionBegin; 2863d0f46423SBarry Smith m = A->rmap->n; 2864e4d965acSSatish Balay ai = a->i; 2865bfeeae90SHong Zhang aj = a->j; 28668a047759SSatish Balay 286708401ef6SPierre Jolivet PetscCheck(ov >= 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"illegal negative overlap value used"); 286806763907SSatish Balay 28699566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1,&nidx)); 28709566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m,&table)); 287106763907SSatish Balay 2872e4d965acSSatish Balay for (i=0; i<is_max; i++) { 2873b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2874e4d965acSSatish Balay isz = 0; 28759566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m,table)); 2876e4d965acSSatish Balay 2877e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28789566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i],&idx)); 28799566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i],&n)); 2880e4d965acSSatish Balay 2881dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2882e4d965acSSatish Balay for (j=0; j<n; ++j) { 28832205254eSKarl Rupp if (!PetscBTLookupSet(table,idx[j])) nidx[isz++] = idx[j]; 28844dcbc457SBarry Smith } 28859566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i],&idx)); 28869566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2887e4d965acSSatish Balay 288804a348a9SBarry Smith k = 0; 288904a348a9SBarry Smith for (j=0; j<ov; j++) { /* for each overlap */ 289004a348a9SBarry Smith n = isz; 289106763907SSatish Balay for (; k<n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2892e4d965acSSatish Balay row = nidx[k]; 2893e4d965acSSatish Balay start = ai[row]; 2894e4d965acSSatish Balay end = ai[row+1]; 289504a348a9SBarry Smith for (l = start; l<end; l++) { 2896efb16452SHong Zhang val = aj[l]; 28972205254eSKarl Rupp if (!PetscBTLookupSet(table,val)) nidx[isz++] = val; 2898e4d965acSSatish Balay } 2899e4d965acSSatish Balay } 2900e4d965acSSatish Balay } 29019566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF,isz,nidx,PETSC_COPY_VALUES,(is+i))); 2902e4d965acSSatish Balay } 29039566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 29049566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 29053a40ed3dSBarry Smith PetscFunctionReturn(0); 29064dcbc457SBarry Smith } 290717ab2063SBarry Smith 29080513a670SBarry Smith /* -------------------------------------------------------------- */ 2909dfbe8321SBarry Smith PetscErrorCode MatPermute_SeqAIJ(Mat A,IS rowp,IS colp,Mat *B) 29100513a670SBarry Smith { 29110513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 29123b98c0a2SBarry Smith PetscInt i,nz = 0,m = A->rmap->n,n = A->cmap->n; 29135d0c19d7SBarry Smith const PetscInt *row,*col; 29145d0c19d7SBarry Smith PetscInt *cnew,j,*lens; 291556cd22aeSBarry Smith IS icolp,irowp; 29160298fd71SBarry Smith PetscInt *cwork = NULL; 29170298fd71SBarry Smith PetscScalar *vwork = NULL; 29180513a670SBarry Smith 29193a40ed3dSBarry Smith PetscFunctionBegin; 29209566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp,PETSC_DECIDE,&irowp)); 29219566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp,&row)); 29229566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp,PETSC_DECIDE,&icolp)); 29239566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp,&col)); 29240513a670SBarry Smith 29250513a670SBarry Smith /* determine lengths of permuted rows */ 29269566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1,&lens)); 29272205254eSKarl Rupp for (i=0; i<m; i++) lens[row[i]] = a->i[i+1] - a->i[i]; 29289566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A),B)); 29299566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B,m,n,m,n)); 29309566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B,A,A)); 29319566063dSJacob Faibussowitsch PetscCall(MatSetType(*B,((PetscObject)A)->type_name)); 29329566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B,0,lens)); 29339566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 29340513a670SBarry Smith 29359566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n,&cnew)); 29360513a670SBarry Smith for (i=0; i<m; i++) { 29379566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A,i,&nz,&cwork,&vwork)); 29382205254eSKarl Rupp for (j=0; j<nz; j++) cnew[j] = col[cwork[j]]; 29399566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B,1,&row[i],nz,cnew,vwork,INSERT_VALUES)); 29409566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A,i,&nz,&cwork,&vwork)); 29410513a670SBarry Smith } 29429566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 29432205254eSKarl Rupp 29443c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 29452205254eSKarl Rupp 29468c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29479566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B,A->boundtocpu)); 29489fe5e383SStefano Zampini #endif 29499566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY)); 29509566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY)); 29519566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp,&row)); 29529566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp,&col)); 29539566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29549566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 29556768869dSprj- if (rowp == colp) { 29569566063dSJacob Faibussowitsch PetscCall(MatPropagateSymmetryOptions(A,*B)); 29576768869dSprj- } 29583a40ed3dSBarry Smith PetscFunctionReturn(0); 29590513a670SBarry Smith } 29600513a670SBarry Smith 2961dfbe8321SBarry Smith PetscErrorCode MatCopy_SeqAIJ(Mat A,Mat B,MatStructure str) 2962cb5b572fSBarry Smith { 2963cb5b572fSBarry Smith PetscFunctionBegin; 296433f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 296533f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2966be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2967be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ*)B->data; 29682e5835c6SStefano Zampini const PetscScalar *aa; 2969be6bf707SBarry Smith 29709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 297108401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n],PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT,a->i[A->rmap->n],b->i[B->rmap->n]); 29729566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a,aa,a->i[A->rmap->n])); 29739566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 29749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 2975cb5b572fSBarry Smith } else { 29769566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A,B,str)); 2977cb5b572fSBarry Smith } 2978cb5b572fSBarry Smith PetscFunctionReturn(0); 2979cb5b572fSBarry Smith } 2980cb5b572fSBarry Smith 29814994cf47SJed Brown PetscErrorCode MatSetUp_SeqAIJ(Mat A) 2982273d9f13SBarry Smith { 2983273d9f13SBarry Smith PetscFunctionBegin; 29849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A,PETSC_DEFAULT,NULL)); 2985273d9f13SBarry Smith PetscFunctionReturn(0); 2986273d9f13SBarry Smith } 2987273d9f13SBarry Smith 2988f38c1e66SStefano Zampini PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A,PetscScalar *array[]) 29896c0721eeSBarry Smith { 29906c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 29916e111a19SKarl Rupp 29926c0721eeSBarry Smith PetscFunctionBegin; 29936c0721eeSBarry Smith *array = a->a; 29946c0721eeSBarry Smith PetscFunctionReturn(0); 29956c0721eeSBarry Smith } 29966c0721eeSBarry Smith 2997f38c1e66SStefano Zampini PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A,PetscScalar *array[]) 29986c0721eeSBarry Smith { 29996c0721eeSBarry Smith PetscFunctionBegin; 3000f38c1e66SStefano Zampini *array = NULL; 30016c0721eeSBarry Smith PetscFunctionReturn(0); 30026c0721eeSBarry Smith } 3003273d9f13SBarry Smith 30048229c054SShri Abhyankar /* 30058229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 30068229c054SShri Abhyankar have different nonzero structure. 30078229c054SShri Abhyankar */ 3008b264fe52SHong Zhang PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m,const PetscInt *xi,const PetscInt *xj,const PetscInt *yi,const PetscInt *yj,PetscInt *nnz) 3009ec7775f6SShri Abhyankar { 3010b264fe52SHong Zhang PetscInt i,j,k,nzx,nzy; 3011ec7775f6SShri Abhyankar 3012ec7775f6SShri Abhyankar PetscFunctionBegin; 3013ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 3014ec7775f6SShri Abhyankar for (i=0; i<m; i++) { 3015b264fe52SHong Zhang const PetscInt *xjj = xj+xi[i],*yjj = yj+yi[i]; 3016b264fe52SHong Zhang nzx = xi[i+1] - xi[i]; 3017b264fe52SHong Zhang nzy = yi[i+1] - yi[i]; 30188af7cee1SJed Brown nnz[i] = 0; 30198af7cee1SJed Brown for (j=0,k=0; j<nzx; j++) { /* Point in X */ 3020b264fe52SHong Zhang for (; k<nzy && yjj[k]<xjj[j]; k++) nnz[i]++; /* Catch up to X */ 3021b264fe52SHong Zhang if (k<nzy && yjj[k]==xjj[j]) k++; /* Skip duplicate */ 30228af7cee1SJed Brown nnz[i]++; 30238af7cee1SJed Brown } 30248af7cee1SJed Brown for (; k<nzy; k++) nnz[i]++; 3025ec7775f6SShri Abhyankar } 3026ec7775f6SShri Abhyankar PetscFunctionReturn(0); 3027ec7775f6SShri Abhyankar } 3028ec7775f6SShri Abhyankar 3029b264fe52SHong Zhang PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y,Mat X,PetscInt *nnz) 3030b264fe52SHong Zhang { 3031b264fe52SHong Zhang PetscInt m = Y->rmap->N; 3032b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ*)X->data; 3033b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ*)Y->data; 3034b264fe52SHong Zhang 3035b264fe52SHong Zhang PetscFunctionBegin; 3036b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 30379566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m,x->i,x->j,y->i,y->j,nnz)); 3038b264fe52SHong Zhang PetscFunctionReturn(0); 3039b264fe52SHong Zhang } 3040b264fe52SHong Zhang 3041f4df32b1SMatthew Knepley PetscErrorCode MatAXPY_SeqAIJ(Mat Y,PetscScalar a,Mat X,MatStructure str) 3042ac90fabeSBarry Smith { 3043ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ*)X->data,*y = (Mat_SeqAIJ*)Y->data; 3044ac90fabeSBarry Smith 3045ac90fabeSBarry Smith PetscFunctionBegin; 3046134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 3047134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3048134adf20SPierre Jolivet if (e) { 30499566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i,y->i,Y->rmap->n+1,&e)); 305081fa06acSBarry Smith if (e) { 30519566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j,y->j,y->nz,&e)); 3052134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 305381fa06acSBarry Smith } 305481fa06acSBarry Smith } 305554c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"MatStructure is not SAME_NONZERO_PATTERN"); 305681fa06acSBarry Smith } 3057ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 30582e5835c6SStefano Zampini const PetscScalar *xa; 30592e5835c6SStefano Zampini PetscScalar *ya,alpha = a; 306081fa06acSBarry Smith PetscBLASInt one = 1,bnz; 306181fa06acSBarry Smith 30629566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz,&bnz)); 30639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y,&ya)); 30649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X,&xa)); 3065792fecdfSBarry Smith PetscCallBLAS("BLASaxpy",BLASaxpy_(&bnz,&alpha,xa,&one,ya,&one)); 30669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X,&xa)); 30679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y,&ya)); 30689566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*bnz)); 30699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 30709566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3071ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 30729566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y,a,X,str)); 3073ac90fabeSBarry Smith } else { 30748229c054SShri Abhyankar Mat B; 30758229c054SShri Abhyankar PetscInt *nnz; 30769566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N,&nnz)); 30779566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y),&B)); 30789566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B,((PetscObject)Y)->name)); 30799566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B,Y->rmap,Y->cmap)); 30809566063dSJacob Faibussowitsch PetscCall(MatSetType(B,((PetscObject)Y)->type_name)); 30819566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y,X,nnz)); 30829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B,0,nnz)); 30839566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B,Y,a,X,str)); 30849566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y,&B)); 30859bb234a9SBarry Smith PetscCall(MatSeqAIJCheckInode(Y)); 30869566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3087ac90fabeSBarry Smith } 3088ac90fabeSBarry Smith PetscFunctionReturn(0); 3089ac90fabeSBarry Smith } 3090ac90fabeSBarry Smith 30912726fb6dSPierre Jolivet PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3092354c94deSBarry Smith { 3093354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3094354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3095354c94deSBarry Smith PetscInt i,nz; 3096354c94deSBarry Smith PetscScalar *a; 3097354c94deSBarry Smith 3098354c94deSBarry Smith PetscFunctionBegin; 3099354c94deSBarry Smith nz = aij->nz; 31009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat,&a)); 31012205254eSKarl Rupp for (i=0; i<nz; i++) a[i] = PetscConj(a[i]); 31029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat,&a)); 3103354c94deSBarry Smith #else 3104354c94deSBarry Smith PetscFunctionBegin; 3105354c94deSBarry Smith #endif 3106354c94deSBarry Smith PetscFunctionReturn(0); 3107354c94deSBarry Smith } 3108354c94deSBarry Smith 3109985db425SBarry Smith PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3110e34fafa9SBarry Smith { 3111e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3112d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3113e34fafa9SBarry Smith PetscReal atmp; 3114985db425SBarry Smith PetscScalar *x; 3115ce496241SStefano Zampini const MatScalar *aa,*av; 3116e34fafa9SBarry Smith 3117e34fafa9SBarry Smith PetscFunctionBegin; 311828b400f6SJacob Faibussowitsch PetscCheck(!A->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 31199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&av)); 3120ce496241SStefano Zampini aa = av; 3121e34fafa9SBarry Smith ai = a->i; 3122e34fafa9SBarry Smith aj = a->j; 3123e34fafa9SBarry Smith 31249566063dSJacob Faibussowitsch PetscCall(VecSet(v,0.0)); 31259566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 31269566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v,&n)); 312708401ef6SPierre Jolivet PetscCheck(n == A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3128e34fafa9SBarry Smith for (i=0; i<m; i++) { 3129e34fafa9SBarry Smith ncols = ai[1] - ai[0]; ai++; 3130e34fafa9SBarry Smith for (j=0; j<ncols; j++) { 3131985db425SBarry Smith atmp = PetscAbsScalar(*aa); 3132985db425SBarry Smith if (PetscAbsScalar(x[i]) < atmp) {x[i] = atmp; if (idx) idx[i] = *aj;} 3133985db425SBarry Smith aa++; aj++; 3134985db425SBarry Smith } 3135985db425SBarry Smith } 31369566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 31379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&av)); 3138985db425SBarry Smith PetscFunctionReturn(0); 3139985db425SBarry Smith } 3140985db425SBarry Smith 3141985db425SBarry Smith PetscErrorCode MatGetRowMax_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3142985db425SBarry Smith { 3143985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3144d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3145985db425SBarry Smith PetscScalar *x; 3146ce496241SStefano Zampini const MatScalar *aa,*av; 3147985db425SBarry Smith 3148985db425SBarry Smith PetscFunctionBegin; 314928b400f6SJacob Faibussowitsch PetscCheck(!A->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 31509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&av)); 3151ce496241SStefano Zampini aa = av; 3152985db425SBarry Smith ai = a->i; 3153985db425SBarry Smith aj = a->j; 3154985db425SBarry Smith 31559566063dSJacob Faibussowitsch PetscCall(VecSet(v,0.0)); 31569566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 31579566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v,&n)); 315808401ef6SPierre Jolivet PetscCheck(n == A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3159985db425SBarry Smith for (i=0; i<m; i++) { 3160985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 3161d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 3162985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 3163985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3164985db425SBarry Smith x[i] = 0.0; 3165985db425SBarry Smith if (idx) { 3166985db425SBarry Smith for (j=0; j<ncols; j++) { /* find first implicit 0.0 in the row */ 3167985db425SBarry Smith if (aj[j] > j) { 3168985db425SBarry Smith idx[i] = j; 3169985db425SBarry Smith break; 3170985db425SBarry Smith } 3171985db425SBarry Smith } 31721a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 31731a254869SHong Zhang if (j==ncols && j < A->cmap->n) idx[i] = j; 3174985db425SBarry Smith } 3175985db425SBarry Smith } 3176985db425SBarry Smith for (j=0; j<ncols; j++) { 3177985db425SBarry Smith if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 3178985db425SBarry Smith aa++; aj++; 3179985db425SBarry Smith } 3180985db425SBarry Smith } 31819566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 31829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&av)); 3183985db425SBarry Smith PetscFunctionReturn(0); 3184985db425SBarry Smith } 3185985db425SBarry Smith 3186c87e5d42SMatthew Knepley PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3187c87e5d42SMatthew Knepley { 3188c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3189c87e5d42SMatthew Knepley PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3190ce496241SStefano Zampini PetscScalar *x; 3191ce496241SStefano Zampini const MatScalar *aa,*av; 3192c87e5d42SMatthew Knepley 3193c87e5d42SMatthew Knepley PetscFunctionBegin; 31949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&av)); 3195ce496241SStefano Zampini aa = av; 3196c87e5d42SMatthew Knepley ai = a->i; 3197c87e5d42SMatthew Knepley aj = a->j; 3198c87e5d42SMatthew Knepley 31999566063dSJacob Faibussowitsch PetscCall(VecSet(v,0.0)); 32009566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 32019566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v,&n)); 320208401ef6SPierre Jolivet PetscCheck(n == m,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3203c87e5d42SMatthew Knepley for (i=0; i<m; i++) { 3204c87e5d42SMatthew Knepley ncols = ai[1] - ai[0]; ai++; 3205f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 3206f07e67edSHong Zhang x[i] = *aa; if (idx) idx[i] = 0; 3207f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3208f07e67edSHong Zhang x[i] = 0.0; 3209f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3210289a08f5SMatthew Knepley for (j=0; j<ncols; j++) { 3211f07e67edSHong Zhang if (aj[j] > j) { 3212f07e67edSHong Zhang idx[i] = j; 32132205254eSKarl Rupp break; 32142205254eSKarl Rupp } 3215289a08f5SMatthew Knepley } 3216f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3217f07e67edSHong Zhang if (j==ncols && j < A->cmap->n) idx[i] = j; 3218f07e67edSHong Zhang } 3219289a08f5SMatthew Knepley } 3220c87e5d42SMatthew Knepley for (j=0; j<ncols; j++) { 3221f07e67edSHong Zhang if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 3222c87e5d42SMatthew Knepley aa++; aj++; 3223c87e5d42SMatthew Knepley } 3224c87e5d42SMatthew Knepley } 32259566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 32269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&av)); 3227c87e5d42SMatthew Knepley PetscFunctionReturn(0); 3228c87e5d42SMatthew Knepley } 3229c87e5d42SMatthew Knepley 3230985db425SBarry Smith PetscErrorCode MatGetRowMin_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3231985db425SBarry Smith { 3232985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3233d9ca1df4SBarry Smith PetscInt i,j,m = A->rmap->n,ncols,n; 3234d9ca1df4SBarry Smith const PetscInt *ai,*aj; 3235985db425SBarry Smith PetscScalar *x; 3236ce496241SStefano Zampini const MatScalar *aa,*av; 3237985db425SBarry Smith 3238985db425SBarry Smith PetscFunctionBegin; 323928b400f6SJacob Faibussowitsch PetscCheck(!A->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 32409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&av)); 3241ce496241SStefano Zampini aa = av; 3242985db425SBarry Smith ai = a->i; 3243985db425SBarry Smith aj = a->j; 3244985db425SBarry Smith 32459566063dSJacob Faibussowitsch PetscCall(VecSet(v,0.0)); 32469566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 32479566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v,&n)); 324808401ef6SPierre Jolivet PetscCheck(n == m,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3249985db425SBarry Smith for (i=0; i<m; i++) { 3250985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 3251d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 3252985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 3253985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3254985db425SBarry Smith x[i] = 0.0; 3255985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3256985db425SBarry Smith for (j=0; j<ncols; j++) { 3257985db425SBarry Smith if (aj[j] > j) { 3258985db425SBarry Smith idx[i] = j; 3259985db425SBarry Smith break; 3260985db425SBarry Smith } 3261985db425SBarry Smith } 3262fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3263fa213d2fSHong Zhang if (j==ncols && j < A->cmap->n) idx[i] = j; 3264985db425SBarry Smith } 3265985db425SBarry Smith } 3266985db425SBarry Smith for (j=0; j<ncols; j++) { 3267985db425SBarry Smith if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 3268985db425SBarry Smith aa++; aj++; 3269e34fafa9SBarry Smith } 3270e34fafa9SBarry Smith } 32719566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 32729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&av)); 3273e34fafa9SBarry Smith PetscFunctionReturn(0); 3274e34fafa9SBarry Smith } 3275bbead8a2SBarry Smith 3276713ccfa9SJed Brown PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A,const PetscScalar **values) 3277bbead8a2SBarry Smith { 3278bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 327933d57670SJed Brown PetscInt i,bs = PetscAbs(A->rmap->bs),mbs = A->rmap->n/bs,ipvt[5],bs2 = bs*bs,*v_pivots,ij[7],*IJ,j; 3280bbead8a2SBarry Smith MatScalar *diag,work[25],*v_work; 32810da83c2eSBarry Smith const PetscReal shift = 0.0; 32821a9391e3SHong Zhang PetscBool allowzeropivot,zeropivotdetected=PETSC_FALSE; 3283bbead8a2SBarry Smith 3284bbead8a2SBarry Smith PetscFunctionBegin; 3285a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 32864a0d0026SBarry Smith if (a->ibdiagvalid) { 32874a0d0026SBarry Smith if (values) *values = a->ibdiag; 32884a0d0026SBarry Smith PetscFunctionReturn(0); 32894a0d0026SBarry Smith } 32909566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 3291bbead8a2SBarry Smith if (!a->ibdiag) { 32929566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bs2*mbs,&a->ibdiag)); 32939566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,bs2*mbs*sizeof(PetscScalar))); 3294bbead8a2SBarry Smith } 3295bbead8a2SBarry Smith diag = a->ibdiag; 3296bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3297bbead8a2SBarry Smith /* factor and invert each block */ 3298bbead8a2SBarry Smith switch (bs) { 3299bbead8a2SBarry Smith case 1: 3300bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 33019566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,1,&i,1,&i,diag+i)); 3302ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3303ec1892c8SHong Zhang if (allowzeropivot) { 33047b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33057b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 33067b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 33079566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n",i,(double)PetscAbsScalar(diag[i]),(double)PETSC_MACHINE_EPSILON)); 330898921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_MAT_LU_ZRPVT,"Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g",i,(double)PetscAbsScalar(diag[i]),(double)PETSC_MACHINE_EPSILON); 3309ec1892c8SHong Zhang } 3310bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3311bbead8a2SBarry Smith } 3312bbead8a2SBarry Smith break; 3313bbead8a2SBarry Smith case 2: 3314bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3315bbead8a2SBarry Smith ij[0] = 2*i; ij[1] = 2*i + 1; 33169566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,2,ij,2,ij,diag)); 33179566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag,shift,allowzeropivot,&zeropivotdetected)); 33187b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33199566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3320bbead8a2SBarry Smith diag += 4; 3321bbead8a2SBarry Smith } 3322bbead8a2SBarry Smith break; 3323bbead8a2SBarry Smith case 3: 3324bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3325bbead8a2SBarry Smith ij[0] = 3*i; ij[1] = 3*i + 1; ij[2] = 3*i + 2; 33269566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,3,ij,3,ij,diag)); 33279566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag,shift,allowzeropivot,&zeropivotdetected)); 33287b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33299566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3330bbead8a2SBarry Smith diag += 9; 3331bbead8a2SBarry Smith } 3332bbead8a2SBarry Smith break; 3333bbead8a2SBarry Smith case 4: 3334bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3335bbead8a2SBarry Smith ij[0] = 4*i; ij[1] = 4*i + 1; ij[2] = 4*i + 2; ij[3] = 4*i + 3; 33369566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,4,ij,4,ij,diag)); 33379566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag,shift,allowzeropivot,&zeropivotdetected)); 33387b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33399566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3340bbead8a2SBarry Smith diag += 16; 3341bbead8a2SBarry Smith } 3342bbead8a2SBarry Smith break; 3343bbead8a2SBarry Smith case 5: 3344bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3345bbead8a2SBarry Smith ij[0] = 5*i; ij[1] = 5*i + 1; ij[2] = 5*i + 2; ij[3] = 5*i + 3; ij[4] = 5*i + 4; 33469566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,5,ij,5,ij,diag)); 33479566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag,ipvt,work,shift,allowzeropivot,&zeropivotdetected)); 33487b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33499566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3350bbead8a2SBarry Smith diag += 25; 3351bbead8a2SBarry Smith } 3352bbead8a2SBarry Smith break; 3353bbead8a2SBarry Smith case 6: 3354bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3355bbead8a2SBarry Smith ij[0] = 6*i; ij[1] = 6*i + 1; ij[2] = 6*i + 2; ij[3] = 6*i + 3; ij[4] = 6*i + 4; ij[5] = 6*i + 5; 33569566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,6,ij,6,ij,diag)); 33579566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag,shift,allowzeropivot,&zeropivotdetected)); 33587b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33599566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3360bbead8a2SBarry Smith diag += 36; 3361bbead8a2SBarry Smith } 3362bbead8a2SBarry Smith break; 3363bbead8a2SBarry Smith case 7: 3364bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3365bbead8a2SBarry Smith ij[0] = 7*i; ij[1] = 7*i + 1; ij[2] = 7*i + 2; ij[3] = 7*i + 3; ij[4] = 7*i + 4; ij[5] = 7*i + 5; ij[5] = 7*i + 6; 33669566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,7,ij,7,ij,diag)); 33679566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag,shift,allowzeropivot,&zeropivotdetected)); 33687b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33699566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3370bbead8a2SBarry Smith diag += 49; 3371bbead8a2SBarry Smith } 3372bbead8a2SBarry Smith break; 3373bbead8a2SBarry Smith default: 33749566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs,&v_work,bs,&v_pivots,bs,&IJ)); 3375bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3376bbead8a2SBarry Smith for (j=0; j<bs; j++) { 3377bbead8a2SBarry Smith IJ[j] = bs*i + j; 3378bbead8a2SBarry Smith } 33799566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,bs,IJ,bs,IJ,diag)); 33809566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs,diag,v_pivots,v_work,allowzeropivot,&zeropivotdetected)); 33817b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33829566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag,bs)); 3383bbead8a2SBarry Smith diag += bs2; 3384bbead8a2SBarry Smith } 33859566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work,v_pivots,IJ)); 3386bbead8a2SBarry Smith } 3387bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 3388bbead8a2SBarry Smith PetscFunctionReturn(0); 3389bbead8a2SBarry Smith } 3390bbead8a2SBarry Smith 339173a71a0fSBarry Smith static PetscErrorCode MatSetRandom_SeqAIJ(Mat x,PetscRandom rctx) 339273a71a0fSBarry Smith { 339373a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)x->data; 3394fff043a9SJunchao Zhang PetscScalar a,*aa; 339573a71a0fSBarry Smith PetscInt m,n,i,j,col; 339673a71a0fSBarry Smith 339773a71a0fSBarry Smith PetscFunctionBegin; 339873a71a0fSBarry Smith if (!x->assembled) { 33999566063dSJacob Faibussowitsch PetscCall(MatGetSize(x,&m,&n)); 340073a71a0fSBarry Smith for (i=0; i<m; i++) { 340173a71a0fSBarry Smith for (j=0; j<aij->imax[i]; j++) { 34029566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx,&a)); 340373a71a0fSBarry Smith col = (PetscInt)(n*PetscRealPart(a)); 34049566063dSJacob Faibussowitsch PetscCall(MatSetValues(x,1,&i,1,&col,&a,ADD_VALUES)); 340573a71a0fSBarry Smith } 340673a71a0fSBarry Smith } 3407e2ce353bSJunchao Zhang } else { 34089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x,&aa)); 34099566063dSJacob Faibussowitsch for (i=0; i<aij->nz; i++) PetscCall(PetscRandomGetValue(rctx,aa+i)); 34109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x,&aa)); 3411e2ce353bSJunchao Zhang } 34129566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x,MAT_FINAL_ASSEMBLY)); 34139566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x,MAT_FINAL_ASSEMBLY)); 341473a71a0fSBarry Smith PetscFunctionReturn(0); 341573a71a0fSBarry Smith } 341673a71a0fSBarry Smith 3417679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3418679944adSJunchao Zhang PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x,PetscInt low,PetscInt high,PetscRandom rctx) 3419679944adSJunchao Zhang { 3420679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)x->data; 3421679944adSJunchao Zhang PetscScalar a; 3422679944adSJunchao Zhang PetscInt m,n,i,j,col,nskip; 3423679944adSJunchao Zhang 3424679944adSJunchao Zhang PetscFunctionBegin; 3425679944adSJunchao Zhang nskip = high - low; 34269566063dSJacob Faibussowitsch PetscCall(MatGetSize(x,&m,&n)); 3427679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3428679944adSJunchao Zhang for (i=0; i<m; i++) { 3429679944adSJunchao Zhang for (j=0; j<aij->imax[i]; j++) { 34309566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx,&a)); 3431679944adSJunchao Zhang col = (PetscInt)(n*PetscRealPart(a)); 3432679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34339566063dSJacob Faibussowitsch PetscCall(MatSetValues(x,1,&i,1,&col,&a,ADD_VALUES)); 3434679944adSJunchao Zhang } 3435e2ce353bSJunchao Zhang } 34369566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x,MAT_FINAL_ASSEMBLY)); 34379566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x,MAT_FINAL_ASSEMBLY)); 3438679944adSJunchao Zhang PetscFunctionReturn(0); 3439679944adSJunchao Zhang } 3440679944adSJunchao Zhang 3441682d7d0cSBarry Smith /* -------------------------------------------------------------------*/ 34420a6ffc59SBarry Smith static struct _MatOps MatOps_Values = { MatSetValues_SeqAIJ, 3443cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3444cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3445cb5b572fSBarry Smith MatMult_SeqAIJ, 344697304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34477c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34487c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3449f4259b30SLisandro Dalcin NULL, 3450f4259b30SLisandro Dalcin NULL, 3451f4259b30SLisandro Dalcin NULL, 3452f4259b30SLisandro Dalcin /* 10*/ NULL, 3453cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3454f4259b30SLisandro Dalcin NULL, 345541f059aeSBarry Smith MatSOR_SeqAIJ, 345691e9d3e2SHong Zhang MatTranspose_SeqAIJ, 345797304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3458cb5b572fSBarry Smith MatEqual_SeqAIJ, 3459cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3460cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3461cb5b572fSBarry Smith MatNorm_SeqAIJ, 3462f4259b30SLisandro Dalcin /* 20*/ NULL, 3463cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3464cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3465cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3466d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3467f4259b30SLisandro Dalcin NULL, 3468f4259b30SLisandro Dalcin NULL, 3469f4259b30SLisandro Dalcin NULL, 3470f4259b30SLisandro Dalcin NULL, 34714994cf47SJed Brown /* 29*/ MatSetUp_SeqAIJ, 3472f4259b30SLisandro Dalcin NULL, 3473f4259b30SLisandro Dalcin NULL, 3474f4259b30SLisandro Dalcin NULL, 3475f4259b30SLisandro Dalcin NULL, 3476d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3477f4259b30SLisandro Dalcin NULL, 3478f4259b30SLisandro Dalcin NULL, 3479cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3480f4259b30SLisandro Dalcin NULL, 3481d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 34827dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3483cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3484cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3485cb5b572fSBarry Smith MatCopy_SeqAIJ, 3486d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3487cb5b572fSBarry Smith MatScale_SeqAIJ, 34887d68702bSBarry Smith MatShift_SeqAIJ, 348979299369SBarry Smith MatDiagonalSet_SeqAIJ, 34906e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 349173a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 34923b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 34933b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 34943b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3495a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 349693dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3497f4259b30SLisandro Dalcin NULL, 3498f4259b30SLisandro Dalcin NULL, 3499cda55fadSBarry Smith MatPermute_SeqAIJ, 3500f4259b30SLisandro Dalcin NULL, 3501f4259b30SLisandro Dalcin /* 59*/ NULL, 3502b9b97703SBarry Smith MatDestroy_SeqAIJ, 3503b9b97703SBarry Smith MatView_SeqAIJ, 3504f4259b30SLisandro Dalcin NULL, 3505f4259b30SLisandro Dalcin NULL, 3506f4259b30SLisandro Dalcin /* 64*/ NULL, 3507321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3508f4259b30SLisandro Dalcin NULL, 3509f4259b30SLisandro Dalcin NULL, 3510f4259b30SLisandro Dalcin NULL, 3511d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3512c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3513f4259b30SLisandro Dalcin NULL, 3514f4259b30SLisandro Dalcin NULL, 3515f4259b30SLisandro Dalcin NULL, 3516f4259b30SLisandro Dalcin /* 74*/ NULL, 35173acb8795SBarry Smith MatFDColoringApply_AIJ, 3518f4259b30SLisandro Dalcin NULL, 3519f4259b30SLisandro Dalcin NULL, 3520f4259b30SLisandro Dalcin NULL, 35216ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3522f4259b30SLisandro Dalcin NULL, 3523f4259b30SLisandro Dalcin NULL, 3524f4259b30SLisandro Dalcin NULL, 3525bc011b1eSHong Zhang MatLoad_SeqAIJ, 3526d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqAIJ, 35271cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 3528f4259b30SLisandro Dalcin NULL, 3529f4259b30SLisandro Dalcin NULL, 3530f4259b30SLisandro Dalcin NULL, 3531f4259b30SLisandro Dalcin /* 89*/ NULL, 3532f4259b30SLisandro Dalcin NULL, 353326be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3534f4259b30SLisandro Dalcin NULL, 3535f4259b30SLisandro Dalcin NULL, 35368fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3537f4259b30SLisandro Dalcin NULL, 3538f4259b30SLisandro Dalcin NULL, 35396fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3540f4259b30SLisandro Dalcin NULL, 35414222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3542f4259b30SLisandro Dalcin NULL, 3543f4259b30SLisandro Dalcin NULL, 354487d4246cSBarry Smith MatConjugate_SeqAIJ, 3545f4259b30SLisandro Dalcin NULL, 3546d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 354799cafbc1SBarry Smith MatRealPart_SeqAIJ, 3548f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3549f4259b30SLisandro Dalcin NULL, 3550f4259b30SLisandro Dalcin NULL, 3551cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3552f4259b30SLisandro Dalcin NULL, 35532af78befSBarry Smith MatGetRowMin_SeqAIJ, 3554f4259b30SLisandro Dalcin NULL, 3555599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3556f4259b30SLisandro Dalcin /*114*/ NULL, 3557f4259b30SLisandro Dalcin NULL, 3558f4259b30SLisandro Dalcin NULL, 3559f4259b30SLisandro Dalcin NULL, 3560f4259b30SLisandro Dalcin NULL, 3561f4259b30SLisandro Dalcin /*119*/ NULL, 3562f4259b30SLisandro Dalcin NULL, 3563f4259b30SLisandro Dalcin NULL, 3564f4259b30SLisandro Dalcin NULL, 3565b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 35660716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3567a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 356837868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 35690da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3570f4259b30SLisandro Dalcin NULL, 3571f4259b30SLisandro Dalcin /*129*/ NULL, 3572f4259b30SLisandro Dalcin NULL, 3573f4259b30SLisandro Dalcin NULL, 357475648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3575b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3576b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 35772b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3578f4259b30SLisandro Dalcin NULL, 3579f4259b30SLisandro Dalcin NULL, 35803964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3581f4259b30SLisandro Dalcin /*139*/NULL, 3582f4259b30SLisandro Dalcin NULL, 3583f4259b30SLisandro Dalcin NULL, 35843a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 35859c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 35864222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 35874222ddf1SHong Zhang /*145*/MatDestroySubMatrices_SeqAIJ, 3588f4259b30SLisandro Dalcin NULL, 358972833a62Smarkadams4 NULL, 359072833a62Smarkadams4 MatCreateGraph_Simple_AIJ, 35917fb60732SBarry Smith MatFilter_AIJ, 35927fb60732SBarry Smith /*150*/MatTransposeSymbolic_SeqAIJ 35939e29f15eSvictorle }; 359417ab2063SBarry Smith 35957087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat,PetscInt *indices) 3596bef8e0ddSBarry Smith { 3597bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 359897f1f81fSBarry Smith PetscInt i,nz,n; 3599bef8e0ddSBarry Smith 3600bef8e0ddSBarry Smith PetscFunctionBegin; 3601bef8e0ddSBarry Smith nz = aij->maxnz; 3602d0f46423SBarry Smith n = mat->rmap->n; 3603bef8e0ddSBarry Smith for (i=0; i<nz; i++) { 3604bef8e0ddSBarry Smith aij->j[i] = indices[i]; 3605bef8e0ddSBarry Smith } 3606bef8e0ddSBarry Smith aij->nz = nz; 3607bef8e0ddSBarry Smith for (i=0; i<n; i++) { 3608bef8e0ddSBarry Smith aij->ilen[i] = aij->imax[i]; 3609bef8e0ddSBarry Smith } 3610bef8e0ddSBarry Smith PetscFunctionReturn(0); 3611bef8e0ddSBarry Smith } 3612bef8e0ddSBarry Smith 3613a3bb6f32SFande Kong /* 3614ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3615ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3616ddea5d60SJunchao Zhang */ 3617a3bb6f32SFande Kong PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3618a3bb6f32SFande Kong { 3619a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3620a3bb6f32SFande Kong PetscTable gid1_lid1; 3621a3bb6f32SFande Kong PetscTablePosition tpos; 362225b670f0SStefano Zampini PetscInt gid,lid,i,ec,nz = aij->nz; 362325b670f0SStefano Zampini PetscInt *garray,*jj = aij->j; 3624a3bb6f32SFande Kong 3625a3bb6f32SFande Kong PetscFunctionBegin; 3626a3bb6f32SFande Kong PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3627a3bb6f32SFande Kong PetscValidPointer(mapping,2); 3628a3bb6f32SFande Kong /* use a table */ 36299566063dSJacob Faibussowitsch PetscCall(PetscTableCreate(mat->rmap->n,mat->cmap->N+1,&gid1_lid1)); 3630a3bb6f32SFande Kong ec = 0; 363125b670f0SStefano Zampini for (i=0; i<nz; i++) { 363225b670f0SStefano Zampini PetscInt data,gid1 = jj[i] + 1; 36339566063dSJacob Faibussowitsch PetscCall(PetscTableFind(gid1_lid1,gid1,&data)); 3634a3bb6f32SFande Kong if (!data) { 3635a3bb6f32SFande Kong /* one based table */ 36369566063dSJacob Faibussowitsch PetscCall(PetscTableAdd(gid1_lid1,gid1,++ec,INSERT_VALUES)); 3637a3bb6f32SFande Kong } 3638a3bb6f32SFande Kong } 3639a3bb6f32SFande Kong /* form array of columns we need */ 36409566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec,&garray)); 36419566063dSJacob Faibussowitsch PetscCall(PetscTableGetHeadPosition(gid1_lid1,&tpos)); 3642a3bb6f32SFande Kong while (tpos) { 36439566063dSJacob Faibussowitsch PetscCall(PetscTableGetNext(gid1_lid1,&tpos,&gid,&lid)); 3644a3bb6f32SFande Kong gid--; 3645a3bb6f32SFande Kong lid--; 3646a3bb6f32SFande Kong garray[lid] = gid; 3647a3bb6f32SFande Kong } 36489566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec,garray)); /* sort, and rebuild */ 36499566063dSJacob Faibussowitsch PetscCall(PetscTableRemoveAll(gid1_lid1)); 3650a3bb6f32SFande Kong for (i=0; i<ec; i++) { 36519566063dSJacob Faibussowitsch PetscCall(PetscTableAdd(gid1_lid1,garray[i]+1,i+1,INSERT_VALUES)); 3652a3bb6f32SFande Kong } 3653a3bb6f32SFande Kong /* compact out the extra columns in B */ 365425b670f0SStefano Zampini for (i=0; i<nz; i++) { 365525b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 36569566063dSJacob Faibussowitsch PetscCall(PetscTableFind(gid1_lid1,gid1,&lid)); 3657a3bb6f32SFande Kong lid--; 365825b670f0SStefano Zampini jj[i] = lid; 3659a3bb6f32SFande Kong } 36609566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 36619566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy(&gid1_lid1)); 36629566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat),ec,ec,1,&mat->cmap)); 36639566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF,mat->cmap->bs,mat->cmap->n,garray,PETSC_OWN_POINTER,mapping)); 36649566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping,ISLOCALTOGLOBALMAPPINGHASH)); 3665a3bb6f32SFande Kong PetscFunctionReturn(0); 3666a3bb6f32SFande Kong } 3667a3bb6f32SFande Kong 3668bef8e0ddSBarry Smith /*@ 3669bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3670bef8e0ddSBarry Smith in the matrix. 3671bef8e0ddSBarry Smith 3672bef8e0ddSBarry Smith Input Parameters: 3673bef8e0ddSBarry Smith + mat - the SeqAIJ matrix 3674bef8e0ddSBarry Smith - indices - the column indices 3675bef8e0ddSBarry Smith 367615091d37SBarry Smith Level: advanced 367715091d37SBarry Smith 3678bef8e0ddSBarry Smith Notes: 3679bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3680bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 3681bef8e0ddSBarry Smith of the MatSetValues() operation. 3682bef8e0ddSBarry Smith 3683bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 3684d1be2dadSMatthew Knepley MatCreateSeqAIJ(), and the columns indices MUST be sorted. 3685bef8e0ddSBarry Smith 3686bef8e0ddSBarry Smith MUST be called before any calls to MatSetValues(); 3687bef8e0ddSBarry Smith 3688b9617806SBarry Smith The indices should start with zero, not one. 3689b9617806SBarry Smith 3690bef8e0ddSBarry Smith @*/ 36917087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat,PetscInt *indices) 3692bef8e0ddSBarry Smith { 3693bef8e0ddSBarry Smith PetscFunctionBegin; 36940700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3695dadcf809SJacob Faibussowitsch PetscValidIntPointer(indices,2); 3696cac4c232SBarry Smith PetscUseMethod(mat,"MatSeqAIJSetColumnIndices_C",(Mat,PetscInt*),(mat,indices)); 3697bef8e0ddSBarry Smith PetscFunctionReturn(0); 3698bef8e0ddSBarry Smith } 3699bef8e0ddSBarry Smith 3700be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/ 3701be6bf707SBarry Smith 37027087cfbeSBarry Smith PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3703be6bf707SBarry Smith { 3704be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3705d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3706be6bf707SBarry Smith 3707be6bf707SBarry Smith PetscFunctionBegin; 370828b400f6SJacob Faibussowitsch PetscCheck(aij->nonew,PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3709be6bf707SBarry Smith 3710be6bf707SBarry Smith /* allocate space for values if not already there */ 3711be6bf707SBarry Smith if (!aij->saved_values) { 37129566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz+1,&aij->saved_values)); 37139566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)mat,(nz+1)*sizeof(PetscScalar))); 3714be6bf707SBarry Smith } 3715be6bf707SBarry Smith 3716be6bf707SBarry Smith /* copy values over */ 37179566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values,aij->a,nz)); 3718be6bf707SBarry Smith PetscFunctionReturn(0); 3719be6bf707SBarry Smith } 3720be6bf707SBarry Smith 3721be6bf707SBarry Smith /*@ 3722be6bf707SBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows, for 3723be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3724be6bf707SBarry Smith nonlinear portion. 3725be6bf707SBarry Smith 3726be6bf707SBarry Smith Collect on Mat 3727be6bf707SBarry Smith 3728be6bf707SBarry Smith Input Parameters: 37290e609b76SBarry Smith . mat - the matrix (currently only AIJ matrices support this option) 3730be6bf707SBarry Smith 373115091d37SBarry Smith Level: advanced 373215091d37SBarry Smith 3733be6bf707SBarry Smith Common Usage, with SNESSolve(): 3734be6bf707SBarry Smith $ Create Jacobian matrix 3735be6bf707SBarry Smith $ Set linear terms into matrix 3736be6bf707SBarry Smith $ Apply boundary conditions to matrix, at this time matrix must have 3737be6bf707SBarry Smith $ final nonzero structure (i.e. setting the nonlinear terms and applying 3738be6bf707SBarry Smith $ boundary conditions again will not change the nonzero structure 3739512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3740be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3741be6bf707SBarry Smith $ Call SNESSetJacobian() with matrix 3742be6bf707SBarry Smith $ In your Jacobian routine 3743be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3744be6bf707SBarry Smith $ Set nonlinear terms in matrix 3745be6bf707SBarry Smith 3746be6bf707SBarry Smith Common Usage without SNESSolve(), i.e. when you handle nonlinear solve yourself: 3747be6bf707SBarry Smith $ // build linear portion of Jacobian 3748512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3749be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3750be6bf707SBarry Smith $ loop over nonlinear iterations 3751be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3752be6bf707SBarry Smith $ // call MatSetValues(mat,...) to set nonliner portion of Jacobian 3753be6bf707SBarry Smith $ // call MatAssemblyBegin/End() on matrix 3754be6bf707SBarry Smith $ Solve linear system with Jacobian 3755be6bf707SBarry Smith $ endloop 3756be6bf707SBarry Smith 3757be6bf707SBarry Smith Notes: 3758be6bf707SBarry Smith Matrix must already be assemblied before calling this routine 3759512a5fc5SBarry Smith Must set the matrix option MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); before 3760be6bf707SBarry Smith calling this routine. 3761be6bf707SBarry Smith 37620c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 37630c468ba9SBarry Smith and does not allocated additional space. 37640c468ba9SBarry Smith 3765db781477SPatrick Sanan .seealso: `MatRetrieveValues()` 3766be6bf707SBarry Smith 3767be6bf707SBarry Smith @*/ 37687087cfbeSBarry Smith PetscErrorCode MatStoreValues(Mat mat) 3769be6bf707SBarry Smith { 3770be6bf707SBarry Smith PetscFunctionBegin; 37710700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 377228b400f6SJacob Faibussowitsch PetscCheck(mat->assembled,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 377328b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3774cac4c232SBarry Smith PetscUseMethod(mat,"MatStoreValues_C",(Mat),(mat)); 3775be6bf707SBarry Smith PetscFunctionReturn(0); 3776be6bf707SBarry Smith } 3777be6bf707SBarry Smith 37787087cfbeSBarry Smith PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3779be6bf707SBarry Smith { 3780be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3781d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3782be6bf707SBarry Smith 3783be6bf707SBarry Smith PetscFunctionBegin; 378428b400f6SJacob Faibussowitsch PetscCheck(aij->nonew,PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 378528b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values,PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatStoreValues(A);first"); 3786be6bf707SBarry Smith /* copy values over */ 37879566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a,aij->saved_values,nz)); 3788be6bf707SBarry Smith PetscFunctionReturn(0); 3789be6bf707SBarry Smith } 3790be6bf707SBarry Smith 3791be6bf707SBarry Smith /*@ 3792be6bf707SBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for 3793be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3794be6bf707SBarry Smith nonlinear portion. 3795be6bf707SBarry Smith 3796be6bf707SBarry Smith Collect on Mat 3797be6bf707SBarry Smith 3798be6bf707SBarry Smith Input Parameters: 3799386f7cf9SBarry Smith . mat - the matrix (currently only AIJ matrices support this option) 3800be6bf707SBarry Smith 380115091d37SBarry Smith Level: advanced 380215091d37SBarry Smith 3803db781477SPatrick Sanan .seealso: `MatStoreValues()` 3804be6bf707SBarry Smith 3805be6bf707SBarry Smith @*/ 38067087cfbeSBarry Smith PetscErrorCode MatRetrieveValues(Mat mat) 3807be6bf707SBarry Smith { 3808be6bf707SBarry Smith PetscFunctionBegin; 38090700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 381028b400f6SJacob Faibussowitsch PetscCheck(mat->assembled,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 381128b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3812cac4c232SBarry Smith PetscUseMethod(mat,"MatRetrieveValues_C",(Mat),(mat)); 3813be6bf707SBarry Smith PetscFunctionReturn(0); 3814be6bf707SBarry Smith } 3815be6bf707SBarry Smith 3816be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/ 381717ab2063SBarry Smith /*@C 3818682d7d0cSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in AIJ (compressed row) format 38190d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 38206e62573dSLois Curfman McInnes the user should preallocate the matrix storage by setting the parameter nz 382151c19458SBarry Smith (or the array nnz). By setting these parameters accurately, performance 38222bd5e0b2SLois Curfman McInnes during matrix assembly can be increased by more than a factor of 50. 382317ab2063SBarry Smith 3824d083f849SBarry Smith Collective 3825db81eaa0SLois Curfman McInnes 382617ab2063SBarry Smith Input Parameters: 3827db81eaa0SLois Curfman McInnes + comm - MPI communicator, set to PETSC_COMM_SELF 382817ab2063SBarry Smith . m - number of rows 382917ab2063SBarry Smith . n - number of columns 383017ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 383151c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38320298fd71SBarry Smith (possibly different for each row) or NULL 383317ab2063SBarry Smith 383417ab2063SBarry Smith Output Parameter: 3835416022c9SBarry Smith . A - the matrix 383617ab2063SBarry Smith 3837175b88e8SBarry Smith It is recommended that one use the MatCreate(), MatSetType() and/or MatSetFromOptions(), 3838f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 3839175b88e8SBarry Smith [MatXXXXSetPreallocation() is, for example, MatSeqAIJSetPreallocation] 3840175b88e8SBarry Smith 3841b259b22eSLois Curfman McInnes Notes: 384249a6f317SBarry Smith If nnz is given then nz is ignored 384349a6f317SBarry Smith 384417ab2063SBarry Smith The AIJ format (also called the Yale sparse matrix format or 384517ab2063SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 38460002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 384744cd7ae7SLois Curfman McInnes either one (as in Fortran) or zero. See the users' manual for details. 384817ab2063SBarry Smith 384917ab2063SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 38500298fd71SBarry Smith Set nz=PETSC_DEFAULT and nnz=NULL for PETSc to control dynamic memory 38513d323bbdSBarry Smith allocation. For large problems you MUST preallocate memory or you 38526da5968aSLois Curfman McInnes will get TERRIBLE performance, see the users' manual chapter on matrices. 385317ab2063SBarry Smith 3854682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38554fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3856682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38576c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38586c7ebb05SLois Curfman McInnes 38596c7ebb05SLois Curfman McInnes Options Database Keys: 3860698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 38619db58ca8SBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 386217ab2063SBarry Smith 3863027ccd11SLois Curfman McInnes Level: intermediate 3864027ccd11SLois Curfman McInnes 3865db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 386636db0b34SBarry Smith 386717ab2063SBarry Smith @*/ 38687087cfbeSBarry Smith PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt nz,const PetscInt nnz[],Mat *A) 386917ab2063SBarry Smith { 38703a40ed3dSBarry Smith PetscFunctionBegin; 38719566063dSJacob Faibussowitsch PetscCall(MatCreate(comm,A)); 38729566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A,m,n,m,n)); 38739566063dSJacob Faibussowitsch PetscCall(MatSetType(*A,MATSEQAIJ)); 38749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A,nz,nnz)); 3875273d9f13SBarry Smith PetscFunctionReturn(0); 3876273d9f13SBarry Smith } 3877273d9f13SBarry Smith 3878273d9f13SBarry Smith /*@C 3879273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3880273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3881273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3882273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3883273d9f13SBarry Smith 3884d083f849SBarry Smith Collective 3885273d9f13SBarry Smith 3886273d9f13SBarry Smith Input Parameters: 38871c4f3114SJed Brown + B - The matrix 3888273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3889273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38900298fd71SBarry Smith (possibly different for each row) or NULL 3891273d9f13SBarry Smith 3892273d9f13SBarry Smith Notes: 389349a6f317SBarry Smith If nnz is given then nz is ignored 389449a6f317SBarry Smith 3895273d9f13SBarry Smith The AIJ format (also called the Yale sparse matrix format or 3896273d9f13SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 3897273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3898273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3899273d9f13SBarry Smith 3900273d9f13SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 39010298fd71SBarry Smith Set nz=PETSC_DEFAULT and nnz=NULL for PETSc to control dynamic memory 3902273d9f13SBarry Smith allocation. For large problems you MUST preallocate memory or you 3903273d9f13SBarry Smith will get TERRIBLE performance, see the users' manual chapter on matrices. 3904273d9f13SBarry Smith 3905aa95bbe8SBarry Smith You can call MatGetInfo() to get information on how effective the preallocation was; 3906aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3907aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3908aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3909aa95bbe8SBarry Smith 3910a96a251dSBarry Smith Developers: Use nz of MAT_SKIP_ALLOCATION to not allocate any space for the matrix 3911a96a251dSBarry Smith entries or columns indices 3912a96a251dSBarry Smith 3913273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3914273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3915273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3916273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3917273d9f13SBarry Smith 3918273d9f13SBarry Smith Options Database Keys: 3919698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 392047b2e64bSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 3921273d9f13SBarry Smith 3922273d9f13SBarry Smith Level: intermediate 3923273d9f13SBarry Smith 3924db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3925db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3926273d9f13SBarry Smith 3927273d9f13SBarry Smith @*/ 39287087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation(Mat B,PetscInt nz,const PetscInt nnz[]) 3929273d9f13SBarry Smith { 3930a23d5eceSKris Buschelman PetscFunctionBegin; 39316ba663aaSJed Brown PetscValidHeaderSpecific(B,MAT_CLASSID,1); 39326ba663aaSJed Brown PetscValidType(B,1); 3933cac4c232SBarry Smith PetscTryMethod(B,"MatSeqAIJSetPreallocation_C",(Mat,PetscInt,const PetscInt[]),(B,nz,nnz)); 3934a23d5eceSKris Buschelman PetscFunctionReturn(0); 3935a23d5eceSKris Buschelman } 3936a23d5eceSKris Buschelman 39377087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B,PetscInt nz,const PetscInt *nnz) 3938a23d5eceSKris Buschelman { 3939273d9f13SBarry Smith Mat_SeqAIJ *b; 39402576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE,realalloc = PETSC_FALSE; 394197f1f81fSBarry Smith PetscInt i; 3942273d9f13SBarry Smith 3943273d9f13SBarry Smith PetscFunctionBegin; 39442576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3945a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3946c461c341SBarry Smith skipallocation = PETSC_TRUE; 3947c461c341SBarry Smith nz = 0; 3948c461c341SBarry Smith } 39499566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39509566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3951899cda47SBarry Smith 3952435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 395308401ef6SPierre Jolivet PetscCheck(nz >= 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nz cannot be less than 0: value %" PetscInt_FMT,nz); 3954cf9c20a2SJed Brown if (PetscUnlikelyDebug(nnz)) { 3955d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) { 395608401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT,i,nnz[i]); 395708401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT,i,nnz[i],B->cmap->n); 3958b73539f3SBarry Smith } 3959b73539f3SBarry Smith } 3960b73539f3SBarry Smith 3961273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 39622205254eSKarl Rupp 3963273d9f13SBarry Smith b = (Mat_SeqAIJ*)B->data; 3964273d9f13SBarry Smith 3965ab93d7beSBarry Smith if (!skipallocation) { 39662ee49352SLisandro Dalcin if (!b->imax) { 39679566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n,&b->imax)); 39689566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt))); 3969071fcb05SBarry Smith } 3970071fcb05SBarry Smith if (!b->ilen) { 3971071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 39729566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n,&b->ilen)); 39739566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt))); 3974071fcb05SBarry Smith } else { 39759566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen,B->rmap->n*sizeof(PetscInt))); 39762ee49352SLisandro Dalcin } 3977846b4da1SFande Kong if (!b->ipre) { 39789566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n,&b->ipre)); 39799566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt))); 3980846b4da1SFande Kong } 3981273d9f13SBarry Smith if (!nnz) { 3982435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 3983c62bd62aSJed Brown else if (nz < 0) nz = 1; 39845d2a9ed1SStefano Zampini nz = PetscMin(nz,B->cmap->n); 3985d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) b->imax[i] = nz; 3986d0f46423SBarry Smith nz = nz*B->rmap->n; 3987273d9f13SBarry Smith } else { 3988c73702f5SBarry Smith PetscInt64 nz64 = 0; 3989c73702f5SBarry Smith for (i=0; i<B->rmap->n; i++) {b->imax[i] = nnz[i]; nz64 += nnz[i];} 39909566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64,&nz)); 3991273d9f13SBarry Smith } 3992ab93d7beSBarry Smith 3993273d9f13SBarry Smith /* allocate the matrix space */ 399453dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 39959566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B,&b->a,&b->j,&b->i)); 3996396832f4SHong Zhang if (B->structure_only) { 39979566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz,&b->j)); 39989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n+1,&b->i)); 39999566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)B,(B->rmap->n+1)*sizeof(PetscInt)+nz*sizeof(PetscInt))); 4000396832f4SHong Zhang } else { 40019566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nz,&b->a,nz,&b->j,B->rmap->n+1,&b->i)); 40029566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)B,(B->rmap->n+1)*sizeof(PetscInt)+nz*(sizeof(PetscScalar)+sizeof(PetscInt)))); 4003396832f4SHong Zhang } 4004bfeeae90SHong Zhang b->i[0] = 0; 4005d0f46423SBarry Smith for (i=1; i<B->rmap->n+1; i++) { 40065da197adSKris Buschelman b->i[i] = b->i[i-1] + b->imax[i-1]; 40075da197adSKris Buschelman } 4008396832f4SHong Zhang if (B->structure_only) { 4009396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 4010396832f4SHong Zhang b->free_a = PETSC_FALSE; 4011396832f4SHong Zhang } else { 4012273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 4013e6b907acSBarry Smith b->free_a = PETSC_TRUE; 4014396832f4SHong Zhang } 4015e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 4016c461c341SBarry Smith } else { 4017e6b907acSBarry Smith b->free_a = PETSC_FALSE; 4018e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 4019c461c341SBarry Smith } 4020273d9f13SBarry Smith 4021846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 4022846b4da1SFande Kong /* reserve user-requested sparsity */ 40239566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre,b->imax,B->rmap->n)); 4024846b4da1SFande Kong } 4025846b4da1SFande Kong 4026273d9f13SBarry Smith b->nz = 0; 4027273d9f13SBarry Smith b->maxnz = nz; 4028273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40291baa6e33SBarry Smith if (realalloc) PetscCall(MatSetOption(B,MAT_NEW_NONZERO_ALLOCATION_ERR,PETSC_TRUE)); 4030cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4031cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40325519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40335519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40345519a089SJose E. Roman */ 40355519a089SJose E. Roman B->nonzerostate++; 4036273d9f13SBarry Smith PetscFunctionReturn(0); 4037273d9f13SBarry Smith } 4038273d9f13SBarry Smith 4039846b4da1SFande Kong PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4040846b4da1SFande Kong { 4041846b4da1SFande Kong Mat_SeqAIJ *a; 4042a5bbaf83SFande Kong PetscInt i; 4043846b4da1SFande Kong 4044846b4da1SFande Kong PetscFunctionBegin; 4045846b4da1SFande Kong PetscValidHeaderSpecific(A,MAT_CLASSID,1); 404614d0e64fSAlex Lindsay 404714d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 404814d0e64fSAlex Lindsay if (!A->rmap->n) PetscFunctionReturn(0); 404914d0e64fSAlex Lindsay 4050846b4da1SFande Kong a = (Mat_SeqAIJ*)A->data; 40512c814fdeSFande Kong /* if no saved info, we error out */ 405228b400f6SJacob Faibussowitsch PetscCheck(a->ipre,PETSC_COMM_SELF,PETSC_ERR_ARG_NULL,"No saved preallocation info "); 40532c814fdeSFande Kong 4054aed4548fSBarry Smith PetscCheck(a->i && a->j && a->a && a->imax && a->ilen,PETSC_COMM_SELF,PETSC_ERR_ARG_NULL,"Memory info is incomplete, and can not reset preallocation "); 40552c814fdeSFande Kong 40569566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax,a->ipre,A->rmap->n)); 40579566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen,A->rmap->n)); 4058846b4da1SFande Kong a->i[0] = 0; 4059846b4da1SFande Kong for (i=1; i<A->rmap->n+1; i++) { 4060846b4da1SFande Kong a->i[i] = a->i[i-1] + a->imax[i-1]; 4061846b4da1SFande Kong } 4062846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4063846b4da1SFande Kong a->nz = 0; 4064846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4065846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4066846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4067846b4da1SFande Kong A->assembled = PETSC_FALSE; 4068846b4da1SFande Kong PetscFunctionReturn(0); 4069846b4da1SFande Kong } 4070846b4da1SFande Kong 407158d36128SBarry Smith /*@ 4072a1661176SMatthew Knepley MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in AIJ format. 4073a1661176SMatthew Knepley 4074a1661176SMatthew Knepley Input Parameters: 4075a1661176SMatthew Knepley + B - the matrix 4076a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 4077a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 4078a1661176SMatthew Knepley - v - optional values in the matrix 4079a1661176SMatthew Knepley 4080a1661176SMatthew Knepley Level: developer 4081a1661176SMatthew Knepley 40826a9b8d82SBarry Smith Notes: 408358d36128SBarry Smith The i,j,v values are COPIED with this routine; to avoid the copy use MatCreateSeqAIJWithArrays() 408458d36128SBarry Smith 40856a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 40866a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 40876a9b8d82SBarry Smith 40886a9b8d82SBarry Smith Developer Notes: 40896a9b8d82SBarry Smith An optimization could be added to the implementation where it checks if the i, and j are identical to the current i and j and 40906a9b8d82SBarry Smith then just copies the v values directly with PetscMemcpy(). 40916a9b8d82SBarry Smith 40926a9b8d82SBarry Smith This routine could also take a PetscCopyMode argument to allow sharing the values instead of always copying them. 40936a9b8d82SBarry Smith 4094db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MatResetPreallocation()` 4095a1661176SMatthew Knepley @*/ 4096a1661176SMatthew Knepley PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B,const PetscInt i[],const PetscInt j[],const PetscScalar v[]) 4097a1661176SMatthew Knepley { 4098a1661176SMatthew Knepley PetscFunctionBegin; 40990700a824SBarry Smith PetscValidHeaderSpecific(B,MAT_CLASSID,1); 41006ba663aaSJed Brown PetscValidType(B,1); 4101cac4c232SBarry Smith PetscTryMethod(B,"MatSeqAIJSetPreallocationCSR_C",(Mat,const PetscInt[],const PetscInt[],const PetscScalar[]),(B,i,j,v)); 4102a1661176SMatthew Knepley PetscFunctionReturn(0); 4103a1661176SMatthew Knepley } 4104a1661176SMatthew Knepley 41057087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B,const PetscInt Ii[],const PetscInt J[],const PetscScalar v[]) 4106a1661176SMatthew Knepley { 4107a1661176SMatthew Knepley PetscInt i; 4108a1661176SMatthew Knepley PetscInt m,n; 4109a1661176SMatthew Knepley PetscInt nz; 41106a9b8d82SBarry Smith PetscInt *nnz; 4111a1661176SMatthew Knepley 4112a1661176SMatthew Knepley PetscFunctionBegin; 4113aed4548fSBarry Smith PetscCheck(Ii[0] == 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4114779a8d59SSatish Balay 41159566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 41169566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4117779a8d59SSatish Balay 41189566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 41199566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1, &nnz)); 4120a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4121b7940d39SSatish Balay nz = Ii[i+1]- Ii[i]; 412208401ef6SPierre Jolivet PetscCheck(nz >= 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4123a1661176SMatthew Knepley nnz[i] = nz; 4124a1661176SMatthew Knepley } 41259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 41269566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4127a1661176SMatthew Knepley 4128a1661176SMatthew Knepley for (i = 0; i < m; i++) { 41299566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i+1] - Ii[i], J+Ii[i], v ? v + Ii[i] : NULL, INSERT_VALUES)); 4130a1661176SMatthew Knepley } 4131a1661176SMatthew Knepley 41329566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY)); 41339566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY)); 4134a1661176SMatthew Knepley 41359566063dSJacob Faibussowitsch PetscCall(MatSetOption(B,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE)); 4136a1661176SMatthew Knepley PetscFunctionReturn(0); 4137a1661176SMatthew Knepley } 4138a1661176SMatthew Knepley 4139ad7e164aSPierre Jolivet /*@ 4140ad7e164aSPierre Jolivet MatSeqAIJKron - Computes C, the Kronecker product of A and B. 4141ad7e164aSPierre Jolivet 4142ad7e164aSPierre Jolivet Input Parameters: 4143ad7e164aSPierre Jolivet + A - left-hand side matrix 4144ad7e164aSPierre Jolivet . B - right-hand side matrix 4145ad7e164aSPierre Jolivet - reuse - either MAT_INITIAL_MATRIX or MAT_REUSE_MATRIX 4146ad7e164aSPierre Jolivet 4147ad7e164aSPierre Jolivet Output Parameter: 4148ad7e164aSPierre Jolivet . C - Kronecker product of A and B 4149ad7e164aSPierre Jolivet 4150ad7e164aSPierre Jolivet Level: intermediate 4151ad7e164aSPierre Jolivet 4152ad7e164aSPierre Jolivet Notes: 4153ad7e164aSPierre Jolivet MAT_REUSE_MATRIX can only be used when the nonzero structure of the product matrix has not changed from that last call to MatSeqAIJKron(). 4154ad7e164aSPierre Jolivet 4155db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4156ad7e164aSPierre Jolivet @*/ 4157ad7e164aSPierre Jolivet PetscErrorCode MatSeqAIJKron(Mat A,Mat B,MatReuse reuse,Mat *C) 4158ad7e164aSPierre Jolivet { 4159ad7e164aSPierre Jolivet PetscFunctionBegin; 4160ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A,MAT_CLASSID,1); 4161ad7e164aSPierre Jolivet PetscValidType(A,1); 4162ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B,MAT_CLASSID,2); 4163ad7e164aSPierre Jolivet PetscValidType(B,2); 4164ad7e164aSPierre Jolivet PetscValidPointer(C,4); 4165ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4166ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C,MAT_CLASSID,4); 4167ad7e164aSPierre Jolivet PetscValidType(*C,4); 4168ad7e164aSPierre Jolivet } 4169cac4c232SBarry Smith PetscTryMethod(A,"MatSeqAIJKron_C",(Mat,Mat,MatReuse,Mat*),(A,B,reuse,C)); 4170ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4171ad7e164aSPierre Jolivet } 4172ad7e164aSPierre Jolivet 4173ad7e164aSPierre Jolivet PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A,Mat B,MatReuse reuse,Mat *C) 4174ad7e164aSPierre Jolivet { 4175ad7e164aSPierre Jolivet Mat newmat; 4176ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 4177ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ*)B->data; 4178ad7e164aSPierre Jolivet PetscScalar *v; 4179fff043a9SJunchao Zhang const PetscScalar *aa,*ba; 4180ad7e164aSPierre Jolivet PetscInt *i,*j,m,n,p,q,nnz = 0,am = A->rmap->n,bm = B->rmap->n,an = A->cmap->n, bn = B->cmap->n; 4181ad7e164aSPierre Jolivet PetscBool flg; 4182ad7e164aSPierre Jolivet 4183ad7e164aSPierre Jolivet PetscFunctionBegin; 418428b400f6SJacob Faibussowitsch PetscCheck(!A->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 418528b400f6SJacob Faibussowitsch PetscCheck(A->assembled,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 418628b400f6SJacob Faibussowitsch PetscCheck(!B->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 418728b400f6SJacob Faibussowitsch PetscCheck(B->assembled,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 41889566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B,MATSEQAIJ,&flg)); 418928b400f6SJacob Faibussowitsch PetscCheck(flg,PETSC_COMM_SELF,PETSC_ERR_SUP,"MatType %s",((PetscObject)B)->type_name); 4190aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX,PETSC_COMM_SELF,PETSC_ERR_SUP,"MatReuse %d",(int)reuse); 4191ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 41929566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am*bm+1,&i,a->i[am]*b->i[bm],&j)); 41939566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF,&newmat)); 41949566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat,am*bm,an*bn,am*bm,an*bn)); 41959566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat,MATAIJ)); 4196ad7e164aSPierre Jolivet i[0] = 0; 4197ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4198ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4199ad7e164aSPierre Jolivet i[m*bm + p + 1] = i[m*bm + p] + (a->i[m+1] - a->i[m]) * (b->i[p+1] - b->i[p]); 4200ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m+1]; ++n) { 4201ad7e164aSPierre Jolivet for (q = b->i[p]; q < b->i[p+1]; ++q) { 4202ad7e164aSPierre Jolivet j[nnz++] = a->j[n]*bn + b->j[q]; 4203ad7e164aSPierre Jolivet } 4204ad7e164aSPierre Jolivet } 4205ad7e164aSPierre Jolivet } 4206ad7e164aSPierre Jolivet } 42079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat,i,j,NULL)); 4208ad7e164aSPierre Jolivet *C = newmat; 42099566063dSJacob Faibussowitsch PetscCall(PetscFree2(i,j)); 4210ad7e164aSPierre Jolivet nnz = 0; 4211ad7e164aSPierre Jolivet } 42129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C,&v)); 42139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 42149566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B,&ba)); 4215ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4216ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4217ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m+1]; ++n) { 4218ad7e164aSPierre Jolivet for (q = b->i[p]; q < b->i[p+1]; ++q) { 4219fff043a9SJunchao Zhang v[nnz++] = aa[n] * ba[q]; 4220ad7e164aSPierre Jolivet } 4221ad7e164aSPierre Jolivet } 4222ad7e164aSPierre Jolivet } 4223ad7e164aSPierre Jolivet } 42249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C,&v)); 42259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 42269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B,&ba)); 4227ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4228ad7e164aSPierre Jolivet } 4229ad7e164aSPierre Jolivet 4230c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4231af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4232170fe5c8SBarry Smith 4233170fe5c8SBarry Smith /* 4234170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4235170fe5c8SBarry Smith 4236170fe5c8SBarry Smith n p p 42372da392ccSBarry Smith [ ] [ ] [ ] 42382da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42392da392ccSBarry Smith [ ] [ ] [ ] 4240170fe5c8SBarry Smith 4241170fe5c8SBarry Smith */ 4242170fe5c8SBarry Smith PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A,Mat B,Mat C) 4243170fe5c8SBarry Smith { 4244170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense*)A->data; 4245170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ*)B->data; 4246170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense*)C->data; 424786214ceeSStefano Zampini PetscInt i,j,n,m,q,p; 4248170fe5c8SBarry Smith const PetscInt *ii,*idx; 4249170fe5c8SBarry Smith const PetscScalar *b,*a,*a_q; 4250170fe5c8SBarry Smith PetscScalar *c,*c_q; 425186214ceeSStefano Zampini PetscInt clda = sub_c->lda; 425286214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4253170fe5c8SBarry Smith 4254170fe5c8SBarry Smith PetscFunctionBegin; 4255d0f46423SBarry Smith m = A->rmap->n; 4256d0f46423SBarry Smith n = A->cmap->n; 4257d0f46423SBarry Smith p = B->cmap->n; 4258170fe5c8SBarry Smith a = sub_a->v; 4259170fe5c8SBarry Smith b = sub_b->a; 4260170fe5c8SBarry Smith c = sub_c->v; 426186214ceeSStefano Zampini if (clda == m) { 42629566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c,m*p)); 426386214ceeSStefano Zampini } else { 426486214ceeSStefano Zampini for (j=0;j<p;j++) 426586214ceeSStefano Zampini for (i=0;i<m;i++) 426686214ceeSStefano Zampini c[j*clda + i] = 0.0; 426786214ceeSStefano Zampini } 4268170fe5c8SBarry Smith ii = sub_b->i; 4269170fe5c8SBarry Smith idx = sub_b->j; 4270170fe5c8SBarry Smith for (i=0; i<n; i++) { 4271170fe5c8SBarry Smith q = ii[i+1] - ii[i]; 4272170fe5c8SBarry Smith while (q-->0) { 427386214ceeSStefano Zampini c_q = c + clda*(*idx); 427486214ceeSStefano Zampini a_q = a + alda*i; 4275854c7f52SBarry Smith PetscKernelAXPY(c_q,*b,a_q,m); 4276170fe5c8SBarry Smith idx++; 4277170fe5c8SBarry Smith b++; 4278170fe5c8SBarry Smith } 4279170fe5c8SBarry Smith } 4280170fe5c8SBarry Smith PetscFunctionReturn(0); 4281170fe5c8SBarry Smith } 4282170fe5c8SBarry Smith 42834222ddf1SHong Zhang PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A,Mat B,PetscReal fill,Mat C) 4284170fe5c8SBarry Smith { 4285d0f46423SBarry Smith PetscInt m=A->rmap->n,n=B->cmap->n; 428686214ceeSStefano Zampini PetscBool cisdense; 4287170fe5c8SBarry Smith 4288170fe5c8SBarry Smith PetscFunctionBegin; 428908401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT,A->cmap->n,B->rmap->n); 42909566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C,m,n,m,n)); 42919566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C,A,B)); 42929566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATSEQDENSECUDA,"")); 429386214ceeSStefano Zampini if (!cisdense) { 42949566063dSJacob Faibussowitsch PetscCall(MatSetType(C,MATDENSE)); 429586214ceeSStefano Zampini } 42969566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4297d73949e8SHong Zhang 42984222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 4299170fe5c8SBarry Smith PetscFunctionReturn(0); 4300170fe5c8SBarry Smith } 4301170fe5c8SBarry Smith 4302170fe5c8SBarry Smith /* ----------------------------------------------------------------*/ 43030bad9183SKris Buschelman /*MC 4304fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 43050bad9183SKris Buschelman based on compressed sparse row format. 43060bad9183SKris Buschelman 43070bad9183SKris Buschelman Options Database Keys: 43080bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 43090bad9183SKris Buschelman 43100bad9183SKris Buschelman Level: beginner 43110bad9183SKris Buschelman 43120cd7f59aSBarry Smith Notes: 43130cd7f59aSBarry Smith MatSetValues() may be called for this matrix type with a NULL argument for the numerical values, 43140cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 43150cd7f59aSBarry Smith in the matrix 43160cd7f59aSBarry Smith 43170cd7f59aSBarry Smith MatSetOptions(,MAT_STRUCTURE_ONLY,PETSC_TRUE) may be called for this matrix type. In this no 43180cd7f59aSBarry Smith space is allocated for the nonzero entries and any entries passed with MatSetValues() are ignored 43190cd7f59aSBarry Smith 43200cd7f59aSBarry Smith Developer Notes: 43210cd7f59aSBarry Smith It would be nice if all matrix formats supported passing NULL in for the numerical values 43220cd7f59aSBarry Smith 4323db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 43240bad9183SKris Buschelman M*/ 43250bad9183SKris Buschelman 4326ccd284c7SBarry Smith /*MC 4327ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4328ccd284c7SBarry Smith 4329ccd284c7SBarry Smith This matrix type is identical to MATSEQAIJ when constructed with a single process communicator, 4330ccd284c7SBarry Smith and MATMPIAIJ otherwise. As a result, for single process communicators, 4331ed73aabaSBarry Smith MatSeqAIJSetPreallocation() is supported, and similarly MatMPIAIJSetPreallocation() is supported 4332ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4333ccd284c7SBarry Smith the above preallocation routines for simplicity. 4334ccd284c7SBarry Smith 4335ccd284c7SBarry Smith Options Database Keys: 4336ccd284c7SBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to MatSetFromOptions() 4337ccd284c7SBarry Smith 433895452b02SPatrick Sanan Developer Notes: 4339ca9cdca7SRichard Tran Mills Subclasses include MATAIJCUSPARSE, MATAIJPERM, MATAIJSELL, MATAIJMKL, MATAIJCRL, and also automatically switches over to use inodes when 4340ccd284c7SBarry Smith enough exist. 4341ccd284c7SBarry Smith 4342ccd284c7SBarry Smith Level: beginner 4343ccd284c7SBarry Smith 4344db781477SPatrick Sanan .seealso: `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4345ccd284c7SBarry Smith M*/ 4346ccd284c7SBarry Smith 4347ccd284c7SBarry Smith /*MC 4348ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4349ccd284c7SBarry Smith 4350ccd284c7SBarry Smith This matrix type is identical to MATSEQAIJCRL when constructed with a single process communicator, 4351ccd284c7SBarry Smith and MATMPIAIJCRL otherwise. As a result, for single process communicators, 4352ccd284c7SBarry Smith MatSeqAIJSetPreallocation() is supported, and similarly MatMPIAIJSetPreallocation() is supported 4353ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4354ccd284c7SBarry Smith the above preallocation routines for simplicity. 4355ccd284c7SBarry Smith 4356ccd284c7SBarry Smith Options Database Keys: 4357ccd284c7SBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to MatSetFromOptions() 4358ccd284c7SBarry Smith 4359ccd284c7SBarry Smith Level: beginner 4360ccd284c7SBarry Smith 4361c2e3fba1SPatrick Sanan .seealso: `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4362ccd284c7SBarry Smith M*/ 4363ccd284c7SBarry Smith 43647906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat,MatType,MatReuse,Mat*); 43657906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43667906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat,MatType,MatReuse,Mat*); 43677906f579SHong Zhang #endif 4368d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4369d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat,MatType,MatReuse,Mat*); 4370d24d4204SJose E. Roman #endif 43717906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 43727906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A,MatType,MatReuse,Mat*); 43737906f579SHong Zhang #endif 43747906f579SHong Zhang 4375d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat,MatType,MatReuse,Mat*); 4376c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat,MatType,MatReuse,Mat*); 43774222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 43787906f579SHong Zhang 43798c778c55SBarry Smith /*@C 43808f1ea47aSStefano Zampini MatSeqAIJGetArray - gives read/write access to the array where the data for a MATSEQAIJ matrix is stored 43818c778c55SBarry Smith 43828c778c55SBarry Smith Not Collective 43838c778c55SBarry Smith 43848c778c55SBarry Smith Input Parameter: 4385579dbff0SBarry Smith . mat - a MATSEQAIJ matrix 43868c778c55SBarry Smith 43878c778c55SBarry Smith Output Parameter: 43888c778c55SBarry Smith . array - pointer to the data 43898c778c55SBarry Smith 43908c778c55SBarry Smith Level: intermediate 43918c778c55SBarry Smith 4392db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 43938c778c55SBarry Smith @*/ 43948c778c55SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A,PetscScalar **array) 43958c778c55SBarry Smith { 4396d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 43978c778c55SBarry Smith 43988c778c55SBarry Smith PetscFunctionBegin; 4399d67d9f35SJunchao Zhang if (aij->ops->getarray) { 44009566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A,array)); 4401d67d9f35SJunchao Zhang } else { 4402d67d9f35SJunchao Zhang *array = aij->a; 4403d67d9f35SJunchao Zhang } 4404d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4405d67d9f35SJunchao Zhang } 4406d67d9f35SJunchao Zhang 4407d67d9f35SJunchao Zhang /*@C 4408d67d9f35SJunchao Zhang MatSeqAIJRestoreArray - returns access to the array where the data for a MATSEQAIJ matrix is stored obtained by MatSeqAIJGetArray() 4409d67d9f35SJunchao Zhang 4410d67d9f35SJunchao Zhang Not Collective 4411d67d9f35SJunchao Zhang 4412d67d9f35SJunchao Zhang Input Parameters: 4413d67d9f35SJunchao Zhang + mat - a MATSEQAIJ matrix 4414d67d9f35SJunchao Zhang - array - pointer to the data 4415d67d9f35SJunchao Zhang 4416d67d9f35SJunchao Zhang Level: intermediate 4417d67d9f35SJunchao Zhang 4418db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()` 4419d67d9f35SJunchao Zhang @*/ 4420d67d9f35SJunchao Zhang PetscErrorCode MatSeqAIJRestoreArray(Mat A,PetscScalar **array) 4421d67d9f35SJunchao Zhang { 4422d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 4423d67d9f35SJunchao Zhang 4424d67d9f35SJunchao Zhang PetscFunctionBegin; 4425d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 44269566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A,array)); 4427d67d9f35SJunchao Zhang } else { 4428d67d9f35SJunchao Zhang *array = NULL; 4429d67d9f35SJunchao Zhang } 44309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44319566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 44328c778c55SBarry Smith PetscFunctionReturn(0); 44338c778c55SBarry Smith } 44348c778c55SBarry Smith 443521e72a00SBarry Smith /*@C 44368f1ea47aSStefano Zampini MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a MATSEQAIJ matrix is stored 44378f1ea47aSStefano Zampini 44388f1ea47aSStefano Zampini Not Collective 44398f1ea47aSStefano Zampini 44408f1ea47aSStefano Zampini Input Parameter: 44418f1ea47aSStefano Zampini . mat - a MATSEQAIJ matrix 44428f1ea47aSStefano Zampini 44438f1ea47aSStefano Zampini Output Parameter: 44448f1ea47aSStefano Zampini . array - pointer to the data 44458f1ea47aSStefano Zampini 44468f1ea47aSStefano Zampini Level: intermediate 44478f1ea47aSStefano Zampini 4448db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44498f1ea47aSStefano Zampini @*/ 44508f1ea47aSStefano Zampini PetscErrorCode MatSeqAIJGetArrayRead(Mat A,const PetscScalar **array) 44518f1ea47aSStefano Zampini { 4452d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 44538f1ea47aSStefano Zampini 44548f1ea47aSStefano Zampini PetscFunctionBegin; 4455d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44569566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A,array)); 4457d67d9f35SJunchao Zhang } else { 4458d67d9f35SJunchao Zhang *array = aij->a; 4459d67d9f35SJunchao Zhang } 44608f1ea47aSStefano Zampini PetscFunctionReturn(0); 44618f1ea47aSStefano Zampini } 44628f1ea47aSStefano Zampini 44638f1ea47aSStefano Zampini /*@C 44648f1ea47aSStefano Zampini MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from MatSeqAIJGetArrayRead 44658f1ea47aSStefano Zampini 44668f1ea47aSStefano Zampini Not Collective 44678f1ea47aSStefano Zampini 44688f1ea47aSStefano Zampini Input Parameter: 44698f1ea47aSStefano Zampini . mat - a MATSEQAIJ matrix 44708f1ea47aSStefano Zampini 44718f1ea47aSStefano Zampini Output Parameter: 44728f1ea47aSStefano Zampini . array - pointer to the data 44738f1ea47aSStefano Zampini 44748f1ea47aSStefano Zampini Level: intermediate 44758f1ea47aSStefano Zampini 4476db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 44778f1ea47aSStefano Zampini @*/ 44788f1ea47aSStefano Zampini PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A,const PetscScalar **array) 44798f1ea47aSStefano Zampini { 4480d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 44818f1ea47aSStefano Zampini 44828f1ea47aSStefano Zampini PetscFunctionBegin; 4483d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 44849566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A,array)); 4485d67d9f35SJunchao Zhang } else { 4486d67d9f35SJunchao Zhang *array = NULL; 4487d67d9f35SJunchao Zhang } 4488d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4489d67d9f35SJunchao Zhang } 4490d67d9f35SJunchao Zhang 4491d67d9f35SJunchao Zhang /*@C 4492d67d9f35SJunchao Zhang MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a MATSEQAIJ matrix is stored 4493d67d9f35SJunchao Zhang 4494d67d9f35SJunchao Zhang Not Collective 4495d67d9f35SJunchao Zhang 4496d67d9f35SJunchao Zhang Input Parameter: 4497d67d9f35SJunchao Zhang . mat - a MATSEQAIJ matrix 4498d67d9f35SJunchao Zhang 4499d67d9f35SJunchao Zhang Output Parameter: 4500d67d9f35SJunchao Zhang . array - pointer to the data 4501d67d9f35SJunchao Zhang 4502d67d9f35SJunchao Zhang Level: intermediate 4503d67d9f35SJunchao Zhang 4504db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4505d67d9f35SJunchao Zhang @*/ 4506d67d9f35SJunchao Zhang PetscErrorCode MatSeqAIJGetArrayWrite(Mat A,PetscScalar **array) 4507d67d9f35SJunchao Zhang { 4508d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 4509d67d9f35SJunchao Zhang 4510d67d9f35SJunchao Zhang PetscFunctionBegin; 4511d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 45129566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A,array)); 4513d67d9f35SJunchao Zhang } else { 4514d67d9f35SJunchao Zhang *array = aij->a; 4515d67d9f35SJunchao Zhang } 45169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 45179566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 4518d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4519d67d9f35SJunchao Zhang } 4520d67d9f35SJunchao Zhang 4521d67d9f35SJunchao Zhang /*@C 4522d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4523d67d9f35SJunchao Zhang 4524d67d9f35SJunchao Zhang Not Collective 4525d67d9f35SJunchao Zhang 4526d67d9f35SJunchao Zhang Input Parameter: 4527d67d9f35SJunchao Zhang . mat - a MATSEQAIJ matrix 4528d67d9f35SJunchao Zhang 4529d67d9f35SJunchao Zhang Output Parameter: 4530d67d9f35SJunchao Zhang . array - pointer to the data 4531d67d9f35SJunchao Zhang 4532d67d9f35SJunchao Zhang Level: intermediate 4533d67d9f35SJunchao Zhang 4534db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4535d67d9f35SJunchao Zhang @*/ 4536d67d9f35SJunchao Zhang PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A,PetscScalar **array) 4537d67d9f35SJunchao Zhang { 4538d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 4539d67d9f35SJunchao Zhang 4540d67d9f35SJunchao Zhang PetscFunctionBegin; 4541d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45429566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A,array)); 4543d67d9f35SJunchao Zhang } else { 4544d67d9f35SJunchao Zhang *array = NULL; 4545d67d9f35SJunchao Zhang } 45468f1ea47aSStefano Zampini PetscFunctionReturn(0); 45478f1ea47aSStefano Zampini } 45488f1ea47aSStefano Zampini 45498f1ea47aSStefano Zampini /*@C 45507ee59b9bSJunchao Zhang MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the SEQAIJ matrix 45517ee59b9bSJunchao Zhang 45527ee59b9bSJunchao Zhang Not Collective 45537ee59b9bSJunchao Zhang 45547ee59b9bSJunchao Zhang Input Parameter: 45557ee59b9bSJunchao Zhang . mat - a matrix of type MATSEQAIJ or its subclasses 45567ee59b9bSJunchao Zhang 45577ee59b9bSJunchao Zhang Output Parameters: 45587ee59b9bSJunchao Zhang + i - row map array of the matrix 45597ee59b9bSJunchao Zhang . j - column index array of the matrix 45607ee59b9bSJunchao Zhang . a - data array of the matrix 45617ee59b9bSJunchao Zhang - memtype - memory type of the arrays 45627ee59b9bSJunchao Zhang 45637ee59b9bSJunchao Zhang Notes: 45647ee59b9bSJunchao Zhang Any of the output parameters can be NULL, in which case the corresponding value is not returned. 45657ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 45667ee59b9bSJunchao Zhang 45677ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 45687ee59b9bSJunchao Zhang If the matrix is assembled, the data array 'a' is guaranteed to have the latest values of the matrix. 45697ee59b9bSJunchao Zhang 45707ee59b9bSJunchao Zhang Level: Developer 45717ee59b9bSJunchao Zhang 4572db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45737ee59b9bSJunchao Zhang @*/ 45747ee59b9bSJunchao Zhang PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat,const PetscInt **i,const PetscInt **j,PetscScalar **a,PetscMemType *mtype) 45757ee59b9bSJunchao Zhang { 45767ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 45777ee59b9bSJunchao Zhang 45787ee59b9bSJunchao Zhang PetscFunctionBegin; 45797ee59b9bSJunchao Zhang PetscCheck(mat->preallocated,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"matrix is not preallocated"); 45807ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 45817ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat,i,j,a,mtype)); 45827ee59b9bSJunchao Zhang } else { 45837ee59b9bSJunchao Zhang if (i) *i = aij->i; 45847ee59b9bSJunchao Zhang if (j) *j = aij->j; 45857ee59b9bSJunchao Zhang if (a) *a = aij->a; 45867ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 45877ee59b9bSJunchao Zhang } 45887ee59b9bSJunchao Zhang PetscFunctionReturn(0); 45897ee59b9bSJunchao Zhang } 45907ee59b9bSJunchao Zhang 45917ee59b9bSJunchao Zhang /*@C 459221e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 459321e72a00SBarry Smith 459421e72a00SBarry Smith Not Collective 459521e72a00SBarry Smith 459621e72a00SBarry Smith Input Parameter: 4597579dbff0SBarry Smith . mat - a MATSEQAIJ matrix 459821e72a00SBarry Smith 459921e72a00SBarry Smith Output Parameter: 460021e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 460121e72a00SBarry Smith 460221e72a00SBarry Smith Level: intermediate 460321e72a00SBarry Smith 4604db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 460521e72a00SBarry Smith @*/ 460621e72a00SBarry Smith PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A,PetscInt *nz) 460721e72a00SBarry Smith { 460821e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 460921e72a00SBarry Smith 461021e72a00SBarry Smith PetscFunctionBegin; 461121e72a00SBarry Smith *nz = aij->rmax; 461221e72a00SBarry Smith PetscFunctionReturn(0); 461321e72a00SBarry Smith } 461421e72a00SBarry Smith 4615e8729f6fSJunchao Zhang PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 4616394ed5ebSJunchao Zhang { 4617394ed5ebSJunchao Zhang MPI_Comm comm; 4618394ed5ebSJunchao Zhang PetscInt *i,*j; 4619394ed5ebSJunchao Zhang PetscInt M,N,row; 4620394ed5ebSJunchao Zhang PetscCount k,p,q,nneg,nnz,start,end; /* Index the coo array, so use PetscCount as their type */ 4621394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4622394ed5ebSJunchao Zhang PetscInt *Aj; 4623394ed5ebSJunchao Zhang PetscScalar *Aa; 4624cbc6b225SStefano Zampini Mat_SeqAIJ *seqaij = (Mat_SeqAIJ*)(mat->data); 4625cbc6b225SStefano Zampini MatType rtype; 4626394ed5ebSJunchao Zhang PetscCount *perm,*jmap; 4627394ed5ebSJunchao Zhang 4628394ed5ebSJunchao Zhang PetscFunctionBegin; 46299566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(mat)); 46309566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat,&comm)); 46319566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat,&M,&N)); 4632e8729f6fSJunchao Zhang i = coo_i; 4633e8729f6fSJunchao Zhang j = coo_j; 46349566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n,&perm)); 4635394ed5ebSJunchao Zhang for (k=0; k<coo_n; k++) { /* Ignore entries with negative row or col indices */ 4636394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 4637394ed5ebSJunchao Zhang perm[k] = k; 4638394ed5ebSJunchao Zhang } 4639394ed5ebSJunchao Zhang 4640394ed5ebSJunchao Zhang /* Sort by row */ 46419566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithIntCountArrayPair(coo_n,i,j,perm)); 4642394ed5ebSJunchao Zhang for (k=0; k<coo_n; k++) {if (i[k] >= 0) break;} /* Advance k to the first row with a non-negative index */ 4643394ed5ebSJunchao Zhang nneg = k; 46449566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n-nneg+1,&jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4645394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 4646394ed5ebSJunchao Zhang jmap++; /* Inc jmap by 1 for convinience */ 4647394ed5ebSJunchao Zhang 46489566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(M+1,&Ai)); /* CSR of A */ 46499566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n-nneg,&Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4650394ed5ebSJunchao Zhang 4651394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 4652394ed5ebSJunchao Zhang Ai++; /* Inc by 1 for convinience */ 4653394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4654394ed5ebSJunchao Zhang while (k<coo_n) { 4655394ed5ebSJunchao Zhang row = i[k]; 4656394ed5ebSJunchao Zhang start = k; /* [start,end) indices for this row */ 4657394ed5ebSJunchao Zhang while (k<coo_n && i[k] == row) k++; 4658394ed5ebSJunchao Zhang end = k; 46599566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithCountArray(end-start,j+start,perm+start)); 4660394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4661394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4662394ed5ebSJunchao Zhang jmap[q] = 1; /* Number of repeats of this nozero entry */ 4663394ed5ebSJunchao Zhang Ai[row] = 1; 4664394ed5ebSJunchao Zhang nnz++; 4665394ed5ebSJunchao Zhang 4666394ed5ebSJunchao Zhang for (p=start+1; p<end; p++) { /* Scan remaining nonzero in this row */ 4667394ed5ebSJunchao Zhang if (j[p] != j[p-1]) { /* Meet a new nonzero */ 4668394ed5ebSJunchao Zhang q++; 4669394ed5ebSJunchao Zhang jmap[q] = 1; 4670394ed5ebSJunchao Zhang Aj[q] = j[p]; 4671394ed5ebSJunchao Zhang Ai[row]++; 4672394ed5ebSJunchao Zhang nnz++; 4673394ed5ebSJunchao Zhang } else { 4674394ed5ebSJunchao Zhang jmap[q]++; 4675394ed5ebSJunchao Zhang } 4676394ed5ebSJunchao Zhang } 4677394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4678394ed5ebSJunchao Zhang } 4679394ed5ebSJunchao Zhang 4680394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4681394ed5ebSJunchao Zhang for (k=0; k<M; k++) Ai[k+1] += Ai[k]; 4682394ed5ebSJunchao Zhang jmap--; /* Back to the beginning of jmap[] */ 4683394ed5ebSJunchao Zhang jmap[0] = 0; 4684394ed5ebSJunchao Zhang for (k=0; k<nnz; k++) jmap[k+1] += jmap[k]; 4685394ed5ebSJunchao Zhang if (nnz < coo_n-nneg) { /* Realloc with actual number of unique nonzeros */ 4686394ed5ebSJunchao Zhang PetscCount *jmap_new; 4687394ed5ebSJunchao Zhang PetscInt *Aj_new; 4688394ed5ebSJunchao Zhang 46899566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz+1,&jmap_new)); 46909566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new,jmap,nnz+1)); 46919566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4692394ed5ebSJunchao Zhang jmap = jmap_new; 4693394ed5ebSJunchao Zhang 46949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz,&Aj_new)); 46959566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new,Aj,nnz)); 46969566063dSJacob Faibussowitsch PetscCall(PetscFree(Aj)); 4697394ed5ebSJunchao Zhang Aj = Aj_new; 4698394ed5ebSJunchao Zhang } 4699394ed5ebSJunchao Zhang 4700394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4701394ed5ebSJunchao Zhang PetscCount *perm_new; 4702cbc6b225SStefano Zampini 47039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n-nneg,&perm_new)); 47049566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new,perm+nneg,coo_n-nneg)); 47059566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4706394ed5ebSJunchao Zhang perm = perm_new; 4707394ed5ebSJunchao Zhang } 4708394ed5ebSJunchao Zhang 47099566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat,&rtype)); 47109566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nnz,&Aa)); /* Zero the matrix */ 47119566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF,M,N,Ai,Aj,Aa,rtype,mat)); 4712394ed5ebSJunchao Zhang 4713394ed5ebSJunchao Zhang seqaij->singlemalloc = PETSC_FALSE; /* Ai, Aj and Aa are not allocated in one big malloc */ 4714394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 4715394ed5ebSJunchao Zhang /* Record COO fields */ 4716394ed5ebSJunchao Zhang seqaij->coo_n = coo_n; 4717394ed5ebSJunchao Zhang seqaij->Atot = coo_n-nneg; /* Annz is seqaij->nz, so no need to record that again */ 4718394ed5ebSJunchao Zhang seqaij->jmap = jmap; /* of length nnz+1 */ 4719394ed5ebSJunchao Zhang seqaij->perm = perm; 4720394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4721394ed5ebSJunchao Zhang } 4722394ed5ebSJunchao Zhang 4723394ed5ebSJunchao Zhang static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A,const PetscScalar v[],InsertMode imode) 4724394ed5ebSJunchao Zhang { 4725394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ*)A->data; 4726394ed5ebSJunchao Zhang PetscCount i,j,Annz = aseq->nz; 4727394ed5ebSJunchao Zhang PetscCount *perm = aseq->perm,*jmap = aseq->jmap; 4728394ed5ebSJunchao Zhang PetscScalar *Aa; 4729394ed5ebSJunchao Zhang 4730394ed5ebSJunchao Zhang PetscFunctionBegin; 47319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&Aa)); 4732394ed5ebSJunchao Zhang for (i=0; i<Annz; i++) { 4733b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4734b6c38306SJunchao Zhang for (j=jmap[i]; j<jmap[i+1]; j++) sum += v[perm[j]]; 4735b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES? 0.0 : Aa[i]) + sum; 4736394ed5ebSJunchao Zhang } 47379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&Aa)); 4738394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4739394ed5ebSJunchao Zhang } 4740394ed5ebSJunchao Zhang 474134b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 47425063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat,MatType,MatReuse,Mat*); 474302fe1965SBarry Smith #endif 47443d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 47455063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat,MatType,MatReuse,Mat*); 47463d0639e7SStefano Zampini #endif 474702fe1965SBarry Smith 47488cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4749273d9f13SBarry Smith { 4750273d9f13SBarry Smith Mat_SeqAIJ *b; 475138baddfdSBarry Smith PetscMPIInt size; 4752273d9f13SBarry Smith 4753273d9f13SBarry Smith PetscFunctionBegin; 47549566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B),&size)); 475508401ef6SPierre Jolivet PetscCheck(size <= 1,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Comm must be of size 1"); 4756273d9f13SBarry Smith 47579566063dSJacob Faibussowitsch PetscCall(PetscNewLog(B,&b)); 47582205254eSKarl Rupp 4759b0a32e0cSBarry Smith B->data = (void*)b; 47602205254eSKarl Rupp 47619566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps))); 4762071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 47632205254eSKarl Rupp 4764f4259b30SLisandro Dalcin b->row = NULL; 4765f4259b30SLisandro Dalcin b->col = NULL; 4766f4259b30SLisandro Dalcin b->icol = NULL; 4767b810aeb4SBarry Smith b->reallocs = 0; 476836db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4769f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4770416022c9SBarry Smith b->nonew = 0; 4771f4259b30SLisandro Dalcin b->diag = NULL; 4772f4259b30SLisandro Dalcin b->solve_work = NULL; 4773f4259b30SLisandro Dalcin B->spptr = NULL; 4774f4259b30SLisandro Dalcin b->saved_values = NULL; 4775f4259b30SLisandro Dalcin b->idiag = NULL; 4776f4259b30SLisandro Dalcin b->mdiag = NULL; 4777f4259b30SLisandro Dalcin b->ssor_work = NULL; 477871f1c65dSBarry Smith b->omega = 1.0; 477971f1c65dSBarry Smith b->fshift = 0.0; 478071f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4781bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4782a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 478317ab2063SBarry Smith 47849566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ)); 4785b3866ffcSBarry Smith #if defined(PETSC_HAVE_MATLAB_ENGINE) 47869566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"PetscMatlabEnginePut_C",MatlabEnginePut_SeqAIJ)); 47879566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"PetscMatlabEngineGet_C",MatlabEngineGet_SeqAIJ)); 4788b3866ffcSBarry Smith #endif 47899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetColumnIndices_C",MatSeqAIJSetColumnIndices_SeqAIJ)); 47909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatStoreValues_C",MatStoreValues_SeqAIJ)); 47919566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatRetrieveValues_C",MatRetrieveValues_SeqAIJ)); 47929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqsbaij_C",MatConvert_SeqAIJ_SeqSBAIJ)); 47939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqbaij_C",MatConvert_SeqAIJ_SeqBAIJ)); 47949566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijperm_C",MatConvert_SeqAIJ_SeqAIJPERM)); 47959566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijsell_C",MatConvert_SeqAIJ_SeqAIJSELL)); 47969779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 47979566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijmkl_C",MatConvert_SeqAIJ_SeqAIJMKL)); 4798191b95cbSRichard Tran Mills #endif 479934b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 48009566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijcusparse_C",MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 48019566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaijcusparse_seqaij_C",MatProductSetFromOptions_SeqAIJ)); 48029566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaij_seqaijcusparse_C",MatProductSetFromOptions_SeqAIJ)); 480302fe1965SBarry Smith #endif 48043d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 48059566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijkokkos_C",MatConvert_SeqAIJ_SeqAIJKokkos)); 48063d0639e7SStefano Zampini #endif 48079566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijcrl_C",MatConvert_SeqAIJ_SeqAIJCRL)); 4808af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 48099566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_elemental_C",MatConvert_SeqAIJ_Elemental)); 4810af8000cdSHong Zhang #endif 4811d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 48129566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_scalapack_C",MatConvert_AIJ_ScaLAPACK)); 4813d24d4204SJose E. Roman #endif 481463c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 48159566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_hypre_C",MatConvert_AIJ_HYPRE)); 48169566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_transpose_seqaij_seqaij_C",MatProductSetFromOptions_Transpose_AIJ_AIJ)); 481763c07aadSStefano Zampini #endif 48189566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqdense_C",MatConvert_SeqAIJ_SeqDense)); 48199566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqsell_C",MatConvert_SeqAIJ_SeqSELL)); 48209566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_is_C",MatConvert_XAIJ_IS)); 48219566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatIsTranspose_C",MatIsTranspose_SeqAIJ)); 48229566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatIsHermitianTranspose_C",MatIsTranspose_SeqAIJ)); 48239566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetPreallocation_C",MatSeqAIJSetPreallocation_SeqAIJ)); 48249566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatResetPreallocation_C",MatResetPreallocation_SeqAIJ)); 48259566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetPreallocationCSR_C",MatSeqAIJSetPreallocationCSR_SeqAIJ)); 48269566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatReorderForNonzeroDiagonal_C",MatReorderForNonzeroDiagonal_SeqAIJ)); 48279566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_is_seqaij_C",MatProductSetFromOptions_IS_XAIJ)); 48289566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqdense_seqaij_C",MatProductSetFromOptions_SeqDense_SeqAIJ)); 48299566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaij_seqaij_C",MatProductSetFromOptions_SeqAIJ)); 48309566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJKron_C",MatSeqAIJKron_SeqAIJ)); 48319566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSetPreallocationCOO_C",MatSetPreallocationCOO_SeqAIJ)); 48329566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSetValuesCOO_C",MatSetValuesCOO_SeqAIJ)); 48339566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 48349566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ)); 48359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 48363a40ed3dSBarry Smith PetscFunctionReturn(0); 483717ab2063SBarry Smith } 483817ab2063SBarry Smith 4839b24902e0SBarry Smith /* 48403893b582SJunchao Zhang Given a matrix generated with MatGetFactor() duplicates all the information in A into C 4841b24902e0SBarry Smith */ 4842ace3abfcSBarry Smith PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C,Mat A,MatDuplicateOption cpvalues,PetscBool mallocmatspace) 484317ab2063SBarry Smith { 48442a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ*)C->data,*a = (Mat_SeqAIJ*)A->data; 4845071fcb05SBarry Smith PetscInt m = A->rmap->n,i; 484617ab2063SBarry Smith 48473a40ed3dSBarry Smith PetscFunctionBegin; 4848aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Cannot duplicate unassembled matrix"); 4849273d9f13SBarry Smith 4850d5f3da31SBarry Smith C->factortype = A->factortype; 4851f4259b30SLisandro Dalcin c->row = NULL; 4852f4259b30SLisandro Dalcin c->col = NULL; 4853f4259b30SLisandro Dalcin c->icol = NULL; 48546ad4291fSHong Zhang c->reallocs = 0; 485517ab2063SBarry Smith 485669272f91SPierre Jolivet C->assembled = A->assembled; 485769272f91SPierre Jolivet C->preallocated = A->preallocated; 485817ab2063SBarry Smith 485969272f91SPierre Jolivet if (A->preallocated) { 48609566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap,&C->rmap)); 48619566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap,&C->cmap)); 4862eec197d1SBarry Smith 48639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&c->imax)); 48649566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax,a->imax,m*sizeof(PetscInt))); 48659566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&c->ilen)); 48669566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen,a->ilen,m*sizeof(PetscInt))); 48679566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)C, 2*m*sizeof(PetscInt))); 486817ab2063SBarry Smith 486917ab2063SBarry Smith /* allocate the matrix space */ 4870f77e22a1SHong Zhang if (mallocmatspace) { 48719566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(a->i[m],&c->a,a->i[m],&c->j,m+1,&c->i)); 48729566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)C, a->i[m]*(sizeof(PetscScalar)+sizeof(PetscInt))+(m+1)*sizeof(PetscInt))); 48732205254eSKarl Rupp 4874f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 48752205254eSKarl Rupp 48769566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i,a->i,m+1)); 487717ab2063SBarry Smith if (m > 0) { 48789566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j,a->j,a->i[m])); 4879be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 48802e5835c6SStefano Zampini const PetscScalar *aa; 48812e5835c6SStefano Zampini 48829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 48839566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a,aa,a->i[m])); 48849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 4885be6bf707SBarry Smith } else { 48869566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a,a->i[m])); 488717ab2063SBarry Smith } 488808480c60SBarry Smith } 4889f77e22a1SHong Zhang } 489017ab2063SBarry Smith 48916ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 4892416022c9SBarry Smith c->roworiented = a->roworiented; 4893416022c9SBarry Smith c->nonew = a->nonew; 4894416022c9SBarry Smith if (a->diag) { 48959566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1,&c->diag)); 48969566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag,a->diag,m*sizeof(PetscInt))); 48979566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)C,(m+1)*sizeof(PetscInt))); 4898071fcb05SBarry Smith } else c->diag = NULL; 48992205254eSKarl Rupp 4900f4259b30SLisandro Dalcin c->solve_work = NULL; 4901f4259b30SLisandro Dalcin c->saved_values = NULL; 4902f4259b30SLisandro Dalcin c->idiag = NULL; 4903f4259b30SLisandro Dalcin c->ssor_work = NULL; 4904a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 4905e6b907acSBarry Smith c->free_a = PETSC_TRUE; 4906e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 49076ad4291fSHong Zhang 4908893ad86cSHong Zhang c->rmax = a->rmax; 4909416022c9SBarry Smith c->nz = a->nz; 49108ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 4911754ec7b1SSatish Balay 49126ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 49136ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 4914cd6b891eSBarry Smith if (a->compressedrow.use) { 49156ad4291fSHong Zhang i = a->compressedrow.nrows; 49169566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i+1,&c->compressedrow.i,i,&c->compressedrow.rindex)); 49179566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i,a->compressedrow.i,i+1)); 49189566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex,a->compressedrow.rindex,i)); 491927ea64f8SHong Zhang } else { 492027ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 49210298fd71SBarry Smith c->compressedrow.i = NULL; 49220298fd71SBarry Smith c->compressedrow.rindex = NULL; 49236ad4291fSHong Zhang } 4924ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 4925e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 49264846f1f5SKris Buschelman 49279566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A,cpvalues,&C)); 492869272f91SPierre Jolivet } 49299566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist,&((PetscObject)C)->qlist)); 49303a40ed3dSBarry Smith PetscFunctionReturn(0); 493117ab2063SBarry Smith } 493217ab2063SBarry Smith 4933b24902e0SBarry Smith PetscErrorCode MatDuplicate_SeqAIJ(Mat A,MatDuplicateOption cpvalues,Mat *B) 4934b24902e0SBarry Smith { 4935b24902e0SBarry Smith PetscFunctionBegin; 49369566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A),B)); 49379566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n)); 4938cfd3f464SBarry Smith if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) { 49399566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B,A,A)); 4940cfd3f464SBarry Smith } 49419566063dSJacob Faibussowitsch PetscCall(MatSetType(*B,((PetscObject)A)->type_name)); 49429566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B,A,cpvalues,PETSC_TRUE)); 4943b24902e0SBarry Smith PetscFunctionReturn(0); 4944b24902e0SBarry Smith } 4945b24902e0SBarry Smith 4946112444f4SShri Abhyankar PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 4947fbdbba38SShri Abhyankar { 494852f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 494952f91c60SVaclav Hapla 495052f91c60SVaclav Hapla PetscFunctionBegin; 495152f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat,MAT_CLASSID,1); 495252f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer,PETSC_VIEWER_CLASSID,2); 4953c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 49549566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 49559566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary)); 49569566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERHDF5, &ishdf5)); 495752f91c60SVaclav Hapla if (isbinary) { 49589566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat,viewer)); 495952f91c60SVaclav Hapla } else if (ishdf5) { 496052f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 49619566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat,viewer)); 496252f91c60SVaclav Hapla #else 496352f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 496452f91c60SVaclav Hapla #endif 496552f91c60SVaclav Hapla } else { 496698921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"Viewer type %s not yet supported for reading %s matrices",((PetscObject)viewer)->type_name,((PetscObject)newMat)->type_name); 496752f91c60SVaclav Hapla } 496852f91c60SVaclav Hapla PetscFunctionReturn(0); 496952f91c60SVaclav Hapla } 497052f91c60SVaclav Hapla 49713ea6fe3dSLisandro Dalcin PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 497252f91c60SVaclav Hapla { 49733ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ*)mat->data; 49743ea6fe3dSLisandro Dalcin PetscInt header[4],*rowlens,M,N,nz,sum,rows,cols,i; 4975fbdbba38SShri Abhyankar 4976fbdbba38SShri Abhyankar PetscFunctionBegin; 49779566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 4978bbead8a2SBarry Smith 49793ea6fe3dSLisandro Dalcin /* read in matrix header */ 49809566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer,header,4,NULL,PETSC_INT)); 498108401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID,PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Not a matrix object in file"); 4982fbdbba38SShri Abhyankar M = header[1]; N = header[2]; nz = header[3]; 498308401ef6SPierre Jolivet PetscCheck(M >= 0,PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Matrix row size (%" PetscInt_FMT ") in file is negative",M); 498408401ef6SPierre Jolivet PetscCheck(N >= 0,PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Matrix column size (%" PetscInt_FMT ") in file is negative",N); 498508401ef6SPierre Jolivet PetscCheck(nz >= 0,PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Matrix stored in special format on disk, cannot load as SeqAIJ"); 4986fbdbba38SShri Abhyankar 49873ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 49889566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat,viewer)); 49893ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 49903ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 49913ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 49923ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 49933ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 49949566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 49959566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 49963ea6fe3dSLisandro Dalcin 49973ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 49989566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat,&rows,&cols)); 4999aed4548fSBarry Smith PetscCheck(M == rows && N == cols,PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")",M,N,rows,cols); 50003ea6fe3dSLisandro Dalcin 5001fbdbba38SShri Abhyankar /* read in row lengths */ 50029566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M,&rowlens)); 50039566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer,rowlens,M,NULL,PETSC_INT)); 50043ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 50053ea6fe3dSLisandro Dalcin sum = 0; for (i=0; i<M; i++) sum += rowlens[i]; 500608401ef6SPierre Jolivet PetscCheck(sum == nz,PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT,nz,sum); 50073ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 50089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat,0,rowlens)); 50099566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat,&rows,&cols)); 5010aed4548fSBarry Smith PetscCheck(M == rows && N == cols,PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")",M,N,rows,cols); 50113ea6fe3dSLisandro Dalcin /* store row lengths */ 50129566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen,rowlens,M)); 50139566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 5014fbdbba38SShri Abhyankar 50153ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 50163ea6fe3dSLisandro Dalcin a->i[0] = 0; for (i=0; i<M; i++) a->i[i+1] = a->i[i] + a->ilen[i]; 50173ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 50189566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer,a->j,nz,NULL,PETSC_INT)); 50193ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 50209566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer,a->a,nz,NULL,PETSC_SCALAR)); 5021fbdbba38SShri Abhyankar 50229566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat,MAT_FINAL_ASSEMBLY)); 50239566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat,MAT_FINAL_ASSEMBLY)); 5024fbdbba38SShri Abhyankar PetscFunctionReturn(0); 5025fbdbba38SShri Abhyankar } 5026fbdbba38SShri Abhyankar 5027ace3abfcSBarry Smith PetscErrorCode MatEqual_SeqAIJ(Mat A,Mat B,PetscBool * flg) 50287264ac53SSatish Balay { 50297264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*b = (Mat_SeqAIJ*)B->data; 5030fff043a9SJunchao Zhang const PetscScalar *aa,*ba; 5031eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5032eeffb40dSHong Zhang PetscInt k; 5033eeffb40dSHong Zhang #endif 50347264ac53SSatish Balay 50353a40ed3dSBarry Smith PetscFunctionBegin; 5036bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5037d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) ||(a->nz != b->nz)) { 5038ca44d042SBarry Smith *flg = PETSC_FALSE; 5039ca44d042SBarry Smith PetscFunctionReturn(0); 5040bcd2baecSBarry Smith } 50417264ac53SSatish Balay 50427264ac53SSatish Balay /* if the a->i are the same */ 50439566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i,b->i,A->rmap->n+1,flg)); 5044abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 50457264ac53SSatish Balay 50467264ac53SSatish Balay /* if a->j are the same */ 50479566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j,b->j,a->nz,flg)); 5048abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 5049bcd2baecSBarry Smith 50509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 50519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B,&ba)); 5052bcd2baecSBarry Smith /* if a->a are the same */ 5053eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5054eeffb40dSHong Zhang for (k=0; k<a->nz; k++) { 5055fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5056eeffb40dSHong Zhang *flg = PETSC_FALSE; 50573a40ed3dSBarry Smith PetscFunctionReturn(0); 5058eeffb40dSHong Zhang } 5059eeffb40dSHong Zhang } 5060eeffb40dSHong Zhang #else 50619566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa,ba,a->nz,flg)); 5062eeffb40dSHong Zhang #endif 50639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 50649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B,&ba)); 5065eeffb40dSHong Zhang PetscFunctionReturn(0); 50667264ac53SSatish Balay } 506736db0b34SBarry Smith 506805869f15SSatish Balay /*@ 506936db0b34SBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential AIJ matrix using matrix elements (in CSR format) 507036db0b34SBarry Smith provided by the user. 507136db0b34SBarry Smith 5072d083f849SBarry Smith Collective 507336db0b34SBarry Smith 507436db0b34SBarry Smith Input Parameters: 507536db0b34SBarry Smith + comm - must be an MPI communicator of size 1 507636db0b34SBarry Smith . m - number of rows 507736db0b34SBarry Smith . n - number of columns 5078483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 507936db0b34SBarry Smith . j - column indices 508036db0b34SBarry Smith - a - matrix values 508136db0b34SBarry Smith 508236db0b34SBarry Smith Output Parameter: 508336db0b34SBarry Smith . mat - the matrix 508436db0b34SBarry Smith 508536db0b34SBarry Smith Level: intermediate 508636db0b34SBarry Smith 508736db0b34SBarry Smith Notes: 50880551d7c0SBarry Smith The i, j, and a arrays are not copied by this routine, the user must free these arrays 5089292fb18eSBarry Smith once the matrix is destroyed and not before 509036db0b34SBarry Smith 509136db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 509236db0b34SBarry Smith 5093bfeeae90SHong Zhang The i and j indices are 0 based 509436db0b34SBarry Smith 5095a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5096a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 50978eef79e4SBarry Smith as shown 5098a4552177SSatish Balay 50998eef79e4SBarry Smith $ 1 0 0 51008eef79e4SBarry Smith $ 2 0 3 51018eef79e4SBarry Smith $ 4 5 6 51028eef79e4SBarry Smith $ 51038eef79e4SBarry Smith $ i = {0,1,3,6} [size = nrow+1 = 3+1] 51048eef79e4SBarry Smith $ j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 51058eef79e4SBarry Smith $ v = {1,2,3,4,5,6} [size = 6] 5106a4552177SSatish Balay 5107db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 510836db0b34SBarry Smith 510936db0b34SBarry Smith @*/ 5110c3c607ccSBarry Smith PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt i[],PetscInt j[],PetscScalar a[],Mat *mat) 511136db0b34SBarry Smith { 5112cbcfb4deSHong Zhang PetscInt ii; 511336db0b34SBarry Smith Mat_SeqAIJ *aij; 5114cbcfb4deSHong Zhang PetscInt jj; 511536db0b34SBarry Smith 511636db0b34SBarry Smith PetscFunctionBegin; 5117aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"i (row indices) must start with 0"); 51189566063dSJacob Faibussowitsch PetscCall(MatCreate(comm,mat)); 51199566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat,m,n,m,n)); 51209566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 51219566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat,MATSEQAIJ)); 51229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat,MAT_SKIP_ALLOCATION,NULL)); 5123ab93d7beSBarry Smith aij = (Mat_SeqAIJ*)(*mat)->data; 51249566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&aij->imax)); 51259566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&aij->ilen)); 5126ab93d7beSBarry Smith 512736db0b34SBarry Smith aij->i = i; 512836db0b34SBarry Smith aij->j = j; 512936db0b34SBarry Smith aij->a = a; 513036db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 513136db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5132e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5133e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 513436db0b34SBarry Smith 5135cbc6b225SStefano Zampini for (ii=0,aij->nonzerorowcnt=0,aij->rmax=0; ii<m; ii++) { 513636db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii+1] - i[ii]; 513776bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5138aed4548fSBarry Smith PetscCheck(i[ii+1] - i[ii] >= 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT,ii,i[ii+1] - i[ii]); 51399985e31cSBarry Smith for (jj=i[ii]+1; jj<i[ii+1]; jj++) { 514008401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj-1],PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted",jj-i[ii],j[jj],ii); 514108401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj-1],PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry",jj-i[ii],j[jj],ii); 51429985e31cSBarry Smith } 514336db0b34SBarry Smith } 514476bd3646SJed Brown } 514576bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 514636db0b34SBarry Smith for (ii=0; ii<aij->i[m]; ii++) { 514708401ef6SPierre Jolivet PetscCheck(j[ii] >= 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT,ii,j[ii]); 5148aed4548fSBarry Smith PetscCheck(j[ii] <= n - 1,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT,ii,j[ii]); 514936db0b34SBarry Smith } 515076bd3646SJed Brown } 515136db0b34SBarry Smith 51529566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY)); 51539566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY)); 515436db0b34SBarry Smith PetscFunctionReturn(0); 515536db0b34SBarry Smith } 5156cbc6b225SStefano Zampini 5157f62e3866SBarry Smith /*@ 5158d021a1c5SVictor Minden MatCreateSeqAIJFromTriple - Creates an sequential AIJ matrix using matrix elements (in COO format) 51598a0b0e6bSVictor Minden provided by the user. 51608a0b0e6bSVictor Minden 5161d083f849SBarry Smith Collective 51628a0b0e6bSVictor Minden 51638a0b0e6bSVictor Minden Input Parameters: 51648a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 51658a0b0e6bSVictor Minden . m - number of rows 51668a0b0e6bSVictor Minden . n - number of columns 51678a0b0e6bSVictor Minden . i - row indices 51688a0b0e6bSVictor Minden . j - column indices 51691230e6d1SVictor Minden . a - matrix values 51701230e6d1SVictor Minden . nz - number of nonzeros 5171f62e3866SBarry Smith - idx - if the i and j indices start with 1 use PETSC_TRUE otherwise use PETSC_FALSE 51728a0b0e6bSVictor Minden 51738a0b0e6bSVictor Minden Output Parameter: 51748a0b0e6bSVictor Minden . mat - the matrix 51758a0b0e6bSVictor Minden 51768a0b0e6bSVictor Minden Level: intermediate 51778a0b0e6bSVictor Minden 5178f62e3866SBarry Smith Example: 5179f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 51809e99939fSJunchao Zhang .vb 51818a0b0e6bSVictor Minden 1 0 0 51828a0b0e6bSVictor Minden 2 0 3 51838a0b0e6bSVictor Minden 4 5 6 51848a0b0e6bSVictor Minden 51858a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 51868a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 51878a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 51889e99939fSJunchao Zhang .ve 51898a0b0e6bSVictor Minden 5190db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()` 51918a0b0e6bSVictor Minden 51928a0b0e6bSVictor Minden @*/ 5193c3c607ccSBarry Smith PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt i[],PetscInt j[],PetscScalar a[],Mat *mat,PetscInt nz,PetscBool idx) 51948a0b0e6bSVictor Minden { 5195d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1,row,col; 51968a0b0e6bSVictor Minden 51978a0b0e6bSVictor Minden PetscFunctionBegin; 51989566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m,&nnz)); 51991230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 5200c8d679ebSHong Zhang nnz[i[ii] - !!idx] += 1; 52011230e6d1SVictor Minden } 52029566063dSJacob Faibussowitsch PetscCall(MatCreate(comm,mat)); 52039566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat,m,n,m,n)); 52049566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat,MATSEQAIJ)); 52059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat,0,nnz)); 52061230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 52071230e6d1SVictor Minden if (idx) { 52081230e6d1SVictor Minden row = i[ii] - 1; 52091230e6d1SVictor Minden col = j[ii] - 1; 52101230e6d1SVictor Minden } else { 52111230e6d1SVictor Minden row = i[ii]; 52121230e6d1SVictor Minden col = j[ii]; 52138a0b0e6bSVictor Minden } 52149566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat,one,&row,one,&col,&a[ii],ADD_VALUES)); 52158a0b0e6bSVictor Minden } 52169566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY)); 52179566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY)); 52189566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 52198a0b0e6bSVictor Minden PetscFunctionReturn(0); 52208a0b0e6bSVictor Minden } 522136db0b34SBarry Smith 5222acf2f550SJed Brown PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5223acf2f550SJed Brown { 5224acf2f550SJed Brown Mat_SeqAIJ *a=(Mat_SeqAIJ*)A->data; 5225acf2f550SJed Brown 5226acf2f550SJed Brown PetscFunctionBegin; 5227acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5228acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 52292205254eSKarl Rupp 52309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 5231acf2f550SJed Brown PetscFunctionReturn(0); 5232acf2f550SJed Brown } 5233acf2f550SJed Brown 52349c8f2541SHong Zhang PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm,Mat inmat,PetscInt n,MatReuse scall,Mat *outmat) 52359c8f2541SHong Zhang { 52369c8f2541SHong Zhang PetscFunctionBegin; 52379566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm,inmat,n,scall,outmat)); 52389c8f2541SHong Zhang PetscFunctionReturn(0); 52399c8f2541SHong Zhang } 52409c8f2541SHong Zhang 524181824310SBarry Smith /* 524253dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 524353dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 524453dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 524553dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 524653dd7562SDmitry Karpeev */ 524753dd7562SDmitry Karpeev PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C,IS rowemb,IS colemb,MatStructure pattern,Mat B) 524853dd7562SDmitry Karpeev { 524953dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 525053dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 525153dd7562SDmitry Karpeev PetscBool seqaij; 525253dd7562SDmitry Karpeev PetscInt m,n,*nz,i,j,count; 525353dd7562SDmitry Karpeev PetscScalar v; 525453dd7562SDmitry Karpeev const PetscInt *rowindices,*colindices; 525553dd7562SDmitry Karpeev 525653dd7562SDmitry Karpeev PetscFunctionBegin; 525753dd7562SDmitry Karpeev if (!B) PetscFunctionReturn(0); 525853dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 52599566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B,MATSEQAIJ,&seqaij)); 526028b400f6SJacob Faibussowitsch PetscCheck(seqaij,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is of wrong type"); 526153dd7562SDmitry Karpeev if (rowemb) { 52629566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb,&m)); 526308401ef6SPierre Jolivet PetscCheck(m == B->rmap->n,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT,m,B->rmap->n); 526453dd7562SDmitry Karpeev } else { 526508401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is row-incompatible with the target matrix"); 526653dd7562SDmitry Karpeev } 526753dd7562SDmitry Karpeev if (colemb) { 52689566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb,&n)); 526908401ef6SPierre Jolivet PetscCheck(n == B->cmap->n,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT,n,B->cmap->n); 527053dd7562SDmitry Karpeev } else { 527108401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is col-incompatible with the target matrix"); 527253dd7562SDmitry Karpeev } 527353dd7562SDmitry Karpeev 527453dd7562SDmitry Karpeev Baij = (Mat_SeqAIJ*)(B->data); 527553dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 52769566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n,&nz)); 527753dd7562SDmitry Karpeev for (i=0; i<B->rmap->n; i++) { 527853dd7562SDmitry Karpeev nz[i] = Baij->i[i+1] - Baij->i[i]; 527953dd7562SDmitry Karpeev } 52809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C,0,nz)); 52819566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 528253dd7562SDmitry Karpeev } 528353dd7562SDmitry Karpeev if (pattern == SUBSET_NONZERO_PATTERN) { 52849566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(C)); 528553dd7562SDmitry Karpeev } 528653dd7562SDmitry Karpeev count = 0; 528753dd7562SDmitry Karpeev rowindices = NULL; 528853dd7562SDmitry Karpeev colindices = NULL; 528953dd7562SDmitry Karpeev if (rowemb) { 52909566063dSJacob Faibussowitsch PetscCall(ISGetIndices(rowemb,&rowindices)); 529153dd7562SDmitry Karpeev } 529253dd7562SDmitry Karpeev if (colemb) { 52939566063dSJacob Faibussowitsch PetscCall(ISGetIndices(colemb,&colindices)); 529453dd7562SDmitry Karpeev } 529553dd7562SDmitry Karpeev for (i=0; i<B->rmap->n; i++) { 529653dd7562SDmitry Karpeev PetscInt row; 529753dd7562SDmitry Karpeev row = i; 529853dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 529953dd7562SDmitry Karpeev for (j=Baij->i[i]; j<Baij->i[i+1]; j++) { 530053dd7562SDmitry Karpeev PetscInt col; 530153dd7562SDmitry Karpeev col = Baij->j[count]; 530253dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 530353dd7562SDmitry Karpeev v = Baij->a[count]; 53049566063dSJacob Faibussowitsch PetscCall(MatSetValues(C,1,&row,1,&col,&v,INSERT_VALUES)); 530553dd7562SDmitry Karpeev ++count; 530653dd7562SDmitry Karpeev } 530753dd7562SDmitry Karpeev } 530853dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 530953dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 531053dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 531153dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 531253dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 531353dd7562SDmitry Karpeev PetscFunctionReturn(0); 531453dd7562SDmitry Karpeev } 531553dd7562SDmitry Karpeev 53164099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 53174099cc6bSBarry Smith 53184099cc6bSBarry Smith /*@C 53194099cc6bSBarry Smith MatSeqAIJSetType - Converts a MATSEQAIJ matrix to a subtype 53204099cc6bSBarry Smith 53214099cc6bSBarry Smith Collective on Mat 53224099cc6bSBarry Smith 53234099cc6bSBarry Smith Input Parameters: 53244099cc6bSBarry Smith + mat - the matrix object 53254099cc6bSBarry Smith - matype - matrix type 53264099cc6bSBarry Smith 53274099cc6bSBarry Smith Options Database Key: 53284099cc6bSBarry Smith . -mat_seqai_type <method> - for example seqaijcrl 53294099cc6bSBarry Smith 53304099cc6bSBarry Smith Level: intermediate 53314099cc6bSBarry Smith 5332db781477SPatrick Sanan .seealso: `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`, `Mat` 53334099cc6bSBarry Smith @*/ 53344099cc6bSBarry Smith PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 53354099cc6bSBarry Smith { 53364099cc6bSBarry Smith PetscBool sametype; 53375f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat,MatType,MatReuse,Mat*); 53384099cc6bSBarry Smith 53394099cc6bSBarry Smith PetscFunctionBegin; 53404099cc6bSBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 53419566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat,matype,&sametype)); 53424099cc6bSBarry Smith if (sametype) PetscFunctionReturn(0); 53434099cc6bSBarry Smith 53449566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList,matype,&r)); 53455f80ce2aSJacob Faibussowitsch PetscCheck(r,PETSC_COMM_SELF,PETSC_ERR_ARG_UNKNOWN_TYPE,"Unknown Mat type given: %s",matype); 53469566063dSJacob Faibussowitsch PetscCall((*r)(mat,matype,MAT_INPLACE_MATRIX,&mat)); 53474099cc6bSBarry Smith PetscFunctionReturn(0); 53484099cc6bSBarry Smith } 53494099cc6bSBarry Smith 53504099cc6bSBarry Smith /*@C 53514099cc6bSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential AIJ matrices 53524099cc6bSBarry Smith 53534099cc6bSBarry Smith Not Collective 53544099cc6bSBarry Smith 53554099cc6bSBarry Smith Input Parameters: 53564099cc6bSBarry Smith + name - name of a new user-defined matrix type, for example MATSEQAIJCRL 53574099cc6bSBarry Smith - function - routine to convert to subtype 53584099cc6bSBarry Smith 53594099cc6bSBarry Smith Notes: 53604099cc6bSBarry Smith MatSeqAIJRegister() may be called multiple times to add several user-defined solvers. 53614099cc6bSBarry Smith 53624099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 53634099cc6bSBarry Smith $ -mat_seqaij_type my_mat 53644099cc6bSBarry Smith 53654099cc6bSBarry Smith Level: advanced 53664099cc6bSBarry Smith 5367db781477SPatrick Sanan .seealso: `MatSeqAIJRegisterAll()` 53684099cc6bSBarry Smith 53694099cc6bSBarry Smith Level: advanced 53704099cc6bSBarry Smith @*/ 5371388d47a6SSatish Balay PetscErrorCode MatSeqAIJRegister(const char sname[],PetscErrorCode (*function)(Mat,MatType,MatReuse,Mat *)) 53724099cc6bSBarry Smith { 53734099cc6bSBarry Smith PetscFunctionBegin; 53749566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 53759566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList,sname,function)); 53764099cc6bSBarry Smith PetscFunctionReturn(0); 53774099cc6bSBarry Smith } 53784099cc6bSBarry Smith 53794099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 53804099cc6bSBarry Smith 53814099cc6bSBarry Smith /*@C 53824099cc6bSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of SeqAIJ 53834099cc6bSBarry Smith 53844099cc6bSBarry Smith Not Collective 53854099cc6bSBarry Smith 53864099cc6bSBarry Smith Level: advanced 53874099cc6bSBarry Smith 5388db781477SPatrick Sanan .seealso: `MatRegisterAll()`, `MatSeqAIJRegister()` 53894099cc6bSBarry Smith @*/ 53904099cc6bSBarry Smith PetscErrorCode MatSeqAIJRegisterAll(void) 53914099cc6bSBarry Smith { 53924099cc6bSBarry Smith PetscFunctionBegin; 53934099cc6bSBarry Smith if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(0); 53944099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 53954099cc6bSBarry Smith 53969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 53979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 53989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 53999779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 54009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5401485f9817SRichard Tran Mills #endif 54025063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 54039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 54045063d097SStefano Zampini #endif 54055063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 54069566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 54075063d097SStefano Zampini #endif 54084099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 54099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 54104099cc6bSBarry Smith #endif 54114099cc6bSBarry Smith PetscFunctionReturn(0); 54124099cc6bSBarry Smith } 541353dd7562SDmitry Karpeev 541453dd7562SDmitry Karpeev /* 541581824310SBarry Smith Special version for direct calls from Fortran 541681824310SBarry Smith */ 5417af0996ceSBarry Smith #include <petsc/private/fortranimpl.h> 541881824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 541981824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 542081824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 542181824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 542281824310SBarry Smith #endif 542381824310SBarry Smith 542481824310SBarry Smith /* Change these macros so can be used in void function */ 542598921bdaSJacob Faibussowitsch 542698921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 54279566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 54289566063dSJacob Faibussowitsch #undef PetscCall 54299566063dSJacob Faibussowitsch #define PetscCall(...) do { \ 54305f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 543198921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 543298921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF,__LINE__,PETSC_FUNCTION_NAME,__FILE__,ierr_msv_mpiaij,PETSC_ERROR_REPEAT," "); \ 543398921bdaSJacob Faibussowitsch return; \ 543498921bdaSJacob Faibussowitsch } \ 543598921bdaSJacob Faibussowitsch } while (0) 543698921bdaSJacob Faibussowitsch 543798921bdaSJacob Faibussowitsch #undef SETERRQ 543898921bdaSJacob Faibussowitsch #define SETERRQ(comm,ierr,...) do { \ 543998921bdaSJacob Faibussowitsch *_ierr = PetscError(comm,__LINE__,PETSC_FUNCTION_NAME,__FILE__,ierr,PETSC_ERROR_INITIAL,__VA_ARGS__); \ 544098921bdaSJacob Faibussowitsch return; \ 544198921bdaSJacob Faibussowitsch } while (0) 544281824310SBarry Smith 544319caf8f3SSatish Balay PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA,PetscInt *mm,const PetscInt im[],PetscInt *nn,const PetscInt in[],const PetscScalar v[],InsertMode *isis, PetscErrorCode *_ierr) 544481824310SBarry Smith { 544581824310SBarry Smith Mat A = *AA; 544681824310SBarry Smith PetscInt m = *mm, n = *nn; 544781824310SBarry Smith InsertMode is = *isis; 544881824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 544981824310SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 545081824310SBarry Smith PetscInt *imax,*ai,*ailen; 545181824310SBarry Smith PetscInt *aj,nonew = a->nonew,lastcol = -1; 545254f21887SBarry Smith MatScalar *ap,value,*aa; 5453ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5454ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 545581824310SBarry Smith 545681824310SBarry Smith PetscFunctionBegin; 54574994cf47SJed Brown MatCheckPreallocated(A,1); 545881824310SBarry Smith imax = a->imax; 545981824310SBarry Smith ai = a->i; 546081824310SBarry Smith ailen = a->ilen; 546181824310SBarry Smith aj = a->j; 546281824310SBarry Smith aa = a->a; 546381824310SBarry Smith 546481824310SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 546581824310SBarry Smith row = im[k]; 546681824310SBarry Smith if (row < 0) continue; 54675f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large"); 546881824310SBarry Smith rp = aj + ai[row]; ap = aa + ai[row]; 546981824310SBarry Smith rmax = imax[row]; nrow = ailen[row]; 547081824310SBarry Smith low = 0; 547181824310SBarry Smith high = nrow; 547281824310SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 547381824310SBarry Smith if (in[l] < 0) continue; 54745f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Column too large"); 547581824310SBarry Smith col = in[l]; 54762205254eSKarl Rupp if (roworiented) value = v[l + k*n]; 54772205254eSKarl Rupp else value = v[k + l*m]; 54782205254eSKarl Rupp 547981824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 548081824310SBarry Smith 54812205254eSKarl Rupp if (col <= lastcol) low = 0; 54822205254eSKarl Rupp else high = nrow; 548381824310SBarry Smith lastcol = col; 548481824310SBarry Smith while (high-low > 5) { 548581824310SBarry Smith t = (low+high)/2; 548681824310SBarry Smith if (rp[t] > col) high = t; 548781824310SBarry Smith else low = t; 548881824310SBarry Smith } 548981824310SBarry Smith for (i=low; i<high; i++) { 549081824310SBarry Smith if (rp[i] > col) break; 549181824310SBarry Smith if (rp[i] == col) { 549281824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 549381824310SBarry Smith else ap[i] = value; 549481824310SBarry Smith goto noinsert; 549581824310SBarry Smith } 549681824310SBarry Smith } 549781824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 549881824310SBarry Smith if (nonew == 1) goto noinsert; 54995f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero in the matrix"); 5500fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 550181824310SBarry Smith N = nrow++ - 1; a->nz++; high++; 550281824310SBarry Smith /* shift up all the later entries in this row */ 550381824310SBarry Smith for (ii=N; ii>=i; ii--) { 550481824310SBarry Smith rp[ii+1] = rp[ii]; 550581824310SBarry Smith ap[ii+1] = ap[ii]; 550681824310SBarry Smith } 550781824310SBarry Smith rp[i] = col; 550881824310SBarry Smith ap[i] = value; 5509e56f5c9eSBarry Smith A->nonzerostate++; 551081824310SBarry Smith noinsert:; 551181824310SBarry Smith low = i + 1; 551281824310SBarry Smith } 551381824310SBarry Smith ailen[row] = nrow; 551481824310SBarry Smith } 551581824310SBarry Smith PetscFunctionReturnVoid(); 551681824310SBarry Smith } 551798921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 551898921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 551998921bdaSJacob Faibussowitsch * original definitions */ 55209566063dSJacob Faibussowitsch #undef PetscCall 552198921bdaSJacob Faibussowitsch #undef SETERRQ 5522